diff --git "a/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" "b/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 6.2245, "train/learning_rate": 2.911104513064133e-05, "train/epoch": 1.68, "train/global_step": 1500, "_runtime": 10153, "_timestamp": 1647384430, "_step": 1500, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 5.0, 5.0, 7.0, 1.0, 0.0, 72.0, 46.0, 19.0, 7.0, 8.0, 7.0, 29287.0, 914.0, 71.0, 22.0, 8.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.0, -89.25390625, -85.5078125, -81.76171875, -78.015625, -74.26953125, -70.5234375, -66.77734375, -63.03125, -59.28515625, -55.5390625, -51.79296875, -48.046875, -44.30078125, -40.5546875, -36.80859375, -33.0625, -29.31640625, -25.5703125, -21.82421875, -18.078125, -14.33203125, -10.5859375, -6.83984375, -3.09375, 0.65234375, 4.3984375, 8.14453125, 11.890625, 15.63671875, 19.3828125, 23.12890625, 26.875, 30.62109375, 34.3671875, 38.11328125, 41.859375, 45.60546875, 49.3515625, 53.09765625, 56.84375, 60.58984375, 64.3359375, 68.08203125, 71.828125, 75.57421875, 79.3203125, 83.06640625, 86.8125, 90.55859375, 94.3046875, 98.05078125, 101.796875, 105.54296875, 109.2890625, 113.03515625, 116.78125, 120.52734375, 124.2734375, 128.01953125, 131.765625, 135.51171875, 139.2578125, 143.00390625, 146.75]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 6.0, 10.0, 22.0, 27.0, 34.0, 29.0, 39.0, 45.0, 50.0, 66.0, 59.0, 69.0, 61.0, 64.0, 71.0, 62.0, 46.0, 47.0, 45.0, 30.0, 27.0, 22.0, 14.0, 14.0, 11.0, 3.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.6536750793457, -34.22751998901367, -32.80136489868164, -31.375207901000977, -29.949052810668945, -28.522897720336914, -27.09674072265625, -25.67058563232422, -24.244430541992188, -22.818275451660156, -21.392120361328125, -19.96596336364746, -18.53980827331543, -17.1136531829834, -15.68749713897705, -14.261341094970703, -12.835186004638672, -11.40903091430664, -9.982874870300293, -8.556718826293945, -7.130563735961914, -5.704408168792725, -4.278252601623535, -2.8520965576171875, -1.4259414672851562, 0.00021409988403320312, 1.4263696670532227, 2.852525234222412, 4.278680801391602, 5.704836368560791, 7.1309919357299805, 8.557147979736328, 9.98330307006836, 11.40945816040039, 12.835614204406738, 14.261770248413086, 15.687925338745117, 17.11408042907715, 18.540237426757812, 19.966392517089844, 21.392547607421875, 22.818702697753906, 24.244857788085938, 25.6710147857666, 27.097169876098633, 28.523324966430664, 29.949481964111328, 31.37563705444336, 32.80179214477539, 34.22794723510742, 35.65410232543945, 37.080257415771484, 38.50641632080078, 39.93257141113281, 41.358726501464844, 42.784881591796875, 44.211036682128906, 45.63719177246094, 47.06334686279297, 48.489501953125, 49.91565704345703, 51.34181594848633, 52.76797103881836, 54.19412612915039, 55.62028121948242]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 9.0, 13.0, 12.0, 12.0, 11.0, 13.0, 16.0, 10.0, 14.0, 17.0, 21.0, 25.0, 29.0, 28.0, 24.0, 43.0, 41.0, 40.0, 47.0, 44.0, 33.0, 36.0, 32.0, 27.0, 44.0, 48.0, 38.0, 27.0, 24.0, 27.0, 21.0, 20.0, 18.0, 18.0, 15.0, 16.0, 14.0, 9.0, 11.0, 8.0, 7.0, 7.0, 3.0, 9.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0], "bins": [-30.464330673217773, -29.572296142578125, -28.68026351928711, -27.78822898864746, -26.896196365356445, -26.004161834716797, -25.11212921142578, -24.220094680786133, -23.328060150146484, -22.436025619506836, -21.54399299621582, -20.651958465576172, -19.759925842285156, -18.867891311645508, -17.97585678100586, -17.083824157714844, -16.191791534423828, -15.299757957458496, -14.407724380493164, -13.515689849853516, -12.6236572265625, -11.731622695922852, -10.83958911895752, -9.947555541992188, -9.055521965026855, -8.163488388061523, -7.271454811096191, -6.379420757293701, -5.487387180328369, -4.595353603363037, -3.703319549560547, -2.811285972595215, -1.9192543029785156, -1.027220606803894, -0.13518691062927246, 0.7568469047546387, 1.6488804817199707, 2.5409140586853027, 3.432948112487793, 4.324981689453125, 5.217015266418457, 6.109048843383789, 7.001082420349121, 7.893116474151611, 8.785150527954102, 9.677183151245117, 10.569217681884766, 11.461251258850098, 12.35328483581543, 13.245318412780762, 14.137351989746094, 15.029386520385742, 15.921419143676758, 16.813453674316406, 17.705486297607422, 18.59752082824707, 19.48955535888672, 20.381589889526367, 21.273622512817383, 22.16565704345703, 23.057689666748047, 23.949724197387695, 24.841758728027344, 25.73379135131836, 26.625823974609375]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 15.0, 22.0, 24.0, 26.0, 28.0, 77.0, 106.0, 153.0, 235.0, 313.0, 437.0, 693.0, 969.0, 1480.0, 2146.0, 3115.0, 4553.0, 6683.0, 9978.0, 14330.0, 21524.0, 31327.0, 46596.0, 69768.0, 111900.0, 223754.0, 196708.0, 102575.0, 64611.0, 42971.0, 29183.0, 19803.0, 13421.0, 9066.0, 6318.0, 4358.0, 2877.0, 1982.0, 1405.0, 870.0, 695.0, 438.0, 332.0, 208.0, 141.0, 97.0, 91.0, 40.0, 39.0, 20.0, 14.0, 12.0, 11.0, 8.0, 7.0, 6.0, 1.0, 1.0], "bins": [-88.9375, -86.150390625, -83.36328125, -80.576171875, -77.7890625, -75.001953125, -72.21484375, -69.427734375, -66.640625, -63.853515625, -61.06640625, -58.279296875, -55.4921875, -52.705078125, -49.91796875, -47.130859375, -44.34375, -41.556640625, -38.76953125, -35.982421875, -33.1953125, -30.408203125, -27.62109375, -24.833984375, -22.046875, -19.259765625, -16.47265625, -13.685546875, -10.8984375, -8.111328125, -5.32421875, -2.537109375, 0.25, 3.037109375, 5.82421875, 8.611328125, 11.3984375, 14.185546875, 16.97265625, 19.759765625, 22.546875, 25.333984375, 28.12109375, 30.908203125, 33.6953125, 36.482421875, 39.26953125, 42.056640625, 44.84375, 47.630859375, 50.41796875, 53.205078125, 55.9921875, 58.779296875, 61.56640625, 64.353515625, 67.140625, 69.927734375, 72.71484375, 75.501953125, 78.2890625, 81.076171875, 83.86328125, 86.650390625, 89.4375]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 5.0, 4.0, 6.0, 6.0, 10.0, 7.0, 7.0, 9.0, 4.0, 14.0, 13.0, 14.0, 6.0, 17.0, 20.0, 27.0, 21.0, 26.0, 31.0, 37.0, 48.0, 73.0, 81.0, 96.0, 61.0, 49.0, 42.0, 28.0, 36.0, 28.0, 29.0, 23.0, 17.0, 18.0, 18.0, 6.0, 14.0, 6.0, 10.0, 9.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0], "bins": [-37.59375, -36.52099609375, -35.4482421875, -34.37548828125, -33.302734375, -32.22998046875, -31.1572265625, -30.08447265625, -29.01171875, -27.93896484375, -26.8662109375, -25.79345703125, -24.720703125, -23.64794921875, -22.5751953125, -21.50244140625, -20.4296875, -19.35693359375, -18.2841796875, -17.21142578125, -16.138671875, -15.06591796875, -13.9931640625, -12.92041015625, -11.84765625, -10.77490234375, -9.7021484375, -8.62939453125, -7.556640625, -6.48388671875, -5.4111328125, -4.33837890625, -3.265625, -2.19287109375, -1.1201171875, -0.04736328125, 1.025390625, 2.09814453125, 3.1708984375, 4.24365234375, 5.31640625, 6.38916015625, 7.4619140625, 8.53466796875, 9.607421875, 10.68017578125, 11.7529296875, 12.82568359375, 13.8984375, 14.97119140625, 16.0439453125, 17.11669921875, 18.189453125, 19.26220703125, 20.3349609375, 21.40771484375, 22.48046875, 23.55322265625, 24.6259765625, 25.69873046875, 26.771484375, 27.84423828125, 28.9169921875, 29.98974609375, 31.0625]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 5.0, 7.0, 9.0, 9.0, 8.0, 8.0, 12.0, 17.0, 12.0, 19.0, 20.0, 24.0, 38.0, 31.0, 47.0, 48.0, 61.0, 51.0, 59.0, 56.0, 48.0, 48.0, 46.0, 37.0, 52.0, 33.0, 35.0, 27.0, 19.0, 26.0, 16.0, 19.0, 12.0, 9.0, 7.0, 3.0, 2.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-26.355745315551758, -25.658567428588867, -24.96139144897461, -24.26421356201172, -23.567035675048828, -22.86985969543457, -22.17268180847168, -21.475505828857422, -20.77832794189453, -20.08115005493164, -19.383974075317383, -18.686796188354492, -17.989620208740234, -17.292442321777344, -16.595264434814453, -15.898087501525879, -15.200910568237305, -14.50373363494873, -13.806556701660156, -13.109378814697266, -12.412201881408691, -11.715024948120117, -11.017847061157227, -10.320670127868652, -9.623493194580078, -8.926316261291504, -8.22913932800293, -7.531961441040039, -6.834784507751465, -6.137607574462891, -5.440430164337158, -4.743252754211426, -4.046075820922852, -3.3488986492156982, -2.651721477508545, -1.9545443058013916, -1.2573671340942383, -0.560189962387085, 0.13698720932006836, 0.8341646194458008, 1.531341552734375, 2.2285187244415283, 2.9256958961486816, 3.622873067855835, 4.320050239562988, 5.0172271728515625, 5.714404582977295, 6.411581993103027, 7.108758926391602, 7.805935859680176, 8.50311279296875, 9.20029067993164, 9.897467613220215, 10.594644546508789, 11.29182243347168, 11.988999366760254, 12.686176300048828, 13.383353233337402, 14.080530166625977, 14.777708053588867, 15.474884986877441, 16.172061920166016, 16.869239807128906, 17.566417694091797, 18.263593673706055]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 12.0, 7.0, 9.0, 19.0, 10.0, 19.0, 17.0, 24.0, 27.0, 23.0, 19.0, 39.0, 40.0, 40.0, 48.0, 39.0, 50.0, 43.0, 44.0, 53.0, 47.0, 40.0, 47.0, 43.0, 33.0, 31.0, 34.0, 19.0, 25.0, 17.0, 20.0, 10.0, 8.0, 9.0, 11.0, 10.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.76949691772461, -25.030296325683594, -24.29109764099121, -23.551897048950195, -22.812698364257812, -22.073497772216797, -21.33429718017578, -20.595096588134766, -19.855897903442383, -19.116697311401367, -18.377498626708984, -17.63829803466797, -16.899097442626953, -16.15989875793457, -15.420698165893555, -14.681498527526855, -13.942298889160156, -13.203099250793457, -12.463899612426758, -11.724699020385742, -10.985499382019043, -10.246299743652344, -9.507099151611328, -8.767899513244629, -8.02869987487793, -7.2895002365112305, -6.550300121307373, -5.811100006103516, -5.071900367736816, -4.332700729370117, -3.5935006141662598, -2.8543004989624023, -2.115100860595703, -1.3759009838104248, -0.6367011070251465, 0.10249876976013184, 0.8416986465454102, 1.5808985233306885, 2.320098400115967, 3.059298515319824, 3.7984981536865234, 4.537697792053223, 5.27689790725708, 6.0160980224609375, 6.755297660827637, 7.494497299194336, 8.233697891235352, 8.97289752960205, 9.71209716796875, 10.45129680633545, 11.190496444702148, 11.929697036743164, 12.668896675109863, 13.408096313476562, 14.147296905517578, 14.886496543884277, 15.625696182250977, 16.364896774291992, 17.104095458984375, 17.84329605102539, 18.582496643066406, 19.32169532775879, 20.060895919799805, 20.800094604492188, 21.539295196533203]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 5.0, 10.0, 19.0, 17.0, 21.0, 39.0, 53.0, 88.0, 105.0, 170.0, 240.0, 406.0, 658.0, 943.0, 1399.0, 2358.0, 3811.0, 6306.0, 10525.0, 17724.0, 30226.0, 53161.0, 96010.0, 192532.0, 466094.0, 1024207.0, 1162778.0, 614647.0, 246847.0, 116119.0, 61634.0, 34652.0, 20180.0, 11771.0, 7047.0, 4270.0, 2639.0, 1661.0, 1035.0, 659.0, 417.0, 282.0, 167.0, 125.0, 76.0, 44.0, 37.0, 28.0, 15.0, 11.0, 8.0, 4.0, 0.0, 4.0, 1.0, 1.0], "bins": [-23.71875, -23.024169921875, -22.32958984375, -21.635009765625, -20.9404296875, -20.245849609375, -19.55126953125, -18.856689453125, -18.162109375, -17.467529296875, -16.77294921875, -16.078369140625, -15.3837890625, -14.689208984375, -13.99462890625, -13.300048828125, -12.60546875, -11.910888671875, -11.21630859375, -10.521728515625, -9.8271484375, -9.132568359375, -8.43798828125, -7.743408203125, -7.048828125, -6.354248046875, -5.65966796875, -4.965087890625, -4.2705078125, -3.575927734375, -2.88134765625, -2.186767578125, -1.4921875, -0.797607421875, -0.10302734375, 0.591552734375, 1.2861328125, 1.980712890625, 2.67529296875, 3.369873046875, 4.064453125, 4.759033203125, 5.45361328125, 6.148193359375, 6.8427734375, 7.537353515625, 8.23193359375, 8.926513671875, 9.62109375, 10.315673828125, 11.01025390625, 11.704833984375, 12.3994140625, 13.093994140625, 13.78857421875, 14.483154296875, 15.177734375, 15.872314453125, 16.56689453125, 17.261474609375, 17.9560546875, 18.650634765625, 19.34521484375, 20.039794921875, 20.734375]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 5.0, 6.0, 6.0, 9.0, 6.0, 16.0, 13.0, 13.0, 20.0, 18.0, 17.0, 27.0, 29.0, 38.0, 29.0, 37.0, 33.0, 39.0, 45.0, 37.0, 53.0, 47.0, 52.0, 43.0, 30.0, 38.0, 41.0, 34.0, 32.0, 34.0, 28.0, 14.0, 17.0, 22.0, 15.0, 10.0, 12.0, 9.0, 11.0, 5.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.6171875, -15.1591796875, -14.701171875, -14.2431640625, -13.78515625, -13.3271484375, -12.869140625, -12.4111328125, -11.953125, -11.4951171875, -11.037109375, -10.5791015625, -10.12109375, -9.6630859375, -9.205078125, -8.7470703125, -8.2890625, -7.8310546875, -7.373046875, -6.9150390625, -6.45703125, -5.9990234375, -5.541015625, -5.0830078125, -4.625, -4.1669921875, -3.708984375, -3.2509765625, -2.79296875, -2.3349609375, -1.876953125, -1.4189453125, -0.9609375, -0.5029296875, -0.044921875, 0.4130859375, 0.87109375, 1.3291015625, 1.787109375, 2.2451171875, 2.703125, 3.1611328125, 3.619140625, 4.0771484375, 4.53515625, 4.9931640625, 5.451171875, 5.9091796875, 6.3671875, 6.8251953125, 7.283203125, 7.7412109375, 8.19921875, 8.6572265625, 9.115234375, 9.5732421875, 10.03125, 10.4892578125, 10.947265625, 11.4052734375, 11.86328125, 12.3212890625, 12.779296875, 13.2373046875, 13.6953125]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 7.0, 7.0, 18.0, 27.0, 36.0, 59.0, 112.0, 147.0, 224.0, 380.0, 604.0, 998.0, 1770.0, 2956.0, 5304.0, 9388.0, 16770.0, 30481.0, 56977.0, 106311.0, 201056.0, 385881.0, 757437.0, 1139210.0, 708924.0, 362159.0, 188552.0, 99252.0, 53350.0, 28865.0, 15701.0, 8892.0, 5103.0, 2938.0, 1630.0, 1063.0, 611.0, 381.0, 245.0, 162.0, 96.0, 70.0, 31.0, 34.0, 15.0, 12.0, 13.0, 9.0, 6.0, 2.0, 1.0, 2.0, 1.0], "bins": [-22.40625, -21.755859375, -21.10546875, -20.455078125, -19.8046875, -19.154296875, -18.50390625, -17.853515625, -17.203125, -16.552734375, -15.90234375, -15.251953125, -14.6015625, -13.951171875, -13.30078125, -12.650390625, -12.0, -11.349609375, -10.69921875, -10.048828125, -9.3984375, -8.748046875, -8.09765625, -7.447265625, -6.796875, -6.146484375, -5.49609375, -4.845703125, -4.1953125, -3.544921875, -2.89453125, -2.244140625, -1.59375, -0.943359375, -0.29296875, 0.357421875, 1.0078125, 1.658203125, 2.30859375, 2.958984375, 3.609375, 4.259765625, 4.91015625, 5.560546875, 6.2109375, 6.861328125, 7.51171875, 8.162109375, 8.8125, 9.462890625, 10.11328125, 10.763671875, 11.4140625, 12.064453125, 12.71484375, 13.365234375, 14.015625, 14.666015625, 15.31640625, 15.966796875, 16.6171875, 17.267578125, 17.91796875, 18.568359375, 19.21875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 11.0, 13.0, 11.0, 15.0, 22.0, 34.0, 44.0, 49.0, 66.0, 81.0, 95.0, 103.0, 127.0, 166.0, 215.0, 249.0, 289.0, 387.0, 366.0, 337.0, 266.0, 247.0, 195.0, 141.0, 131.0, 111.0, 71.0, 59.0, 41.0, 29.0, 26.0, 32.0, 11.0, 9.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.46875, -8.2138671875, -7.958984375, -7.7041015625, -7.44921875, -7.1943359375, -6.939453125, -6.6845703125, -6.4296875, -6.1748046875, -5.919921875, -5.6650390625, -5.41015625, -5.1552734375, -4.900390625, -4.6455078125, -4.390625, -4.1357421875, -3.880859375, -3.6259765625, -3.37109375, -3.1162109375, -2.861328125, -2.6064453125, -2.3515625, -2.0966796875, -1.841796875, -1.5869140625, -1.33203125, -1.0771484375, -0.822265625, -0.5673828125, -0.3125, -0.0576171875, 0.197265625, 0.4521484375, 0.70703125, 0.9619140625, 1.216796875, 1.4716796875, 1.7265625, 1.9814453125, 2.236328125, 2.4912109375, 2.74609375, 3.0009765625, 3.255859375, 3.5107421875, 3.765625, 4.0205078125, 4.275390625, 4.5302734375, 4.78515625, 5.0400390625, 5.294921875, 5.5498046875, 5.8046875, 6.0595703125, 6.314453125, 6.5693359375, 6.82421875, 7.0791015625, 7.333984375, 7.5888671875, 7.84375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 7.0, 8.0, 14.0, 11.0, 21.0, 28.0, 25.0, 24.0, 40.0, 47.0, 52.0, 57.0, 54.0, 79.0, 64.0, 68.0, 66.0, 43.0, 42.0, 40.0, 42.0, 32.0, 25.0, 20.0, 22.0, 12.0, 10.0, 9.0, 2.0, 7.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.973779678344727, -21.361480712890625, -20.749181747436523, -20.13688087463379, -19.524581909179688, -18.912282943725586, -18.299983978271484, -17.687685012817383, -17.07538604736328, -16.46308708190918, -15.850787162780762, -15.23848819732666, -14.626188278198242, -14.01388931274414, -13.401590347290039, -12.789291381835938, -12.176990509033203, -11.564691543579102, -10.952391624450684, -10.340092658996582, -9.727792739868164, -9.115493774414062, -8.503194808959961, -7.890895366668701, -7.278595924377441, -6.666296482086182, -6.053997039794922, -5.44169807434082, -4.8293986320495605, -4.217099189758301, -3.60479998588562, -2.9925007820129395, -2.3802013397216797, -1.7679020166397095, -1.1556026935577393, -0.543303370475769, 0.06899595260620117, 0.6812953948974609, 1.2935945987701416, 1.9058938026428223, 2.518193244934082, 3.130492687225342, 3.7427918910980225, 4.355091094970703, 4.967390537261963, 5.579689979553223, 6.191988945007324, 6.804288387298584, 7.416587829589844, 8.028886795043945, 8.641186714172363, 9.253485679626465, 9.865785598754883, 10.478084564208984, 11.090383529663086, 11.702682495117188, 12.314982414245605, 12.927281379699707, 13.539581298828125, 14.151880264282227, 14.764179229736328, 15.376479148864746, 15.988778114318848, 16.601078033447266, 17.213376998901367]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 3.0, 5.0, 4.0, 9.0, 10.0, 8.0, 11.0, 12.0, 11.0, 17.0, 23.0, 31.0, 22.0, 33.0, 41.0, 39.0, 32.0, 27.0, 39.0, 38.0, 43.0, 45.0, 45.0, 48.0, 40.0, 40.0, 34.0, 42.0, 38.0, 18.0, 24.0, 21.0, 26.0, 17.0, 24.0, 18.0, 11.0, 11.0, 6.0, 11.0, 8.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.264737129211426, -14.750859260559082, -14.236982345581055, -13.723104476928711, -13.209226608276367, -12.695348739624023, -12.18147087097168, -11.667593955993652, -11.153716087341309, -10.639838218688965, -10.125961303710938, -9.612083435058594, -9.09820556640625, -8.584327697753906, -8.070449829101562, -7.556572914123535, -7.042695045471191, -6.528817176818848, -6.014939785003662, -5.501062393188477, -4.987184524536133, -4.473306655883789, -3.9594292640686035, -3.445551633834839, -2.931674003601074, -2.4177963733673096, -1.903918743133545, -1.3900411128997803, -0.8761634826660156, -0.362285852432251, 0.15159177780151367, 0.6654694080352783, 1.1793460845947266, 1.6932237148284912, 2.207101345062256, 2.7209789752960205, 3.234856605529785, 3.74873423576355, 4.2626118659973145, 4.7764892578125, 5.290367126464844, 5.8042449951171875, 6.318122386932373, 6.831999778747559, 7.345877647399902, 7.859755516052246, 8.373632431030273, 8.887510299682617, 9.401388168334961, 9.915266036987305, 10.429143905639648, 10.943020820617676, 11.45689868927002, 11.970776557922363, 12.48465347290039, 12.998531341552734, 13.512409210205078, 14.026287078857422, 14.540164947509766, 15.054041862487793, 15.567919731140137, 16.081796646118164, 16.595674514770508, 17.10955238342285, 17.623430252075195]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 6.0, 10.0, 16.0, 16.0, 23.0, 36.0, 70.0, 91.0, 123.0, 173.0, 289.0, 396.0, 562.0, 899.0, 1384.0, 2138.0, 3493.0, 5664.0, 9726.0, 17606.0, 33708.0, 67287.0, 141155.0, 266167.0, 244987.0, 124242.0, 59593.0, 29764.0, 15902.0, 8806.0, 5245.0, 3096.0, 2041.0, 1308.0, 816.0, 541.0, 354.0, 249.0, 150.0, 111.0, 92.0, 71.0, 36.0, 34.0, 20.0, 16.0, 16.0, 7.0, 9.0, 0.0, 4.0, 5.0], "bins": [-10.7890625, -10.4886474609375, -10.188232421875, -9.8878173828125, -9.58740234375, -9.2869873046875, -8.986572265625, -8.6861572265625, -8.3857421875, -8.0853271484375, -7.784912109375, -7.4844970703125, -7.18408203125, -6.8836669921875, -6.583251953125, -6.2828369140625, -5.982421875, -5.6820068359375, -5.381591796875, -5.0811767578125, -4.78076171875, -4.4803466796875, -4.179931640625, -3.8795166015625, -3.5791015625, -3.2786865234375, -2.978271484375, -2.6778564453125, -2.37744140625, -2.0770263671875, -1.776611328125, -1.4761962890625, -1.17578125, -0.8753662109375, -0.574951171875, -0.2745361328125, 0.02587890625, 0.3262939453125, 0.626708984375, 0.9271240234375, 1.2275390625, 1.5279541015625, 1.828369140625, 2.1287841796875, 2.42919921875, 2.7296142578125, 3.030029296875, 3.3304443359375, 3.630859375, 3.9312744140625, 4.231689453125, 4.5321044921875, 4.83251953125, 5.1329345703125, 5.433349609375, 5.7337646484375, 6.0341796875, 6.3345947265625, 6.635009765625, 6.9354248046875, 7.23583984375, 7.5362548828125, 7.836669921875, 8.1370849609375, 8.4375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 4.0, 2.0, 5.0, 5.0, 5.0, 15.0, 12.0, 9.0, 13.0, 13.0, 17.0, 17.0, 14.0, 25.0, 25.0, 38.0, 39.0, 31.0, 47.0, 41.0, 39.0, 45.0, 36.0, 43.0, 30.0, 38.0, 40.0, 39.0, 42.0, 44.0, 31.0, 25.0, 23.0, 22.0, 20.0, 20.0, 13.0, 14.0, 15.0, 15.0, 15.0, 4.0, 3.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.46875, -14.97412109375, -14.4794921875, -13.98486328125, -13.490234375, -12.99560546875, -12.5009765625, -12.00634765625, -11.51171875, -11.01708984375, -10.5224609375, -10.02783203125, -9.533203125, -9.03857421875, -8.5439453125, -8.04931640625, -7.5546875, -7.06005859375, -6.5654296875, -6.07080078125, -5.576171875, -5.08154296875, -4.5869140625, -4.09228515625, -3.59765625, -3.10302734375, -2.6083984375, -2.11376953125, -1.619140625, -1.12451171875, -0.6298828125, -0.13525390625, 0.359375, 0.85400390625, 1.3486328125, 1.84326171875, 2.337890625, 2.83251953125, 3.3271484375, 3.82177734375, 4.31640625, 4.81103515625, 5.3056640625, 5.80029296875, 6.294921875, 6.78955078125, 7.2841796875, 7.77880859375, 8.2734375, 8.76806640625, 9.2626953125, 9.75732421875, 10.251953125, 10.74658203125, 11.2412109375, 11.73583984375, 12.23046875, 12.72509765625, 13.2197265625, 13.71435546875, 14.208984375, 14.70361328125, 15.1982421875, 15.69287109375, 16.1875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 9.0, 11.0, 13.0, 9.0, 15.0, 35.0, 39.0, 64.0, 89.0, 94.0, 158.0, 262.0, 415.0, 683.0, 1248.0, 2313.0, 5101.0, 13822.0, 56400.0, 923970.0, 27431.0, 8634.0, 3483.0, 1737.0, 960.0, 557.0, 327.0, 216.0, 161.0, 86.0, 54.0, 39.0, 34.0, 14.0, 21.0, 12.0, 8.0, 8.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-24.296875, -23.566650390625, -22.83642578125, -22.106201171875, -21.3759765625, -20.645751953125, -19.91552734375, -19.185302734375, -18.455078125, -17.724853515625, -16.99462890625, -16.264404296875, -15.5341796875, -14.803955078125, -14.07373046875, -13.343505859375, -12.61328125, -11.883056640625, -11.15283203125, -10.422607421875, -9.6923828125, -8.962158203125, -8.23193359375, -7.501708984375, -6.771484375, -6.041259765625, -5.31103515625, -4.580810546875, -3.8505859375, -3.120361328125, -2.39013671875, -1.659912109375, -0.9296875, -0.199462890625, 0.53076171875, 1.260986328125, 1.9912109375, 2.721435546875, 3.45166015625, 4.181884765625, 4.912109375, 5.642333984375, 6.37255859375, 7.102783203125, 7.8330078125, 8.563232421875, 9.29345703125, 10.023681640625, 10.75390625, 11.484130859375, 12.21435546875, 12.944580078125, 13.6748046875, 14.405029296875, 15.13525390625, 15.865478515625, 16.595703125, 17.325927734375, 18.05615234375, 18.786376953125, 19.5166015625, 20.246826171875, 20.97705078125, 21.707275390625, 22.4375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 6.0, 2.0, 6.0, 6.0, 4.0, 3.0, 11.0, 13.0, 8.0, 17.0, 15.0, 18.0, 24.0, 20.0, 22.0, 28.0, 21.0, 49.0, 54.0, 44.0, 31.0, 34.0, 37.0, 38.0, 39.0, 30.0, 31.0, 45.0, 53.0, 28.0, 22.0, 31.0, 35.0, 24.0, 23.0, 16.0, 21.0, 12.0, 19.0, 17.0, 8.0, 13.0, 6.0, 8.0, 3.0, 4.0, 2.0, 6.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.3671875, -10.0299072265625, -9.692626953125, -9.3553466796875, -9.01806640625, -8.6807861328125, -8.343505859375, -8.0062255859375, -7.6689453125, -7.3316650390625, -6.994384765625, -6.6571044921875, -6.31982421875, -5.9825439453125, -5.645263671875, -5.3079833984375, -4.970703125, -4.6334228515625, -4.296142578125, -3.9588623046875, -3.62158203125, -3.2843017578125, -2.947021484375, -2.6097412109375, -2.2724609375, -1.9351806640625, -1.597900390625, -1.2606201171875, -0.92333984375, -0.5860595703125, -0.248779296875, 0.0885009765625, 0.42578125, 0.7630615234375, 1.100341796875, 1.4376220703125, 1.77490234375, 2.1121826171875, 2.449462890625, 2.7867431640625, 3.1240234375, 3.4613037109375, 3.798583984375, 4.1358642578125, 4.47314453125, 4.8104248046875, 5.147705078125, 5.4849853515625, 5.822265625, 6.1595458984375, 6.496826171875, 6.8341064453125, 7.17138671875, 7.5086669921875, 7.845947265625, 8.1832275390625, 8.5205078125, 8.8577880859375, 9.195068359375, 9.5323486328125, 9.86962890625, 10.2069091796875, 10.544189453125, 10.8814697265625, 11.21875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 14.0, 17.0, 33.0, 31.0, 56.0, 67.0, 85.0, 125.0, 190.0, 244.0, 342.0, 502.0, 733.0, 1014.0, 1596.0, 2428.0, 4357.0, 8438.0, 21659.0, 902839.0, 69861.0, 16397.0, 6964.0, 3826.0, 2166.0, 1402.0, 884.0, 675.0, 453.0, 313.0, 221.0, 175.0, 106.0, 75.0, 72.0, 35.0, 38.0, 20.0, 25.0, 13.0, 16.0, 7.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-4.921875, -4.7674560546875, -4.613037109375, -4.4586181640625, -4.30419921875, -4.1497802734375, -3.995361328125, -3.8409423828125, -3.6865234375, -3.5321044921875, -3.377685546875, -3.2232666015625, -3.06884765625, -2.9144287109375, -2.760009765625, -2.6055908203125, -2.451171875, -2.2967529296875, -2.142333984375, -1.9879150390625, -1.83349609375, -1.6790771484375, -1.524658203125, -1.3702392578125, -1.2158203125, -1.0614013671875, -0.906982421875, -0.7525634765625, -0.59814453125, -0.4437255859375, -0.289306640625, -0.1348876953125, 0.01953125, 0.1739501953125, 0.328369140625, 0.4827880859375, 0.63720703125, 0.7916259765625, 0.946044921875, 1.1004638671875, 1.2548828125, 1.4093017578125, 1.563720703125, 1.7181396484375, 1.87255859375, 2.0269775390625, 2.181396484375, 2.3358154296875, 2.490234375, 2.6446533203125, 2.799072265625, 2.9534912109375, 3.10791015625, 3.2623291015625, 3.416748046875, 3.5711669921875, 3.7255859375, 3.8800048828125, 4.034423828125, 4.1888427734375, 4.34326171875, 4.4976806640625, 4.652099609375, 4.8065185546875, 4.9609375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 9.0, 7.0, 9.0, 19.0, 41.0, 105.0, 368.0, 270.0, 60.0, 24.0, 17.0, 10.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005702972412109375, -0.000551760196685791, -0.0005332231521606445, -0.000514686107635498, -0.0004961490631103516, -0.0004776120185852051, -0.0004590749740600586, -0.0004405379295349121, -0.0004220008850097656, -0.00040346384048461914, -0.00038492679595947266, -0.00036638975143432617, -0.0003478527069091797, -0.0003293156623840332, -0.0003107786178588867, -0.00029224157333374023, -0.00027370452880859375, -0.00025516748428344727, -0.00023663043975830078, -0.0002180933952331543, -0.0001995563507080078, -0.00018101930618286133, -0.00016248226165771484, -0.00014394521713256836, -0.00012540817260742188, -0.00010687112808227539, -8.83340835571289e-05, -6.979703903198242e-05, -5.125999450683594e-05, -3.272294998168945e-05, -1.4185905456542969e-05, 4.351139068603516e-06, 2.288818359375e-05, 4.1425228118896484e-05, 5.996227264404297e-05, 7.849931716918945e-05, 9.703636169433594e-05, 0.00011557340621948242, 0.0001341104507446289, 0.0001526474952697754, 0.00017118453979492188, 0.00018972158432006836, 0.00020825862884521484, 0.00022679567337036133, 0.0002453327178955078, 0.0002638697624206543, 0.0002824068069458008, 0.00030094385147094727, 0.00031948089599609375, 0.00033801794052124023, 0.0003565549850463867, 0.0003750920295715332, 0.0003936290740966797, 0.00041216611862182617, 0.00043070316314697266, 0.00044924020767211914, 0.0004677772521972656, 0.0004863142967224121, 0.0005048513412475586, 0.0005233883857727051, 0.0005419254302978516, 0.000560462474822998, 0.0005789995193481445, 0.000597536563873291, 0.0006160736083984375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 18.0, 16.0, 31.0, 47.0, 60.0, 84.0, 96.0, 144.0, 204.0, 319.0, 420.0, 659.0, 926.0, 1377.0, 2091.0, 3294.0, 5094.0, 8139.0, 12865.0, 21895.0, 39728.0, 84105.0, 256286.0, 384015.0, 109847.0, 49127.0, 26273.0, 15205.0, 9237.0, 5940.0, 3728.0, 2407.0, 1587.0, 1041.0, 677.0, 480.0, 348.0, 222.0, 173.0, 92.0, 88.0, 50.0, 32.0, 33.0, 16.0, 16.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2890625, -2.217864990234375, -2.14666748046875, -2.075469970703125, -2.0042724609375, -1.933074951171875, -1.86187744140625, -1.790679931640625, -1.719482421875, -1.648284912109375, -1.57708740234375, -1.505889892578125, -1.4346923828125, -1.363494873046875, -1.29229736328125, -1.221099853515625, -1.14990234375, -1.078704833984375, -1.00750732421875, -0.936309814453125, -0.8651123046875, -0.793914794921875, -0.72271728515625, -0.651519775390625, -0.580322265625, -0.509124755859375, -0.43792724609375, -0.366729736328125, -0.2955322265625, -0.224334716796875, -0.15313720703125, -0.081939697265625, -0.0107421875, 0.060455322265625, 0.13165283203125, 0.202850341796875, 0.2740478515625, 0.345245361328125, 0.41644287109375, 0.487640380859375, 0.558837890625, 0.630035400390625, 0.70123291015625, 0.772430419921875, 0.8436279296875, 0.914825439453125, 0.98602294921875, 1.057220458984375, 1.12841796875, 1.199615478515625, 1.27081298828125, 1.342010498046875, 1.4132080078125, 1.484405517578125, 1.55560302734375, 1.626800537109375, 1.697998046875, 1.769195556640625, 1.84039306640625, 1.911590576171875, 1.9827880859375, 2.053985595703125, 2.12518310546875, 2.196380615234375, 2.267578125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 3.0, 7.0, 6.0, 5.0, 7.0, 4.0, 13.0, 16.0, 14.0, 11.0, 18.0, 20.0, 17.0, 23.0, 23.0, 41.0, 31.0, 38.0, 46.0, 66.0, 57.0, 77.0, 69.0, 49.0, 39.0, 37.0, 30.0, 35.0, 29.0, 20.0, 13.0, 22.0, 19.0, 14.0, 15.0, 11.0, 12.0, 13.0, 6.0, 6.0, 7.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.35107421875, -0.3411293029785156, -0.33118438720703125, -0.3212394714355469, -0.3112945556640625, -0.3013496398925781, -0.29140472412109375, -0.2814598083496094, -0.271514892578125, -0.2615699768066406, -0.25162506103515625, -0.24168014526367188, -0.2317352294921875, -0.22179031372070312, -0.21184539794921875, -0.20190048217773438, -0.19195556640625, -0.18201065063476562, -0.17206573486328125, -0.16212081909179688, -0.1521759033203125, -0.14223098754882812, -0.13228607177734375, -0.12234115600585938, -0.112396240234375, -0.10245132446289062, -0.09250640869140625, -0.08256149291992188, -0.0726165771484375, -0.06267166137695312, -0.05272674560546875, -0.042781829833984375, -0.0328369140625, -0.022891998291015625, -0.01294708251953125, -0.003002166748046875, 0.0069427490234375, 0.016887664794921875, 0.02683258056640625, 0.036777496337890625, 0.046722412109375, 0.056667327880859375, 0.06661224365234375, 0.07655715942382812, 0.0865020751953125, 0.09644699096679688, 0.10639190673828125, 0.11633682250976562, 0.12628173828125, 0.13622665405273438, 0.14617156982421875, 0.15611648559570312, 0.1660614013671875, 0.17600631713867188, 0.18595123291015625, 0.19589614868164062, 0.205841064453125, 0.21578598022460938, 0.22573089599609375, 0.23567581176757812, 0.2456207275390625, 0.2555656433105469, 0.26551055908203125, 0.2754554748535156, 0.285400390625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 6.0, 3.0, 3.0, 10.0, 6.0, 16.0, 8.0, 24.0, 26.0, 27.0, 30.0, 48.0, 41.0, 53.0, 61.0, 78.0, 74.0, 68.0, 67.0, 57.0, 42.0, 47.0, 36.0, 33.0, 35.0, 15.0, 21.0, 19.0, 9.0, 15.0, 9.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.311752319335938, -20.713884353637695, -20.116018295288086, -19.518150329589844, -18.920284271240234, -18.322416305541992, -17.72454833984375, -17.12668228149414, -16.5288143157959, -15.930947303771973, -15.333080291748047, -14.735212326049805, -14.137345314025879, -13.539478302001953, -12.941610336303711, -12.343743324279785, -11.74587631225586, -11.148009300231934, -10.550142288208008, -9.952274322509766, -9.35440731048584, -8.756540298461914, -8.158672332763672, -7.560805320739746, -6.96293830871582, -6.3650712966918945, -5.7672038078308105, -5.169336318969727, -4.571469306945801, -3.973602056503296, -3.375734806060791, -2.777867317199707, -2.1800003051757812, -1.5821330547332764, -0.9842658042907715, -0.3863985538482666, 0.21146869659423828, 0.8093359470367432, 1.407203197479248, 2.005070686340332, 2.602937698364258, 3.2008049488067627, 3.7986721992492676, 4.396539688110352, 4.994406700134277, 5.592273712158203, 6.190141201019287, 6.788008689880371, 7.385875701904297, 7.983742713928223, 8.581609725952148, 9.17947769165039, 9.777344703674316, 10.375211715698242, 10.973079681396484, 11.57094669342041, 12.168813705444336, 12.766680717468262, 13.364547729492188, 13.96241569519043, 14.560282707214355, 15.158149719238281, 15.756017684936523, 16.353885650634766, 16.951751708984375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 5.0, 9.0, 10.0, 6.0, 11.0, 10.0, 10.0, 23.0, 23.0, 26.0, 28.0, 31.0, 36.0, 41.0, 33.0, 29.0, 34.0, 33.0, 52.0, 41.0, 50.0, 43.0, 46.0, 36.0, 39.0, 39.0, 36.0, 18.0, 24.0, 25.0, 26.0, 15.0, 21.0, 20.0, 13.0, 11.0, 7.0, 10.0, 8.0, 6.0, 3.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.542332649230957, -14.054250717163086, -13.566168785095215, -13.078086853027344, -12.590005874633789, -12.101922988891602, -11.613842010498047, -11.125760078430176, -10.637678146362305, -10.149596214294434, -9.661514282226562, -9.173432350158691, -8.68535041809082, -8.197269439697266, -7.7091875076293945, -7.221105575561523, -6.733023643493652, -6.244941711425781, -5.75685977935791, -5.268778324127197, -4.780696392059326, -4.292614459991455, -3.804532766342163, -3.316451072692871, -2.828369140625, -2.340287208557129, -1.852205514907837, -1.3641237020492554, -0.8760418891906738, -0.38795995712280273, 0.10012173652648926, 0.5882034301757812, 1.0762863159179688, 1.5643681287765503, 2.052449941635132, 2.540531635284424, 3.028613567352295, 3.516695499420166, 4.004776954650879, 4.49285888671875, 4.980940818786621, 5.469022750854492, 5.957104682922363, 6.445186138153076, 6.933268070220947, 7.421350002288818, 7.909431457519531, 8.397513389587402, 8.885595321655273, 9.373677253723145, 9.861759185791016, 10.349841117858887, 10.837923049926758, 11.326004028320312, 11.814085960388184, 12.302167892456055, 12.790249824523926, 13.278331756591797, 13.766413688659668, 14.254495620727539, 14.742576599121094, 15.230659484863281, 15.718740463256836, 16.20682144165039, 16.694904327392578]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 15.0, 26.0, 45.0, 68.0, 83.0, 126.0, 201.0, 322.0, 410.0, 579.0, 931.0, 1410.0, 2100.0, 3286.0, 4997.0, 7708.0, 11915.0, 18942.0, 29885.0, 47147.0, 72510.0, 106796.0, 140469.0, 155847.0, 138985.0, 105210.0, 71399.0, 46205.0, 29039.0, 18502.0, 11618.0, 7366.0, 5034.0, 3117.0, 2039.0, 1372.0, 929.0, 621.0, 414.0, 301.0, 190.0, 132.0, 86.0, 55.0, 50.0, 21.0, 18.0, 14.0, 8.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-16.53125, -16.022216796875, -15.51318359375, -15.004150390625, -14.4951171875, -13.986083984375, -13.47705078125, -12.968017578125, -12.458984375, -11.949951171875, -11.44091796875, -10.931884765625, -10.4228515625, -9.913818359375, -9.40478515625, -8.895751953125, -8.38671875, -7.877685546875, -7.36865234375, -6.859619140625, -6.3505859375, -5.841552734375, -5.33251953125, -4.823486328125, -4.314453125, -3.805419921875, -3.29638671875, -2.787353515625, -2.2783203125, -1.769287109375, -1.26025390625, -0.751220703125, -0.2421875, 0.266845703125, 0.77587890625, 1.284912109375, 1.7939453125, 2.302978515625, 2.81201171875, 3.321044921875, 3.830078125, 4.339111328125, 4.84814453125, 5.357177734375, 5.8662109375, 6.375244140625, 6.88427734375, 7.393310546875, 7.90234375, 8.411376953125, 8.92041015625, 9.429443359375, 9.9384765625, 10.447509765625, 10.95654296875, 11.465576171875, 11.974609375, 12.483642578125, 12.99267578125, 13.501708984375, 14.0107421875, 14.519775390625, 15.02880859375, 15.537841796875, 16.046875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 8.0, 7.0, 5.0, 5.0, 9.0, 5.0, 8.0, 10.0, 18.0, 15.0, 19.0, 24.0, 26.0, 22.0, 35.0, 30.0, 34.0, 30.0, 40.0, 32.0, 39.0, 34.0, 44.0, 41.0, 41.0, 47.0, 42.0, 50.0, 32.0, 33.0, 27.0, 20.0, 20.0, 26.0, 18.0, 23.0, 12.0, 14.0, 13.0, 6.0, 8.0, 9.0, 10.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.515625, -13.102783203125, -12.68994140625, -12.277099609375, -11.8642578125, -11.451416015625, -11.03857421875, -10.625732421875, -10.212890625, -9.800048828125, -9.38720703125, -8.974365234375, -8.5615234375, -8.148681640625, -7.73583984375, -7.322998046875, -6.91015625, -6.497314453125, -6.08447265625, -5.671630859375, -5.2587890625, -4.845947265625, -4.43310546875, -4.020263671875, -3.607421875, -3.194580078125, -2.78173828125, -2.368896484375, -1.9560546875, -1.543212890625, -1.13037109375, -0.717529296875, -0.3046875, 0.108154296875, 0.52099609375, 0.933837890625, 1.3466796875, 1.759521484375, 2.17236328125, 2.585205078125, 2.998046875, 3.410888671875, 3.82373046875, 4.236572265625, 4.6494140625, 5.062255859375, 5.47509765625, 5.887939453125, 6.30078125, 6.713623046875, 7.12646484375, 7.539306640625, 7.9521484375, 8.364990234375, 8.77783203125, 9.190673828125, 9.603515625, 10.016357421875, 10.42919921875, 10.842041015625, 11.2548828125, 11.667724609375, 12.08056640625, 12.493408203125, 12.90625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 15.0, 21.0, 22.0, 46.0, 61.0, 88.0, 145.0, 245.0, 332.0, 429.0, 739.0, 1052.0, 1632.0, 2577.0, 3740.0, 5871.0, 9183.0, 14203.0, 22630.0, 36268.0, 58217.0, 89937.0, 128571.0, 157581.0, 155442.0, 124550.0, 85653.0, 55325.0, 34241.0, 21410.0, 13483.0, 8563.0, 5615.0, 3651.0, 2328.0, 1566.0, 1060.0, 685.0, 457.0, 285.0, 213.0, 137.0, 100.0, 58.0, 41.0, 29.0, 19.0, 13.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-16.96875, -16.4375, -15.90625, -15.375, -14.84375, -14.3125, -13.78125, -13.25, -12.71875, -12.1875, -11.65625, -11.125, -10.59375, -10.0625, -9.53125, -9.0, -8.46875, -7.9375, -7.40625, -6.875, -6.34375, -5.8125, -5.28125, -4.75, -4.21875, -3.6875, -3.15625, -2.625, -2.09375, -1.5625, -1.03125, -0.5, 0.03125, 0.5625, 1.09375, 1.625, 2.15625, 2.6875, 3.21875, 3.75, 4.28125, 4.8125, 5.34375, 5.875, 6.40625, 6.9375, 7.46875, 8.0, 8.53125, 9.0625, 9.59375, 10.125, 10.65625, 11.1875, 11.71875, 12.25, 12.78125, 13.3125, 13.84375, 14.375, 14.90625, 15.4375, 15.96875, 16.5, 17.03125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 7.0, 6.0, 9.0, 6.0, 8.0, 3.0, 15.0, 13.0, 16.0, 23.0, 15.0, 20.0, 24.0, 30.0, 30.0, 37.0, 36.0, 35.0, 42.0, 50.0, 46.0, 38.0, 48.0, 41.0, 47.0, 40.0, 30.0, 31.0, 33.0, 21.0, 27.0, 20.0, 19.0, 21.0, 20.0, 17.0, 16.0, 12.0, 21.0, 11.0, 4.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.3828125, -9.09765625, -8.8125, -8.52734375, -8.2421875, -7.95703125, -7.671875, -7.38671875, -7.1015625, -6.81640625, -6.53125, -6.24609375, -5.9609375, -5.67578125, -5.390625, -5.10546875, -4.8203125, -4.53515625, -4.25, -3.96484375, -3.6796875, -3.39453125, -3.109375, -2.82421875, -2.5390625, -2.25390625, -1.96875, -1.68359375, -1.3984375, -1.11328125, -0.828125, -0.54296875, -0.2578125, 0.02734375, 0.3125, 0.59765625, 0.8828125, 1.16796875, 1.453125, 1.73828125, 2.0234375, 2.30859375, 2.59375, 2.87890625, 3.1640625, 3.44921875, 3.734375, 4.01953125, 4.3046875, 4.58984375, 4.875, 5.16015625, 5.4453125, 5.73046875, 6.015625, 6.30078125, 6.5859375, 6.87109375, 7.15625, 7.44140625, 7.7265625, 8.01171875, 8.296875, 8.58203125, 8.8671875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 8.0, 8.0, 8.0, 16.0, 23.0, 26.0, 53.0, 64.0, 99.0, 177.0, 260.0, 406.0, 698.0, 1202.0, 2002.0, 3524.0, 6393.0, 11930.0, 22261.0, 42402.0, 79559.0, 140030.0, 205904.0, 208633.0, 144903.0, 82710.0, 44087.0, 23375.0, 12342.0, 6531.0, 3703.0, 2083.0, 1222.0, 739.0, 440.0, 252.0, 165.0, 106.0, 64.0, 42.0, 39.0, 19.0, 16.0, 13.0, 10.0, 1.0, 8.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.849609375, -3.725555419921875, -3.60150146484375, -3.477447509765625, -3.3533935546875, -3.229339599609375, -3.10528564453125, -2.981231689453125, -2.857177734375, -2.733123779296875, -2.60906982421875, -2.485015869140625, -2.3609619140625, -2.236907958984375, -2.11285400390625, -1.988800048828125, -1.86474609375, -1.740692138671875, -1.61663818359375, -1.492584228515625, -1.3685302734375, -1.244476318359375, -1.12042236328125, -0.996368408203125, -0.872314453125, -0.748260498046875, -0.62420654296875, -0.500152587890625, -0.3760986328125, -0.252044677734375, -0.12799072265625, -0.003936767578125, 0.1201171875, 0.244171142578125, 0.36822509765625, 0.492279052734375, 0.6163330078125, 0.740386962890625, 0.86444091796875, 0.988494873046875, 1.112548828125, 1.236602783203125, 1.36065673828125, 1.484710693359375, 1.6087646484375, 1.732818603515625, 1.85687255859375, 1.980926513671875, 2.10498046875, 2.229034423828125, 2.35308837890625, 2.477142333984375, 2.6011962890625, 2.725250244140625, 2.84930419921875, 2.973358154296875, 3.097412109375, 3.221466064453125, 3.34552001953125, 3.469573974609375, 3.5936279296875, 3.717681884765625, 3.84173583984375, 3.965789794921875, 4.08984375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 12.0, 9.0, 13.0, 15.0, 11.0, 30.0, 27.0, 34.0, 47.0, 44.0, 57.0, 66.0, 84.0, 72.0, 61.0, 71.0, 63.0, 57.0, 43.0, 32.0, 34.0, 29.0, 17.0, 16.0, 12.0, 9.0, 8.0, 9.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025272369384765625, -0.00024199485778808594, -0.00023126602172851562, -0.0002205371856689453, -0.000209808349609375, -0.0001990795135498047, -0.00018835067749023438, -0.00017762184143066406, -0.00016689300537109375, -0.00015616416931152344, -0.00014543533325195312, -0.0001347064971923828, -0.0001239776611328125, -0.00011324882507324219, -0.00010251998901367188, -9.179115295410156e-05, -8.106231689453125e-05, -7.033348083496094e-05, -5.9604644775390625e-05, -4.887580871582031e-05, -3.814697265625e-05, -2.7418136596679688e-05, -1.6689300537109375e-05, -5.9604644775390625e-06, 4.76837158203125e-06, 1.5497207641601562e-05, 2.6226043701171875e-05, 3.695487976074219e-05, 4.76837158203125e-05, 5.841255187988281e-05, 6.914138793945312e-05, 7.987022399902344e-05, 9.059906005859375e-05, 0.00010132789611816406, 0.00011205673217773438, 0.0001227855682373047, 0.000133514404296875, 0.0001442432403564453, 0.00015497207641601562, 0.00016570091247558594, 0.00017642974853515625, 0.00018715858459472656, 0.00019788742065429688, 0.0002086162567138672, 0.0002193450927734375, 0.0002300739288330078, 0.00024080276489257812, 0.00025153160095214844, 0.00026226043701171875, 0.00027298927307128906, 0.0002837181091308594, 0.0002944469451904297, 0.00030517578125, 0.0003159046173095703, 0.0003266334533691406, 0.00033736228942871094, 0.00034809112548828125, 0.00035881996154785156, 0.0003695487976074219, 0.0003802776336669922, 0.0003910064697265625, 0.0004017353057861328, 0.0004124641418457031, 0.00042319297790527344, 0.00043392181396484375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 8.0, 7.0, 9.0, 18.0, 18.0, 31.0, 58.0, 67.0, 96.0, 128.0, 209.0, 330.0, 476.0, 744.0, 1147.0, 1749.0, 2706.0, 4314.0, 6604.0, 10611.0, 17501.0, 28489.0, 45630.0, 73100.0, 109762.0, 148382.0, 164561.0, 143789.0, 104642.0, 68993.0, 43239.0, 26905.0, 16471.0, 10120.0, 6309.0, 3953.0, 2594.0, 1574.0, 1098.0, 744.0, 461.0, 290.0, 199.0, 145.0, 82.0, 71.0, 40.0, 29.0, 21.0, 17.0, 14.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.107421875, -3.011627197265625, -2.91583251953125, -2.820037841796875, -2.7242431640625, -2.628448486328125, -2.53265380859375, -2.436859130859375, -2.341064453125, -2.245269775390625, -2.14947509765625, -2.053680419921875, -1.9578857421875, -1.862091064453125, -1.76629638671875, -1.670501708984375, -1.57470703125, -1.478912353515625, -1.38311767578125, -1.287322998046875, -1.1915283203125, -1.095733642578125, -0.99993896484375, -0.904144287109375, -0.808349609375, -0.712554931640625, -0.61676025390625, -0.520965576171875, -0.4251708984375, -0.329376220703125, -0.23358154296875, -0.137786865234375, -0.0419921875, 0.053802490234375, 0.14959716796875, 0.245391845703125, 0.3411865234375, 0.436981201171875, 0.53277587890625, 0.628570556640625, 0.724365234375, 0.820159912109375, 0.91595458984375, 1.011749267578125, 1.1075439453125, 1.203338623046875, 1.29913330078125, 1.394927978515625, 1.49072265625, 1.586517333984375, 1.68231201171875, 1.778106689453125, 1.8739013671875, 1.969696044921875, 2.06549072265625, 2.161285400390625, 2.257080078125, 2.352874755859375, 2.44866943359375, 2.544464111328125, 2.6402587890625, 2.736053466796875, 2.83184814453125, 2.927642822265625, 3.0234375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 8.0, 10.0, 11.0, 7.0, 15.0, 11.0, 17.0, 26.0, 41.0, 36.0, 44.0, 40.0, 52.0, 64.0, 56.0, 59.0, 65.0, 45.0, 60.0, 60.0, 44.0, 34.0, 33.0, 34.0, 26.0, 25.0, 13.0, 14.0, 12.0, 5.0, 7.0, 3.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.41796875, -1.37530517578125, -1.3326416015625, -1.28997802734375, -1.247314453125, -1.20465087890625, -1.1619873046875, -1.11932373046875, -1.07666015625, -1.03399658203125, -0.9913330078125, -0.94866943359375, -0.906005859375, -0.86334228515625, -0.8206787109375, -0.77801513671875, -0.7353515625, -0.69268798828125, -0.6500244140625, -0.60736083984375, -0.564697265625, -0.52203369140625, -0.4793701171875, -0.43670654296875, -0.39404296875, -0.35137939453125, -0.3087158203125, -0.26605224609375, -0.223388671875, -0.18072509765625, -0.1380615234375, -0.09539794921875, -0.052734375, -0.01007080078125, 0.0325927734375, 0.07525634765625, 0.117919921875, 0.16058349609375, 0.2032470703125, 0.24591064453125, 0.28857421875, 0.33123779296875, 0.3739013671875, 0.41656494140625, 0.459228515625, 0.50189208984375, 0.5445556640625, 0.58721923828125, 0.6298828125, 0.67254638671875, 0.7152099609375, 0.75787353515625, 0.800537109375, 0.84320068359375, 0.8858642578125, 0.92852783203125, 0.97119140625, 1.01385498046875, 1.0565185546875, 1.09918212890625, 1.141845703125, 1.18450927734375, 1.2271728515625, 1.26983642578125, 1.3125]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 12.0, 7.0, 8.0, 9.0, 12.0, 23.0, 18.0, 32.0, 35.0, 45.0, 66.0, 71.0, 58.0, 66.0, 77.0, 67.0, 57.0, 67.0, 42.0, 43.0, 39.0, 28.0, 31.0, 33.0, 5.0, 14.0, 12.0, 13.0, 5.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.248414993286133, -16.663570404052734, -16.07872772216797, -15.493884086608887, -14.909040451049805, -14.324196815490723, -13.73935317993164, -13.154508590698242, -12.569665908813477, -11.984822273254395, -11.399978637695312, -10.81513500213623, -10.230291366577148, -9.645447731018066, -9.060604095458984, -8.475759506225586, -7.890915870666504, -7.306072235107422, -6.72122859954834, -6.136384963989258, -5.551541328430176, -4.966697692871094, -4.3818535804748535, -3.7970099449157715, -3.2121663093566895, -2.6273226737976074, -2.0424790382385254, -1.4576351642608643, -0.8727915287017822, -0.2879478931427002, 0.29689598083496094, 0.881739616394043, 1.466583251953125, 2.051426887512207, 2.636270523071289, 3.22111439704895, 3.8059580326080322, 4.390801429748535, 4.975645542144775, 5.560489177703857, 6.1453328132629395, 6.7301764488220215, 7.3150200843811035, 7.899864196777344, 8.484707832336426, 9.069551467895508, 9.65439510345459, 10.239238739013672, 10.824082374572754, 11.408926010131836, 11.993769645690918, 12.57861328125, 13.163456916809082, 13.748300552368164, 14.333145141601562, 14.917987823486328, 15.502832412719727, 16.087677001953125, 16.67251968383789, 17.25736427307129, 17.842206954956055, 18.427051544189453, 19.01189422607422, 19.596738815307617, 20.181581497192383]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 2.0, 7.0, 7.0, 5.0, 9.0, 6.0, 13.0, 14.0, 16.0, 26.0, 28.0, 22.0, 19.0, 24.0, 21.0, 26.0, 27.0, 23.0, 40.0, 39.0, 33.0, 41.0, 41.0, 35.0, 35.0, 23.0, 31.0, 40.0, 29.0, 36.0, 25.0, 41.0, 33.0, 22.0, 24.0, 15.0, 20.0, 13.0, 14.0, 9.0, 9.0, 16.0, 9.0, 9.0, 3.0, 8.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.502044677734375, -12.089995384216309, -11.677946090698242, -11.265897750854492, -10.853848457336426, -10.44179916381836, -10.029749870300293, -9.617700576782227, -9.205652236938477, -8.79360294342041, -8.381553649902344, -7.9695048332214355, -7.557456016540527, -7.145406723022461, -6.7333574295043945, -6.321308135986328, -5.909258842468262, -5.497209548950195, -5.085160732269287, -4.673111438751221, -4.2610626220703125, -3.849013328552246, -3.4369640350341797, -3.0249149799346924, -2.612865924835205, -2.2008168697357178, -1.788767695426941, -1.376718521118164, -0.9646694660186768, -0.5526204109191895, -0.14057111740112305, 0.27147793769836426, 0.6835269927978516, 1.0955760478973389, 1.5076252222061157, 1.9196743965148926, 2.33172345161438, 2.743772506713867, 3.1558218002319336, 3.567870855331421, 3.979919910430908, 4.391969203948975, 4.804018020629883, 5.216067314147949, 5.628116607666016, 6.040165424346924, 6.45221471786499, 6.864263534545898, 7.276312828063965, 7.688362121582031, 8.100411415100098, 8.512460708618164, 8.924509048461914, 9.33655834197998, 9.748607635498047, 10.160656929016113, 10.57270622253418, 10.984755516052246, 11.396804809570312, 11.808853149414062, 12.220902442932129, 12.632951736450195, 13.045001029968262, 13.457050323486328, 13.869098663330078]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 7.0, 14.0, 12.0, 23.0, 49.0, 78.0, 133.0, 194.0, 355.0, 545.0, 847.0, 1262.0, 2042.0, 3100.0, 4711.0, 7278.0, 11296.0, 17505.0, 26564.0, 41331.0, 64899.0, 104335.0, 170000.0, 285220.0, 478909.0, 702261.0, 758994.0, 584745.0, 360680.0, 213525.0, 128841.0, 79983.0, 50678.0, 32653.0, 20998.0, 13899.0, 9156.0, 5951.0, 3922.0, 2593.0, 1620.0, 1073.0, 678.0, 474.0, 328.0, 208.0, 107.0, 75.0, 53.0, 30.0, 16.0, 14.0, 18.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-10.1171875, -9.782470703125, -9.44775390625, -9.113037109375, -8.7783203125, -8.443603515625, -8.10888671875, -7.774169921875, -7.439453125, -7.104736328125, -6.77001953125, -6.435302734375, -6.1005859375, -5.765869140625, -5.43115234375, -5.096435546875, -4.76171875, -4.427001953125, -4.09228515625, -3.757568359375, -3.4228515625, -3.088134765625, -2.75341796875, -2.418701171875, -2.083984375, -1.749267578125, -1.41455078125, -1.079833984375, -0.7451171875, -0.410400390625, -0.07568359375, 0.259033203125, 0.59375, 0.928466796875, 1.26318359375, 1.597900390625, 1.9326171875, 2.267333984375, 2.60205078125, 2.936767578125, 3.271484375, 3.606201171875, 3.94091796875, 4.275634765625, 4.6103515625, 4.945068359375, 5.27978515625, 5.614501953125, 5.94921875, 6.283935546875, 6.61865234375, 6.953369140625, 7.2880859375, 7.622802734375, 7.95751953125, 8.292236328125, 8.626953125, 8.961669921875, 9.29638671875, 9.631103515625, 9.9658203125, 10.300537109375, 10.63525390625, 10.969970703125, 11.3046875]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 3.0, 4.0, 6.0, 3.0, 4.0, 6.0, 5.0, 8.0, 8.0, 20.0, 15.0, 13.0, 18.0, 19.0, 20.0, 17.0, 27.0, 29.0, 16.0, 26.0, 23.0, 27.0, 25.0, 29.0, 40.0, 35.0, 31.0, 29.0, 34.0, 41.0, 27.0, 23.0, 39.0, 33.0, 26.0, 31.0, 32.0, 31.0, 25.0, 20.0, 24.0, 13.0, 7.0, 11.0, 12.0, 10.0, 15.0, 10.0, 7.0, 8.0, 4.0, 5.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-7.546875, -7.3016357421875, -7.056396484375, -6.8111572265625, -6.56591796875, -6.3206787109375, -6.075439453125, -5.8302001953125, -5.5849609375, -5.3397216796875, -5.094482421875, -4.8492431640625, -4.60400390625, -4.3587646484375, -4.113525390625, -3.8682861328125, -3.623046875, -3.3778076171875, -3.132568359375, -2.8873291015625, -2.64208984375, -2.3968505859375, -2.151611328125, -1.9063720703125, -1.6611328125, -1.4158935546875, -1.170654296875, -0.9254150390625, -0.68017578125, -0.4349365234375, -0.189697265625, 0.0555419921875, 0.30078125, 0.5460205078125, 0.791259765625, 1.0364990234375, 1.28173828125, 1.5269775390625, 1.772216796875, 2.0174560546875, 2.2626953125, 2.5079345703125, 2.753173828125, 2.9984130859375, 3.24365234375, 3.4888916015625, 3.734130859375, 3.9793701171875, 4.224609375, 4.4698486328125, 4.715087890625, 4.9603271484375, 5.20556640625, 5.4508056640625, 5.696044921875, 5.9412841796875, 6.1865234375, 6.4317626953125, 6.677001953125, 6.9222412109375, 7.16748046875, 7.4127197265625, 7.657958984375, 7.9031982421875, 8.1484375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 6.0, 5.0, 17.0, 6.0, 23.0, 48.0, 48.0, 89.0, 132.0, 238.0, 363.0, 612.0, 1014.0, 1716.0, 2763.0, 4890.0, 8376.0, 14611.0, 25190.0, 44625.0, 77363.0, 137133.0, 236908.0, 400790.0, 620959.0, 787320.0, 692177.0, 468689.0, 283532.0, 164837.0, 94173.0, 53559.0, 30292.0, 17490.0, 9983.0, 5879.0, 3465.0, 2053.0, 1158.0, 673.0, 431.0, 262.0, 155.0, 103.0, 51.0, 34.0, 20.0, 15.0, 10.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.765625, -11.4161376953125, -11.066650390625, -10.7171630859375, -10.36767578125, -10.0181884765625, -9.668701171875, -9.3192138671875, -8.9697265625, -8.6202392578125, -8.270751953125, -7.9212646484375, -7.57177734375, -7.2222900390625, -6.872802734375, -6.5233154296875, -6.173828125, -5.8243408203125, -5.474853515625, -5.1253662109375, -4.77587890625, -4.4263916015625, -4.076904296875, -3.7274169921875, -3.3779296875, -3.0284423828125, -2.678955078125, -2.3294677734375, -1.97998046875, -1.6304931640625, -1.281005859375, -0.9315185546875, -0.58203125, -0.2325439453125, 0.116943359375, 0.4664306640625, 0.81591796875, 1.1654052734375, 1.514892578125, 1.8643798828125, 2.2138671875, 2.5633544921875, 2.912841796875, 3.2623291015625, 3.61181640625, 3.9613037109375, 4.310791015625, 4.6602783203125, 5.009765625, 5.3592529296875, 5.708740234375, 6.0582275390625, 6.40771484375, 6.7572021484375, 7.106689453125, 7.4561767578125, 7.8056640625, 8.1551513671875, 8.504638671875, 8.8541259765625, 9.20361328125, 9.5531005859375, 9.902587890625, 10.2520751953125, 10.6015625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 6.0, 13.0, 13.0, 17.0, 18.0, 15.0, 35.0, 37.0, 41.0, 57.0, 57.0, 78.0, 104.0, 108.0, 121.0, 172.0, 171.0, 190.0, 225.0, 258.0, 269.0, 276.0, 285.0, 248.0, 209.0, 195.0, 169.0, 142.0, 124.0, 103.0, 90.0, 52.0, 53.0, 29.0, 24.0, 17.0, 20.0, 10.0, 10.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.734375, -4.5732421875, -4.412109375, -4.2509765625, -4.08984375, -3.9287109375, -3.767578125, -3.6064453125, -3.4453125, -3.2841796875, -3.123046875, -2.9619140625, -2.80078125, -2.6396484375, -2.478515625, -2.3173828125, -2.15625, -1.9951171875, -1.833984375, -1.6728515625, -1.51171875, -1.3505859375, -1.189453125, -1.0283203125, -0.8671875, -0.7060546875, -0.544921875, -0.3837890625, -0.22265625, -0.0615234375, 0.099609375, 0.2607421875, 0.421875, 0.5830078125, 0.744140625, 0.9052734375, 1.06640625, 1.2275390625, 1.388671875, 1.5498046875, 1.7109375, 1.8720703125, 2.033203125, 2.1943359375, 2.35546875, 2.5166015625, 2.677734375, 2.8388671875, 3.0, 3.1611328125, 3.322265625, 3.4833984375, 3.64453125, 3.8056640625, 3.966796875, 4.1279296875, 4.2890625, 4.4501953125, 4.611328125, 4.7724609375, 4.93359375, 5.0947265625, 5.255859375, 5.4169921875, 5.578125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 5.0, 5.0, 11.0, 17.0, 16.0, 22.0, 17.0, 23.0, 45.0, 26.0, 45.0, 46.0, 40.0, 65.0, 64.0, 59.0, 66.0, 52.0, 47.0, 56.0, 44.0, 34.0, 33.0, 29.0, 26.0, 18.0, 18.0, 12.0, 11.0, 11.0, 4.0, 6.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.000777244567871, -9.630976676940918, -9.261176109313965, -8.891375541687012, -8.521574974060059, -8.151774406433105, -7.781973838806152, -7.412173271179199, -7.042372703552246, -6.672572135925293, -6.30277156829834, -5.932971000671387, -5.563170433044434, -5.1933698654174805, -4.823569297790527, -4.453768730163574, -4.083968162536621, -3.714167594909668, -3.344367027282715, -2.9745664596557617, -2.6047658920288086, -2.2349653244018555, -1.8651647567749023, -1.4953641891479492, -1.125563621520996, -0.755763053894043, -0.38596248626708984, -0.01616191864013672, 0.3536386489868164, 0.7234392166137695, 1.0932397842407227, 1.4630403518676758, 1.8328399658203125, 2.2026405334472656, 2.5724411010742188, 2.942241668701172, 3.312042236328125, 3.681842803955078, 4.051643371582031, 4.421443939208984, 4.7912445068359375, 5.161045074462891, 5.530845642089844, 5.900646209716797, 6.27044677734375, 6.640247344970703, 7.010047912597656, 7.379848480224609, 7.7496490478515625, 8.119449615478516, 8.489250183105469, 8.859050750732422, 9.228851318359375, 9.598651885986328, 9.968452453613281, 10.338253021240234, 10.708053588867188, 11.07785415649414, 11.447654724121094, 11.817455291748047, 12.187255859375, 12.557056427001953, 12.926856994628906, 13.29665756225586, 13.666458129882812]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 8.0, 5.0, 7.0, 8.0, 11.0, 12.0, 20.0, 14.0, 25.0, 23.0, 21.0, 25.0, 24.0, 26.0, 30.0, 25.0, 25.0, 35.0, 32.0, 27.0, 48.0, 31.0, 28.0, 31.0, 38.0, 32.0, 39.0, 33.0, 22.0, 32.0, 34.0, 24.0, 21.0, 21.0, 21.0, 19.0, 21.0, 10.0, 12.0, 14.0, 9.0, 10.0, 10.0, 10.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.159399032592773, -8.843890190124512, -8.52838134765625, -8.212872505187988, -7.897363662719727, -7.581854820251465, -7.266345977783203, -6.950837135314941, -6.63532829284668, -6.319819450378418, -6.004310607910156, -5.6888017654418945, -5.373292922973633, -5.057784080505371, -4.742275238037109, -4.426766395568848, -4.111257553100586, -3.795748710632324, -3.4802398681640625, -3.164731025695801, -2.849222183227539, -2.5337133407592773, -2.2182044982910156, -1.902695655822754, -1.5871868133544922, -1.2716779708862305, -0.9561691284179688, -0.640660285949707, -0.3251514434814453, -0.009642601013183594, 0.3058662414550781, 0.6213750839233398, 0.936884880065918, 1.2523937225341797, 1.5679025650024414, 1.8834114074707031, 2.198920249938965, 2.5144290924072266, 2.8299379348754883, 3.14544677734375, 3.4609556198120117, 3.7764644622802734, 4.091973304748535, 4.407482147216797, 4.722990989685059, 5.03849983215332, 5.354008674621582, 5.669517517089844, 5.9850263595581055, 6.300535202026367, 6.616044044494629, 6.931552886962891, 7.247061729431152, 7.562570571899414, 7.878079414367676, 8.193588256835938, 8.5090970993042, 8.824605941772461, 9.140114784240723, 9.455623626708984, 9.771132469177246, 10.086641311645508, 10.40215015411377, 10.717658996582031, 11.033167839050293]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 13.0, 7.0, 19.0, 18.0, 38.0, 49.0, 83.0, 122.0, 190.0, 324.0, 584.0, 970.0, 1674.0, 2996.0, 5217.0, 8892.0, 15891.0, 29157.0, 54332.0, 103590.0, 196558.0, 267115.0, 169303.0, 87812.0, 46387.0, 24774.0, 14069.0, 7798.0, 4360.0, 2576.0, 1478.0, 861.0, 502.0, 282.0, 180.0, 119.0, 68.0, 42.0, 30.0, 20.0, 19.0, 15.0, 12.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.26171875, -5.10406494140625, -4.9464111328125, -4.78875732421875, -4.631103515625, -4.47344970703125, -4.3157958984375, -4.15814208984375, -4.00048828125, -3.84283447265625, -3.6851806640625, -3.52752685546875, -3.369873046875, -3.21221923828125, -3.0545654296875, -2.89691162109375, -2.7392578125, -2.58160400390625, -2.4239501953125, -2.26629638671875, -2.108642578125, -1.95098876953125, -1.7933349609375, -1.63568115234375, -1.47802734375, -1.32037353515625, -1.1627197265625, -1.00506591796875, -0.847412109375, -0.68975830078125, -0.5321044921875, -0.37445068359375, -0.216796875, -0.05914306640625, 0.0985107421875, 0.25616455078125, 0.413818359375, 0.57147216796875, 0.7291259765625, 0.88677978515625, 1.04443359375, 1.20208740234375, 1.3597412109375, 1.51739501953125, 1.675048828125, 1.83270263671875, 1.9903564453125, 2.14801025390625, 2.3056640625, 2.46331787109375, 2.6209716796875, 2.77862548828125, 2.936279296875, 3.09393310546875, 3.2515869140625, 3.40924072265625, 3.56689453125, 3.72454833984375, 3.8822021484375, 4.03985595703125, 4.197509765625, 4.35516357421875, 4.5128173828125, 4.67047119140625, 4.828125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 5.0, 3.0, 12.0, 11.0, 11.0, 5.0, 10.0, 9.0, 13.0, 22.0, 30.0, 16.0, 23.0, 26.0, 27.0, 25.0, 24.0, 28.0, 32.0, 35.0, 37.0, 38.0, 50.0, 33.0, 30.0, 32.0, 42.0, 35.0, 32.0, 37.0, 23.0, 25.0, 22.0, 21.0, 29.0, 18.0, 27.0, 23.0, 11.0, 7.0, 11.0, 15.0, 11.0, 10.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.6796875, -9.352294921875, -9.02490234375, -8.697509765625, -8.3701171875, -8.042724609375, -7.71533203125, -7.387939453125, -7.060546875, -6.733154296875, -6.40576171875, -6.078369140625, -5.7509765625, -5.423583984375, -5.09619140625, -4.768798828125, -4.44140625, -4.114013671875, -3.78662109375, -3.459228515625, -3.1318359375, -2.804443359375, -2.47705078125, -2.149658203125, -1.822265625, -1.494873046875, -1.16748046875, -0.840087890625, -0.5126953125, -0.185302734375, 0.14208984375, 0.469482421875, 0.796875, 1.124267578125, 1.45166015625, 1.779052734375, 2.1064453125, 2.433837890625, 2.76123046875, 3.088623046875, 3.416015625, 3.743408203125, 4.07080078125, 4.398193359375, 4.7255859375, 5.052978515625, 5.38037109375, 5.707763671875, 6.03515625, 6.362548828125, 6.68994140625, 7.017333984375, 7.3447265625, 7.672119140625, 7.99951171875, 8.326904296875, 8.654296875, 8.981689453125, 9.30908203125, 9.636474609375, 9.9638671875, 10.291259765625, 10.61865234375, 10.946044921875, 11.2734375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 4.0, 2.0, 6.0, 7.0, 6.0, 10.0, 12.0, 21.0, 28.0, 39.0, 47.0, 48.0, 79.0, 90.0, 137.0, 183.0, 275.0, 407.0, 618.0, 1036.0, 1675.0, 3014.0, 6311.0, 14309.0, 43340.0, 911571.0, 38748.0, 13575.0, 5669.0, 2804.0, 1533.0, 920.0, 581.0, 392.0, 307.0, 174.0, 145.0, 82.0, 75.0, 70.0, 40.0, 46.0, 27.0, 22.0, 18.0, 12.0, 7.0, 4.0, 2.0, 3.0, 6.0, 5.0, 5.0, 1.0, 6.0, 2.0, 0.0, 1.0], "bins": [-12.671875, -12.26904296875, -11.8662109375, -11.46337890625, -11.060546875, -10.65771484375, -10.2548828125, -9.85205078125, -9.44921875, -9.04638671875, -8.6435546875, -8.24072265625, -7.837890625, -7.43505859375, -7.0322265625, -6.62939453125, -6.2265625, -5.82373046875, -5.4208984375, -5.01806640625, -4.615234375, -4.21240234375, -3.8095703125, -3.40673828125, -3.00390625, -2.60107421875, -2.1982421875, -1.79541015625, -1.392578125, -0.98974609375, -0.5869140625, -0.18408203125, 0.21875, 0.62158203125, 1.0244140625, 1.42724609375, 1.830078125, 2.23291015625, 2.6357421875, 3.03857421875, 3.44140625, 3.84423828125, 4.2470703125, 4.64990234375, 5.052734375, 5.45556640625, 5.8583984375, 6.26123046875, 6.6640625, 7.06689453125, 7.4697265625, 7.87255859375, 8.275390625, 8.67822265625, 9.0810546875, 9.48388671875, 9.88671875, 10.28955078125, 10.6923828125, 11.09521484375, 11.498046875, 11.90087890625, 12.3037109375, 12.70654296875, 13.109375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 2.0, 4.0, 7.0, 10.0, 13.0, 14.0, 20.0, 17.0, 25.0, 31.0, 23.0, 29.0, 31.0, 43.0, 35.0, 46.0, 54.0, 50.0, 50.0, 40.0, 52.0, 43.0, 40.0, 47.0, 35.0, 41.0, 40.0, 33.0, 24.0, 16.0, 16.0, 12.0, 19.0, 7.0, 4.0, 13.0, 3.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8515625, -10.5333251953125, -10.215087890625, -9.8968505859375, -9.57861328125, -9.2603759765625, -8.942138671875, -8.6239013671875, -8.3056640625, -7.9874267578125, -7.669189453125, -7.3509521484375, -7.03271484375, -6.7144775390625, -6.396240234375, -6.0780029296875, -5.759765625, -5.4415283203125, -5.123291015625, -4.8050537109375, -4.48681640625, -4.1685791015625, -3.850341796875, -3.5321044921875, -3.2138671875, -2.8956298828125, -2.577392578125, -2.2591552734375, -1.94091796875, -1.6226806640625, -1.304443359375, -0.9862060546875, -0.66796875, -0.3497314453125, -0.031494140625, 0.2867431640625, 0.60498046875, 0.9232177734375, 1.241455078125, 1.5596923828125, 1.8779296875, 2.1961669921875, 2.514404296875, 2.8326416015625, 3.15087890625, 3.4691162109375, 3.787353515625, 4.1055908203125, 4.423828125, 4.7420654296875, 5.060302734375, 5.3785400390625, 5.69677734375, 6.0150146484375, 6.333251953125, 6.6514892578125, 6.9697265625, 7.2879638671875, 7.606201171875, 7.9244384765625, 8.24267578125, 8.5609130859375, 8.879150390625, 9.1973876953125, 9.515625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 8.0, 16.0, 14.0, 20.0, 20.0, 40.0, 36.0, 70.0, 88.0, 158.0, 218.0, 280.0, 428.0, 710.0, 1151.0, 1948.0, 3742.0, 8205.0, 22733.0, 920068.0, 60827.0, 14539.0, 5902.0, 2926.0, 1639.0, 940.0, 550.0, 389.0, 278.0, 158.0, 110.0, 97.0, 71.0, 45.0, 33.0, 19.0, 19.0, 16.0, 7.0, 10.0, 5.0, 5.0, 5.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41796875, -2.33685302734375, -2.2557373046875, -2.17462158203125, -2.093505859375, -2.01239013671875, -1.9312744140625, -1.85015869140625, -1.76904296875, -1.68792724609375, -1.6068115234375, -1.52569580078125, -1.444580078125, -1.36346435546875, -1.2823486328125, -1.20123291015625, -1.1201171875, -1.03900146484375, -0.9578857421875, -0.87677001953125, -0.795654296875, -0.71453857421875, -0.6334228515625, -0.55230712890625, -0.47119140625, -0.39007568359375, -0.3089599609375, -0.22784423828125, -0.146728515625, -0.06561279296875, 0.0155029296875, 0.09661865234375, 0.177734375, 0.25885009765625, 0.3399658203125, 0.42108154296875, 0.502197265625, 0.58331298828125, 0.6644287109375, 0.74554443359375, 0.82666015625, 0.90777587890625, 0.9888916015625, 1.07000732421875, 1.151123046875, 1.23223876953125, 1.3133544921875, 1.39447021484375, 1.4755859375, 1.55670166015625, 1.6378173828125, 1.71893310546875, 1.800048828125, 1.88116455078125, 1.9622802734375, 2.04339599609375, 2.12451171875, 2.20562744140625, 2.2867431640625, 2.36785888671875, 2.448974609375, 2.53009033203125, 2.6112060546875, 2.69232177734375, 2.7734375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 6.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 4.0, 12.0, 10.0, 13.0, 39.0, 67.0, 110.0, 157.0, 141.0, 139.0, 103.0, 55.0, 54.0, 15.0, 14.0, 8.0, 7.0, 4.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001093149185180664, -0.00010595563799142838, -0.00010259635746479034, -9.923707693815231e-05, -9.587779641151428e-05, -9.251851588487625e-05, -8.915923535823822e-05, -8.579995483160019e-05, -8.244067430496216e-05, -7.908139377832413e-05, -7.57221132516861e-05, -7.236283272504807e-05, -6.900355219841003e-05, -6.5644271671772e-05, -6.228499114513397e-05, -5.892571061849594e-05, -5.556643009185791e-05, -5.220714956521988e-05, -4.884786903858185e-05, -4.548858851194382e-05, -4.2129307985305786e-05, -3.8770027458667755e-05, -3.5410746932029724e-05, -3.205146640539169e-05, -2.8692185878753662e-05, -2.533290535211563e-05, -2.19736248254776e-05, -1.861434429883957e-05, -1.5255063772201538e-05, -1.1895783245563507e-05, -8.536502718925476e-06, -5.177222192287445e-06, -1.817941665649414e-06, 1.541338860988617e-06, 4.900619387626648e-06, 8.259899914264679e-06, 1.161918044090271e-05, 1.4978460967540741e-05, 1.8337741494178772e-05, 2.1697022020816803e-05, 2.5056302547454834e-05, 2.8415583074092865e-05, 3.1774863600730896e-05, 3.513414412736893e-05, 3.849342465400696e-05, 4.185270518064499e-05, 4.521198570728302e-05, 4.857126623392105e-05, 5.193054676055908e-05, 5.528982728719711e-05, 5.8649107813835144e-05, 6.200838834047318e-05, 6.53676688671112e-05, 6.872694939374924e-05, 7.208622992038727e-05, 7.54455104470253e-05, 7.880479097366333e-05, 8.216407150030136e-05, 8.552335202693939e-05, 8.888263255357742e-05, 9.224191308021545e-05, 9.560119360685349e-05, 9.896047413349152e-05, 0.00010231975466012955, 0.00010567903518676758]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 11.0, 6.0, 12.0, 17.0, 22.0, 19.0, 44.0, 55.0, 84.0, 167.0, 193.0, 306.0, 452.0, 680.0, 1025.0, 1597.0, 2524.0, 3966.0, 6596.0, 11104.0, 20280.0, 39802.0, 86085.0, 220162.0, 368685.0, 150283.0, 63589.0, 30729.0, 16216.0, 9047.0, 5472.0, 3267.0, 2085.0, 1317.0, 858.0, 563.0, 371.0, 250.0, 210.0, 121.0, 91.0, 50.0, 50.0, 22.0, 24.0, 17.0, 10.0, 8.0, 4.0, 3.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0, -0.9680633544921875, -0.936126708984375, -0.9041900634765625, -0.87225341796875, -0.8403167724609375, -0.808380126953125, -0.7764434814453125, -0.7445068359375, -0.7125701904296875, -0.680633544921875, -0.6486968994140625, -0.61676025390625, -0.5848236083984375, -0.552886962890625, -0.5209503173828125, -0.489013671875, -0.4570770263671875, -0.425140380859375, -0.3932037353515625, -0.36126708984375, -0.3293304443359375, -0.297393798828125, -0.2654571533203125, -0.2335205078125, -0.2015838623046875, -0.169647216796875, -0.1377105712890625, -0.10577392578125, -0.0738372802734375, -0.041900634765625, -0.0099639892578125, 0.02197265625, 0.0539093017578125, 0.085845947265625, 0.1177825927734375, 0.14971923828125, 0.1816558837890625, 0.213592529296875, 0.2455291748046875, 0.2774658203125, 0.3094024658203125, 0.341339111328125, 0.3732757568359375, 0.40521240234375, 0.4371490478515625, 0.469085693359375, 0.5010223388671875, 0.532958984375, 0.5648956298828125, 0.596832275390625, 0.6287689208984375, 0.66070556640625, 0.6926422119140625, 0.724578857421875, 0.7565155029296875, 0.7884521484375, 0.8203887939453125, 0.852325439453125, 0.8842620849609375, 0.91619873046875, 0.9481353759765625, 0.980072021484375, 1.0120086669921875, 1.0439453125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 7.0, 4.0, 4.0, 8.0, 11.0, 8.0, 12.0, 17.0, 23.0, 19.0, 25.0, 34.0, 37.0, 36.0, 37.0, 45.0, 74.0, 70.0, 63.0, 60.0, 55.0, 56.0, 52.0, 44.0, 35.0, 27.0, 27.0, 21.0, 21.0, 19.0, 12.0, 7.0, 6.0, 8.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.3095703125, -0.29970550537109375, -0.2898406982421875, -0.27997589111328125, -0.270111083984375, -0.26024627685546875, -0.2503814697265625, -0.24051666259765625, -0.23065185546875, -0.22078704833984375, -0.2109222412109375, -0.20105743408203125, -0.191192626953125, -0.18132781982421875, -0.1714630126953125, -0.16159820556640625, -0.1517333984375, -0.14186859130859375, -0.1320037841796875, -0.12213897705078125, -0.112274169921875, -0.10240936279296875, -0.0925445556640625, -0.08267974853515625, -0.07281494140625, -0.06295013427734375, -0.0530853271484375, -0.04322052001953125, -0.033355712890625, -0.02349090576171875, -0.0136260986328125, -0.00376129150390625, 0.006103515625, 0.01596832275390625, 0.0258331298828125, 0.03569793701171875, 0.045562744140625, 0.05542755126953125, 0.0652923583984375, 0.07515716552734375, 0.08502197265625, 0.09488677978515625, 0.1047515869140625, 0.11461639404296875, 0.124481201171875, 0.13434600830078125, 0.1442108154296875, 0.15407562255859375, 0.1639404296875, 0.17380523681640625, 0.1836700439453125, 0.19353485107421875, 0.203399658203125, 0.21326446533203125, 0.2231292724609375, 0.23299407958984375, 0.24285888671875, 0.25272369384765625, 0.2625885009765625, 0.27245330810546875, 0.282318115234375, 0.29218292236328125, 0.3020477294921875, 0.31191253662109375, 0.32177734375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 2.0, 2.0, 5.0, 9.0, 17.0, 17.0, 21.0, 19.0, 21.0, 29.0, 42.0, 37.0, 38.0, 43.0, 62.0, 70.0, 63.0, 48.0, 68.0, 42.0, 52.0, 50.0, 43.0, 33.0, 34.0, 19.0, 19.0, 18.0, 16.0, 11.0, 15.0, 5.0, 6.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.699773788452148, -9.341609954833984, -8.98344612121582, -8.625282287597656, -8.267118453979492, -7.908954620361328, -7.550790309906006, -7.192626476287842, -6.834462642669678, -6.476298809051514, -6.11813497543335, -5.759970664978027, -5.401806831359863, -5.043642997741699, -4.685479164123535, -4.327315330505371, -3.969151496887207, -3.610987663269043, -3.252823829650879, -2.8946597576141357, -2.5364959239959717, -2.1783320903778076, -1.8201680183410645, -1.4620041847229004, -1.1038403511047363, -0.7456764578819275, -0.38751256465911865, -0.02934861183166504, 0.328815221786499, 0.6869790554046631, 1.0451431274414062, 1.4033069610595703, 1.7614707946777344, 2.1196346282958984, 2.4777984619140625, 2.8359625339508057, 3.1941263675689697, 3.552290201187134, 3.910454273223877, 4.268618106842041, 4.626781940460205, 4.984945774078369, 5.343109607696533, 5.7012739181518555, 6.0594377517700195, 6.417601585388184, 6.775765419006348, 7.133929252624512, 7.492093086242676, 7.85025691986084, 8.208420753479004, 8.566584587097168, 8.924748420715332, 9.282912254333496, 9.641077041625977, 9.99924087524414, 10.357404708862305, 10.715568542480469, 11.073732376098633, 11.431896209716797, 11.790060043334961, 12.148223876953125, 12.506387710571289, 12.864551544189453, 13.222715377807617]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 1.0, 4.0, 8.0, 9.0, 8.0, 3.0, 7.0, 6.0, 9.0, 16.0, 13.0, 21.0, 18.0, 23.0, 27.0, 22.0, 23.0, 25.0, 28.0, 31.0, 26.0, 30.0, 31.0, 30.0, 45.0, 31.0, 29.0, 31.0, 33.0, 36.0, 40.0, 33.0, 27.0, 24.0, 34.0, 26.0, 22.0, 21.0, 28.0, 11.0, 24.0, 17.0, 5.0, 17.0, 12.0, 4.0, 13.0, 11.0, 7.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.980996131896973, -8.674165725708008, -8.36733627319336, -8.060505867004395, -7.75367546081543, -7.446845531463623, -7.140015602111816, -6.833185195922852, -6.526355266571045, -6.219525337219238, -5.912694931030273, -5.605865001678467, -5.29903507232666, -4.992204666137695, -4.685374736785889, -4.378544807434082, -4.071714401245117, -3.7648842334747314, -3.4580540657043457, -3.151224136352539, -2.8443939685821533, -2.5375638008117676, -2.230733871459961, -1.9239037036895752, -1.6170735359191895, -1.3102433681488037, -1.0034133195877075, -0.6965832114219666, -0.3897531032562256, -0.08292293548583984, 0.22390711307525635, 0.5307371616363525, 0.8375673294067383, 1.144397497177124, 1.4512275457382202, 1.7580575942993164, 2.064887762069702, 2.371717929840088, 2.6785478591918945, 2.9853780269622803, 3.292208194732666, 3.5990383625030518, 3.9058685302734375, 4.212698459625244, 4.519528388977051, 4.826358795166016, 5.133188724517822, 5.440018653869629, 5.746849060058594, 6.0536789894104, 6.360509395599365, 6.667339324951172, 6.974169731140137, 7.280999660491943, 7.58782958984375, 7.894659996032715, 8.20149040222168, 8.508320808410645, 8.815150260925293, 9.121980667114258, 9.428811073303223, 9.735641479492188, 10.042470932006836, 10.3493013381958, 10.65613079071045]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 6.0, 3.0, 5.0, 10.0, 15.0, 25.0, 41.0, 40.0, 88.0, 128.0, 221.0, 288.0, 464.0, 713.0, 1022.0, 1644.0, 2607.0, 4043.0, 6090.0, 9573.0, 14407.0, 22765.0, 34870.0, 52630.0, 76172.0, 104584.0, 128880.0, 138598.0, 126967.0, 101270.0, 74205.0, 50813.0, 33616.0, 22057.0, 14120.0, 9008.0, 5847.0, 3819.0, 2386.0, 1601.0, 1016.0, 676.0, 436.0, 260.0, 162.0, 133.0, 75.0, 64.0, 35.0, 28.0, 13.0, 6.0, 7.0, 9.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.390625, -9.082275390625, -8.77392578125, -8.465576171875, -8.1572265625, -7.848876953125, -7.54052734375, -7.232177734375, -6.923828125, -6.615478515625, -6.30712890625, -5.998779296875, -5.6904296875, -5.382080078125, -5.07373046875, -4.765380859375, -4.45703125, -4.148681640625, -3.84033203125, -3.531982421875, -3.2236328125, -2.915283203125, -2.60693359375, -2.298583984375, -1.990234375, -1.681884765625, -1.37353515625, -1.065185546875, -0.7568359375, -0.448486328125, -0.14013671875, 0.168212890625, 0.4765625, 0.784912109375, 1.09326171875, 1.401611328125, 1.7099609375, 2.018310546875, 2.32666015625, 2.635009765625, 2.943359375, 3.251708984375, 3.56005859375, 3.868408203125, 4.1767578125, 4.485107421875, 4.79345703125, 5.101806640625, 5.41015625, 5.718505859375, 6.02685546875, 6.335205078125, 6.6435546875, 6.951904296875, 7.26025390625, 7.568603515625, 7.876953125, 8.185302734375, 8.49365234375, 8.802001953125, 9.1103515625, 9.418701171875, 9.72705078125, 10.035400390625, 10.34375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 6.0, 3.0, 5.0, 5.0, 13.0, 10.0, 15.0, 19.0, 12.0, 11.0, 26.0, 27.0, 26.0, 22.0, 27.0, 29.0, 26.0, 35.0, 36.0, 34.0, 37.0, 27.0, 44.0, 50.0, 42.0, 43.0, 26.0, 29.0, 27.0, 31.0, 21.0, 38.0, 34.0, 20.0, 24.0, 24.0, 16.0, 12.0, 15.0, 17.0, 9.0, 7.0, 5.0, 3.0, 3.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.296875, -8.984130859375, -8.67138671875, -8.358642578125, -8.0458984375, -7.733154296875, -7.42041015625, -7.107666015625, -6.794921875, -6.482177734375, -6.16943359375, -5.856689453125, -5.5439453125, -5.231201171875, -4.91845703125, -4.605712890625, -4.29296875, -3.980224609375, -3.66748046875, -3.354736328125, -3.0419921875, -2.729248046875, -2.41650390625, -2.103759765625, -1.791015625, -1.478271484375, -1.16552734375, -0.852783203125, -0.5400390625, -0.227294921875, 0.08544921875, 0.398193359375, 0.7109375, 1.023681640625, 1.33642578125, 1.649169921875, 1.9619140625, 2.274658203125, 2.58740234375, 2.900146484375, 3.212890625, 3.525634765625, 3.83837890625, 4.151123046875, 4.4638671875, 4.776611328125, 5.08935546875, 5.402099609375, 5.71484375, 6.027587890625, 6.34033203125, 6.653076171875, 6.9658203125, 7.278564453125, 7.59130859375, 7.904052734375, 8.216796875, 8.529541015625, 8.84228515625, 9.155029296875, 9.4677734375, 9.780517578125, 10.09326171875, 10.406005859375, 10.71875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 3.0, 4.0, 11.0, 16.0, 12.0, 25.0, 29.0, 58.0, 72.0, 105.0, 166.0, 220.0, 319.0, 433.0, 698.0, 1025.0, 1489.0, 2040.0, 3225.0, 4797.0, 7121.0, 10883.0, 16519.0, 25226.0, 38052.0, 56567.0, 81792.0, 109944.0, 133072.0, 138298.0, 121275.0, 93905.0, 66874.0, 45291.0, 30061.0, 19662.0, 13139.0, 8629.0, 5598.0, 3855.0, 2539.0, 1788.0, 1185.0, 773.0, 532.0, 373.0, 240.0, 187.0, 122.0, 103.0, 69.0, 52.0, 39.0, 18.0, 11.0, 10.0, 7.0, 4.0, 2.0, 3.0, 2.0], "bins": [-9.8515625, -9.5457763671875, -9.239990234375, -8.9342041015625, -8.62841796875, -8.3226318359375, -8.016845703125, -7.7110595703125, -7.4052734375, -7.0994873046875, -6.793701171875, -6.4879150390625, -6.18212890625, -5.8763427734375, -5.570556640625, -5.2647705078125, -4.958984375, -4.6531982421875, -4.347412109375, -4.0416259765625, -3.73583984375, -3.4300537109375, -3.124267578125, -2.8184814453125, -2.5126953125, -2.2069091796875, -1.901123046875, -1.5953369140625, -1.28955078125, -0.9837646484375, -0.677978515625, -0.3721923828125, -0.06640625, 0.2393798828125, 0.545166015625, 0.8509521484375, 1.15673828125, 1.4625244140625, 1.768310546875, 2.0740966796875, 2.3798828125, 2.6856689453125, 2.991455078125, 3.2972412109375, 3.60302734375, 3.9088134765625, 4.214599609375, 4.5203857421875, 4.826171875, 5.1319580078125, 5.437744140625, 5.7435302734375, 6.04931640625, 6.3551025390625, 6.660888671875, 6.9666748046875, 7.2724609375, 7.5782470703125, 7.884033203125, 8.1898193359375, 8.49560546875, 8.8013916015625, 9.107177734375, 9.4129638671875, 9.71875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 5.0, 3.0, 3.0, 13.0, 5.0, 11.0, 21.0, 21.0, 21.0, 21.0, 22.0, 16.0, 32.0, 27.0, 23.0, 42.0, 37.0, 31.0, 41.0, 42.0, 48.0, 37.0, 45.0, 30.0, 42.0, 44.0, 36.0, 27.0, 27.0, 20.0, 33.0, 32.0, 19.0, 26.0, 10.0, 10.0, 12.0, 15.0, 9.0, 8.0, 6.0, 4.0, 3.0, 4.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.859375, -6.6492919921875, -6.439208984375, -6.2291259765625, -6.01904296875, -5.8089599609375, -5.598876953125, -5.3887939453125, -5.1787109375, -4.9686279296875, -4.758544921875, -4.5484619140625, -4.33837890625, -4.1282958984375, -3.918212890625, -3.7081298828125, -3.498046875, -3.2879638671875, -3.077880859375, -2.8677978515625, -2.65771484375, -2.4476318359375, -2.237548828125, -2.0274658203125, -1.8173828125, -1.6072998046875, -1.397216796875, -1.1871337890625, -0.97705078125, -0.7669677734375, -0.556884765625, -0.3468017578125, -0.13671875, 0.0733642578125, 0.283447265625, 0.4935302734375, 0.70361328125, 0.9136962890625, 1.123779296875, 1.3338623046875, 1.5439453125, 1.7540283203125, 1.964111328125, 2.1741943359375, 2.38427734375, 2.5943603515625, 2.804443359375, 3.0145263671875, 3.224609375, 3.4346923828125, 3.644775390625, 3.8548583984375, 4.06494140625, 4.2750244140625, 4.485107421875, 4.6951904296875, 4.9052734375, 5.1153564453125, 5.325439453125, 5.5355224609375, 5.74560546875, 5.9556884765625, 6.165771484375, 6.3758544921875, 6.5859375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 5.0, 13.0, 15.0, 24.0, 33.0, 43.0, 57.0, 74.0, 93.0, 160.0, 203.0, 298.0, 496.0, 582.0, 1000.0, 1382.0, 2108.0, 3331.0, 5314.0, 8750.0, 14607.0, 24757.0, 42666.0, 71718.0, 116156.0, 164755.0, 183964.0, 151665.0, 101705.0, 61536.0, 36357.0, 21458.0, 12420.0, 7516.0, 4690.0, 2824.0, 1918.0, 1199.0, 806.0, 553.0, 416.0, 264.0, 192.0, 114.0, 86.0, 58.0, 50.0, 39.0, 26.0, 16.0, 16.0, 13.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-2.822265625, -2.729278564453125, -2.63629150390625, -2.543304443359375, -2.4503173828125, -2.357330322265625, -2.26434326171875, -2.171356201171875, -2.078369140625, -1.985382080078125, -1.89239501953125, -1.799407958984375, -1.7064208984375, -1.613433837890625, -1.52044677734375, -1.427459716796875, -1.33447265625, -1.241485595703125, -1.14849853515625, -1.055511474609375, -0.9625244140625, -0.869537353515625, -0.77655029296875, -0.683563232421875, -0.590576171875, -0.497589111328125, -0.40460205078125, -0.311614990234375, -0.2186279296875, -0.125640869140625, -0.03265380859375, 0.060333251953125, 0.1533203125, 0.246307373046875, 0.33929443359375, 0.432281494140625, 0.5252685546875, 0.618255615234375, 0.71124267578125, 0.804229736328125, 0.897216796875, 0.990203857421875, 1.08319091796875, 1.176177978515625, 1.2691650390625, 1.362152099609375, 1.45513916015625, 1.548126220703125, 1.64111328125, 1.734100341796875, 1.82708740234375, 1.920074462890625, 2.0130615234375, 2.106048583984375, 2.19903564453125, 2.292022705078125, 2.385009765625, 2.477996826171875, 2.57098388671875, 2.663970947265625, 2.7569580078125, 2.849945068359375, 2.94293212890625, 3.035919189453125, 3.12890625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 6.0, 1.0, 3.0, 6.0, 4.0, 9.0, 14.0, 9.0, 11.0, 18.0, 14.0, 13.0, 27.0, 28.0, 28.0, 46.0, 39.0, 27.0, 40.0, 48.0, 49.0, 54.0, 50.0, 55.0, 53.0, 46.0, 35.0, 51.0, 40.0, 36.0, 16.0, 22.0, 18.0, 21.0, 13.0, 10.0, 13.0, 8.0, 5.0, 9.0, 8.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00019049644470214844, -0.0001839473843574524, -0.00017739832401275635, -0.0001708492636680603, -0.00016430020332336426, -0.0001577511429786682, -0.00015120208263397217, -0.00014465302228927612, -0.00013810396194458008, -0.00013155490159988403, -0.000125005841255188, -0.00011845678091049194, -0.0001119077205657959, -0.00010535866022109985, -9.880959987640381e-05, -9.226053953170776e-05, -8.571147918701172e-05, -7.916241884231567e-05, -7.261335849761963e-05, -6.606429815292358e-05, -5.951523780822754e-05, -5.2966177463531494e-05, -4.641711711883545e-05, -3.9868056774139404e-05, -3.331899642944336e-05, -2.6769936084747314e-05, -2.022087574005127e-05, -1.3671815395355225e-05, -7.12275505065918e-06, -5.736947059631348e-07, 5.97536563873291e-06, 1.2524425983428955e-05, 1.9073486328125e-05, 2.5622546672821045e-05, 3.217160701751709e-05, 3.8720667362213135e-05, 4.526972770690918e-05, 5.1818788051605225e-05, 5.836784839630127e-05, 6.491690874099731e-05, 7.146596908569336e-05, 7.80150294303894e-05, 8.456408977508545e-05, 9.11131501197815e-05, 9.766221046447754e-05, 0.00010421127080917358, 0.00011076033115386963, 0.00011730939149856567, 0.00012385845184326172, 0.00013040751218795776, 0.0001369565725326538, 0.00014350563287734985, 0.0001500546932220459, 0.00015660375356674194, 0.000163152813911438, 0.00016970187425613403, 0.00017625093460083008, 0.00018279999494552612, 0.00018934905529022217, 0.0001958981156349182, 0.00020244717597961426, 0.0002089962363243103, 0.00021554529666900635, 0.0002220943570137024, 0.00022864341735839844]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 4.0, 10.0, 14.0, 26.0, 22.0, 41.0, 66.0, 101.0, 151.0, 282.0, 429.0, 652.0, 1101.0, 1753.0, 2958.0, 4999.0, 8507.0, 15223.0, 27180.0, 47617.0, 84074.0, 139051.0, 193636.0, 193053.0, 136382.0, 82674.0, 46786.0, 26332.0, 14762.0, 8385.0, 4840.0, 2875.0, 1711.0, 1060.0, 631.0, 438.0, 248.0, 170.0, 113.0, 72.0, 37.0, 32.0, 21.0, 9.0, 12.0, 1.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.501953125, -3.398895263671875, -3.29583740234375, -3.192779541015625, -3.0897216796875, -2.986663818359375, -2.88360595703125, -2.780548095703125, -2.677490234375, -2.574432373046875, -2.47137451171875, -2.368316650390625, -2.2652587890625, -2.162200927734375, -2.05914306640625, -1.956085205078125, -1.85302734375, -1.749969482421875, -1.64691162109375, -1.543853759765625, -1.4407958984375, -1.337738037109375, -1.23468017578125, -1.131622314453125, -1.028564453125, -0.925506591796875, -0.82244873046875, -0.719390869140625, -0.6163330078125, -0.513275146484375, -0.41021728515625, -0.307159423828125, -0.2041015625, -0.101043701171875, 0.00201416015625, 0.105072021484375, 0.2081298828125, 0.311187744140625, 0.41424560546875, 0.517303466796875, 0.620361328125, 0.723419189453125, 0.82647705078125, 0.929534912109375, 1.0325927734375, 1.135650634765625, 1.23870849609375, 1.341766357421875, 1.44482421875, 1.547882080078125, 1.65093994140625, 1.753997802734375, 1.8570556640625, 1.960113525390625, 2.06317138671875, 2.166229248046875, 2.269287109375, 2.372344970703125, 2.47540283203125, 2.578460693359375, 2.6815185546875, 2.784576416015625, 2.88763427734375, 2.990692138671875, 3.09375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 7.0, 8.0, 5.0, 10.0, 12.0, 16.0, 8.0, 14.0, 14.0, 20.0, 28.0, 35.0, 42.0, 38.0, 41.0, 51.0, 62.0, 64.0, 65.0, 63.0, 54.0, 54.0, 40.0, 42.0, 35.0, 24.0, 22.0, 13.0, 20.0, 20.0, 13.0, 11.0, 8.0, 8.0, 4.0, 6.0, 3.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2646484375, -1.2265472412109375, -1.188446044921875, -1.1503448486328125, -1.11224365234375, -1.0741424560546875, -1.036041259765625, -0.9979400634765625, -0.9598388671875, -0.9217376708984375, -0.883636474609375, -0.8455352783203125, -0.80743408203125, -0.7693328857421875, -0.731231689453125, -0.6931304931640625, -0.655029296875, -0.6169281005859375, -0.578826904296875, -0.5407257080078125, -0.50262451171875, -0.4645233154296875, -0.426422119140625, -0.3883209228515625, -0.3502197265625, -0.3121185302734375, -0.274017333984375, -0.2359161376953125, -0.19781494140625, -0.1597137451171875, -0.121612548828125, -0.0835113525390625, -0.04541015625, -0.0073089599609375, 0.030792236328125, 0.0688934326171875, 0.10699462890625, 0.1450958251953125, 0.183197021484375, 0.2212982177734375, 0.2593994140625, 0.2975006103515625, 0.335601806640625, 0.3737030029296875, 0.41180419921875, 0.4499053955078125, 0.488006591796875, 0.5261077880859375, 0.564208984375, 0.6023101806640625, 0.640411376953125, 0.6785125732421875, 0.71661376953125, 0.7547149658203125, 0.792816162109375, 0.8309173583984375, 0.8690185546875, 0.9071197509765625, 0.945220947265625, 0.9833221435546875, 1.02142333984375, 1.0595245361328125, 1.097625732421875, 1.1357269287109375, 1.173828125]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 2.0, 4.0, 7.0, 7.0, 8.0, 14.0, 17.0, 12.0, 23.0, 21.0, 20.0, 33.0, 38.0, 38.0, 49.0, 38.0, 55.0, 66.0, 55.0, 51.0, 48.0, 50.0, 45.0, 49.0, 49.0, 29.0, 24.0, 24.0, 25.0, 20.0, 10.0, 11.0, 14.0, 10.0, 7.0, 1.0, 9.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.100635528564453, -8.784401893615723, -8.468168258666992, -8.151933670043945, -7.835700035095215, -7.519466400146484, -7.203232288360596, -6.886998176574707, -6.570764541625977, -6.254530906677246, -5.938296794891357, -5.622062683105469, -5.305829048156738, -4.989595413208008, -4.673361301422119, -4.3571271896362305, -4.0408935546875, -3.7246596813201904, -3.408425807952881, -3.0921919345855713, -2.7759580612182617, -2.459724187850952, -2.1434903144836426, -1.827256441116333, -1.5110225677490234, -1.1947886943817139, -0.8785548210144043, -0.5623209476470947, -0.24608707427978516, 0.07014679908752441, 0.386380672454834, 0.7026145458221436, 1.0188493728637695, 1.335083246231079, 1.6513171195983887, 1.9675509929656982, 2.283784866333008, 2.6000187397003174, 2.916252613067627, 3.2324864864349365, 3.548720359802246, 3.8649542331695557, 4.181188106536865, 4.497422218322754, 4.813655853271484, 5.129889488220215, 5.4461236000061035, 5.762357711791992, 6.078591346740723, 6.394824981689453, 6.711059093475342, 7.0272932052612305, 7.343526840209961, 7.659760475158691, 7.97599458694458, 8.292228698730469, 8.6084623336792, 8.92469596862793, 9.240930557250977, 9.557164192199707, 9.873397827148438, 10.189631462097168, 10.505865097045898, 10.822099685668945, 11.138333320617676]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 6.0, 10.0, 12.0, 9.0, 10.0, 13.0, 15.0, 15.0, 22.0, 17.0, 18.0, 41.0, 35.0, 33.0, 26.0, 36.0, 40.0, 36.0, 28.0, 54.0, 50.0, 32.0, 46.0, 37.0, 29.0, 32.0, 25.0, 36.0, 31.0, 34.0, 24.0, 24.0, 17.0, 21.0, 16.0, 11.0, 8.0, 12.0, 6.0, 11.0, 5.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.335637092590332, -10.967034339904785, -10.598431587219238, -10.229829788208008, -9.861227035522461, -9.492624282836914, -9.124021530151367, -8.75541877746582, -8.386816024780273, -8.018213272094727, -7.649610996246338, -7.281008243560791, -6.912405490875244, -6.5438032150268555, -6.175200462341309, -5.806597709655762, -5.437995433807373, -5.069392681121826, -4.7007904052734375, -4.332187652587891, -3.9635848999023438, -3.594982385635376, -3.226379871368408, -2.8577771186828613, -2.4891746044158936, -2.120572090148926, -1.751969337463379, -1.3833668231964111, -1.0147641897201538, -0.6461615562438965, -0.2775590419769287, 0.09104371070861816, 0.45964622497558594, 0.8282488584518433, 1.1968514919281006, 1.5654540061950684, 1.9340566396713257, 2.302659273147583, 2.671261787414551, 3.0398645401000977, 3.4084670543670654, 3.777069568634033, 4.14567232131958, 4.514274597167969, 4.882877349853516, 5.2514801025390625, 5.620082855224609, 5.988685607910156, 6.357287883758545, 6.725890636444092, 7.0944929122924805, 7.463095664978027, 7.831698417663574, 8.200301170349121, 8.568902969360352, 8.937505722045898, 9.306108474731445, 9.674711227416992, 10.043313980102539, 10.411916732788086, 10.780518531799316, 11.149121284484863, 11.51772403717041, 11.886326789855957, 12.254929542541504]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 8.0, 13.0, 15.0, 36.0, 50.0, 75.0, 141.0, 224.0, 364.0, 575.0, 1023.0, 1648.0, 2588.0, 4397.0, 7268.0, 12189.0, 20341.0, 33711.0, 57234.0, 98207.0, 170767.0, 300558.0, 527666.0, 786609.0, 815083.0, 575380.0, 333290.0, 187786.0, 105997.0, 60920.0, 35796.0, 21217.0, 12769.0, 7915.0, 4801.0, 2918.0, 1772.0, 1080.0, 694.0, 428.0, 265.0, 172.0, 119.0, 68.0, 45.0, 29.0, 13.0, 10.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-9.6640625, -9.3804931640625, -9.096923828125, -8.8133544921875, -8.52978515625, -8.2462158203125, -7.962646484375, -7.6790771484375, -7.3955078125, -7.1119384765625, -6.828369140625, -6.5447998046875, -6.26123046875, -5.9776611328125, -5.694091796875, -5.4105224609375, -5.126953125, -4.8433837890625, -4.559814453125, -4.2762451171875, -3.99267578125, -3.7091064453125, -3.425537109375, -3.1419677734375, -2.8583984375, -2.5748291015625, -2.291259765625, -2.0076904296875, -1.72412109375, -1.4405517578125, -1.156982421875, -0.8734130859375, -0.58984375, -0.3062744140625, -0.022705078125, 0.2608642578125, 0.54443359375, 0.8280029296875, 1.111572265625, 1.3951416015625, 1.6787109375, 1.9622802734375, 2.245849609375, 2.5294189453125, 2.81298828125, 3.0965576171875, 3.380126953125, 3.6636962890625, 3.947265625, 4.2308349609375, 4.514404296875, 4.7979736328125, 5.08154296875, 5.3651123046875, 5.648681640625, 5.9322509765625, 6.2158203125, 6.4993896484375, 6.782958984375, 7.0665283203125, 7.35009765625, 7.6336669921875, 7.917236328125, 8.2008056640625, 8.484375]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 10.0, 8.0, 5.0, 12.0, 10.0, 9.0, 18.0, 14.0, 22.0, 26.0, 30.0, 28.0, 33.0, 28.0, 30.0, 25.0, 41.0, 36.0, 44.0, 42.0, 41.0, 45.0, 43.0, 31.0, 36.0, 32.0, 34.0, 36.0, 34.0, 22.0, 26.0, 27.0, 20.0, 15.0, 15.0, 12.0, 15.0, 11.0, 8.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.08984375, -6.85791015625, -6.6259765625, -6.39404296875, -6.162109375, -5.93017578125, -5.6982421875, -5.46630859375, -5.234375, -5.00244140625, -4.7705078125, -4.53857421875, -4.306640625, -4.07470703125, -3.8427734375, -3.61083984375, -3.37890625, -3.14697265625, -2.9150390625, -2.68310546875, -2.451171875, -2.21923828125, -1.9873046875, -1.75537109375, -1.5234375, -1.29150390625, -1.0595703125, -0.82763671875, -0.595703125, -0.36376953125, -0.1318359375, 0.10009765625, 0.33203125, 0.56396484375, 0.7958984375, 1.02783203125, 1.259765625, 1.49169921875, 1.7236328125, 1.95556640625, 2.1875, 2.41943359375, 2.6513671875, 2.88330078125, 3.115234375, 3.34716796875, 3.5791015625, 3.81103515625, 4.04296875, 4.27490234375, 4.5068359375, 4.73876953125, 4.970703125, 5.20263671875, 5.4345703125, 5.66650390625, 5.8984375, 6.13037109375, 6.3623046875, 6.59423828125, 6.826171875, 7.05810546875, 7.2900390625, 7.52197265625, 7.75390625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 6.0, 3.0, 5.0, 18.0, 17.0, 29.0, 47.0, 64.0, 104.0, 167.0, 298.0, 477.0, 760.0, 1267.0, 2111.0, 3581.0, 6183.0, 10266.0, 17885.0, 31137.0, 53326.0, 91862.0, 157211.0, 260222.0, 408987.0, 584105.0, 693864.0, 634464.0, 472190.0, 307763.0, 189606.0, 111194.0, 65211.0, 37753.0, 21698.0, 12456.0, 7316.0, 4318.0, 2549.0, 1489.0, 911.0, 527.0, 306.0, 191.0, 133.0, 92.0, 44.0, 26.0, 26.0, 13.0, 4.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.11328125, -6.88140869140625, -6.6495361328125, -6.41766357421875, -6.185791015625, -5.95391845703125, -5.7220458984375, -5.49017333984375, -5.25830078125, -5.02642822265625, -4.7945556640625, -4.56268310546875, -4.330810546875, -4.09893798828125, -3.8670654296875, -3.63519287109375, -3.4033203125, -3.17144775390625, -2.9395751953125, -2.70770263671875, -2.475830078125, -2.24395751953125, -2.0120849609375, -1.78021240234375, -1.54833984375, -1.31646728515625, -1.0845947265625, -0.85272216796875, -0.620849609375, -0.38897705078125, -0.1571044921875, 0.07476806640625, 0.306640625, 0.53851318359375, 0.7703857421875, 1.00225830078125, 1.234130859375, 1.46600341796875, 1.6978759765625, 1.92974853515625, 2.16162109375, 2.39349365234375, 2.6253662109375, 2.85723876953125, 3.089111328125, 3.32098388671875, 3.5528564453125, 3.78472900390625, 4.0166015625, 4.24847412109375, 4.4803466796875, 4.71221923828125, 4.944091796875, 5.17596435546875, 5.4078369140625, 5.63970947265625, 5.87158203125, 6.10345458984375, 6.3353271484375, 6.56719970703125, 6.799072265625, 7.03094482421875, 7.2628173828125, 7.49468994140625, 7.7265625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 4.0, 2.0, 9.0, 7.0, 16.0, 9.0, 17.0, 17.0, 18.0, 25.0, 30.0, 49.0, 52.0, 70.0, 82.0, 100.0, 102.0, 134.0, 154.0, 166.0, 177.0, 185.0, 254.0, 220.0, 228.0, 225.0, 235.0, 232.0, 199.0, 200.0, 181.0, 130.0, 112.0, 85.0, 74.0, 50.0, 57.0, 39.0, 30.0, 21.0, 21.0, 21.0, 11.0, 14.0, 8.0, 2.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.99591064453125, -3.8824462890625, -3.76898193359375, -3.655517578125, -3.54205322265625, -3.4285888671875, -3.31512451171875, -3.20166015625, -3.08819580078125, -2.9747314453125, -2.86126708984375, -2.747802734375, -2.63433837890625, -2.5208740234375, -2.40740966796875, -2.2939453125, -2.18048095703125, -2.0670166015625, -1.95355224609375, -1.840087890625, -1.72662353515625, -1.6131591796875, -1.49969482421875, -1.38623046875, -1.27276611328125, -1.1593017578125, -1.04583740234375, -0.932373046875, -0.81890869140625, -0.7054443359375, -0.59197998046875, -0.478515625, -0.36505126953125, -0.2515869140625, -0.13812255859375, -0.024658203125, 0.08880615234375, 0.2022705078125, 0.31573486328125, 0.42919921875, 0.54266357421875, 0.6561279296875, 0.76959228515625, 0.883056640625, 0.99652099609375, 1.1099853515625, 1.22344970703125, 1.3369140625, 1.45037841796875, 1.5638427734375, 1.67730712890625, 1.790771484375, 1.90423583984375, 2.0177001953125, 2.13116455078125, 2.24462890625, 2.35809326171875, 2.4715576171875, 2.58502197265625, 2.698486328125, 2.81195068359375, 2.9254150390625, 3.03887939453125, 3.15234375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 5.0, 4.0, 12.0, 11.0, 12.0, 11.0, 13.0, 25.0, 18.0, 32.0, 39.0, 52.0, 50.0, 56.0, 59.0, 71.0, 58.0, 63.0, 61.0, 65.0, 45.0, 38.0, 44.0, 31.0, 25.0, 20.0, 18.0, 11.0, 13.0, 14.0, 9.0, 2.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.388318061828613, -7.10281229019165, -6.8173065185546875, -6.531800270080566, -6.2462944984436035, -5.960788726806641, -5.6752824783325195, -5.389776706695557, -5.104270935058594, -4.818765163421631, -4.533259391784668, -4.247753143310547, -3.962247371673584, -3.676741600036621, -3.391235589981079, -3.105729579925537, -2.820223808288574, -2.5347180366516113, -2.2492120265960693, -1.963706135749817, -1.6782002449035645, -1.392694354057312, -1.1071884632110596, -0.8216825723648071, -0.5361766815185547, -0.25067079067230225, 0.034835100173950195, 0.32034099102020264, 0.6058468818664551, 0.8913527727127075, 1.17685866355896, 1.4623645544052124, 1.7478704452514648, 2.0333762168884277, 2.3188822269439697, 2.6043882369995117, 2.8898940086364746, 3.1753997802734375, 3.4609057903289795, 3.7464118003845215, 4.031917572021484, 4.317423343658447, 4.60292911529541, 4.888435363769531, 5.173941135406494, 5.459446907043457, 5.744953155517578, 6.030458927154541, 6.315964698791504, 6.601470470428467, 6.88697624206543, 7.172482490539551, 7.457988262176514, 7.743494033813477, 8.029000282287598, 8.314505577087402, 8.600011825561523, 8.885518074035645, 9.17102336883545, 9.45652961730957, 9.742034912109375, 10.027541160583496, 10.313047409057617, 10.598552703857422, 10.884058952331543]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [5.0, 1.0, 5.0, 3.0, 1.0, 9.0, 3.0, 7.0, 1.0, 7.0, 7.0, 8.0, 14.0, 10.0, 13.0, 9.0, 8.0, 19.0, 24.0, 21.0, 28.0, 27.0, 35.0, 30.0, 31.0, 37.0, 31.0, 34.0, 33.0, 26.0, 28.0, 46.0, 38.0, 33.0, 30.0, 26.0, 24.0, 24.0, 33.0, 21.0, 37.0, 27.0, 22.0, 17.0, 21.0, 8.0, 16.0, 15.0, 11.0, 7.0, 7.0, 12.0, 4.0, 10.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.7470293045043945, -7.494931221008301, -7.242832660675049, -6.990734577178955, -6.738636016845703, -6.486537933349609, -6.234439849853516, -5.982341289520264, -5.730242729187012, -5.478144645690918, -5.226046085357666, -4.973948001861572, -4.72184944152832, -4.469751358032227, -4.217653274536133, -3.965554714202881, -3.713456630706787, -3.4613583087921143, -3.2092599868774414, -2.9571619033813477, -2.7050633430480957, -2.452965259552002, -2.200866937637329, -1.9487686157226562, -1.6966702938079834, -1.4445719718933105, -1.1924736499786377, -0.9403754472732544, -0.6882771253585815, -0.4361788034439087, -0.1840806007385254, 0.06801772117614746, 0.3201160430908203, 0.5722143650054932, 0.8243126273155212, 1.0764108896255493, 1.3285092115402222, 1.580607533454895, 1.8327057361602783, 2.084804058074951, 2.336902379989624, 2.589000701904297, 2.8410990238189697, 3.0931973457336426, 3.3452954292297363, 3.5973939895629883, 3.849492073059082, 4.101590156555176, 4.353688716888428, 4.6057868003845215, 4.857885360717773, 5.109983444213867, 5.362082004547119, 5.614180088043213, 5.866278648376465, 6.118376731872559, 6.370474815368652, 6.622572898864746, 6.874671459197998, 7.126769542694092, 7.378868103027344, 7.6309661865234375, 7.883064270019531, 8.135162353515625, 8.387261390686035]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 9.0, 15.0, 24.0, 16.0, 35.0, 60.0, 105.0, 140.0, 185.0, 288.0, 436.0, 702.0, 1042.0, 1504.0, 2253.0, 3457.0, 5248.0, 8057.0, 12418.0, 19338.0, 30988.0, 48624.0, 77116.0, 117845.0, 165195.0, 175182.0, 133826.0, 88560.0, 56631.0, 35251.0, 22583.0, 14343.0, 9237.0, 6051.0, 3940.0, 2525.0, 1789.0, 1167.0, 770.0, 530.0, 348.0, 262.0, 156.0, 103.0, 71.0, 52.0, 23.0, 23.0, 9.0, 9.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28515625, -2.211822509765625, -2.13848876953125, -2.065155029296875, -1.9918212890625, -1.918487548828125, -1.84515380859375, -1.771820068359375, -1.698486328125, -1.625152587890625, -1.55181884765625, -1.478485107421875, -1.4051513671875, -1.331817626953125, -1.25848388671875, -1.185150146484375, -1.11181640625, -1.038482666015625, -0.96514892578125, -0.891815185546875, -0.8184814453125, -0.745147705078125, -0.67181396484375, -0.598480224609375, -0.525146484375, -0.451812744140625, -0.37847900390625, -0.305145263671875, -0.2318115234375, -0.158477783203125, -0.08514404296875, -0.011810302734375, 0.0615234375, 0.134857177734375, 0.20819091796875, 0.281524658203125, 0.3548583984375, 0.428192138671875, 0.50152587890625, 0.574859619140625, 0.648193359375, 0.721527099609375, 0.79486083984375, 0.868194580078125, 0.9415283203125, 1.014862060546875, 1.08819580078125, 1.161529541015625, 1.23486328125, 1.308197021484375, 1.38153076171875, 1.454864501953125, 1.5281982421875, 1.601531982421875, 1.67486572265625, 1.748199462890625, 1.821533203125, 1.894866943359375, 1.96820068359375, 2.041534423828125, 2.1148681640625, 2.188201904296875, 2.26153564453125, 2.334869384765625, 2.408203125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 11.0, 8.0, 6.0, 3.0, 9.0, 11.0, 21.0, 10.0, 14.0, 19.0, 16.0, 21.0, 27.0, 29.0, 26.0, 37.0, 36.0, 24.0, 34.0, 32.0, 35.0, 32.0, 35.0, 29.0, 36.0, 26.0, 40.0, 27.0, 23.0, 31.0, 30.0, 37.0, 23.0, 19.0, 19.0, 24.0, 22.0, 23.0, 9.0, 13.0, 12.0, 15.0, 9.0, 3.0, 2.0, 7.0, 7.0, 5.0, 1.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9765625, -7.7247314453125, -7.472900390625, -7.2210693359375, -6.96923828125, -6.7174072265625, -6.465576171875, -6.2137451171875, -5.9619140625, -5.7100830078125, -5.458251953125, -5.2064208984375, -4.95458984375, -4.7027587890625, -4.450927734375, -4.1990966796875, -3.947265625, -3.6954345703125, -3.443603515625, -3.1917724609375, -2.93994140625, -2.6881103515625, -2.436279296875, -2.1844482421875, -1.9326171875, -1.6807861328125, -1.428955078125, -1.1771240234375, -0.92529296875, -0.6734619140625, -0.421630859375, -0.1697998046875, 0.08203125, 0.3338623046875, 0.585693359375, 0.8375244140625, 1.08935546875, 1.3411865234375, 1.593017578125, 1.8448486328125, 2.0966796875, 2.3485107421875, 2.600341796875, 2.8521728515625, 3.10400390625, 3.3558349609375, 3.607666015625, 3.8594970703125, 4.111328125, 4.3631591796875, 4.614990234375, 4.8668212890625, 5.11865234375, 5.3704833984375, 5.622314453125, 5.8741455078125, 6.1259765625, 6.3778076171875, 6.629638671875, 6.8814697265625, 7.13330078125, 7.3851318359375, 7.636962890625, 7.8887939453125, 8.140625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 8.0, 5.0, 12.0, 13.0, 12.0, 30.0, 42.0, 40.0, 66.0, 81.0, 117.0, 181.0, 251.0, 348.0, 512.0, 869.0, 1423.0, 2883.0, 6150.0, 15987.0, 51727.0, 911725.0, 33937.0, 11626.0, 4863.0, 2200.0, 1236.0, 693.0, 429.0, 298.0, 216.0, 154.0, 105.0, 92.0, 54.0, 31.0, 40.0, 37.0, 22.0, 11.0, 13.0, 7.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3046875, -9.0169677734375, -8.729248046875, -8.4415283203125, -8.15380859375, -7.8660888671875, -7.578369140625, -7.2906494140625, -7.0029296875, -6.7152099609375, -6.427490234375, -6.1397705078125, -5.85205078125, -5.5643310546875, -5.276611328125, -4.9888916015625, -4.701171875, -4.4134521484375, -4.125732421875, -3.8380126953125, -3.55029296875, -3.2625732421875, -2.974853515625, -2.6871337890625, -2.3994140625, -2.1116943359375, -1.823974609375, -1.5362548828125, -1.24853515625, -0.9608154296875, -0.673095703125, -0.3853759765625, -0.09765625, 0.1900634765625, 0.477783203125, 0.7655029296875, 1.05322265625, 1.3409423828125, 1.628662109375, 1.9163818359375, 2.2041015625, 2.4918212890625, 2.779541015625, 3.0672607421875, 3.35498046875, 3.6427001953125, 3.930419921875, 4.2181396484375, 4.505859375, 4.7935791015625, 5.081298828125, 5.3690185546875, 5.65673828125, 5.9444580078125, 6.232177734375, 6.5198974609375, 6.8076171875, 7.0953369140625, 7.383056640625, 7.6707763671875, 7.95849609375, 8.2462158203125, 8.533935546875, 8.8216552734375, 9.109375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 10.0, 8.0, 13.0, 9.0, 21.0, 16.0, 16.0, 25.0, 20.0, 26.0, 35.0, 40.0, 32.0, 39.0, 48.0, 42.0, 41.0, 50.0, 50.0, 39.0, 54.0, 43.0, 37.0, 37.0, 39.0, 30.0, 34.0, 26.0, 22.0, 16.0, 23.0, 13.0, 15.0, 9.0, 9.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.16796875, -6.93072509765625, -6.6934814453125, -6.45623779296875, -6.218994140625, -5.98175048828125, -5.7445068359375, -5.50726318359375, -5.27001953125, -5.03277587890625, -4.7955322265625, -4.55828857421875, -4.321044921875, -4.08380126953125, -3.8465576171875, -3.60931396484375, -3.3720703125, -3.13482666015625, -2.8975830078125, -2.66033935546875, -2.423095703125, -2.18585205078125, -1.9486083984375, -1.71136474609375, -1.47412109375, -1.23687744140625, -0.9996337890625, -0.76239013671875, -0.525146484375, -0.28790283203125, -0.0506591796875, 0.18658447265625, 0.423828125, 0.66107177734375, 0.8983154296875, 1.13555908203125, 1.372802734375, 1.61004638671875, 1.8472900390625, 2.08453369140625, 2.32177734375, 2.55902099609375, 2.7962646484375, 3.03350830078125, 3.270751953125, 3.50799560546875, 3.7452392578125, 3.98248291015625, 4.2197265625, 4.45697021484375, 4.6942138671875, 4.93145751953125, 5.168701171875, 5.40594482421875, 5.6431884765625, 5.88043212890625, 6.11767578125, 6.35491943359375, 6.5921630859375, 6.82940673828125, 7.066650390625, 7.30389404296875, 7.5411376953125, 7.77838134765625, 8.015625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 9.0, 10.0, 14.0, 17.0, 27.0, 43.0, 47.0, 70.0, 78.0, 132.0, 172.0, 275.0, 380.0, 639.0, 997.0, 1758.0, 3338.0, 7220.0, 18708.0, 823115.0, 158018.0, 18450.0, 7059.0, 3255.0, 1750.0, 1027.0, 635.0, 391.0, 256.0, 180.0, 139.0, 89.0, 52.0, 48.0, 43.0, 21.0, 30.0, 12.0, 7.0, 9.0, 4.0, 2.0, 7.0, 2.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7021484375, -1.6454010009765625, -1.588653564453125, -1.5319061279296875, -1.47515869140625, -1.4184112548828125, -1.361663818359375, -1.3049163818359375, -1.2481689453125, -1.1914215087890625, -1.134674072265625, -1.0779266357421875, -1.02117919921875, -0.9644317626953125, -0.907684326171875, -0.8509368896484375, -0.794189453125, -0.7374420166015625, -0.680694580078125, -0.6239471435546875, -0.56719970703125, -0.5104522705078125, -0.453704833984375, -0.3969573974609375, -0.3402099609375, -0.2834625244140625, -0.226715087890625, -0.1699676513671875, -0.11322021484375, -0.0564727783203125, 0.000274658203125, 0.0570220947265625, 0.11376953125, 0.1705169677734375, 0.227264404296875, 0.2840118408203125, 0.34075927734375, 0.3975067138671875, 0.454254150390625, 0.5110015869140625, 0.5677490234375, 0.6244964599609375, 0.681243896484375, 0.7379913330078125, 0.79473876953125, 0.8514862060546875, 0.908233642578125, 0.9649810791015625, 1.021728515625, 1.0784759521484375, 1.135223388671875, 1.1919708251953125, 1.24871826171875, 1.3054656982421875, 1.362213134765625, 1.4189605712890625, 1.4757080078125, 1.5324554443359375, 1.589202880859375, 1.6459503173828125, 1.70269775390625, 1.7594451904296875, 1.816192626953125, 1.8729400634765625, 1.9296875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 1.0, 1.0, 10.0, 15.0, 12.0, 13.0, 23.0, 25.0, 29.0, 31.0, 39.0, 45.0, 50.0, 59.0, 63.0, 54.0, 62.0, 67.0, 59.0, 47.0, 59.0, 46.0, 28.0, 36.0, 23.0, 11.0, 18.0, 20.0, 8.0, 14.0, 4.0, 3.0, 0.0, 4.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1544437408447266e-05, -3.9948150515556335e-05, -3.8351863622665405e-05, -3.6755576729774475e-05, -3.5159289836883545e-05, -3.3563002943992615e-05, -3.1966716051101685e-05, -3.0370429158210754e-05, -2.8774142265319824e-05, -2.7177855372428894e-05, -2.5581568479537964e-05, -2.3985281586647034e-05, -2.2388994693756104e-05, -2.0792707800865173e-05, -1.9196420907974243e-05, -1.7600134015083313e-05, -1.6003847122192383e-05, -1.4407560229301453e-05, -1.2811273336410522e-05, -1.1214986443519592e-05, -9.618699550628662e-06, -8.022412657737732e-06, -6.426125764846802e-06, -4.829838871955872e-06, -3.2335519790649414e-06, -1.6372650861740112e-06, -4.0978193283081055e-08, 1.5553086996078491e-06, 3.1515955924987793e-06, 4.7478824853897095e-06, 6.34416937828064e-06, 7.94045627117157e-06, 9.5367431640625e-06, 1.113303005695343e-05, 1.272931694984436e-05, 1.432560384273529e-05, 1.592189073562622e-05, 1.751817762851715e-05, 1.911446452140808e-05, 2.071075141429901e-05, 2.230703830718994e-05, 2.390332520008087e-05, 2.5499612092971802e-05, 2.7095898985862732e-05, 2.8692185878753662e-05, 3.0288472771644592e-05, 3.188475966453552e-05, 3.348104655742645e-05, 3.507733345031738e-05, 3.667362034320831e-05, 3.826990723609924e-05, 3.986619412899017e-05, 4.1462481021881104e-05, 4.3058767914772034e-05, 4.4655054807662964e-05, 4.6251341700553894e-05, 4.7847628593444824e-05, 4.9443915486335754e-05, 5.1040202379226685e-05, 5.2636489272117615e-05, 5.4232776165008545e-05, 5.5829063057899475e-05, 5.7425349950790405e-05, 5.9021636843681335e-05, 6.0617923736572266e-05]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 6.0, 15.0, 17.0, 28.0, 45.0, 67.0, 89.0, 137.0, 245.0, 349.0, 601.0, 920.0, 1570.0, 2769.0, 4797.0, 7835.0, 13716.0, 24931.0, 47697.0, 98400.0, 229996.0, 319192.0, 149473.0, 67562.0, 34540.0, 18152.0, 10451.0, 5921.0, 3569.0, 2194.0, 1232.0, 724.0, 454.0, 297.0, 182.0, 128.0, 86.0, 59.0, 34.0, 24.0, 18.0, 11.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50927734375, -0.49298095703125, -0.4766845703125, -0.46038818359375, -0.444091796875, -0.42779541015625, -0.4114990234375, -0.39520263671875, -0.37890625, -0.36260986328125, -0.3463134765625, -0.33001708984375, -0.313720703125, -0.29742431640625, -0.2811279296875, -0.26483154296875, -0.24853515625, -0.23223876953125, -0.2159423828125, -0.19964599609375, -0.183349609375, -0.16705322265625, -0.1507568359375, -0.13446044921875, -0.1181640625, -0.10186767578125, -0.0855712890625, -0.06927490234375, -0.052978515625, -0.03668212890625, -0.0203857421875, -0.00408935546875, 0.01220703125, 0.02850341796875, 0.0447998046875, 0.06109619140625, 0.077392578125, 0.09368896484375, 0.1099853515625, 0.12628173828125, 0.142578125, 0.15887451171875, 0.1751708984375, 0.19146728515625, 0.207763671875, 0.22406005859375, 0.2403564453125, 0.25665283203125, 0.27294921875, 0.28924560546875, 0.3055419921875, 0.32183837890625, 0.338134765625, 0.35443115234375, 0.3707275390625, 0.38702392578125, 0.4033203125, 0.41961669921875, 0.4359130859375, 0.45220947265625, 0.468505859375, 0.48480224609375, 0.5010986328125, 0.51739501953125, 0.53369140625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 9.0, 7.0, 4.0, 12.0, 23.0, 30.0, 34.0, 34.0, 53.0, 56.0, 83.0, 94.0, 94.0, 86.0, 96.0, 56.0, 41.0, 41.0, 41.0, 24.0, 21.0, 15.0, 8.0, 10.0, 3.0, 4.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19287109375, -0.1861572265625, -0.179443359375, -0.1727294921875, -0.166015625, -0.1593017578125, -0.152587890625, -0.1458740234375, -0.13916015625, -0.1324462890625, -0.125732421875, -0.1190185546875, -0.1123046875, -0.1055908203125, -0.098876953125, -0.0921630859375, -0.08544921875, -0.0787353515625, -0.072021484375, -0.0653076171875, -0.05859375, -0.0518798828125, -0.045166015625, -0.0384521484375, -0.03173828125, -0.0250244140625, -0.018310546875, -0.0115966796875, -0.0048828125, 0.0018310546875, 0.008544921875, 0.0152587890625, 0.02197265625, 0.0286865234375, 0.035400390625, 0.0421142578125, 0.048828125, 0.0555419921875, 0.062255859375, 0.0689697265625, 0.07568359375, 0.0823974609375, 0.089111328125, 0.0958251953125, 0.1025390625, 0.1092529296875, 0.115966796875, 0.1226806640625, 0.12939453125, 0.1361083984375, 0.142822265625, 0.1495361328125, 0.15625, 0.1629638671875, 0.169677734375, 0.1763916015625, 0.18310546875, 0.1898193359375, 0.196533203125, 0.2032470703125, 0.2099609375, 0.2166748046875, 0.223388671875, 0.2301025390625, 0.23681640625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 5.0, 16.0, 16.0, 7.0, 18.0, 29.0, 28.0, 34.0, 34.0, 50.0, 52.0, 65.0, 70.0, 63.0, 60.0, 63.0, 53.0, 67.0, 33.0, 46.0, 32.0, 25.0, 24.0, 26.0, 12.0, 14.0, 13.0, 11.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.939026355743408, -6.6618852615356445, -6.384743690490723, -6.107602596282959, -5.830461502075195, -5.553319931030273, -5.27617883682251, -4.999037742614746, -4.721896171569824, -4.4447550773620605, -4.167613506317139, -3.890472412109375, -3.6133313179016113, -3.3361899852752686, -3.059048652648926, -2.781907558441162, -2.5047664642333984, -2.2276251316070557, -1.950484037399292, -1.6733427047729492, -1.396201491355896, -1.1190602779388428, -0.8419189453125, -0.5647777318954468, -0.28763651847839355, -0.010495275259017944, 0.26664596796035767, 0.5437872409820557, 0.8209284543991089, 1.098069667816162, 1.3752110004425049, 1.652352213859558, 1.9294929504394531, 2.206634283065796, 2.4837753772735596, 2.7609167098999023, 3.038057804107666, 3.315199136734009, 3.5923404693603516, 3.8694815635681152, 4.146622657775879, 4.423763751983643, 4.7009053230285645, 4.978046417236328, 5.255187511444092, 5.5323286056518555, 5.809470176696777, 6.086611270904541, 6.363752841949463, 6.640893936157227, 6.918035507202148, 7.195176601409912, 7.472317695617676, 7.749459266662598, 8.026599884033203, 8.303741455078125, 8.580883026123047, 8.858024597167969, 9.135165214538574, 9.412306785583496, 9.689448356628418, 9.966588973999023, 10.243730545043945, 10.520872116088867, 10.798012733459473]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 2.0, 2.0, 9.0, 6.0, 4.0, 4.0, 4.0, 7.0, 12.0, 10.0, 13.0, 11.0, 11.0, 11.0, 22.0, 20.0, 25.0, 29.0, 28.0, 28.0, 41.0, 29.0, 33.0, 32.0, 34.0, 30.0, 25.0, 36.0, 45.0, 32.0, 34.0, 28.0, 29.0, 21.0, 22.0, 34.0, 28.0, 31.0, 26.0, 21.0, 16.0, 19.0, 10.0, 16.0, 14.0, 12.0, 4.0, 11.0, 7.0, 8.0, 7.0, 7.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.49487829208374, -7.248100757598877, -7.0013227462768555, -6.754545211791992, -6.507767677307129, -6.260990142822266, -6.014212131500244, -5.767434597015381, -5.520656585693359, -5.273879051208496, -5.027101039886475, -4.780323505401611, -4.533545970916748, -4.286767959594727, -4.039990425109863, -3.793212890625, -3.5464353561401367, -3.2996575832366943, -3.052880048751831, -2.8061022758483887, -2.5593247413635254, -2.312546968460083, -2.0657691955566406, -1.8189915418624878, -1.572213888168335, -1.3254362344741821, -1.0786585807800293, -0.8318808078765869, -0.5851031541824341, -0.33832550048828125, -0.09154772758483887, 0.15522992610931396, 0.402008056640625, 0.6487857103347778, 0.8955634236335754, 1.142341136932373, 1.3891187906265259, 1.6358964443206787, 1.882674217224121, 2.1294517517089844, 2.3762295246124268, 2.623007297515869, 2.8697848320007324, 3.116562604904175, 3.363340377807617, 3.6101179122924805, 3.856895685195923, 4.103673458099365, 4.3504509925842285, 4.597228527069092, 4.844006538391113, 5.090784072875977, 5.33756160736084, 5.584339141845703, 5.831117153167725, 6.077894687652588, 6.324672698974609, 6.571450233459473, 6.818228244781494, 7.065005779266357, 7.311783313751221, 7.558561325073242, 7.8053388595581055, 8.052116394042969, 8.298893928527832]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 11.0, 27.0, 32.0, 58.0, 81.0, 113.0, 185.0, 286.0, 406.0, 660.0, 925.0, 1403.0, 2096.0, 2999.0, 4486.0, 6603.0, 9910.0, 14522.0, 21560.0, 31371.0, 44262.0, 61845.0, 81263.0, 101577.0, 115953.0, 118617.0, 108120.0, 89129.0, 68306.0, 50025.0, 35315.0, 24471.0, 16832.0, 11495.0, 7810.0, 5255.0, 3589.0, 2296.0, 1520.0, 1075.0, 702.0, 436.0, 325.0, 236.0, 128.0, 76.0, 57.0, 40.0, 26.0, 21.0, 9.0, 2.0, 7.0, 4.0, 1.0, 2.0], "bins": [-6.65625, -6.45562744140625, -6.2550048828125, -6.05438232421875, -5.853759765625, -5.65313720703125, -5.4525146484375, -5.25189208984375, -5.05126953125, -4.85064697265625, -4.6500244140625, -4.44940185546875, -4.248779296875, -4.04815673828125, -3.8475341796875, -3.64691162109375, -3.4462890625, -3.24566650390625, -3.0450439453125, -2.84442138671875, -2.643798828125, -2.44317626953125, -2.2425537109375, -2.04193115234375, -1.84130859375, -1.64068603515625, -1.4400634765625, -1.23944091796875, -1.038818359375, -0.83819580078125, -0.6375732421875, -0.43695068359375, -0.236328125, -0.03570556640625, 0.1649169921875, 0.36553955078125, 0.566162109375, 0.76678466796875, 0.9674072265625, 1.16802978515625, 1.36865234375, 1.56927490234375, 1.7698974609375, 1.97052001953125, 2.171142578125, 2.37176513671875, 2.5723876953125, 2.77301025390625, 2.9736328125, 3.17425537109375, 3.3748779296875, 3.57550048828125, 3.776123046875, 3.97674560546875, 4.1773681640625, 4.37799072265625, 4.57861328125, 4.77923583984375, 4.9798583984375, 5.18048095703125, 5.381103515625, 5.58172607421875, 5.7823486328125, 5.98297119140625, 6.18359375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 9.0, 7.0, 8.0, 10.0, 12.0, 11.0, 13.0, 14.0, 17.0, 19.0, 21.0, 18.0, 37.0, 29.0, 28.0, 22.0, 36.0, 41.0, 38.0, 34.0, 32.0, 32.0, 37.0, 42.0, 27.0, 36.0, 32.0, 24.0, 29.0, 27.0, 24.0, 22.0, 30.0, 32.0, 16.0, 17.0, 18.0, 18.0, 11.0, 6.0, 13.0, 3.0, 4.0, 9.0, 5.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.125, -6.886474609375, -6.64794921875, -6.409423828125, -6.1708984375, -5.932373046875, -5.69384765625, -5.455322265625, -5.216796875, -4.978271484375, -4.73974609375, -4.501220703125, -4.2626953125, -4.024169921875, -3.78564453125, -3.547119140625, -3.30859375, -3.070068359375, -2.83154296875, -2.593017578125, -2.3544921875, -2.115966796875, -1.87744140625, -1.638916015625, -1.400390625, -1.161865234375, -0.92333984375, -0.684814453125, -0.4462890625, -0.207763671875, 0.03076171875, 0.269287109375, 0.5078125, 0.746337890625, 0.98486328125, 1.223388671875, 1.4619140625, 1.700439453125, 1.93896484375, 2.177490234375, 2.416015625, 2.654541015625, 2.89306640625, 3.131591796875, 3.3701171875, 3.608642578125, 3.84716796875, 4.085693359375, 4.32421875, 4.562744140625, 4.80126953125, 5.039794921875, 5.2783203125, 5.516845703125, 5.75537109375, 5.993896484375, 6.232421875, 6.470947265625, 6.70947265625, 6.947998046875, 7.1865234375, 7.425048828125, 7.66357421875, 7.902099609375, 8.140625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 7.0, 11.0, 9.0, 15.0, 32.0, 35.0, 30.0, 68.0, 89.0, 136.0, 202.0, 311.0, 474.0, 706.0, 1112.0, 1693.0, 2482.0, 4009.0, 6233.0, 9834.0, 15135.0, 23933.0, 37503.0, 57309.0, 83368.0, 113355.0, 136605.0, 141354.0, 124612.0, 95348.0, 67481.0, 44587.0, 29127.0, 18489.0, 11664.0, 7496.0, 4995.0, 3041.0, 1923.0, 1328.0, 771.0, 564.0, 364.0, 242.0, 162.0, 105.0, 66.0, 46.0, 34.0, 23.0, 14.0, 14.0, 8.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-7.609375, -7.37310791015625, -7.1368408203125, -6.90057373046875, -6.664306640625, -6.42803955078125, -6.1917724609375, -5.95550537109375, -5.71923828125, -5.48297119140625, -5.2467041015625, -5.01043701171875, -4.774169921875, -4.53790283203125, -4.3016357421875, -4.06536865234375, -3.8291015625, -3.59283447265625, -3.3565673828125, -3.12030029296875, -2.884033203125, -2.64776611328125, -2.4114990234375, -2.17523193359375, -1.93896484375, -1.70269775390625, -1.4664306640625, -1.23016357421875, -0.993896484375, -0.75762939453125, -0.5213623046875, -0.28509521484375, -0.048828125, 0.18743896484375, 0.4237060546875, 0.65997314453125, 0.896240234375, 1.13250732421875, 1.3687744140625, 1.60504150390625, 1.84130859375, 2.07757568359375, 2.3138427734375, 2.55010986328125, 2.786376953125, 3.02264404296875, 3.2589111328125, 3.49517822265625, 3.7314453125, 3.96771240234375, 4.2039794921875, 4.44024658203125, 4.676513671875, 4.91278076171875, 5.1490478515625, 5.38531494140625, 5.62158203125, 5.85784912109375, 6.0941162109375, 6.33038330078125, 6.566650390625, 6.80291748046875, 7.0391845703125, 7.27545166015625, 7.51171875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 11.0, 9.0, 8.0, 13.0, 12.0, 16.0, 11.0, 16.0, 24.0, 20.0, 23.0, 26.0, 21.0, 27.0, 17.0, 34.0, 37.0, 34.0, 44.0, 33.0, 47.0, 34.0, 45.0, 39.0, 32.0, 36.0, 38.0, 29.0, 25.0, 33.0, 33.0, 23.0, 26.0, 29.0, 19.0, 11.0, 14.0, 11.0, 13.0, 11.0, 7.0, 2.0, 2.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.6171875, -5.448974609375, -5.28076171875, -5.112548828125, -4.9443359375, -4.776123046875, -4.60791015625, -4.439697265625, -4.271484375, -4.103271484375, -3.93505859375, -3.766845703125, -3.5986328125, -3.430419921875, -3.26220703125, -3.093994140625, -2.92578125, -2.757568359375, -2.58935546875, -2.421142578125, -2.2529296875, -2.084716796875, -1.91650390625, -1.748291015625, -1.580078125, -1.411865234375, -1.24365234375, -1.075439453125, -0.9072265625, -0.739013671875, -0.57080078125, -0.402587890625, -0.234375, -0.066162109375, 0.10205078125, 0.270263671875, 0.4384765625, 0.606689453125, 0.77490234375, 0.943115234375, 1.111328125, 1.279541015625, 1.44775390625, 1.615966796875, 1.7841796875, 1.952392578125, 2.12060546875, 2.288818359375, 2.45703125, 2.625244140625, 2.79345703125, 2.961669921875, 3.1298828125, 3.298095703125, 3.46630859375, 3.634521484375, 3.802734375, 3.970947265625, 4.13916015625, 4.307373046875, 4.4755859375, 4.643798828125, 4.81201171875, 4.980224609375, 5.1484375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 5.0, 8.0, 15.0, 14.0, 12.0, 30.0, 34.0, 48.0, 67.0, 113.0, 169.0, 236.0, 349.0, 553.0, 782.0, 1184.0, 1755.0, 2828.0, 4445.0, 6837.0, 10619.0, 16579.0, 25979.0, 41040.0, 63454.0, 94084.0, 129811.0, 154427.0, 147138.0, 116387.0, 80976.0, 53607.0, 34190.0, 21611.0, 14019.0, 8825.0, 5592.0, 3665.0, 2444.0, 1567.0, 1009.0, 630.0, 472.0, 301.0, 211.0, 144.0, 83.0, 60.0, 55.0, 31.0, 22.0, 17.0, 9.0, 6.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.056640625, -1.9898681640625, -1.923095703125, -1.8563232421875, -1.78955078125, -1.7227783203125, -1.656005859375, -1.5892333984375, -1.5224609375, -1.4556884765625, -1.388916015625, -1.3221435546875, -1.25537109375, -1.1885986328125, -1.121826171875, -1.0550537109375, -0.98828125, -0.9215087890625, -0.854736328125, -0.7879638671875, -0.72119140625, -0.6544189453125, -0.587646484375, -0.5208740234375, -0.4541015625, -0.3873291015625, -0.320556640625, -0.2537841796875, -0.18701171875, -0.1202392578125, -0.053466796875, 0.0133056640625, 0.080078125, 0.1468505859375, 0.213623046875, 0.2803955078125, 0.34716796875, 0.4139404296875, 0.480712890625, 0.5474853515625, 0.6142578125, 0.6810302734375, 0.747802734375, 0.8145751953125, 0.88134765625, 0.9481201171875, 1.014892578125, 1.0816650390625, 1.1484375, 1.2152099609375, 1.281982421875, 1.3487548828125, 1.41552734375, 1.4822998046875, 1.549072265625, 1.6158447265625, 1.6826171875, 1.7493896484375, 1.816162109375, 1.8829345703125, 1.94970703125, 2.0164794921875, 2.083251953125, 2.1500244140625, 2.216796875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 4.0, 9.0, 10.0, 14.0, 13.0, 19.0, 33.0, 36.0, 35.0, 46.0, 44.0, 50.0, 55.0, 71.0, 93.0, 60.0, 66.0, 65.0, 43.0, 46.0, 34.0, 40.0, 20.0, 26.0, 14.0, 15.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021183490753173828, -0.00020458362996578217, -0.00019733235239982605, -0.00019008107483386993, -0.00018282979726791382, -0.0001755785197019577, -0.0001683272421360016, -0.00016107596457004547, -0.00015382468700408936, -0.00014657340943813324, -0.00013932213187217712, -0.000132070854306221, -0.0001248195767402649, -0.00011756829917430878, -0.00011031702160835266, -0.00010306574404239655, -9.581446647644043e-05, -8.856318891048431e-05, -8.13119113445282e-05, -7.406063377857208e-05, -6.680935621261597e-05, -5.955807864665985e-05, -5.2306801080703735e-05, -4.505552351474762e-05, -3.7804245948791504e-05, -3.055296838283539e-05, -2.3301690816879272e-05, -1.6050413250923157e-05, -8.799135684967041e-06, -1.5478581190109253e-06, 5.7034194469451904e-06, 1.2954697012901306e-05, 2.0205974578857422e-05, 2.7457252144813538e-05, 3.470852971076965e-05, 4.195980727672577e-05, 4.9211084842681885e-05, 5.6462362408638e-05, 6.371363997459412e-05, 7.096491754055023e-05, 7.821619510650635e-05, 8.546747267246246e-05, 9.271875023841858e-05, 9.99700278043747e-05, 0.00010722130537033081, 0.00011447258293628693, 0.00012172386050224304, 0.00012897513806819916, 0.00013622641563415527, 0.0001434776932001114, 0.0001507289707660675, 0.00015798024833202362, 0.00016523152589797974, 0.00017248280346393585, 0.00017973408102989197, 0.00018698535859584808, 0.0001942366361618042, 0.00020148791372776031, 0.00020873919129371643, 0.00021599046885967255, 0.00022324174642562866, 0.00023049302399158478, 0.0002377443015575409, 0.000244995579123497, 0.0002522468566894531]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 5.0, 5.0, 10.0, 14.0, 30.0, 31.0, 43.0, 56.0, 126.0, 147.0, 218.0, 346.0, 472.0, 744.0, 1065.0, 1628.0, 2418.0, 3590.0, 5356.0, 7993.0, 12107.0, 18479.0, 27968.0, 42287.0, 63558.0, 90905.0, 121454.0, 141932.0, 139225.0, 114041.0, 83279.0, 56943.0, 37842.0, 24910.0, 16612.0, 10979.0, 7105.0, 4859.0, 3276.0, 2120.0, 1440.0, 1018.0, 615.0, 454.0, 281.0, 177.0, 144.0, 87.0, 61.0, 42.0, 28.0, 12.0, 15.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9287109375, -1.8662261962890625, -1.803741455078125, -1.7412567138671875, -1.67877197265625, -1.6162872314453125, -1.553802490234375, -1.4913177490234375, -1.4288330078125, -1.3663482666015625, -1.303863525390625, -1.2413787841796875, -1.17889404296875, -1.1164093017578125, -1.053924560546875, -0.9914398193359375, -0.928955078125, -0.8664703369140625, -0.803985595703125, -0.7415008544921875, -0.67901611328125, -0.6165313720703125, -0.554046630859375, -0.4915618896484375, -0.4290771484375, -0.3665924072265625, -0.304107666015625, -0.2416229248046875, -0.17913818359375, -0.1166534423828125, -0.054168701171875, 0.0083160400390625, 0.07080078125, 0.1332855224609375, 0.195770263671875, 0.2582550048828125, 0.32073974609375, 0.3832244873046875, 0.445709228515625, 0.5081939697265625, 0.5706787109375, 0.6331634521484375, 0.695648193359375, 0.7581329345703125, 0.82061767578125, 0.8831024169921875, 0.945587158203125, 1.0080718994140625, 1.070556640625, 1.1330413818359375, 1.195526123046875, 1.2580108642578125, 1.32049560546875, 1.3829803466796875, 1.445465087890625, 1.5079498291015625, 1.5704345703125, 1.6329193115234375, 1.695404052734375, 1.7578887939453125, 1.82037353515625, 1.8828582763671875, 1.945343017578125, 2.0078277587890625, 2.0703125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 7.0, 5.0, 5.0, 11.0, 14.0, 8.0, 18.0, 17.0, 19.0, 21.0, 24.0, 32.0, 36.0, 38.0, 44.0, 33.0, 54.0, 42.0, 55.0, 51.0, 49.0, 34.0, 43.0, 41.0, 46.0, 38.0, 27.0, 25.0, 29.0, 18.0, 32.0, 10.0, 10.0, 13.0, 12.0, 9.0, 6.0, 10.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.978515625, -0.9498519897460938, -0.9211883544921875, -0.8925247192382812, -0.863861083984375, -0.8351974487304688, -0.8065338134765625, -0.7778701782226562, -0.74920654296875, -0.7205429077148438, -0.6918792724609375, -0.6632156372070312, -0.634552001953125, -0.6058883666992188, -0.5772247314453125, -0.5485610961914062, -0.5198974609375, -0.49123382568359375, -0.4625701904296875, -0.43390655517578125, -0.405242919921875, -0.37657928466796875, -0.3479156494140625, -0.31925201416015625, -0.29058837890625, -0.26192474365234375, -0.2332611083984375, -0.20459747314453125, -0.175933837890625, -0.14727020263671875, -0.1186065673828125, -0.08994293212890625, -0.061279296875, -0.03261566162109375, -0.0039520263671875, 0.02471160888671875, 0.053375244140625, 0.08203887939453125, 0.1107025146484375, 0.13936614990234375, 0.16802978515625, 0.19669342041015625, 0.2253570556640625, 0.25402069091796875, 0.282684326171875, 0.31134796142578125, 0.3400115966796875, 0.36867523193359375, 0.3973388671875, 0.42600250244140625, 0.4546661376953125, 0.48332977294921875, 0.511993408203125, 0.5406570434570312, 0.5693206787109375, 0.5979843139648438, 0.62664794921875, 0.6553115844726562, 0.6839752197265625, 0.7126388549804688, 0.741302490234375, 0.7699661254882812, 0.7986297607421875, 0.8272933959960938, 0.85595703125]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 7.0, 6.0, 5.0, 8.0, 10.0, 15.0, 17.0, 14.0, 22.0, 25.0, 30.0, 34.0, 40.0, 41.0, 57.0, 56.0, 59.0, 61.0, 64.0, 57.0, 66.0, 42.0, 40.0, 42.0, 33.0, 36.0, 28.0, 15.0, 13.0, 13.0, 14.0, 5.0, 10.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1952805519104, -5.9445085525512695, -5.693736553192139, -5.442964553833008, -5.192192554473877, -4.941420555114746, -4.690648078918457, -4.439876556396484, -4.189104080200195, -3.9383320808410645, -3.6875600814819336, -3.4367880821228027, -3.186016082763672, -2.935244083404541, -2.684471845626831, -2.4336998462677, -2.1829280853271484, -1.9321560859680176, -1.6813840866088867, -1.4306119680404663, -1.1798399686813354, -0.9290679693222046, -0.6782958507537842, -0.4275238513946533, -0.17675185203552246, 0.07402017712593079, 0.32479220628738403, 0.5755642652511597, 0.8263362646102905, 1.0771082639694214, 1.3278803825378418, 1.5786523818969727, 1.8294248580932617, 2.0801968574523926, 2.3309688568115234, 2.5817408561706543, 2.832512855529785, 3.083284854888916, 3.334057092666626, 3.584829092025757, 3.8356010913848877, 4.086373329162598, 4.3371453285217285, 4.587917327880859, 4.83868932723999, 5.089461326599121, 5.340233325958252, 5.591005325317383, 5.841777324676514, 6.0925493240356445, 6.343321323394775, 6.594093322753906, 6.844865322113037, 7.095637321472168, 7.346409797668457, 7.59718132019043, 7.847953796386719, 8.098726272583008, 8.34949779510498, 8.60027027130127, 8.851041793823242, 9.101814270019531, 9.352585792541504, 9.603358268737793, 9.854129791259766]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 5.0, 8.0, 7.0, 10.0, 5.0, 14.0, 13.0, 13.0, 13.0, 23.0, 17.0, 22.0, 25.0, 36.0, 33.0, 32.0, 30.0, 38.0, 38.0, 35.0, 39.0, 33.0, 32.0, 33.0, 34.0, 37.0, 27.0, 36.0, 32.0, 28.0, 33.0, 21.0, 26.0, 18.0, 18.0, 21.0, 12.0, 9.0, 12.0, 10.0, 17.0, 8.0, 8.0, 9.0, 9.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-8.791168212890625, -8.52606201171875, -8.260954856872559, -7.995848655700684, -7.73074197769165, -7.465635299682617, -7.200529098510742, -6.935422420501709, -6.670315742492676, -6.405209064483643, -6.140102863311768, -5.874996185302734, -5.609889507293701, -5.344782829284668, -5.079676628112793, -4.81456995010376, -4.549463748931885, -4.284357070922852, -4.019250869750977, -3.7541441917419434, -3.48903751373291, -3.223931074142456, -2.958824634552002, -2.6937179565429688, -2.4286115169525146, -2.1635050773620605, -1.8983983993530273, -1.6332919597625732, -1.3681854009628296, -1.103078842163086, -0.8379724025726318, -0.5728658437728882, -0.30775928497314453, -0.04265275597572327, 0.222453773021698, 0.4875602722167969, 0.7526668310165405, 1.0177733898162842, 1.2828798294067383, 1.547986388206482, 1.8130929470062256, 2.0781993865966797, 2.343306064605713, 2.608412504196167, 2.873518943786621, 3.1386256217956543, 3.4037320613861084, 3.6688385009765625, 3.9339451789855957, 4.199051856994629, 4.464158058166504, 4.729264736175537, 4.99437141418457, 5.259477615356445, 5.5245842933654785, 5.789690971374512, 6.054797172546387, 6.31990385055542, 6.585010051727295, 6.850116729736328, 7.115223407745361, 7.3803300857543945, 7.6454362869262695, 7.910542964935303, 8.175649642944336]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 18.0, 16.0, 31.0, 58.0, 100.0, 167.0, 264.0, 392.0, 655.0, 1060.0, 1678.0, 2688.0, 4169.0, 6483.0, 10467.0, 16557.0, 27011.0, 44067.0, 71879.0, 118791.0, 199061.0, 331892.0, 534905.0, 725185.0, 721711.0, 530587.0, 332105.0, 199365.0, 119386.0, 72959.0, 44468.0, 27807.0, 17136.0, 11105.0, 6978.0, 4472.0, 2973.0, 1932.0, 1212.0, 833.0, 546.0, 393.0, 264.0, 175.0, 97.0, 75.0, 51.0, 27.0, 7.0, 14.0, 11.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.86328125, -5.6678466796875, -5.472412109375, -5.2769775390625, -5.08154296875, -4.8861083984375, -4.690673828125, -4.4952392578125, -4.2998046875, -4.1043701171875, -3.908935546875, -3.7135009765625, -3.51806640625, -3.3226318359375, -3.127197265625, -2.9317626953125, -2.736328125, -2.5408935546875, -2.345458984375, -2.1500244140625, -1.95458984375, -1.7591552734375, -1.563720703125, -1.3682861328125, -1.1728515625, -0.9774169921875, -0.781982421875, -0.5865478515625, -0.39111328125, -0.1956787109375, -0.000244140625, 0.1951904296875, 0.390625, 0.5860595703125, 0.781494140625, 0.9769287109375, 1.17236328125, 1.3677978515625, 1.563232421875, 1.7586669921875, 1.9541015625, 2.1495361328125, 2.344970703125, 2.5404052734375, 2.73583984375, 2.9312744140625, 3.126708984375, 3.3221435546875, 3.517578125, 3.7130126953125, 3.908447265625, 4.1038818359375, 4.29931640625, 4.4947509765625, 4.690185546875, 4.8856201171875, 5.0810546875, 5.2764892578125, 5.471923828125, 5.6673583984375, 5.86279296875, 6.0582275390625, 6.253662109375, 6.4490966796875, 6.64453125]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 12.0, 17.0, 10.0, 8.0, 10.0, 12.0, 18.0, 19.0, 16.0, 17.0, 35.0, 27.0, 28.0, 35.0, 37.0, 38.0, 43.0, 40.0, 47.0, 33.0, 43.0, 29.0, 41.0, 33.0, 36.0, 34.0, 34.0, 27.0, 24.0, 31.0, 26.0, 14.0, 17.0, 13.0, 10.0, 11.0, 16.0, 12.0, 7.0, 9.0, 9.0, 4.0, 10.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.50872802734375, -5.3299560546875, -5.15118408203125, -4.972412109375, -4.79364013671875, -4.6148681640625, -4.43609619140625, -4.25732421875, -4.07855224609375, -3.8997802734375, -3.72100830078125, -3.542236328125, -3.36346435546875, -3.1846923828125, -3.00592041015625, -2.8271484375, -2.64837646484375, -2.4696044921875, -2.29083251953125, -2.112060546875, -1.93328857421875, -1.7545166015625, -1.57574462890625, -1.39697265625, -1.21820068359375, -1.0394287109375, -0.86065673828125, -0.681884765625, -0.50311279296875, -0.3243408203125, -0.14556884765625, 0.033203125, 0.21197509765625, 0.3907470703125, 0.56951904296875, 0.748291015625, 0.92706298828125, 1.1058349609375, 1.28460693359375, 1.46337890625, 1.64215087890625, 1.8209228515625, 1.99969482421875, 2.178466796875, 2.35723876953125, 2.5360107421875, 2.71478271484375, 2.8935546875, 3.07232666015625, 3.2510986328125, 3.42987060546875, 3.608642578125, 3.78741455078125, 3.9661865234375, 4.14495849609375, 4.32373046875, 4.50250244140625, 4.6812744140625, 4.86004638671875, 5.038818359375, 5.21759033203125, 5.3963623046875, 5.57513427734375, 5.75390625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 13.0, 16.0, 22.0, 38.0, 53.0, 86.0, 107.0, 211.0, 317.0, 506.0, 812.0, 1394.0, 2174.0, 3543.0, 5823.0, 9364.0, 15499.0, 25865.0, 44147.0, 73107.0, 122560.0, 199217.0, 313036.0, 460222.0, 600165.0, 644834.0, 560384.0, 411131.0, 271339.0, 169452.0, 103637.0, 62129.0, 36988.0, 22086.0, 13272.0, 7998.0, 4858.0, 2939.0, 1874.0, 1173.0, 693.0, 411.0, 287.0, 194.0, 113.0, 79.0, 47.0, 31.0, 12.0, 14.0, 11.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.4453125, -5.27691650390625, -5.1085205078125, -4.94012451171875, -4.771728515625, -4.60333251953125, -4.4349365234375, -4.26654052734375, -4.09814453125, -3.92974853515625, -3.7613525390625, -3.59295654296875, -3.424560546875, -3.25616455078125, -3.0877685546875, -2.91937255859375, -2.7509765625, -2.58258056640625, -2.4141845703125, -2.24578857421875, -2.077392578125, -1.90899658203125, -1.7406005859375, -1.57220458984375, -1.40380859375, -1.23541259765625, -1.0670166015625, -0.89862060546875, -0.730224609375, -0.56182861328125, -0.3934326171875, -0.22503662109375, -0.056640625, 0.11175537109375, 0.2801513671875, 0.44854736328125, 0.616943359375, 0.78533935546875, 0.9537353515625, 1.12213134765625, 1.29052734375, 1.45892333984375, 1.6273193359375, 1.79571533203125, 1.964111328125, 2.13250732421875, 2.3009033203125, 2.46929931640625, 2.6376953125, 2.80609130859375, 2.9744873046875, 3.14288330078125, 3.311279296875, 3.47967529296875, 3.6480712890625, 3.81646728515625, 3.98486328125, 4.15325927734375, 4.3216552734375, 4.49005126953125, 4.658447265625, 4.82684326171875, 4.9952392578125, 5.16363525390625, 5.33203125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 10.0, 13.0, 10.0, 18.0, 23.0, 24.0, 29.0, 26.0, 34.0, 59.0, 65.0, 71.0, 87.0, 102.0, 101.0, 134.0, 132.0, 169.0, 157.0, 186.0, 204.0, 185.0, 200.0, 215.0, 183.0, 201.0, 210.0, 165.0, 143.0, 130.0, 141.0, 135.0, 87.0, 71.0, 65.0, 50.0, 56.0, 33.0, 28.0, 21.0, 26.0, 8.0, 14.0, 16.0, 13.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.578125, -2.498626708984375, -2.41912841796875, -2.339630126953125, -2.2601318359375, -2.180633544921875, -2.10113525390625, -2.021636962890625, -1.942138671875, -1.862640380859375, -1.78314208984375, -1.703643798828125, -1.6241455078125, -1.544647216796875, -1.46514892578125, -1.385650634765625, -1.30615234375, -1.226654052734375, -1.14715576171875, -1.067657470703125, -0.9881591796875, -0.908660888671875, -0.82916259765625, -0.749664306640625, -0.670166015625, -0.590667724609375, -0.51116943359375, -0.431671142578125, -0.3521728515625, -0.272674560546875, -0.19317626953125, -0.113677978515625, -0.0341796875, 0.045318603515625, 0.12481689453125, 0.204315185546875, 0.2838134765625, 0.363311767578125, 0.44281005859375, 0.522308349609375, 0.601806640625, 0.681304931640625, 0.76080322265625, 0.840301513671875, 0.9197998046875, 0.999298095703125, 1.07879638671875, 1.158294677734375, 1.23779296875, 1.317291259765625, 1.39678955078125, 1.476287841796875, 1.5557861328125, 1.635284423828125, 1.71478271484375, 1.794281005859375, 1.873779296875, 1.953277587890625, 2.03277587890625, 2.112274169921875, 2.1917724609375, 2.271270751953125, 2.35076904296875, 2.430267333984375, 2.509765625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 7.0, 11.0, 15.0, 21.0, 19.0, 28.0, 29.0, 36.0, 44.0, 57.0, 51.0, 59.0, 76.0, 66.0, 63.0, 72.0, 50.0, 51.0, 48.0, 43.0, 21.0, 30.0, 23.0, 18.0, 9.0, 13.0, 9.0, 5.0, 4.0, 5.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.956044673919678, -6.724077224731445, -6.492110252380371, -6.260142803192139, -6.028175354003906, -5.796207904815674, -5.564240455627441, -5.332273483276367, -5.100306034088135, -4.868338584899902, -4.636371612548828, -4.404404163360596, -4.172436714172363, -3.940469264984131, -3.7085020542144775, -3.476534843444824, -3.244567394256592, -3.0125999450683594, -2.780632734298706, -2.5486655235290527, -2.3166980743408203, -2.084730625152588, -1.8527634143829346, -1.6207960844039917, -1.3888287544250488, -1.156861424446106, -0.9248940944671631, -0.6929267644882202, -0.46095943450927734, -0.22899210453033447, 0.0029752254486083984, 0.23494255542755127, 0.46691036224365234, 0.6988776922225952, 0.9308450222015381, 1.162812352180481, 1.3947796821594238, 1.6267470121383667, 1.8587143421173096, 2.090681552886963, 2.3226490020751953, 2.5546164512634277, 2.786583662033081, 3.0185508728027344, 3.250518321990967, 3.482485771179199, 3.7144529819488525, 3.946420192718506, 4.178387641906738, 4.410355091094971, 4.642322540283203, 4.874289512634277, 5.10625696182251, 5.338224411010742, 5.570191383361816, 5.802158832550049, 6.034126281738281, 6.266093730926514, 6.498061180114746, 6.73002815246582, 6.961995601654053, 7.193963050842285, 7.425930023193359, 7.657897472381592, 7.889864921569824]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 5.0, 3.0, 9.0, 10.0, 5.0, 7.0, 10.0, 6.0, 26.0, 10.0, 19.0, 20.0, 31.0, 25.0, 39.0, 27.0, 46.0, 33.0, 40.0, 34.0, 33.0, 35.0, 34.0, 37.0, 51.0, 37.0, 38.0, 34.0, 35.0, 33.0, 21.0, 20.0, 22.0, 26.0, 22.0, 18.0, 13.0, 16.0, 11.0, 13.0, 12.0, 6.0, 8.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.600760459899902, -7.368236541748047, -7.13571310043335, -6.903189182281494, -6.670665740966797, -6.438141822814941, -6.205617904663086, -5.973094463348389, -5.740570545196533, -5.508046627044678, -5.2755231857299805, -5.042999267578125, -4.810475826263428, -4.577951908111572, -4.345428466796875, -4.1129045486450195, -3.880380868911743, -3.647857189178467, -3.4153335094451904, -3.182809829711914, -2.9502859115600586, -2.7177622318267822, -2.485238552093506, -2.2527146339416504, -2.020191192626953, -1.7876675128936768, -1.5551437139511108, -1.3226200342178345, -1.0900962352752686, -0.8575725555419922, -0.6250488758087158, -0.3925250768661499, -0.16000127792358398, 0.07252244651317596, 0.3050461709499359, 0.5375698804855347, 0.7700936198234558, 1.002617359161377, 1.2351410388946533, 1.4676648378372192, 1.7001885175704956, 1.932712197303772, 2.165235996246338, 2.3977596759796143, 2.6302833557128906, 2.862807273864746, 3.0953307151794434, 3.327854633331299, 3.560378313064575, 3.7929019927978516, 4.025425910949707, 4.257949352264404, 4.49047327041626, 4.722996711730957, 4.9555206298828125, 5.188044548034668, 5.420567989349365, 5.653091907501221, 5.885615348815918, 6.118139266967773, 6.350662708282471, 6.583186626434326, 6.815710067749023, 7.048233985900879, 7.280757904052734]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 13.0, 20.0, 28.0, 41.0, 57.0, 96.0, 131.0, 231.0, 298.0, 404.0, 579.0, 907.0, 1309.0, 2010.0, 2989.0, 4570.0, 6956.0, 10774.0, 16827.0, 25603.0, 40114.0, 62414.0, 95543.0, 139443.0, 173335.0, 152787.0, 108133.0, 71415.0, 46368.0, 29906.0, 19105.0, 12364.0, 7885.0, 5310.0, 3447.0, 2340.0, 1578.0, 1070.0, 707.0, 446.0, 319.0, 230.0, 149.0, 76.0, 85.0, 50.0, 22.0, 17.0, 17.0, 9.0, 6.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.7958984375, -1.7373199462890625, -1.678741455078125, -1.6201629638671875, -1.56158447265625, -1.5030059814453125, -1.444427490234375, -1.3858489990234375, -1.3272705078125, -1.2686920166015625, -1.210113525390625, -1.1515350341796875, -1.09295654296875, -1.0343780517578125, -0.975799560546875, -0.9172210693359375, -0.858642578125, -0.8000640869140625, -0.741485595703125, -0.6829071044921875, -0.62432861328125, -0.5657501220703125, -0.507171630859375, -0.4485931396484375, -0.3900146484375, -0.3314361572265625, -0.272857666015625, -0.2142791748046875, -0.15570068359375, -0.0971221923828125, -0.038543701171875, 0.0200347900390625, 0.07861328125, 0.1371917724609375, 0.195770263671875, 0.2543487548828125, 0.31292724609375, 0.3715057373046875, 0.430084228515625, 0.4886627197265625, 0.5472412109375, 0.6058197021484375, 0.664398193359375, 0.7229766845703125, 0.78155517578125, 0.8401336669921875, 0.898712158203125, 0.9572906494140625, 1.015869140625, 1.0744476318359375, 1.133026123046875, 1.1916046142578125, 1.25018310546875, 1.3087615966796875, 1.367340087890625, 1.4259185791015625, 1.4844970703125, 1.5430755615234375, 1.601654052734375, 1.6602325439453125, 1.71881103515625, 1.7773895263671875, 1.835968017578125, 1.8945465087890625, 1.953125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 7.0, 5.0, 10.0, 6.0, 5.0, 15.0, 13.0, 14.0, 19.0, 22.0, 30.0, 24.0, 31.0, 29.0, 29.0, 40.0, 49.0, 41.0, 35.0, 42.0, 41.0, 33.0, 43.0, 41.0, 41.0, 33.0, 44.0, 20.0, 26.0, 26.0, 23.0, 21.0, 23.0, 14.0, 17.0, 16.0, 12.0, 13.0, 5.0, 9.0, 9.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.1328125, -7.8916015625, -7.650390625, -7.4091796875, -7.16796875, -6.9267578125, -6.685546875, -6.4443359375, -6.203125, -5.9619140625, -5.720703125, -5.4794921875, -5.23828125, -4.9970703125, -4.755859375, -4.5146484375, -4.2734375, -4.0322265625, -3.791015625, -3.5498046875, -3.30859375, -3.0673828125, -2.826171875, -2.5849609375, -2.34375, -2.1025390625, -1.861328125, -1.6201171875, -1.37890625, -1.1376953125, -0.896484375, -0.6552734375, -0.4140625, -0.1728515625, 0.068359375, 0.3095703125, 0.55078125, 0.7919921875, 1.033203125, 1.2744140625, 1.515625, 1.7568359375, 1.998046875, 2.2392578125, 2.48046875, 2.7216796875, 2.962890625, 3.2041015625, 3.4453125, 3.6865234375, 3.927734375, 4.1689453125, 4.41015625, 4.6513671875, 4.892578125, 5.1337890625, 5.375, 5.6162109375, 5.857421875, 6.0986328125, 6.33984375, 6.5810546875, 6.822265625, 7.0634765625, 7.3046875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 4.0, 13.0, 11.0, 17.0, 15.0, 20.0, 26.0, 41.0, 50.0, 84.0, 102.0, 135.0, 160.0, 181.0, 297.0, 433.0, 617.0, 1016.0, 1601.0, 2856.0, 5598.0, 11884.0, 28592.0, 883624.0, 68919.0, 21635.0, 9486.0, 4601.0, 2418.0, 1287.0, 828.0, 546.0, 376.0, 248.0, 202.0, 137.0, 126.0, 92.0, 68.0, 43.0, 42.0, 15.0, 21.0, 22.0, 17.0, 15.0, 11.0, 9.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.09765625, -5.9000244140625, -5.702392578125, -5.5047607421875, -5.30712890625, -5.1094970703125, -4.911865234375, -4.7142333984375, -4.5166015625, -4.3189697265625, -4.121337890625, -3.9237060546875, -3.72607421875, -3.5284423828125, -3.330810546875, -3.1331787109375, -2.935546875, -2.7379150390625, -2.540283203125, -2.3426513671875, -2.14501953125, -1.9473876953125, -1.749755859375, -1.5521240234375, -1.3544921875, -1.1568603515625, -0.959228515625, -0.7615966796875, -0.56396484375, -0.3663330078125, -0.168701171875, 0.0289306640625, 0.2265625, 0.4241943359375, 0.621826171875, 0.8194580078125, 1.01708984375, 1.2147216796875, 1.412353515625, 1.6099853515625, 1.8076171875, 2.0052490234375, 2.202880859375, 2.4005126953125, 2.59814453125, 2.7957763671875, 2.993408203125, 3.1910400390625, 3.388671875, 3.5863037109375, 3.783935546875, 3.9815673828125, 4.17919921875, 4.3768310546875, 4.574462890625, 4.7720947265625, 4.9697265625, 5.1673583984375, 5.364990234375, 5.5626220703125, 5.76025390625, 5.9578857421875, 6.155517578125, 6.3531494140625, 6.55078125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 7.0, 6.0, 9.0, 8.0, 12.0, 4.0, 5.0, 12.0, 19.0, 17.0, 18.0, 22.0, 18.0, 25.0, 21.0, 25.0, 36.0, 27.0, 34.0, 33.0, 29.0, 50.0, 44.0, 48.0, 36.0, 43.0, 33.0, 45.0, 35.0, 36.0, 23.0, 34.0, 26.0, 21.0, 16.0, 11.0, 15.0, 19.0, 11.0, 12.0, 8.0, 10.0, 9.0, 8.0, 7.0, 8.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.21484375, -5.05291748046875, -4.8909912109375, -4.72906494140625, -4.567138671875, -4.40521240234375, -4.2432861328125, -4.08135986328125, -3.91943359375, -3.75750732421875, -3.5955810546875, -3.43365478515625, -3.271728515625, -3.10980224609375, -2.9478759765625, -2.78594970703125, -2.6240234375, -2.46209716796875, -2.3001708984375, -2.13824462890625, -1.976318359375, -1.81439208984375, -1.6524658203125, -1.49053955078125, -1.32861328125, -1.16668701171875, -1.0047607421875, -0.84283447265625, -0.680908203125, -0.51898193359375, -0.3570556640625, -0.19512939453125, -0.033203125, 0.12872314453125, 0.2906494140625, 0.45257568359375, 0.614501953125, 0.77642822265625, 0.9383544921875, 1.10028076171875, 1.26220703125, 1.42413330078125, 1.5860595703125, 1.74798583984375, 1.909912109375, 2.07183837890625, 2.2337646484375, 2.39569091796875, 2.5576171875, 2.71954345703125, 2.8814697265625, 3.04339599609375, 3.205322265625, 3.36724853515625, 3.5291748046875, 3.69110107421875, 3.85302734375, 4.01495361328125, 4.1768798828125, 4.33880615234375, 4.500732421875, 4.66265869140625, 4.8245849609375, 4.98651123046875, 5.1484375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 12.0, 10.0, 26.0, 22.0, 24.0, 40.0, 46.0, 76.0, 120.0, 179.0, 261.0, 341.0, 577.0, 1030.0, 1845.0, 3651.0, 9000.0, 27507.0, 934265.0, 46894.0, 12452.0, 4623.0, 2308.0, 1232.0, 680.0, 406.0, 281.0, 185.0, 123.0, 94.0, 61.0, 43.0, 27.0, 23.0, 19.0, 13.0, 12.0, 8.0, 6.0, 7.0, 0.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.2529296875, -1.2157135009765625, -1.178497314453125, -1.1412811279296875, -1.10406494140625, -1.0668487548828125, -1.029632568359375, -0.9924163818359375, -0.9552001953125, -0.9179840087890625, -0.880767822265625, -0.8435516357421875, -0.80633544921875, -0.7691192626953125, -0.731903076171875, -0.6946868896484375, -0.657470703125, -0.6202545166015625, -0.583038330078125, -0.5458221435546875, -0.50860595703125, -0.4713897705078125, -0.434173583984375, -0.3969573974609375, -0.3597412109375, -0.3225250244140625, -0.285308837890625, -0.2480926513671875, -0.21087646484375, -0.1736602783203125, -0.136444091796875, -0.0992279052734375, -0.06201171875, -0.0247955322265625, 0.012420654296875, 0.0496368408203125, 0.08685302734375, 0.1240692138671875, 0.161285400390625, 0.1985015869140625, 0.2357177734375, 0.2729339599609375, 0.310150146484375, 0.3473663330078125, 0.38458251953125, 0.4217987060546875, 0.459014892578125, 0.4962310791015625, 0.533447265625, 0.5706634521484375, 0.607879638671875, 0.6450958251953125, 0.68231201171875, 0.7195281982421875, 0.756744384765625, 0.7939605712890625, 0.8311767578125, 0.8683929443359375, 0.905609130859375, 0.9428253173828125, 0.98004150390625, 1.0172576904296875, 1.054473876953125, 1.0916900634765625, 1.12890625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 6.0, 6.0, 4.0, 11.0, 10.0, 11.0, 16.0, 22.0, 20.0, 24.0, 25.0, 26.0, 40.0, 46.0, 44.0, 55.0, 41.0, 41.0, 48.0, 44.0, 52.0, 40.0, 37.0, 45.0, 45.0, 37.0, 23.0, 32.0, 13.0, 15.0, 26.0, 26.0, 11.0, 16.0, 8.0, 7.0, 10.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.349781036376953e-05, -3.242865204811096e-05, -3.135949373245239e-05, -3.0290335416793823e-05, -2.9221177101135254e-05, -2.8152018785476685e-05, -2.7082860469818115e-05, -2.6013702154159546e-05, -2.4944543838500977e-05, -2.3875385522842407e-05, -2.2806227207183838e-05, -2.173706889152527e-05, -2.06679105758667e-05, -1.959875226020813e-05, -1.852959394454956e-05, -1.746043562889099e-05, -1.6391277313232422e-05, -1.5322118997573853e-05, -1.4252960681915283e-05, -1.3183802366256714e-05, -1.2114644050598145e-05, -1.1045485734939575e-05, -9.976327419281006e-06, -8.907169103622437e-06, -7.838010787963867e-06, -6.768852472305298e-06, -5.6996941566467285e-06, -4.630535840988159e-06, -3.56137752532959e-06, -2.4922192096710205e-06, -1.4230608940124512e-06, -3.5390257835388184e-07, 7.152557373046875e-07, 1.7844140529632568e-06, 2.853572368621826e-06, 3.9227306842803955e-06, 4.991888999938965e-06, 6.061047315597534e-06, 7.1302056312561035e-06, 8.199363946914673e-06, 9.268522262573242e-06, 1.0337680578231812e-05, 1.1406838893890381e-05, 1.247599720954895e-05, 1.354515552520752e-05, 1.4614313840866089e-05, 1.5683472156524658e-05, 1.6752630472183228e-05, 1.7821788787841797e-05, 1.8890947103500366e-05, 1.9960105419158936e-05, 2.1029263734817505e-05, 2.2098422050476074e-05, 2.3167580366134644e-05, 2.4236738681793213e-05, 2.5305896997451782e-05, 2.637505531311035e-05, 2.744421362876892e-05, 2.851337194442749e-05, 2.958253026008606e-05, 3.065168857574463e-05, 3.17208468914032e-05, 3.279000520706177e-05, 3.385916352272034e-05, 3.4928321838378906e-05]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 9.0, 18.0, 25.0, 42.0, 67.0, 93.0, 112.0, 192.0, 327.0, 537.0, 892.0, 1402.0, 2395.0, 4456.0, 7695.0, 13972.0, 25511.0, 46851.0, 89366.0, 176498.0, 286149.0, 187752.0, 94050.0, 49683.0, 26666.0, 14446.0, 8116.0, 4616.0, 2605.0, 1514.0, 939.0, 538.0, 348.0, 221.0, 150.0, 84.0, 71.0, 28.0, 34.0, 22.0, 15.0, 15.0, 8.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34423828125, -0.3336601257324219, -0.32308197021484375, -0.3125038146972656, -0.3019256591796875, -0.2913475036621094, -0.28076934814453125, -0.2701911926269531, -0.259613037109375, -0.24903488159179688, -0.23845672607421875, -0.22787857055664062, -0.2173004150390625, -0.20672225952148438, -0.19614410400390625, -0.18556594848632812, -0.17498779296875, -0.16440963745117188, -0.15383148193359375, -0.14325332641601562, -0.1326751708984375, -0.12209701538085938, -0.11151885986328125, -0.10094070434570312, -0.090362548828125, -0.07978439331054688, -0.06920623779296875, -0.058628082275390625, -0.0480499267578125, -0.037471771240234375, -0.02689361572265625, -0.016315460205078125, -0.0057373046875, 0.004840850830078125, 0.01541900634765625, 0.025997161865234375, 0.0365753173828125, 0.047153472900390625, 0.05773162841796875, 0.06830978393554688, 0.078887939453125, 0.08946609497070312, 0.10004425048828125, 0.11062240600585938, 0.1212005615234375, 0.13177871704101562, 0.14235687255859375, 0.15293502807617188, 0.16351318359375, 0.17409133911132812, 0.18466949462890625, 0.19524765014648438, 0.2058258056640625, 0.21640396118164062, 0.22698211669921875, 0.23756027221679688, 0.248138427734375, 0.2587165832519531, 0.26929473876953125, 0.2798728942871094, 0.2904510498046875, 0.3010292053222656, 0.31160736083984375, 0.3221855163574219, 0.332763671875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 11.0, 15.0, 18.0, 24.0, 12.0, 25.0, 29.0, 27.0, 41.0, 39.0, 61.0, 57.0, 59.0, 73.0, 78.0, 73.0, 71.0, 61.0, 44.0, 39.0, 27.0, 23.0, 13.0, 14.0, 9.0, 13.0, 12.0, 6.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1068115234375, -0.10299301147460938, -0.09917449951171875, -0.09535598754882812, -0.0915374755859375, -0.08771896362304688, -0.08390045166015625, -0.08008193969726562, -0.076263427734375, -0.07244491577148438, -0.06862640380859375, -0.06480789184570312, -0.0609893798828125, -0.057170867919921875, -0.05335235595703125, -0.049533843994140625, -0.04571533203125, -0.041896820068359375, -0.03807830810546875, -0.034259796142578125, -0.0304412841796875, -0.026622772216796875, -0.02280426025390625, -0.018985748291015625, -0.015167236328125, -0.011348724365234375, -0.00753021240234375, -0.003711700439453125, 0.0001068115234375, 0.003925323486328125, 0.00774383544921875, 0.011562347412109375, 0.015380859375, 0.019199371337890625, 0.02301788330078125, 0.026836395263671875, 0.0306549072265625, 0.034473419189453125, 0.03829193115234375, 0.042110443115234375, 0.045928955078125, 0.049747467041015625, 0.05356597900390625, 0.057384490966796875, 0.0612030029296875, 0.06502151489257812, 0.06884002685546875, 0.07265853881835938, 0.07647705078125, 0.08029556274414062, 0.08411407470703125, 0.08793258666992188, 0.0917510986328125, 0.09556961059570312, 0.09938812255859375, 0.10320663452148438, 0.107025146484375, 0.11084365844726562, 0.11466217041015625, 0.11848068237304688, 0.1222991943359375, 0.12611770629882812, 0.12993621826171875, 0.13375473022460938, 0.1375732421875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 10.0, 8.0, 14.0, 18.0, 15.0, 22.0, 30.0, 35.0, 40.0, 54.0, 55.0, 56.0, 55.0, 69.0, 65.0, 79.0, 57.0, 51.0, 51.0, 44.0, 39.0, 22.0, 32.0, 13.0, 14.0, 9.0, 12.0, 7.0, 6.0, 7.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.485215663909912, -6.2555952072143555, -6.025975227355957, -5.7963547706604, -5.566734313964844, -5.337114334106445, -5.107493877410889, -4.877873420715332, -4.648253440856934, -4.418632984161377, -4.1890130043029785, -3.959392547607422, -3.7297720909118652, -3.5001518726348877, -3.27053165435791, -3.0409111976623535, -2.811290740966797, -2.5816705226898193, -2.3520500659942627, -2.122429847717285, -1.892809510231018, -1.663189172744751, -1.4335689544677734, -1.2039486169815063, -0.9743282794952393, -0.7447079420089722, -0.5150876641273499, -0.28546738624572754, -0.05584704875946045, 0.17377328872680664, 0.4033935070037842, 0.6330138444900513, 0.8626337051391602, 1.0922540426254272, 1.3218743801116943, 1.5514945983886719, 1.781114935874939, 2.010735273361206, 2.2403554916381836, 2.4699759483337402, 2.6995961666107178, 2.9292163848876953, 3.158836841583252, 3.3884570598602295, 3.618077278137207, 3.8476977348327637, 4.07731819152832, 4.306938171386719, 4.536558628082275, 4.766179084777832, 4.9957990646362305, 5.225419521331787, 5.455039978027344, 5.684659957885742, 5.914280414581299, 6.1439008712768555, 6.373520851135254, 6.6031413078308105, 6.832761287689209, 7.062381744384766, 7.292002201080322, 7.521622657775879, 7.751242637634277, 7.980863094329834, 8.21048355102539]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 6.0, 4.0, 5.0, 12.0, 6.0, 7.0, 8.0, 6.0, 25.0, 13.0, 19.0, 21.0, 30.0, 28.0, 34.0, 30.0, 46.0, 32.0, 42.0, 33.0, 32.0, 36.0, 39.0, 39.0, 45.0, 42.0, 35.0, 30.0, 36.0, 35.0, 19.0, 23.0, 23.0, 24.0, 21.0, 19.0, 11.0, 15.0, 14.0, 13.0, 9.0, 7.0, 8.0, 3.0, 9.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.487278938293457, -7.2565741539001465, -7.025868892669678, -6.795164108276367, -6.564458847045898, -6.333754062652588, -6.103049278259277, -5.872344017028809, -5.64163875579834, -5.410933971405029, -5.1802287101745605, -4.94952392578125, -4.718818664550781, -4.488113880157471, -4.25740909576416, -4.026703834533691, -3.795999050140381, -3.565294027328491, -3.3345890045166016, -3.103884220123291, -2.8731789588928223, -2.6424741744995117, -2.411769151687622, -2.1810641288757324, -1.9503591060638428, -1.7196540832519531, -1.4889490604400635, -1.2582441568374634, -1.0275391340255737, -0.7968341112136841, -0.566129207611084, -0.33542418479919434, -0.10471868515014648, 0.12598630785942078, 0.35669130086898804, 0.5873962640762329, 0.8181012868881226, 1.0488063097000122, 1.2795112133026123, 1.510216236114502, 1.7409212589263916, 1.9716262817382812, 2.202331304550171, 2.4330363273620605, 2.663741111755371, 2.89444637298584, 3.1251511573791504, 3.35585618019104, 3.5865612030029297, 3.8172662258148193, 4.047971248626709, 4.2786760330200195, 4.509381294250488, 4.740086078643799, 4.970790863037109, 5.201496124267578, 5.432201385498047, 5.662906169891357, 5.893611431121826, 6.124316215515137, 6.3550214767456055, 6.585726261138916, 6.816431045532227, 7.047136306762695, 7.277841091156006]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 13.0, 24.0, 24.0, 39.0, 55.0, 64.0, 106.0, 149.0, 248.0, 355.0, 534.0, 818.0, 1319.0, 1947.0, 3255.0, 5433.0, 8587.0, 14229.0, 23317.0, 38426.0, 60570.0, 91722.0, 127311.0, 151727.0, 151945.0, 124210.0, 89051.0, 58251.0, 36327.0, 22718.0, 13559.0, 8371.0, 5169.0, 3104.0, 1982.0, 1254.0, 808.0, 495.0, 347.0, 217.0, 141.0, 105.0, 64.0, 46.0, 33.0, 35.0, 15.0, 12.0, 5.0, 9.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-6.71484375, -6.5111083984375, -6.307373046875, -6.1036376953125, -5.89990234375, -5.6961669921875, -5.492431640625, -5.2886962890625, -5.0849609375, -4.8812255859375, -4.677490234375, -4.4737548828125, -4.27001953125, -4.0662841796875, -3.862548828125, -3.6588134765625, -3.455078125, -3.2513427734375, -3.047607421875, -2.8438720703125, -2.64013671875, -2.4364013671875, -2.232666015625, -2.0289306640625, -1.8251953125, -1.6214599609375, -1.417724609375, -1.2139892578125, -1.01025390625, -0.8065185546875, -0.602783203125, -0.3990478515625, -0.1953125, 0.0084228515625, 0.212158203125, 0.4158935546875, 0.61962890625, 0.8233642578125, 1.027099609375, 1.2308349609375, 1.4345703125, 1.6383056640625, 1.842041015625, 2.0457763671875, 2.24951171875, 2.4532470703125, 2.656982421875, 2.8607177734375, 3.064453125, 3.2681884765625, 3.471923828125, 3.6756591796875, 3.87939453125, 4.0831298828125, 4.286865234375, 4.4906005859375, 4.6943359375, 4.8980712890625, 5.101806640625, 5.3055419921875, 5.50927734375, 5.7130126953125, 5.916748046875, 6.1204833984375, 6.32421875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 2.0, 9.0, 9.0, 13.0, 16.0, 12.0, 14.0, 18.0, 24.0, 27.0, 26.0, 24.0, 28.0, 47.0, 35.0, 42.0, 32.0, 48.0, 34.0, 37.0, 38.0, 31.0, 41.0, 40.0, 31.0, 35.0, 33.0, 29.0, 32.0, 27.0, 20.0, 18.0, 16.0, 8.0, 13.0, 14.0, 14.0, 8.0, 8.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-6.8359375, -6.61920166015625, -6.4024658203125, -6.18572998046875, -5.968994140625, -5.75225830078125, -5.5355224609375, -5.31878662109375, -5.10205078125, -4.88531494140625, -4.6685791015625, -4.45184326171875, -4.235107421875, -4.01837158203125, -3.8016357421875, -3.58489990234375, -3.3681640625, -3.15142822265625, -2.9346923828125, -2.71795654296875, -2.501220703125, -2.28448486328125, -2.0677490234375, -1.85101318359375, -1.63427734375, -1.41754150390625, -1.2008056640625, -0.98406982421875, -0.767333984375, -0.55059814453125, -0.3338623046875, -0.11712646484375, 0.099609375, 0.31634521484375, 0.5330810546875, 0.74981689453125, 0.966552734375, 1.18328857421875, 1.4000244140625, 1.61676025390625, 1.83349609375, 2.05023193359375, 2.2669677734375, 2.48370361328125, 2.700439453125, 2.91717529296875, 3.1339111328125, 3.35064697265625, 3.5673828125, 3.78411865234375, 4.0008544921875, 4.21759033203125, 4.434326171875, 4.65106201171875, 4.8677978515625, 5.08453369140625, 5.30126953125, 5.51800537109375, 5.7347412109375, 5.95147705078125, 6.168212890625, 6.38494873046875, 6.6016845703125, 6.81842041015625, 7.03515625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 6.0, 22.0, 18.0, 39.0, 66.0, 69.0, 138.0, 219.0, 329.0, 514.0, 778.0, 1323.0, 1919.0, 3093.0, 4891.0, 7925.0, 13143.0, 20429.0, 33159.0, 52269.0, 80142.0, 113165.0, 143500.0, 152122.0, 133382.0, 100506.0, 68809.0, 43734.0, 27489.0, 17110.0, 10559.0, 6459.0, 4119.0, 2589.0, 1673.0, 977.0, 670.0, 468.0, 274.0, 161.0, 118.0, 62.0, 41.0, 32.0, 17.0, 14.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-6.234375, -6.03521728515625, -5.8360595703125, -5.63690185546875, -5.437744140625, -5.23858642578125, -5.0394287109375, -4.84027099609375, -4.64111328125, -4.44195556640625, -4.2427978515625, -4.04364013671875, -3.844482421875, -3.64532470703125, -3.4461669921875, -3.24700927734375, -3.0478515625, -2.84869384765625, -2.6495361328125, -2.45037841796875, -2.251220703125, -2.05206298828125, -1.8529052734375, -1.65374755859375, -1.45458984375, -1.25543212890625, -1.0562744140625, -0.85711669921875, -0.657958984375, -0.45880126953125, -0.2596435546875, -0.06048583984375, 0.138671875, 0.33782958984375, 0.5369873046875, 0.73614501953125, 0.935302734375, 1.13446044921875, 1.3336181640625, 1.53277587890625, 1.73193359375, 1.93109130859375, 2.1302490234375, 2.32940673828125, 2.528564453125, 2.72772216796875, 2.9268798828125, 3.12603759765625, 3.3251953125, 3.52435302734375, 3.7235107421875, 3.92266845703125, 4.121826171875, 4.32098388671875, 4.5201416015625, 4.71929931640625, 4.91845703125, 5.11761474609375, 5.3167724609375, 5.51593017578125, 5.715087890625, 5.91424560546875, 6.1134033203125, 6.31256103515625, 6.51171875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 6.0, 3.0, 9.0, 8.0, 7.0, 11.0, 13.0, 14.0, 21.0, 17.0, 26.0, 26.0, 34.0, 33.0, 38.0, 25.0, 42.0, 39.0, 35.0, 26.0, 44.0, 43.0, 36.0, 44.0, 34.0, 33.0, 34.0, 43.0, 22.0, 29.0, 22.0, 26.0, 25.0, 18.0, 13.0, 13.0, 19.0, 5.0, 10.0, 10.0, 10.0, 10.0, 5.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0], "bins": [-4.91796875, -4.780548095703125, -4.64312744140625, -4.505706787109375, -4.3682861328125, -4.230865478515625, -4.09344482421875, -3.956024169921875, -3.818603515625, -3.681182861328125, -3.54376220703125, -3.406341552734375, -3.2689208984375, -3.131500244140625, -2.99407958984375, -2.856658935546875, -2.71923828125, -2.581817626953125, -2.44439697265625, -2.306976318359375, -2.1695556640625, -2.032135009765625, -1.89471435546875, -1.757293701171875, -1.619873046875, -1.482452392578125, -1.34503173828125, -1.207611083984375, -1.0701904296875, -0.932769775390625, -0.79534912109375, -0.657928466796875, -0.5205078125, -0.383087158203125, -0.24566650390625, -0.108245849609375, 0.0291748046875, 0.166595458984375, 0.30401611328125, 0.441436767578125, 0.578857421875, 0.716278076171875, 0.85369873046875, 0.991119384765625, 1.1285400390625, 1.265960693359375, 1.40338134765625, 1.540802001953125, 1.67822265625, 1.815643310546875, 1.95306396484375, 2.090484619140625, 2.2279052734375, 2.365325927734375, 2.50274658203125, 2.640167236328125, 2.777587890625, 2.915008544921875, 3.05242919921875, 3.189849853515625, 3.3272705078125, 3.464691162109375, 3.60211181640625, 3.739532470703125, 3.876953125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [6.0, 2.0, 4.0, 5.0, 8.0, 6.0, 11.0, 18.0, 22.0, 39.0, 58.0, 91.0, 98.0, 120.0, 216.0, 270.0, 411.0, 642.0, 856.0, 1353.0, 2012.0, 3109.0, 5072.0, 8225.0, 13843.0, 23330.0, 39177.0, 65800.0, 107022.0, 156748.0, 185014.0, 158526.0, 108637.0, 67191.0, 40239.0, 23480.0, 13890.0, 8518.0, 5056.0, 3172.0, 2002.0, 1292.0, 921.0, 571.0, 427.0, 306.0, 206.0, 141.0, 120.0, 87.0, 52.0, 48.0, 27.0, 24.0, 13.0, 11.0, 12.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.169921875, -2.09881591796875, -2.0277099609375, -1.95660400390625, -1.885498046875, -1.81439208984375, -1.7432861328125, -1.67218017578125, -1.60107421875, -1.52996826171875, -1.4588623046875, -1.38775634765625, -1.316650390625, -1.24554443359375, -1.1744384765625, -1.10333251953125, -1.0322265625, -0.96112060546875, -0.8900146484375, -0.81890869140625, -0.747802734375, -0.67669677734375, -0.6055908203125, -0.53448486328125, -0.46337890625, -0.39227294921875, -0.3211669921875, -0.25006103515625, -0.178955078125, -0.10784912109375, -0.0367431640625, 0.03436279296875, 0.10546875, 0.17657470703125, 0.2476806640625, 0.31878662109375, 0.389892578125, 0.46099853515625, 0.5321044921875, 0.60321044921875, 0.67431640625, 0.74542236328125, 0.8165283203125, 0.88763427734375, 0.958740234375, 1.02984619140625, 1.1009521484375, 1.17205810546875, 1.2431640625, 1.31427001953125, 1.3853759765625, 1.45648193359375, 1.527587890625, 1.59869384765625, 1.6697998046875, 1.74090576171875, 1.81201171875, 1.88311767578125, 1.9542236328125, 2.02532958984375, 2.096435546875, 2.16754150390625, 2.2386474609375, 2.30975341796875, 2.380859375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 2.0, 8.0, 9.0, 13.0, 15.0, 13.0, 33.0, 45.0, 44.0, 59.0, 60.0, 88.0, 91.0, 112.0, 81.0, 72.0, 59.0, 49.0, 46.0, 29.0, 18.0, 14.0, 8.0, 9.0, 10.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002734661102294922, -0.00026433542370796204, -0.0002552047371864319, -0.00024607405066490173, -0.00023694336414337158, -0.00022781267762184143, -0.00021868199110031128, -0.00020955130457878113, -0.00020042061805725098, -0.00019128993153572083, -0.00018215924501419067, -0.00017302855849266052, -0.00016389787197113037, -0.00015476718544960022, -0.00014563649892807007, -0.00013650581240653992, -0.00012737512588500977, -0.00011824443936347961, -0.00010911375284194946, -9.998306632041931e-05, -9.085237979888916e-05, -8.172169327735901e-05, -7.259100675582886e-05, -6.34603202342987e-05, -5.4329633712768555e-05, -4.51989471912384e-05, -3.606826066970825e-05, -2.69375741481781e-05, -1.780688762664795e-05, -8.676201105117798e-06, 4.544854164123535e-07, 9.585171937942505e-06, 1.8715858459472656e-05, 2.7846544981002808e-05, 3.697723150253296e-05, 4.610791802406311e-05, 5.523860454559326e-05, 6.436929106712341e-05, 7.349997758865356e-05, 8.263066411018372e-05, 9.176135063171387e-05, 0.00010089203715324402, 0.00011002272367477417, 0.00011915341019630432, 0.00012828409671783447, 0.00013741478323936462, 0.00014654546976089478, 0.00015567615628242493, 0.00016480684280395508, 0.00017393752932548523, 0.00018306821584701538, 0.00019219890236854553, 0.00020132958889007568, 0.00021046027541160583, 0.00021959096193313599, 0.00022872164845466614, 0.0002378523349761963, 0.00024698302149772644, 0.0002561137080192566, 0.00026524439454078674, 0.0002743750810623169, 0.00028350576758384705, 0.0002926364541053772, 0.00030176714062690735, 0.0003108978271484375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 4.0, 10.0, 10.0, 18.0, 40.0, 60.0, 103.0, 161.0, 231.0, 371.0, 600.0, 969.0, 1597.0, 2680.0, 4890.0, 8578.0, 15917.0, 29940.0, 54389.0, 97180.0, 157995.0, 205653.0, 184266.0, 123324.0, 72367.0, 39430.0, 21240.0, 11441.0, 6345.0, 3491.0, 2044.0, 1172.0, 738.0, 471.0, 267.0, 190.0, 139.0, 77.0, 43.0, 36.0, 27.0, 19.0, 11.0, 5.0, 2.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.740234375, -2.65899658203125, -2.5777587890625, -2.49652099609375, -2.415283203125, -2.33404541015625, -2.2528076171875, -2.17156982421875, -2.09033203125, -2.00909423828125, -1.9278564453125, -1.84661865234375, -1.765380859375, -1.68414306640625, -1.6029052734375, -1.52166748046875, -1.4404296875, -1.35919189453125, -1.2779541015625, -1.19671630859375, -1.115478515625, -1.03424072265625, -0.9530029296875, -0.87176513671875, -0.79052734375, -0.70928955078125, -0.6280517578125, -0.54681396484375, -0.465576171875, -0.38433837890625, -0.3031005859375, -0.22186279296875, -0.140625, -0.05938720703125, 0.0218505859375, 0.10308837890625, 0.184326171875, 0.26556396484375, 0.3468017578125, 0.42803955078125, 0.50927734375, 0.59051513671875, 0.6717529296875, 0.75299072265625, 0.834228515625, 0.91546630859375, 0.9967041015625, 1.07794189453125, 1.1591796875, 1.24041748046875, 1.3216552734375, 1.40289306640625, 1.484130859375, 1.56536865234375, 1.6466064453125, 1.72784423828125, 1.80908203125, 1.89031982421875, 1.9715576171875, 2.05279541015625, 2.134033203125, 2.21527099609375, 2.2965087890625, 2.37774658203125, 2.458984375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 6.0, 6.0, 8.0, 10.0, 10.0, 14.0, 29.0, 14.0, 23.0, 18.0, 36.0, 40.0, 44.0, 47.0, 62.0, 55.0, 66.0, 67.0, 64.0, 52.0, 44.0, 49.0, 50.0, 36.0, 29.0, 31.0, 17.0, 8.0, 10.0, 17.0, 10.0, 12.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0556640625, -1.02276611328125, -0.9898681640625, -0.95697021484375, -0.924072265625, -0.89117431640625, -0.8582763671875, -0.82537841796875, -0.79248046875, -0.75958251953125, -0.7266845703125, -0.69378662109375, -0.660888671875, -0.62799072265625, -0.5950927734375, -0.56219482421875, -0.529296875, -0.49639892578125, -0.4635009765625, -0.43060302734375, -0.397705078125, -0.36480712890625, -0.3319091796875, -0.29901123046875, -0.26611328125, -0.23321533203125, -0.2003173828125, -0.16741943359375, -0.134521484375, -0.10162353515625, -0.0687255859375, -0.03582763671875, -0.0029296875, 0.02996826171875, 0.0628662109375, 0.09576416015625, 0.128662109375, 0.16156005859375, 0.1944580078125, 0.22735595703125, 0.26025390625, 0.29315185546875, 0.3260498046875, 0.35894775390625, 0.391845703125, 0.42474365234375, 0.4576416015625, 0.49053955078125, 0.5234375, 0.55633544921875, 0.5892333984375, 0.62213134765625, 0.655029296875, 0.68792724609375, 0.7208251953125, 0.75372314453125, 0.78662109375, 0.81951904296875, 0.8524169921875, 0.88531494140625, 0.918212890625, 0.95111083984375, 0.9840087890625, 1.01690673828125, 1.0498046875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 7.0, 11.0, 9.0, 13.0, 16.0, 26.0, 31.0, 35.0, 32.0, 48.0, 39.0, 49.0, 59.0, 66.0, 73.0, 63.0, 55.0, 43.0, 55.0, 43.0, 41.0, 29.0, 30.0, 18.0, 14.0, 18.0, 17.0, 9.0, 10.0, 7.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.59161376953125, -5.391201496124268, -5.190789222717285, -4.990377426147461, -4.7899651527404785, -4.589552879333496, -4.389140605926514, -4.188728332519531, -3.988316059112549, -3.7879037857055664, -3.587491750717163, -3.3870794773101807, -3.1866672039031982, -2.986255168914795, -2.7858428955078125, -2.58543062210083, -2.3850185871124268, -2.1846063137054443, -1.9841941595077515, -1.7837820053100586, -1.5833697319030762, -1.3829575777053833, -1.1825454235076904, -0.982133150100708, -0.7817209959030151, -0.5813087821006775, -0.38089659810066223, -0.18048441410064697, 0.019927799701690674, 0.22034001350402832, 0.4207521677017212, 0.6211644411087036, 0.8215765953063965, 1.0219887495040894, 1.2224010229110718, 1.4228131771087646, 1.623225450515747, 1.82363760471344, 2.024049758911133, 2.2244620323181152, 2.4248743057250977, 2.62528657913208, 2.8256986141204834, 3.026110887527466, 3.2265231609344482, 3.4269351959228516, 3.627347469329834, 3.8277597427368164, 4.028171539306641, 4.228583812713623, 4.4289960861206055, 4.62940788269043, 4.829820156097412, 5.0302324295043945, 5.230644702911377, 5.431056976318359, 5.631469249725342, 5.831881523132324, 6.032293796539307, 6.232706069946289, 6.433117866516113, 6.633530139923096, 6.833942413330078, 7.0343546867370605, 7.234766960144043]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 4.0, 3.0, 5.0, 6.0, 11.0, 7.0, 11.0, 15.0, 7.0, 14.0, 14.0, 27.0, 23.0, 25.0, 23.0, 29.0, 33.0, 29.0, 24.0, 36.0, 48.0, 37.0, 36.0, 36.0, 34.0, 26.0, 29.0, 32.0, 41.0, 37.0, 27.0, 27.0, 21.0, 24.0, 28.0, 33.0, 21.0, 15.0, 21.0, 11.0, 11.0, 7.0, 10.0, 6.0, 11.0, 6.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.834550857543945, -6.621368408203125, -6.408186435699463, -6.195003986358643, -5.9818220138549805, -5.76863956451416, -5.555457592010498, -5.342275142669678, -5.129093170166016, -4.915910720825195, -4.702728748321533, -4.489546298980713, -4.276364326477051, -4.0631818771362305, -3.8499999046325684, -3.636817455291748, -3.423635244369507, -3.2104530334472656, -2.9972708225250244, -2.784088611602783, -2.570906400680542, -2.357724189758301, -2.1445417404174805, -1.9313596487045288, -1.7181774377822876, -1.5049952268600464, -1.2918130159378052, -1.0786306858062744, -0.865448534488678, -0.652266263961792, -0.4390840530395508, -0.22590184211730957, -0.01271963119506836, 0.20046259462833405, 0.41364482045173645, 0.6268270611763, 0.8400092720985413, 1.0531915426254272, 1.2663737535476685, 1.4795559644699097, 1.6927381753921509, 1.905920386314392, 2.119102716445923, 2.332284927368164, 2.5454671382904053, 2.7586493492126465, 2.9718315601348877, 3.185013771057129, 3.39819598197937, 3.6113781929016113, 3.8245604038238525, 4.037742614746094, 4.250925064086914, 4.464107036590576, 4.6772894859313965, 4.890471458435059, 5.103653907775879, 5.316836357116699, 5.530018329620361, 5.743200778961182, 5.956382751464844, 6.169565200805664, 6.382747173309326, 6.5959296226501465, 6.809111595153809]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 7.0, 8.0, 15.0, 21.0, 25.0, 51.0, 53.0, 97.0, 170.0, 233.0, 421.0, 610.0, 967.0, 1485.0, 2346.0, 3910.0, 6424.0, 10888.0, 18040.0, 31316.0, 53517.0, 95558.0, 170958.0, 311902.0, 554198.0, 826352.0, 827858.0, 556923.0, 315237.0, 173567.0, 97092.0, 55396.0, 31738.0, 18489.0, 10886.0, 6494.0, 4056.0, 2442.0, 1581.0, 1018.0, 621.0, 427.0, 293.0, 180.0, 127.0, 95.0, 75.0, 31.0, 33.0, 24.0, 18.0, 6.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.23876953125, -5.0517578125, -4.86474609375, -4.677734375, -4.49072265625, -4.3037109375, -4.11669921875, -3.9296875, -3.74267578125, -3.5556640625, -3.36865234375, -3.181640625, -2.99462890625, -2.8076171875, -2.62060546875, -2.43359375, -2.24658203125, -2.0595703125, -1.87255859375, -1.685546875, -1.49853515625, -1.3115234375, -1.12451171875, -0.9375, -0.75048828125, -0.5634765625, -0.37646484375, -0.189453125, -0.00244140625, 0.1845703125, 0.37158203125, 0.55859375, 0.74560546875, 0.9326171875, 1.11962890625, 1.306640625, 1.49365234375, 1.6806640625, 1.86767578125, 2.0546875, 2.24169921875, 2.4287109375, 2.61572265625, 2.802734375, 2.98974609375, 3.1767578125, 3.36376953125, 3.55078125, 3.73779296875, 3.9248046875, 4.11181640625, 4.298828125, 4.48583984375, 4.6728515625, 4.85986328125, 5.046875, 5.23388671875, 5.4208984375, 5.60791015625, 5.794921875, 5.98193359375, 6.1689453125, 6.35595703125, 6.54296875]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 6.0, 16.0, 9.0, 10.0, 8.0, 17.0, 11.0, 14.0, 28.0, 31.0, 23.0, 28.0, 34.0, 53.0, 39.0, 37.0, 39.0, 45.0, 34.0, 26.0, 40.0, 39.0, 40.0, 30.0, 31.0, 35.0, 36.0, 25.0, 28.0, 31.0, 22.0, 25.0, 13.0, 19.0, 11.0, 13.0, 7.0, 8.0, 13.0, 3.0, 4.0, 4.0, 5.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6796875, -4.52618408203125, -4.3726806640625, -4.21917724609375, -4.065673828125, -3.91217041015625, -3.7586669921875, -3.60516357421875, -3.45166015625, -3.29815673828125, -3.1446533203125, -2.99114990234375, -2.837646484375, -2.68414306640625, -2.5306396484375, -2.37713623046875, -2.2236328125, -2.07012939453125, -1.9166259765625, -1.76312255859375, -1.609619140625, -1.45611572265625, -1.3026123046875, -1.14910888671875, -0.99560546875, -0.84210205078125, -0.6885986328125, -0.53509521484375, -0.381591796875, -0.22808837890625, -0.0745849609375, 0.07891845703125, 0.232421875, 0.38592529296875, 0.5394287109375, 0.69293212890625, 0.846435546875, 0.99993896484375, 1.1534423828125, 1.30694580078125, 1.46044921875, 1.61395263671875, 1.7674560546875, 1.92095947265625, 2.074462890625, 2.22796630859375, 2.3814697265625, 2.53497314453125, 2.6884765625, 2.84197998046875, 2.9954833984375, 3.14898681640625, 3.302490234375, 3.45599365234375, 3.6094970703125, 3.76300048828125, 3.91650390625, 4.07000732421875, 4.2235107421875, 4.37701416015625, 4.530517578125, 4.68402099609375, 4.8375244140625, 4.99102783203125, 5.14453125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 9.0, 11.0, 13.0, 19.0, 27.0, 48.0, 69.0, 101.0, 144.0, 223.0, 360.0, 590.0, 924.0, 1511.0, 2445.0, 4007.0, 6643.0, 11048.0, 19166.0, 33102.0, 58767.0, 102882.0, 180206.0, 307658.0, 484052.0, 663058.0, 719577.0, 599432.0, 408572.0, 250075.0, 145100.0, 82348.0, 47015.0, 26346.0, 15585.0, 9185.0, 5385.0, 3274.0, 2001.0, 1198.0, 753.0, 464.0, 285.0, 216.0, 145.0, 89.0, 61.0, 33.0, 24.0, 15.0, 11.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-4.90234375, -4.7457275390625, -4.589111328125, -4.4324951171875, -4.27587890625, -4.1192626953125, -3.962646484375, -3.8060302734375, -3.6494140625, -3.4927978515625, -3.336181640625, -3.1795654296875, -3.02294921875, -2.8663330078125, -2.709716796875, -2.5531005859375, -2.396484375, -2.2398681640625, -2.083251953125, -1.9266357421875, -1.77001953125, -1.6134033203125, -1.456787109375, -1.3001708984375, -1.1435546875, -0.9869384765625, -0.830322265625, -0.6737060546875, -0.51708984375, -0.3604736328125, -0.203857421875, -0.0472412109375, 0.109375, 0.2659912109375, 0.422607421875, 0.5792236328125, 0.73583984375, 0.8924560546875, 1.049072265625, 1.2056884765625, 1.3623046875, 1.5189208984375, 1.675537109375, 1.8321533203125, 1.98876953125, 2.1453857421875, 2.302001953125, 2.4586181640625, 2.615234375, 2.7718505859375, 2.928466796875, 3.0850830078125, 3.24169921875, 3.3983154296875, 3.554931640625, 3.7115478515625, 3.8681640625, 4.0247802734375, 4.181396484375, 4.3380126953125, 4.49462890625, 4.6512451171875, 4.807861328125, 4.9644775390625, 5.12109375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 7.0, 5.0, 7.0, 18.0, 15.0, 20.0, 23.0, 30.0, 29.0, 32.0, 65.0, 44.0, 79.0, 88.0, 101.0, 101.0, 139.0, 149.0, 172.0, 168.0, 207.0, 208.0, 203.0, 198.0, 215.0, 217.0, 187.0, 186.0, 171.0, 125.0, 124.0, 124.0, 85.0, 94.0, 84.0, 82.0, 56.0, 48.0, 34.0, 24.0, 23.0, 23.0, 8.0, 13.0, 11.0, 9.0, 3.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.18359375, -2.115509033203125, -2.04742431640625, -1.979339599609375, -1.9112548828125, -1.843170166015625, -1.77508544921875, -1.707000732421875, -1.638916015625, -1.570831298828125, -1.50274658203125, -1.434661865234375, -1.3665771484375, -1.298492431640625, -1.23040771484375, -1.162322998046875, -1.09423828125, -1.026153564453125, -0.95806884765625, -0.889984130859375, -0.8218994140625, -0.753814697265625, -0.68572998046875, -0.617645263671875, -0.549560546875, -0.481475830078125, -0.41339111328125, -0.345306396484375, -0.2772216796875, -0.209136962890625, -0.14105224609375, -0.072967529296875, -0.0048828125, 0.063201904296875, 0.13128662109375, 0.199371337890625, 0.2674560546875, 0.335540771484375, 0.40362548828125, 0.471710205078125, 0.539794921875, 0.607879638671875, 0.67596435546875, 0.744049072265625, 0.8121337890625, 0.880218505859375, 0.94830322265625, 1.016387939453125, 1.08447265625, 1.152557373046875, 1.22064208984375, 1.288726806640625, 1.3568115234375, 1.424896240234375, 1.49298095703125, 1.561065673828125, 1.629150390625, 1.697235107421875, 1.76531982421875, 1.833404541015625, 1.9014892578125, 1.969573974609375, 2.03765869140625, 2.105743408203125, 2.173828125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 12.0, 12.0, 12.0, 17.0, 29.0, 35.0, 36.0, 44.0, 65.0, 43.0, 61.0, 57.0, 70.0, 62.0, 66.0, 62.0, 53.0, 45.0, 43.0, 33.0, 16.0, 27.0, 19.0, 23.0, 12.0, 11.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8961992263793945, -4.701761245727539, -4.507323265075684, -4.312885284423828, -4.118447303771973, -3.924009323120117, -3.729571580886841, -3.5351336002349854, -3.34069561958313, -3.1462576389312744, -2.951819658279419, -2.7573819160461426, -2.562943935394287, -2.3685059547424316, -2.174067974090576, -1.9796299934387207, -1.7851920127868652, -1.5907540321350098, -1.3963160514831543, -1.2018781900405884, -1.007440209388733, -0.8130022287368774, -0.6185643672943115, -0.42412638664245605, -0.22968840599060059, -0.035250455141067505, 0.15918749570846558, 0.35362541675567627, 0.5480633974075317, 0.7425013780593872, 0.9369392395019531, 1.1313772201538086, 1.3258156776428223, 1.5202536582946777, 1.7146916389465332, 1.9091295003890991, 2.103567600250244, 2.2980055809020996, 2.492443323135376, 2.6868813037872314, 2.881319284439087, 3.0757572650909424, 3.270195245742798, 3.464632987976074, 3.6590709686279297, 3.853508949279785, 4.047946929931641, 4.242384910583496, 4.436822891235352, 4.631260871887207, 4.8256988525390625, 5.020136833190918, 5.214574813842773, 5.409012794494629, 5.603450775146484, 5.79788875579834, 5.992326736450195, 6.186764717102051, 6.381202697753906, 6.575640678405762, 6.770078659057617, 6.964516639709473, 7.158954620361328, 7.353392601013184, 7.547830104827881]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 5.0, 12.0, 12.0, 10.0, 14.0, 16.0, 20.0, 13.0, 33.0, 23.0, 33.0, 38.0, 26.0, 34.0, 38.0, 38.0, 35.0, 39.0, 30.0, 34.0, 41.0, 37.0, 33.0, 37.0, 42.0, 45.0, 27.0, 22.0, 27.0, 27.0, 19.0, 18.0, 28.0, 14.0, 19.0, 13.0, 11.0, 5.0, 6.0, 3.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.570944786071777, -6.368948459625244, -6.166951656341553, -5.9649553298950195, -5.762958526611328, -5.560962200164795, -5.358965873718262, -5.15696907043457, -4.954972267150879, -4.752975940704346, -4.550979137420654, -4.348982810974121, -4.14698600769043, -3.9449896812438965, -3.742993116378784, -3.540996551513672, -3.3390002250671387, -3.1370036602020264, -2.935007095336914, -2.733010768890381, -2.5310139656066895, -2.3290176391601562, -2.127021074295044, -1.9250245094299316, -1.7230279445648193, -1.521031379699707, -1.3190348148345947, -1.117038369178772, -0.9150418043136597, -0.7130452394485474, -0.5110487937927246, -0.3090522289276123, -0.1070556640625, 0.09494087100028992, 0.29693740606307983, 0.49893391132354736, 0.7009304761886597, 0.902927041053772, 1.1049234867095947, 1.306920051574707, 1.5089166164398193, 1.7109131813049316, 1.912909746170044, 2.1149063110351562, 2.3169026374816895, 2.518899440765381, 2.720895767211914, 2.9228923320770264, 3.1248888969421387, 3.326885461807251, 3.5288820266723633, 3.7308783531188965, 3.932875156402588, 4.134871482849121, 4.3368682861328125, 4.538864612579346, 4.740860939025879, 4.942857265472412, 5.1448540687561035, 5.346850395202637, 5.548847198486328, 5.750843524932861, 5.9528398513793945, 6.154836654663086, 6.356833457946777]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 10.0, 12.0, 14.0, 27.0, 32.0, 58.0, 91.0, 145.0, 177.0, 280.0, 460.0, 611.0, 931.0, 1323.0, 2049.0, 3230.0, 4955.0, 7606.0, 11777.0, 18528.0, 29474.0, 48287.0, 77276.0, 125359.0, 185379.0, 188952.0, 128648.0, 79996.0, 49264.0, 30250.0, 19021.0, 11979.0, 7598.0, 4929.0, 3223.0, 2146.0, 1478.0, 997.0, 630.0, 440.0, 340.0, 186.0, 120.0, 80.0, 60.0, 51.0, 35.0, 16.0, 12.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.73828125, -1.6840057373046875, -1.629730224609375, -1.5754547119140625, -1.52117919921875, -1.4669036865234375, -1.412628173828125, -1.3583526611328125, -1.3040771484375, -1.2498016357421875, -1.195526123046875, -1.1412506103515625, -1.08697509765625, -1.0326995849609375, -0.978424072265625, -0.9241485595703125, -0.869873046875, -0.8155975341796875, -0.761322021484375, -0.7070465087890625, -0.65277099609375, -0.5984954833984375, -0.544219970703125, -0.4899444580078125, -0.4356689453125, -0.3813934326171875, -0.327117919921875, -0.2728424072265625, -0.21856689453125, -0.1642913818359375, -0.110015869140625, -0.0557403564453125, -0.00146484375, 0.0528106689453125, 0.107086181640625, 0.1613616943359375, 0.21563720703125, 0.2699127197265625, 0.324188232421875, 0.3784637451171875, 0.4327392578125, 0.4870147705078125, 0.541290283203125, 0.5955657958984375, 0.64984130859375, 0.7041168212890625, 0.758392333984375, 0.8126678466796875, 0.866943359375, 0.9212188720703125, 0.975494384765625, 1.0297698974609375, 1.08404541015625, 1.1383209228515625, 1.192596435546875, 1.2468719482421875, 1.3011474609375, 1.3554229736328125, 1.409698486328125, 1.4639739990234375, 1.51824951171875, 1.5725250244140625, 1.626800537109375, 1.6810760498046875, 1.7353515625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 7.0, 4.0, 6.0, 3.0, 7.0, 15.0, 19.0, 13.0, 19.0, 15.0, 18.0, 26.0, 30.0, 35.0, 34.0, 31.0, 31.0, 31.0, 37.0, 36.0, 42.0, 31.0, 31.0, 34.0, 40.0, 38.0, 29.0, 41.0, 32.0, 30.0, 34.0, 24.0, 21.0, 19.0, 23.0, 14.0, 15.0, 21.0, 15.0, 5.0, 12.0, 8.0, 2.0, 3.0, 4.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.15625, -5.96478271484375, -5.7733154296875, -5.58184814453125, -5.390380859375, -5.19891357421875, -5.0074462890625, -4.81597900390625, -4.62451171875, -4.43304443359375, -4.2415771484375, -4.05010986328125, -3.858642578125, -3.66717529296875, -3.4757080078125, -3.28424072265625, -3.0927734375, -2.90130615234375, -2.7098388671875, -2.51837158203125, -2.326904296875, -2.13543701171875, -1.9439697265625, -1.75250244140625, -1.56103515625, -1.36956787109375, -1.1781005859375, -0.98663330078125, -0.795166015625, -0.60369873046875, -0.4122314453125, -0.22076416015625, -0.029296875, 0.16217041015625, 0.3536376953125, 0.54510498046875, 0.736572265625, 0.92803955078125, 1.1195068359375, 1.31097412109375, 1.50244140625, 1.69390869140625, 1.8853759765625, 2.07684326171875, 2.268310546875, 2.45977783203125, 2.6512451171875, 2.84271240234375, 3.0341796875, 3.22564697265625, 3.4171142578125, 3.60858154296875, 3.800048828125, 3.99151611328125, 4.1829833984375, 4.37445068359375, 4.56591796875, 4.75738525390625, 4.9488525390625, 5.14031982421875, 5.331787109375, 5.52325439453125, 5.7147216796875, 5.90618896484375, 6.09765625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 10.0, 9.0, 11.0, 12.0, 16.0, 18.0, 17.0, 27.0, 26.0, 57.0, 70.0, 77.0, 111.0, 149.0, 214.0, 243.0, 383.0, 548.0, 890.0, 1347.0, 2422.0, 4671.0, 9903.0, 23809.0, 90987.0, 864600.0, 25538.0, 10516.0, 4931.0, 2615.0, 1434.0, 844.0, 553.0, 416.0, 267.0, 202.0, 146.0, 133.0, 83.0, 61.0, 39.0, 31.0, 36.0, 18.0, 21.0, 13.0, 6.0, 7.0, 4.0, 6.0, 7.0, 8.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.7890625, -5.60833740234375, -5.4276123046875, -5.24688720703125, -5.066162109375, -4.88543701171875, -4.7047119140625, -4.52398681640625, -4.34326171875, -4.16253662109375, -3.9818115234375, -3.80108642578125, -3.620361328125, -3.43963623046875, -3.2589111328125, -3.07818603515625, -2.8974609375, -2.71673583984375, -2.5360107421875, -2.35528564453125, -2.174560546875, -1.99383544921875, -1.8131103515625, -1.63238525390625, -1.45166015625, -1.27093505859375, -1.0902099609375, -0.90948486328125, -0.728759765625, -0.54803466796875, -0.3673095703125, -0.18658447265625, -0.005859375, 0.17486572265625, 0.3555908203125, 0.53631591796875, 0.717041015625, 0.89776611328125, 1.0784912109375, 1.25921630859375, 1.43994140625, 1.62066650390625, 1.8013916015625, 1.98211669921875, 2.162841796875, 2.34356689453125, 2.5242919921875, 2.70501708984375, 2.8857421875, 3.06646728515625, 3.2471923828125, 3.42791748046875, 3.608642578125, 3.78936767578125, 3.9700927734375, 4.15081787109375, 4.33154296875, 4.51226806640625, 4.6929931640625, 4.87371826171875, 5.054443359375, 5.23516845703125, 5.4158935546875, 5.59661865234375, 5.77734375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 4.0, 3.0, 12.0, 12.0, 9.0, 13.0, 12.0, 23.0, 16.0, 26.0, 34.0, 32.0, 38.0, 33.0, 29.0, 35.0, 42.0, 35.0, 50.0, 43.0, 43.0, 52.0, 33.0, 37.0, 37.0, 35.0, 36.0, 32.0, 23.0, 35.0, 14.0, 10.0, 17.0, 18.0, 13.0, 13.0, 13.0, 8.0, 4.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.3203125, -5.16571044921875, -5.0111083984375, -4.85650634765625, -4.701904296875, -4.54730224609375, -4.3927001953125, -4.23809814453125, -4.08349609375, -3.92889404296875, -3.7742919921875, -3.61968994140625, -3.465087890625, -3.31048583984375, -3.1558837890625, -3.00128173828125, -2.8466796875, -2.69207763671875, -2.5374755859375, -2.38287353515625, -2.228271484375, -2.07366943359375, -1.9190673828125, -1.76446533203125, -1.60986328125, -1.45526123046875, -1.3006591796875, -1.14605712890625, -0.991455078125, -0.83685302734375, -0.6822509765625, -0.52764892578125, -0.373046875, -0.21844482421875, -0.0638427734375, 0.09075927734375, 0.245361328125, 0.39996337890625, 0.5545654296875, 0.70916748046875, 0.86376953125, 1.01837158203125, 1.1729736328125, 1.32757568359375, 1.482177734375, 1.63677978515625, 1.7913818359375, 1.94598388671875, 2.1005859375, 2.25518798828125, 2.4097900390625, 2.56439208984375, 2.718994140625, 2.87359619140625, 3.0281982421875, 3.18280029296875, 3.33740234375, 3.49200439453125, 3.6466064453125, 3.80120849609375, 3.955810546875, 4.11041259765625, 4.2650146484375, 4.41961669921875, 4.57421875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 15.0, 7.0, 7.0, 21.0, 20.0, 34.0, 46.0, 82.0, 82.0, 133.0, 191.0, 256.0, 397.0, 539.0, 854.0, 1316.0, 2021.0, 3699.0, 7151.0, 16569.0, 57574.0, 907423.0, 27264.0, 10415.0, 4938.0, 2735.0, 1578.0, 1020.0, 708.0, 423.0, 309.0, 195.0, 144.0, 113.0, 74.0, 52.0, 44.0, 28.0, 20.0, 13.0, 18.0, 7.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6455078125, -0.624847412109375, -0.60418701171875, -0.583526611328125, -0.5628662109375, -0.542205810546875, -0.52154541015625, -0.500885009765625, -0.480224609375, -0.459564208984375, -0.43890380859375, -0.418243408203125, -0.3975830078125, -0.376922607421875, -0.35626220703125, -0.335601806640625, -0.31494140625, -0.294281005859375, -0.27362060546875, -0.252960205078125, -0.2322998046875, -0.211639404296875, -0.19097900390625, -0.170318603515625, -0.149658203125, -0.128997802734375, -0.10833740234375, -0.087677001953125, -0.0670166015625, -0.046356201171875, -0.02569580078125, -0.005035400390625, 0.015625, 0.036285400390625, 0.05694580078125, 0.077606201171875, 0.0982666015625, 0.118927001953125, 0.13958740234375, 0.160247802734375, 0.180908203125, 0.201568603515625, 0.22222900390625, 0.242889404296875, 0.2635498046875, 0.284210205078125, 0.30487060546875, 0.325531005859375, 0.34619140625, 0.366851806640625, 0.38751220703125, 0.408172607421875, 0.4288330078125, 0.449493408203125, 0.47015380859375, 0.490814208984375, 0.511474609375, 0.532135009765625, 0.55279541015625, 0.573455810546875, 0.5941162109375, 0.614776611328125, 0.63543701171875, 0.656097412109375, 0.6767578125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 0.0, 1.0, 5.0, 5.0, 12.0, 18.0, 30.0, 51.0, 77.0, 104.0, 139.0, 165.0, 118.0, 92.0, 61.0, 31.0, 15.0, 4.0, 7.0, 6.0, 1.0, 1.0, 6.0, 3.0, 4.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.816884994506836e-05, -9.453762322664261e-05, -9.090639650821686e-05, -8.727516978979111e-05, -8.364394307136536e-05, -8.00127163529396e-05, -7.638148963451385e-05, -7.27502629160881e-05, -6.911903619766235e-05, -6.54878094792366e-05, -6.185658276081085e-05, -5.82253560423851e-05, -5.459412932395935e-05, -5.09629026055336e-05, -4.733167588710785e-05, -4.37004491686821e-05, -4.006922245025635e-05, -3.64379957318306e-05, -3.2806769013404846e-05, -2.9175542294979095e-05, -2.5544315576553345e-05, -2.1913088858127594e-05, -1.8281862139701843e-05, -1.4650635421276093e-05, -1.1019408702850342e-05, -7.388181984424591e-06, -3.7569552659988403e-06, -1.257285475730896e-07, 3.505498170852661e-06, 7.136724889278412e-06, 1.0767951607704163e-05, 1.4399178326129913e-05, 1.8030405044555664e-05, 2.1661631762981415e-05, 2.5292858481407166e-05, 2.8924085199832916e-05, 3.255531191825867e-05, 3.618653863668442e-05, 3.981776535511017e-05, 4.344899207353592e-05, 4.708021879196167e-05, 5.071144551038742e-05, 5.434267222881317e-05, 5.797389894723892e-05, 6.160512566566467e-05, 6.523635238409042e-05, 6.886757910251617e-05, 7.249880582094193e-05, 7.613003253936768e-05, 7.976125925779343e-05, 8.339248597621918e-05, 8.702371269464493e-05, 9.065493941307068e-05, 9.428616613149643e-05, 9.791739284992218e-05, 0.00010154861956834793, 0.00010517984628677368, 0.00010881107300519943, 0.00011244229972362518, 0.00011607352644205093, 0.00011970475316047668, 0.00012333597987890244, 0.00012696720659732819, 0.00013059843331575394, 0.0001342296600341797]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 6.0, 6.0, 8.0, 21.0, 26.0, 24.0, 37.0, 59.0, 99.0, 117.0, 191.0, 269.0, 358.0, 545.0, 805.0, 1088.0, 1741.0, 2563.0, 3966.0, 5768.0, 8646.0, 13248.0, 20556.0, 32392.0, 52658.0, 89085.0, 151522.0, 217742.0, 174235.0, 104311.0, 61424.0, 36737.0, 23477.0, 15038.0, 9864.0, 6504.0, 4415.0, 2985.0, 1871.0, 1327.0, 848.0, 582.0, 442.0, 273.0, 214.0, 142.0, 113.0, 75.0, 50.0, 26.0, 22.0, 19.0, 10.0, 6.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.1966552734375, -0.19044113159179688, -0.18422698974609375, -0.17801284790039062, -0.1717987060546875, -0.16558456420898438, -0.15937042236328125, -0.15315628051757812, -0.146942138671875, -0.14072799682617188, -0.13451385498046875, -0.12829971313476562, -0.1220855712890625, -0.11587142944335938, -0.10965728759765625, -0.10344314575195312, -0.09722900390625, -0.09101486206054688, -0.08480072021484375, -0.07858657836914062, -0.0723724365234375, -0.06615829467773438, -0.05994415283203125, -0.053730010986328125, -0.047515869140625, -0.041301727294921875, -0.03508758544921875, -0.028873443603515625, -0.0226593017578125, -0.016445159912109375, -0.01023101806640625, -0.004016876220703125, 0.002197265625, 0.008411407470703125, 0.01462554931640625, 0.020839691162109375, 0.0270538330078125, 0.033267974853515625, 0.03948211669921875, 0.045696258544921875, 0.051910400390625, 0.058124542236328125, 0.06433868408203125, 0.07055282592773438, 0.0767669677734375, 0.08298110961914062, 0.08919525146484375, 0.09540939331054688, 0.10162353515625, 0.10783767700195312, 0.11405181884765625, 0.12026596069335938, 0.1264801025390625, 0.13269424438476562, 0.13890838623046875, 0.14512252807617188, 0.151336669921875, 0.15755081176757812, 0.16376495361328125, 0.16997909545898438, 0.1761932373046875, 0.18240737915039062, 0.18862152099609375, 0.19483566284179688, 0.2010498046875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 1.0, 6.0, 1.0, 3.0, 8.0, 10.0, 9.0, 14.0, 13.0, 20.0, 28.0, 11.0, 23.0, 25.0, 38.0, 30.0, 45.0, 42.0, 58.0, 52.0, 41.0, 55.0, 46.0, 50.0, 52.0, 34.0, 46.0, 44.0, 33.0, 25.0, 21.0, 21.0, 22.0, 15.0, 10.0, 12.0, 7.0, 4.0, 9.0, 4.0, 2.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.103515625, -0.10065269470214844, -0.09778976440429688, -0.09492683410644531, -0.09206390380859375, -0.08920097351074219, -0.08633804321289062, -0.08347511291503906, -0.0806121826171875, -0.07774925231933594, -0.07488632202148438, -0.07202339172363281, -0.06916046142578125, -0.06629753112792969, -0.06343460083007812, -0.06057167053222656, -0.057708740234375, -0.05484580993652344, -0.051982879638671875, -0.04911994934082031, -0.04625701904296875, -0.04339408874511719, -0.040531158447265625, -0.03766822814941406, -0.0348052978515625, -0.03194236755371094, -0.029079437255859375, -0.026216506958007812, -0.02335357666015625, -0.020490646362304688, -0.017627716064453125, -0.014764785766601562, -0.01190185546875, -0.009038925170898438, -0.006175994873046875, -0.0033130645751953125, -0.00045013427734375, 0.0024127960205078125, 0.005275726318359375, 0.008138656616210938, 0.0110015869140625, 0.013864517211914062, 0.016727447509765625, 0.019590377807617188, 0.02245330810546875, 0.025316238403320312, 0.028179168701171875, 0.031042098999023438, 0.033905029296875, 0.03676795959472656, 0.039630889892578125, 0.04249382019042969, 0.04535675048828125, 0.04821968078613281, 0.051082611083984375, 0.05394554138183594, 0.0568084716796875, 0.05967140197753906, 0.06253433227539062, 0.06539726257324219, 0.06826019287109375, 0.07112312316894531, 0.07398605346679688, 0.07684898376464844, 0.0797119140625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 18.0, 8.0, 15.0, 25.0, 26.0, 37.0, 38.0, 61.0, 54.0, 59.0, 66.0, 60.0, 69.0, 70.0, 55.0, 53.0, 50.0, 47.0, 36.0, 23.0, 22.0, 28.0, 17.0, 13.0, 9.0, 8.0, 8.0, 0.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7851643562316895, -4.588388442993164, -4.391613006591797, -4.19483757019043, -3.9980616569519043, -3.801285982131958, -3.6045103073120117, -3.4077346324920654, -3.210958957672119, -3.014183282852173, -2.8174076080322266, -2.6206319332122803, -2.423856258392334, -2.2270805835723877, -2.0303049087524414, -1.8335292339324951, -1.6367535591125488, -1.4399778842926025, -1.2432022094726562, -1.04642653465271, -0.8496508598327637, -0.6528751850128174, -0.4560995101928711, -0.2593238353729248, -0.06254816055297852, 0.13422751426696777, 0.33100318908691406, 0.5277788639068604, 0.7245545387268066, 0.9213302135467529, 1.1181058883666992, 1.3148815631866455, 1.5116567611694336, 1.7084324359893799, 1.9052081108093262, 2.1019837856292725, 2.2987594604492188, 2.495535135269165, 2.6923108100891113, 2.8890864849090576, 3.085862159729004, 3.28263783454895, 3.4794135093688965, 3.6761891841888428, 3.872964859008789, 4.069740295410156, 4.266516208648682, 4.463292121887207, 4.660067558288574, 4.856842994689941, 5.053618907928467, 5.250394821166992, 5.447170257568359, 5.643945693969727, 5.840721607208252, 6.037497520446777, 6.2342729568481445, 6.431048393249512, 6.627824306488037, 6.8246002197265625, 7.02137565612793, 7.218151092529297, 7.414927005767822, 7.611702919006348, 7.808478355407715]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 6.0, 13.0, 11.0, 7.0, 13.0, 21.0, 18.0, 12.0, 32.0, 26.0, 30.0, 35.0, 30.0, 30.0, 38.0, 40.0, 39.0, 33.0, 33.0, 36.0, 36.0, 38.0, 34.0, 38.0, 45.0, 44.0, 27.0, 23.0, 23.0, 30.0, 20.0, 21.0, 23.0, 17.0, 17.0, 14.0, 10.0, 7.0, 5.0, 3.0, 8.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.526854515075684, -6.326322555541992, -6.125790119171143, -5.925258159637451, -5.724725723266602, -5.52419376373291, -5.323661804199219, -5.123129367828369, -4.9225969314575195, -4.722064971923828, -4.5215325355529785, -4.321000576019287, -4.1204681396484375, -3.919936180114746, -3.7194039821624756, -3.518871784210205, -3.3183398246765137, -3.117807626724243, -2.9172754287719727, -2.7167434692382812, -2.5162110328674316, -2.3156790733337402, -2.1151468753814697, -1.9146146774291992, -1.7140824794769287, -1.5135502815246582, -1.3130180835723877, -1.1124860048294067, -0.9119538068771362, -0.7114216089248657, -0.5108895301818848, -0.31035733222961426, -0.10982465744018555, 0.09070751070976257, 0.2912396788597107, 0.4917718172073364, 0.6923040151596069, 0.8928362131118774, 1.0933682918548584, 1.293900489807129, 1.4944326877593994, 1.69496488571167, 1.8954970836639404, 2.096029281616211, 2.2965612411499023, 2.497093677520752, 2.6976256370544434, 2.898157835006714, 3.0986900329589844, 3.299222230911255, 3.4997544288635254, 3.700286388397217, 3.9008188247680664, 4.101350784301758, 4.301882743835449, 4.502415180206299, 4.702947616577148, 4.90347957611084, 5.1040120124816895, 5.304543972015381, 5.5050764083862305, 5.705608367919922, 5.906140327453613, 6.106672763824463, 6.307204723358154]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 9.0, 11.0, 12.0, 27.0, 35.0, 44.0, 92.0, 152.0, 187.0, 315.0, 508.0, 741.0, 1138.0, 1628.0, 2498.0, 3695.0, 5580.0, 8612.0, 13009.0, 19797.0, 29643.0, 43435.0, 62000.0, 85713.0, 109944.0, 126654.0, 127794.0, 112594.0, 88828.0, 65058.0, 45840.0, 31429.0, 20998.0, 13948.0, 9112.0, 5888.0, 3918.0, 2507.0, 1746.0, 1215.0, 731.0, 472.0, 322.0, 228.0, 132.0, 107.0, 77.0, 66.0, 36.0, 19.0, 11.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.36328125, -4.22283935546875, -4.0823974609375, -3.94195556640625, -3.801513671875, -3.66107177734375, -3.5206298828125, -3.38018798828125, -3.23974609375, -3.09930419921875, -2.9588623046875, -2.81842041015625, -2.677978515625, -2.53753662109375, -2.3970947265625, -2.25665283203125, -2.1162109375, -1.97576904296875, -1.8353271484375, -1.69488525390625, -1.554443359375, -1.41400146484375, -1.2735595703125, -1.13311767578125, -0.99267578125, -0.85223388671875, -0.7117919921875, -0.57135009765625, -0.430908203125, -0.29046630859375, -0.1500244140625, -0.00958251953125, 0.130859375, 0.27130126953125, 0.4117431640625, 0.55218505859375, 0.692626953125, 0.83306884765625, 0.9735107421875, 1.11395263671875, 1.25439453125, 1.39483642578125, 1.5352783203125, 1.67572021484375, 1.816162109375, 1.95660400390625, 2.0970458984375, 2.23748779296875, 2.3779296875, 2.51837158203125, 2.6588134765625, 2.79925537109375, 2.939697265625, 3.08013916015625, 3.2205810546875, 3.36102294921875, 3.50146484375, 3.64190673828125, 3.7823486328125, 3.92279052734375, 4.063232421875, 4.20367431640625, 4.3441162109375, 4.48455810546875, 4.625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 6.0, 4.0, 10.0, 8.0, 16.0, 14.0, 16.0, 14.0, 22.0, 21.0, 23.0, 36.0, 34.0, 23.0, 22.0, 36.0, 32.0, 35.0, 33.0, 28.0, 27.0, 44.0, 30.0, 39.0, 42.0, 35.0, 34.0, 35.0, 33.0, 21.0, 22.0, 27.0, 24.0, 19.0, 21.0, 15.0, 21.0, 6.0, 11.0, 11.0, 9.0, 6.0, 7.0, 6.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0], "bins": [-6.09375, -5.91748046875, -5.7412109375, -5.56494140625, -5.388671875, -5.21240234375, -5.0361328125, -4.85986328125, -4.68359375, -4.50732421875, -4.3310546875, -4.15478515625, -3.978515625, -3.80224609375, -3.6259765625, -3.44970703125, -3.2734375, -3.09716796875, -2.9208984375, -2.74462890625, -2.568359375, -2.39208984375, -2.2158203125, -2.03955078125, -1.86328125, -1.68701171875, -1.5107421875, -1.33447265625, -1.158203125, -0.98193359375, -0.8056640625, -0.62939453125, -0.453125, -0.27685546875, -0.1005859375, 0.07568359375, 0.251953125, 0.42822265625, 0.6044921875, 0.78076171875, 0.95703125, 1.13330078125, 1.3095703125, 1.48583984375, 1.662109375, 1.83837890625, 2.0146484375, 2.19091796875, 2.3671875, 2.54345703125, 2.7197265625, 2.89599609375, 3.072265625, 3.24853515625, 3.4248046875, 3.60107421875, 3.77734375, 3.95361328125, 4.1298828125, 4.30615234375, 4.482421875, 4.65869140625, 4.8349609375, 5.01123046875, 5.1875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 8.0, 8.0, 11.0, 15.0, 25.0, 35.0, 59.0, 89.0, 145.0, 208.0, 288.0, 446.0, 758.0, 1143.0, 1754.0, 2851.0, 4466.0, 7211.0, 11918.0, 19384.0, 31117.0, 50036.0, 76784.0, 110769.0, 143000.0, 154181.0, 137036.0, 103925.0, 70878.0, 45507.0, 28284.0, 17526.0, 10574.0, 6631.0, 4190.0, 2652.0, 1663.0, 1075.0, 647.0, 438.0, 274.0, 196.0, 123.0, 81.0, 48.0, 32.0, 23.0, 15.0, 11.0, 9.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.375, -5.2091064453125, -5.043212890625, -4.8773193359375, -4.71142578125, -4.5455322265625, -4.379638671875, -4.2137451171875, -4.0478515625, -3.8819580078125, -3.716064453125, -3.5501708984375, -3.38427734375, -3.2183837890625, -3.052490234375, -2.8865966796875, -2.720703125, -2.5548095703125, -2.388916015625, -2.2230224609375, -2.05712890625, -1.8912353515625, -1.725341796875, -1.5594482421875, -1.3935546875, -1.2276611328125, -1.061767578125, -0.8958740234375, -0.72998046875, -0.5640869140625, -0.398193359375, -0.2322998046875, -0.06640625, 0.0994873046875, 0.265380859375, 0.4312744140625, 0.59716796875, 0.7630615234375, 0.928955078125, 1.0948486328125, 1.2607421875, 1.4266357421875, 1.592529296875, 1.7584228515625, 1.92431640625, 2.0902099609375, 2.256103515625, 2.4219970703125, 2.587890625, 2.7537841796875, 2.919677734375, 3.0855712890625, 3.25146484375, 3.4173583984375, 3.583251953125, 3.7491455078125, 3.9150390625, 4.0809326171875, 4.246826171875, 4.4127197265625, 4.57861328125, 4.7445068359375, 4.910400390625, 5.0762939453125, 5.2421875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 1.0, 5.0, 2.0, 4.0, 6.0, 4.0, 8.0, 7.0, 11.0, 14.0, 11.0, 15.0, 20.0, 21.0, 16.0, 32.0, 34.0, 22.0, 29.0, 32.0, 35.0, 37.0, 35.0, 48.0, 46.0, 34.0, 40.0, 31.0, 39.0, 48.0, 30.0, 25.0, 28.0, 32.0, 25.0, 36.0, 25.0, 23.0, 16.0, 13.0, 15.0, 10.0, 9.0, 6.0, 10.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.671875, -3.556488037109375, -3.44110107421875, -3.325714111328125, -3.2103271484375, -3.094940185546875, -2.97955322265625, -2.864166259765625, -2.748779296875, -2.633392333984375, -2.51800537109375, -2.402618408203125, -2.2872314453125, -2.171844482421875, -2.05645751953125, -1.941070556640625, -1.82568359375, -1.710296630859375, -1.59490966796875, -1.479522705078125, -1.3641357421875, -1.248748779296875, -1.13336181640625, -1.017974853515625, -0.902587890625, -0.787200927734375, -0.67181396484375, -0.556427001953125, -0.4410400390625, -0.325653076171875, -0.21026611328125, -0.094879150390625, 0.0205078125, 0.135894775390625, 0.25128173828125, 0.366668701171875, 0.4820556640625, 0.597442626953125, 0.71282958984375, 0.828216552734375, 0.943603515625, 1.058990478515625, 1.17437744140625, 1.289764404296875, 1.4051513671875, 1.520538330078125, 1.63592529296875, 1.751312255859375, 1.86669921875, 1.982086181640625, 2.09747314453125, 2.212860107421875, 2.3282470703125, 2.443634033203125, 2.55902099609375, 2.674407958984375, 2.789794921875, 2.905181884765625, 3.02056884765625, 3.135955810546875, 3.2513427734375, 3.366729736328125, 3.48211669921875, 3.597503662109375, 3.712890625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 11.0, 13.0, 15.0, 22.0, 29.0, 40.0, 41.0, 60.0, 77.0, 111.0, 167.0, 211.0, 348.0, 525.0, 817.0, 1432.0, 2770.0, 5966.0, 13336.0, 33486.0, 86492.0, 208021.0, 321628.0, 217731.0, 92186.0, 35679.0, 14103.0, 6156.0, 2936.0, 1586.0, 867.0, 518.0, 336.0, 230.0, 181.0, 127.0, 80.0, 67.0, 44.0, 43.0, 31.0, 13.0, 8.0, 8.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.25, -3.13995361328125, -3.0299072265625, -2.91986083984375, -2.809814453125, -2.69976806640625, -2.5897216796875, -2.47967529296875, -2.36962890625, -2.25958251953125, -2.1495361328125, -2.03948974609375, -1.929443359375, -1.81939697265625, -1.7093505859375, -1.59930419921875, -1.4892578125, -1.37921142578125, -1.2691650390625, -1.15911865234375, -1.049072265625, -0.93902587890625, -0.8289794921875, -0.71893310546875, -0.60888671875, -0.49884033203125, -0.3887939453125, -0.27874755859375, -0.168701171875, -0.05865478515625, 0.0513916015625, 0.16143798828125, 0.271484375, 0.38153076171875, 0.4915771484375, 0.60162353515625, 0.711669921875, 0.82171630859375, 0.9317626953125, 1.04180908203125, 1.15185546875, 1.26190185546875, 1.3719482421875, 1.48199462890625, 1.592041015625, 1.70208740234375, 1.8121337890625, 1.92218017578125, 2.0322265625, 2.14227294921875, 2.2523193359375, 2.36236572265625, 2.472412109375, 2.58245849609375, 2.6925048828125, 2.80255126953125, 2.91259765625, 3.02264404296875, 3.1326904296875, 3.24273681640625, 3.352783203125, 3.46282958984375, 3.5728759765625, 3.68292236328125, 3.79296875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 4.0, 8.0, 2.0, 3.0, 2.0, 9.0, 8.0, 19.0, 31.0, 31.0, 33.0, 41.0, 45.0, 55.0, 62.0, 77.0, 66.0, 78.0, 60.0, 55.0, 61.0, 56.0, 48.0, 28.0, 24.0, 12.0, 13.0, 17.0, 13.0, 9.0, 2.0, 4.0, 5.0, 5.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015974044799804688, -0.0001542121171951294, -0.00014868378639221191, -0.00014315545558929443, -0.00013762712478637695, -0.00013209879398345947, -0.000126570463180542, -0.00012104213237762451, -0.00011551380157470703, -0.00010998547077178955, -0.00010445713996887207, -9.892880916595459e-05, -9.340047836303711e-05, -8.787214756011963e-05, -8.234381675720215e-05, -7.681548595428467e-05, -7.128715515136719e-05, -6.575882434844971e-05, -6.0230493545532227e-05, -5.4702162742614746e-05, -4.9173831939697266e-05, -4.3645501136779785e-05, -3.8117170333862305e-05, -3.2588839530944824e-05, -2.7060508728027344e-05, -2.1532177925109863e-05, -1.6003847122192383e-05, -1.0475516319274902e-05, -4.947185516357422e-06, 5.811452865600586e-07, 6.109476089477539e-06, 1.163780689239502e-05, 1.71661376953125e-05, 2.269446849822998e-05, 2.822279930114746e-05, 3.375113010406494e-05, 3.927946090698242e-05, 4.48077917098999e-05, 5.033612251281738e-05, 5.586445331573486e-05, 6.139278411865234e-05, 6.692111492156982e-05, 7.24494457244873e-05, 7.797777652740479e-05, 8.350610733032227e-05, 8.903443813323975e-05, 9.456276893615723e-05, 0.00010009109973907471, 0.00010561943054199219, 0.00011114776134490967, 0.00011667609214782715, 0.00012220442295074463, 0.0001277327537536621, 0.0001332610845565796, 0.00013878941535949707, 0.00014431774616241455, 0.00014984607696533203, 0.0001553744077682495, 0.000160902738571167, 0.00016643106937408447, 0.00017195940017700195, 0.00017748773097991943, 0.00018301606178283691, 0.0001885443925857544, 0.00019407272338867188]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 8.0, 4.0, 4.0, 15.0, 11.0, 18.0, 26.0, 44.0, 46.0, 67.0, 83.0, 122.0, 160.0, 235.0, 339.0, 442.0, 665.0, 1121.0, 1699.0, 2796.0, 4591.0, 7816.0, 13937.0, 25048.0, 44852.0, 77260.0, 126382.0, 178030.0, 189997.0, 147720.0, 95295.0, 55975.0, 31331.0, 17414.0, 9910.0, 5715.0, 3335.0, 2051.0, 1313.0, 840.0, 521.0, 373.0, 266.0, 187.0, 134.0, 102.0, 62.0, 46.0, 45.0, 39.0, 23.0, 16.0, 11.0, 12.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.9296875, -1.86578369140625, -1.8018798828125, -1.73797607421875, -1.674072265625, -1.61016845703125, -1.5462646484375, -1.48236083984375, -1.41845703125, -1.35455322265625, -1.2906494140625, -1.22674560546875, -1.162841796875, -1.09893798828125, -1.0350341796875, -0.97113037109375, -0.9072265625, -0.84332275390625, -0.7794189453125, -0.71551513671875, -0.651611328125, -0.58770751953125, -0.5238037109375, -0.45989990234375, -0.39599609375, -0.33209228515625, -0.2681884765625, -0.20428466796875, -0.140380859375, -0.07647705078125, -0.0125732421875, 0.05133056640625, 0.115234375, 0.17913818359375, 0.2430419921875, 0.30694580078125, 0.370849609375, 0.43475341796875, 0.4986572265625, 0.56256103515625, 0.62646484375, 0.69036865234375, 0.7542724609375, 0.81817626953125, 0.882080078125, 0.94598388671875, 1.0098876953125, 1.07379150390625, 1.1376953125, 1.20159912109375, 1.2655029296875, 1.32940673828125, 1.393310546875, 1.45721435546875, 1.5211181640625, 1.58502197265625, 1.64892578125, 1.71282958984375, 1.7767333984375, 1.84063720703125, 1.904541015625, 1.96844482421875, 2.0323486328125, 2.09625244140625, 2.16015625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 7.0, 11.0, 14.0, 14.0, 19.0, 19.0, 26.0, 36.0, 44.0, 46.0, 38.0, 46.0, 45.0, 46.0, 57.0, 58.0, 53.0, 52.0, 57.0, 56.0, 34.0, 31.0, 36.0, 32.0, 22.0, 16.0, 21.0, 11.0, 12.0, 11.0, 7.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.9365234375, -0.908233642578125, -0.87994384765625, -0.851654052734375, -0.8233642578125, -0.795074462890625, -0.76678466796875, -0.738494873046875, -0.710205078125, -0.681915283203125, -0.65362548828125, -0.625335693359375, -0.5970458984375, -0.568756103515625, -0.54046630859375, -0.512176513671875, -0.48388671875, -0.455596923828125, -0.42730712890625, -0.399017333984375, -0.3707275390625, -0.342437744140625, -0.31414794921875, -0.285858154296875, -0.257568359375, -0.229278564453125, -0.20098876953125, -0.172698974609375, -0.1444091796875, -0.116119384765625, -0.08782958984375, -0.059539794921875, -0.03125, -0.002960205078125, 0.02532958984375, 0.053619384765625, 0.0819091796875, 0.110198974609375, 0.13848876953125, 0.166778564453125, 0.195068359375, 0.223358154296875, 0.25164794921875, 0.279937744140625, 0.3082275390625, 0.336517333984375, 0.36480712890625, 0.393096923828125, 0.42138671875, 0.449676513671875, 0.47796630859375, 0.506256103515625, 0.5345458984375, 0.562835693359375, 0.59112548828125, 0.619415283203125, 0.647705078125, 0.675994873046875, 0.70428466796875, 0.732574462890625, 0.7608642578125, 0.789154052734375, 0.81744384765625, 0.845733642578125, 0.8740234375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 3.0, 10.0, 10.0, 16.0, 14.0, 33.0, 20.0, 55.0, 38.0, 48.0, 58.0, 73.0, 73.0, 67.0, 50.0, 58.0, 67.0, 50.0, 52.0, 42.0, 35.0, 33.0, 19.0, 20.0, 13.0, 9.0, 5.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.619710922241211, -4.417544364929199, -4.2153778076171875, -4.013211250305176, -3.811044692993164, -3.6088781356811523, -3.4067115783691406, -3.204545021057129, -3.002378463745117, -2.8002119064331055, -2.5980453491210938, -2.395878791809082, -2.1937122344970703, -1.991545557975769, -1.7893790006637573, -1.5872124433517456, -1.3850457668304443, -1.1828792095184326, -0.9807126522064209, -0.7785460352897644, -0.5763794779777527, -0.3742128610610962, -0.17204630374908447, 0.030120253562927246, 0.23228681087493896, 0.4344533681869507, 0.6366199254989624, 0.8387865424156189, 1.0409531593322754, 1.243119716644287, 1.4452862739562988, 1.6474528312683105, 1.8496193885803223, 2.051785945892334, 2.2539525032043457, 2.4561190605163574, 2.658285617828369, 2.860452175140381, 3.0626187324523926, 3.2647852897644043, 3.466951847076416, 3.6691184043884277, 3.8712849617004395, 4.073451519012451, 4.275618076324463, 4.477784633636475, 4.679951190948486, 4.882117748260498, 5.084284782409668, 5.28645133972168, 5.488617897033691, 5.690784454345703, 5.892951011657715, 6.095117568969727, 6.297284126281738, 6.49945068359375, 6.701617240905762, 6.903783798217773, 7.105950355529785, 7.308116912841797, 7.510283470153809, 7.71245002746582, 7.914616584777832, 8.116783142089844, 8.318949699401855]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 4.0, 7.0, 3.0, 6.0, 8.0, 15.0, 10.0, 18.0, 16.0, 23.0, 31.0, 23.0, 39.0, 23.0, 39.0, 31.0, 27.0, 25.0, 36.0, 23.0, 24.0, 33.0, 42.0, 46.0, 44.0, 45.0, 39.0, 42.0, 31.0, 22.0, 21.0, 19.0, 20.0, 22.0, 18.0, 15.0, 15.0, 14.0, 13.0, 14.0, 9.0, 8.0, 6.0, 7.0, 10.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-6.532145023345947, -6.346862316131592, -6.161579608917236, -5.976297378540039, -5.791014671325684, -5.605731964111328, -5.420449256896973, -5.235166549682617, -5.049883842468262, -4.864601135253906, -4.679318428039551, -4.494035720825195, -4.308753490447998, -4.123470783233643, -3.938188076019287, -3.7529053688049316, -3.5676229000091553, -3.3823401927948, -3.1970577239990234, -3.011775016784668, -2.8264923095703125, -2.641209602355957, -2.4559271335601807, -2.270644426345825, -2.085361957550049, -1.900079369544983, -1.7147966623306274, -1.5295140743255615, -1.344231367111206, -1.1589487791061401, -0.9736661911010742, -0.7883834838867188, -0.6031007766723633, -0.4178181290626526, -0.23253551125526428, -0.04725289344787598, 0.13802975416183472, 0.3233124017715454, 0.5085949897766113, 0.6938776969909668, 0.8791602849960327, 1.0644428730010986, 1.249725580215454, 1.43500816822052, 1.620290756225586, 1.8055734634399414, 1.9908560514450073, 2.1761388778686523, 2.3614213466644287, 2.546704053878784, 2.7319865226745605, 2.917269229888916, 3.1025519371032715, 3.287834644317627, 3.4731171131134033, 3.658399820327759, 3.843682289123535, 4.028964996337891, 4.214247703552246, 4.399530410766602, 4.584812641143799, 4.770095348358154, 4.95537805557251, 5.140660762786865, 5.325943470001221]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 8.0, 11.0, 16.0, 26.0, 44.0, 52.0, 88.0, 133.0, 218.0, 333.0, 515.0, 846.0, 1348.0, 2010.0, 3336.0, 5591.0, 9542.0, 15930.0, 28196.0, 50051.0, 92575.0, 173427.0, 336127.0, 633438.0, 941305.0, 841593.0, 494002.0, 258276.0, 135303.0, 72534.0, 40131.0, 22482.0, 13325.0, 7844.0, 4804.0, 3076.0, 1873.0, 1312.0, 824.0, 546.0, 374.0, 258.0, 170.0, 109.0, 85.0, 68.0, 36.0, 34.0, 20.0, 17.0, 9.0, 5.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0], "bins": [-5.03515625, -4.86029052734375, -4.6854248046875, -4.51055908203125, -4.335693359375, -4.16082763671875, -3.9859619140625, -3.81109619140625, -3.63623046875, -3.46136474609375, -3.2864990234375, -3.11163330078125, -2.936767578125, -2.76190185546875, -2.5870361328125, -2.41217041015625, -2.2373046875, -2.06243896484375, -1.8875732421875, -1.71270751953125, -1.537841796875, -1.36297607421875, -1.1881103515625, -1.01324462890625, -0.83837890625, -0.66351318359375, -0.4886474609375, -0.31378173828125, -0.138916015625, 0.03594970703125, 0.2108154296875, 0.38568115234375, 0.560546875, 0.73541259765625, 0.9102783203125, 1.08514404296875, 1.260009765625, 1.43487548828125, 1.6097412109375, 1.78460693359375, 1.95947265625, 2.13433837890625, 2.3092041015625, 2.48406982421875, 2.658935546875, 2.83380126953125, 3.0086669921875, 3.18353271484375, 3.3583984375, 3.53326416015625, 3.7081298828125, 3.88299560546875, 4.057861328125, 4.23272705078125, 4.4075927734375, 4.58245849609375, 4.75732421875, 4.93218994140625, 5.1070556640625, 5.28192138671875, 5.456787109375, 5.63165283203125, 5.8065185546875, 5.98138427734375, 6.15625]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 2.0, 5.0, 5.0, 7.0, 15.0, 12.0, 18.0, 14.0, 17.0, 31.0, 26.0, 28.0, 33.0, 28.0, 28.0, 40.0, 37.0, 30.0, 33.0, 31.0, 41.0, 36.0, 41.0, 43.0, 46.0, 37.0, 26.0, 37.0, 35.0, 35.0, 24.0, 19.0, 12.0, 17.0, 15.0, 20.0, 18.0, 9.0, 14.0, 7.0, 6.0, 3.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.00390625, -3.87493896484375, -3.7459716796875, -3.61700439453125, -3.488037109375, -3.35906982421875, -3.2301025390625, -3.10113525390625, -2.97216796875, -2.84320068359375, -2.7142333984375, -2.58526611328125, -2.456298828125, -2.32733154296875, -2.1983642578125, -2.06939697265625, -1.9404296875, -1.81146240234375, -1.6824951171875, -1.55352783203125, -1.424560546875, -1.29559326171875, -1.1666259765625, -1.03765869140625, -0.90869140625, -0.77972412109375, -0.6507568359375, -0.52178955078125, -0.392822265625, -0.26385498046875, -0.1348876953125, -0.00592041015625, 0.123046875, 0.25201416015625, 0.3809814453125, 0.50994873046875, 0.638916015625, 0.76788330078125, 0.8968505859375, 1.02581787109375, 1.15478515625, 1.28375244140625, 1.4127197265625, 1.54168701171875, 1.670654296875, 1.79962158203125, 1.9285888671875, 2.05755615234375, 2.1865234375, 2.31549072265625, 2.4444580078125, 2.57342529296875, 2.702392578125, 2.83135986328125, 2.9603271484375, 3.08929443359375, 3.21826171875, 3.34722900390625, 3.4761962890625, 3.60516357421875, 3.734130859375, 3.86309814453125, 3.9920654296875, 4.12103271484375, 4.25]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 6.0, 18.0, 17.0, 17.0, 33.0, 38.0, 79.0, 125.0, 189.0, 262.0, 444.0, 733.0, 1174.0, 1756.0, 3067.0, 5179.0, 9072.0, 15712.0, 28634.0, 53227.0, 98490.0, 183184.0, 332168.0, 557051.0, 779356.0, 789388.0, 572888.0, 344163.0, 190780.0, 102777.0, 54787.0, 29849.0, 16496.0, 9367.0, 5407.0, 3201.0, 1903.0, 1207.0, 741.0, 478.0, 290.0, 195.0, 119.0, 85.0, 45.0, 31.0, 21.0, 13.0, 5.0, 11.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-5.125, -4.9698486328125, -4.814697265625, -4.6595458984375, -4.50439453125, -4.3492431640625, -4.194091796875, -4.0389404296875, -3.8837890625, -3.7286376953125, -3.573486328125, -3.4183349609375, -3.26318359375, -3.1080322265625, -2.952880859375, -2.7977294921875, -2.642578125, -2.4874267578125, -2.332275390625, -2.1771240234375, -2.02197265625, -1.8668212890625, -1.711669921875, -1.5565185546875, -1.4013671875, -1.2462158203125, -1.091064453125, -0.9359130859375, -0.78076171875, -0.6256103515625, -0.470458984375, -0.3153076171875, -0.16015625, -0.0050048828125, 0.150146484375, 0.3052978515625, 0.46044921875, 0.6156005859375, 0.770751953125, 0.9259033203125, 1.0810546875, 1.2362060546875, 1.391357421875, 1.5465087890625, 1.70166015625, 1.8568115234375, 2.011962890625, 2.1671142578125, 2.322265625, 2.4774169921875, 2.632568359375, 2.7877197265625, 2.94287109375, 3.0980224609375, 3.253173828125, 3.4083251953125, 3.5634765625, 3.7186279296875, 3.873779296875, 4.0289306640625, 4.18408203125, 4.3392333984375, 4.494384765625, 4.6495361328125, 4.8046875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 10.0, 10.0, 13.0, 25.0, 17.0, 23.0, 39.0, 51.0, 74.0, 71.0, 85.0, 91.0, 141.0, 168.0, 193.0, 205.0, 212.0, 270.0, 279.0, 262.0, 264.0, 241.0, 223.0, 212.0, 196.0, 162.0, 124.0, 88.0, 82.0, 61.0, 40.0, 34.0, 27.0, 30.0, 8.0, 13.0, 8.0, 10.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.466796875, -2.390625, -2.314453125, -2.23828125, -2.162109375, -2.0859375, -2.009765625, -1.93359375, -1.857421875, -1.78125, -1.705078125, -1.62890625, -1.552734375, -1.4765625, -1.400390625, -1.32421875, -1.248046875, -1.171875, -1.095703125, -1.01953125, -0.943359375, -0.8671875, -0.791015625, -0.71484375, -0.638671875, -0.5625, -0.486328125, -0.41015625, -0.333984375, -0.2578125, -0.181640625, -0.10546875, -0.029296875, 0.046875, 0.123046875, 0.19921875, 0.275390625, 0.3515625, 0.427734375, 0.50390625, 0.580078125, 0.65625, 0.732421875, 0.80859375, 0.884765625, 0.9609375, 1.037109375, 1.11328125, 1.189453125, 1.265625, 1.341796875, 1.41796875, 1.494140625, 1.5703125, 1.646484375, 1.72265625, 1.798828125, 1.875, 1.951171875, 2.02734375, 2.103515625, 2.1796875, 2.255859375, 2.33203125, 2.408203125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 9.0, 11.0, 17.0, 23.0, 19.0, 15.0, 35.0, 35.0, 67.0, 56.0, 74.0, 65.0, 85.0, 65.0, 61.0, 74.0, 60.0, 33.0, 36.0, 31.0, 30.0, 14.0, 18.0, 19.0, 12.0, 7.0, 4.0, 1.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.763651371002197, -5.570819854736328, -5.377988338470459, -5.185156345367432, -4.9923248291015625, -4.799493312835693, -4.606661796569824, -4.413829803466797, -4.220998287200928, -4.028166770935059, -3.8353350162506104, -3.642503499984741, -3.449671745300293, -3.256840229034424, -3.0640087127685547, -2.8711769580841064, -2.6783454418182373, -2.485513925552368, -2.29268217086792, -2.099850654602051, -1.9070188999176025, -1.7141873836517334, -1.5213557481765747, -1.328524112701416, -1.1356924772262573, -0.9428608417510986, -0.7500292062759399, -0.557197630405426, -0.36436599493026733, -0.17153435945510864, 0.021297216415405273, 0.21412885189056396, 0.40696048736572266, 0.5997921228408813, 0.79262375831604, 0.985455334186554, 1.1782870292663574, 1.3711185455322266, 1.5639501810073853, 1.756781816482544, 1.9496134519577026, 2.1424450874328613, 2.3352766036987305, 2.5281083583831787, 2.720939874649048, 2.913771629333496, 3.1066031455993652, 3.2994346618652344, 3.4922664165496826, 3.6850979328155518, 3.8779296875, 4.070761203765869, 4.263592720031738, 4.456424713134766, 4.649256229400635, 4.842087745666504, 5.034919261932373, 5.227750778198242, 5.420582294464111, 5.613414287567139, 5.806245803833008, 5.999077320098877, 6.191908836364746, 6.384740829467773, 6.577572345733643]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 7.0, 8.0, 10.0, 10.0, 12.0, 11.0, 14.0, 20.0, 21.0, 19.0, 30.0, 30.0, 33.0, 35.0, 31.0, 30.0, 38.0, 26.0, 45.0, 45.0, 53.0, 50.0, 45.0, 32.0, 21.0, 35.0, 30.0, 25.0, 29.0, 26.0, 27.0, 18.0, 16.0, 17.0, 22.0, 12.0, 13.0, 14.0, 14.0, 5.0, 4.0, 7.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.758407115936279, -5.580372333526611, -5.402337074279785, -5.224302291870117, -5.046267509460449, -4.868232727050781, -4.690197467803955, -4.512162685394287, -4.334127426147461, -4.156092643737793, -3.978057622909546, -3.800022602081299, -3.621987819671631, -3.443952798843384, -3.2659177780151367, -3.0878829956054688, -2.909848213195801, -2.7318131923675537, -2.5537784099578857, -2.3757433891296387, -2.1977086067199707, -2.0196735858917236, -1.8416385650634766, -1.663603663444519, -1.4855687618255615, -1.307533860206604, -1.1294989585876465, -0.9514639377593994, -0.7734290361404419, -0.5953941345214844, -0.4173591136932373, -0.23932421207427979, -0.06128883361816406, 0.11674609780311584, 0.29478102922439575, 0.47281599044799805, 0.6508508920669556, 0.8288857936859131, 1.0069208145141602, 1.1849557161331177, 1.3629906177520752, 1.5410255193710327, 1.7190604209899902, 1.8970954418182373, 2.0751304626464844, 2.2531652450561523, 2.4312002658843994, 2.6092352867126465, 2.7872700691223145, 2.9653050899505615, 3.1433398723602295, 3.3213748931884766, 3.4994096755981445, 3.6774446964263916, 3.8554797172546387, 4.033514499664307, 4.211549758911133, 4.389584541320801, 4.567619800567627, 4.745654582977295, 4.923689365386963, 5.101724624633789, 5.279759407043457, 5.457794189453125, 5.635828971862793]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 5.0, 1.0, 5.0, 11.0, 17.0, 28.0, 35.0, 63.0, 93.0, 152.0, 203.0, 315.0, 492.0, 767.0, 1171.0, 1821.0, 2879.0, 4502.0, 7051.0, 11310.0, 18438.0, 30720.0, 52504.0, 93233.0, 161933.0, 233094.0, 178219.0, 103187.0, 58389.0, 33703.0, 20495.0, 12301.0, 7873.0, 4969.0, 3152.0, 1948.0, 1239.0, 786.0, 507.0, 302.0, 215.0, 143.0, 97.0, 52.0, 44.0, 25.0, 16.0, 15.0, 14.0, 9.0, 8.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0], "bins": [-1.8515625, -1.7947540283203125, -1.737945556640625, -1.6811370849609375, -1.62432861328125, -1.5675201416015625, -1.510711669921875, -1.4539031982421875, -1.3970947265625, -1.3402862548828125, -1.283477783203125, -1.2266693115234375, -1.16986083984375, -1.1130523681640625, -1.056243896484375, -0.9994354248046875, -0.942626953125, -0.8858184814453125, -0.829010009765625, -0.7722015380859375, -0.71539306640625, -0.6585845947265625, -0.601776123046875, -0.5449676513671875, -0.4881591796875, -0.4313507080078125, -0.374542236328125, -0.3177337646484375, -0.26092529296875, -0.2041168212890625, -0.147308349609375, -0.0904998779296875, -0.03369140625, 0.0231170654296875, 0.079925537109375, 0.1367340087890625, 0.19354248046875, 0.2503509521484375, 0.307159423828125, 0.3639678955078125, 0.4207763671875, 0.4775848388671875, 0.534393310546875, 0.5912017822265625, 0.64801025390625, 0.7048187255859375, 0.761627197265625, 0.8184356689453125, 0.875244140625, 0.9320526123046875, 0.988861083984375, 1.0456695556640625, 1.10247802734375, 1.1592864990234375, 1.216094970703125, 1.2729034423828125, 1.3297119140625, 1.3865203857421875, 1.443328857421875, 1.5001373291015625, 1.55694580078125, 1.6137542724609375, 1.670562744140625, 1.7273712158203125, 1.7841796875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 5.0, 8.0, 13.0, 12.0, 9.0, 14.0, 18.0, 20.0, 21.0, 19.0, 25.0, 33.0, 34.0, 40.0, 39.0, 41.0, 36.0, 49.0, 33.0, 49.0, 54.0, 40.0, 37.0, 29.0, 32.0, 32.0, 29.0, 26.0, 17.0, 24.0, 25.0, 21.0, 25.0, 21.0, 13.0, 11.0, 12.0, 10.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.03515625, -5.848876953125, -5.66259765625, -5.476318359375, -5.2900390625, -5.103759765625, -4.91748046875, -4.731201171875, -4.544921875, -4.358642578125, -4.17236328125, -3.986083984375, -3.7998046875, -3.613525390625, -3.42724609375, -3.240966796875, -3.0546875, -2.868408203125, -2.68212890625, -2.495849609375, -2.3095703125, -2.123291015625, -1.93701171875, -1.750732421875, -1.564453125, -1.378173828125, -1.19189453125, -1.005615234375, -0.8193359375, -0.633056640625, -0.44677734375, -0.260498046875, -0.07421875, 0.112060546875, 0.29833984375, 0.484619140625, 0.6708984375, 0.857177734375, 1.04345703125, 1.229736328125, 1.416015625, 1.602294921875, 1.78857421875, 1.974853515625, 2.1611328125, 2.347412109375, 2.53369140625, 2.719970703125, 2.90625, 3.092529296875, 3.27880859375, 3.465087890625, 3.6513671875, 3.837646484375, 4.02392578125, 4.210205078125, 4.396484375, 4.582763671875, 4.76904296875, 4.955322265625, 5.1416015625, 5.327880859375, 5.51416015625, 5.700439453125, 5.88671875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 10.0, 6.0, 12.0, 12.0, 28.0, 42.0, 51.0, 60.0, 74.0, 122.0, 197.0, 288.0, 386.0, 629.0, 1095.0, 2225.0, 4994.0, 14813.0, 64038.0, 919618.0, 25518.0, 7619.0, 2939.0, 1490.0, 781.0, 523.0, 282.0, 203.0, 149.0, 91.0, 63.0, 56.0, 43.0, 23.0, 24.0, 12.0, 14.0, 10.0, 8.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.953125, -6.72296142578125, -6.4927978515625, -6.26263427734375, -6.032470703125, -5.80230712890625, -5.5721435546875, -5.34197998046875, -5.11181640625, -4.88165283203125, -4.6514892578125, -4.42132568359375, -4.191162109375, -3.96099853515625, -3.7308349609375, -3.50067138671875, -3.2705078125, -3.04034423828125, -2.8101806640625, -2.58001708984375, -2.349853515625, -2.11968994140625, -1.8895263671875, -1.65936279296875, -1.42919921875, -1.19903564453125, -0.9688720703125, -0.73870849609375, -0.508544921875, -0.27838134765625, -0.0482177734375, 0.18194580078125, 0.412109375, 0.64227294921875, 0.8724365234375, 1.10260009765625, 1.332763671875, 1.56292724609375, 1.7930908203125, 2.02325439453125, 2.25341796875, 2.48358154296875, 2.7137451171875, 2.94390869140625, 3.174072265625, 3.40423583984375, 3.6343994140625, 3.86456298828125, 4.0947265625, 4.32489013671875, 4.5550537109375, 4.78521728515625, 5.015380859375, 5.24554443359375, 5.4757080078125, 5.70587158203125, 5.93603515625, 6.16619873046875, 6.3963623046875, 6.62652587890625, 6.856689453125, 7.08685302734375, 7.3170166015625, 7.54718017578125, 7.77734375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 5.0, 14.0, 10.0, 12.0, 19.0, 16.0, 17.0, 25.0, 20.0, 37.0, 42.0, 34.0, 37.0, 42.0, 45.0, 55.0, 36.0, 59.0, 48.0, 46.0, 26.0, 34.0, 33.0, 46.0, 29.0, 30.0, 27.0, 27.0, 22.0, 18.0, 16.0, 9.0, 11.0, 10.0, 2.0, 6.0, 1.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0], "bins": [-5.234375, -5.094329833984375, -4.95428466796875, -4.814239501953125, -4.6741943359375, -4.534149169921875, -4.39410400390625, -4.254058837890625, -4.114013671875, -3.973968505859375, -3.83392333984375, -3.693878173828125, -3.5538330078125, -3.413787841796875, -3.27374267578125, -3.133697509765625, -2.99365234375, -2.853607177734375, -2.71356201171875, -2.573516845703125, -2.4334716796875, -2.293426513671875, -2.15338134765625, -2.013336181640625, -1.873291015625, -1.733245849609375, -1.59320068359375, -1.453155517578125, -1.3131103515625, -1.173065185546875, -1.03302001953125, -0.892974853515625, -0.7529296875, -0.612884521484375, -0.47283935546875, -0.332794189453125, -0.1927490234375, -0.052703857421875, 0.08734130859375, 0.227386474609375, 0.367431640625, 0.507476806640625, 0.64752197265625, 0.787567138671875, 0.9276123046875, 1.067657470703125, 1.20770263671875, 1.347747802734375, 1.48779296875, 1.627838134765625, 1.76788330078125, 1.907928466796875, 2.0479736328125, 2.188018798828125, 2.32806396484375, 2.468109130859375, 2.608154296875, 2.748199462890625, 2.88824462890625, 3.028289794921875, 3.1683349609375, 3.308380126953125, 3.44842529296875, 3.588470458984375, 3.728515625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 7.0, 11.0, 19.0, 22.0, 55.0, 45.0, 85.0, 108.0, 164.0, 290.0, 449.0, 867.0, 1561.0, 3417.0, 9113.0, 37865.0, 953090.0, 27688.0, 7463.0, 2932.0, 1355.0, 736.0, 448.0, 260.0, 152.0, 108.0, 66.0, 48.0, 29.0, 22.0, 22.0, 17.0, 9.0, 3.0, 6.0, 3.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.724609375, -0.7007827758789062, -0.6769561767578125, -0.6531295776367188, -0.629302978515625, -0.6054763793945312, -0.5816497802734375, -0.5578231811523438, -0.53399658203125, -0.5101699829101562, -0.4863433837890625, -0.46251678466796875, -0.438690185546875, -0.41486358642578125, -0.3910369873046875, -0.36721038818359375, -0.3433837890625, -0.31955718994140625, -0.2957305908203125, -0.27190399169921875, -0.248077392578125, -0.22425079345703125, -0.2004241943359375, -0.17659759521484375, -0.15277099609375, -0.12894439697265625, -0.1051177978515625, -0.08129119873046875, -0.057464599609375, -0.03363800048828125, -0.0098114013671875, 0.01401519775390625, 0.037841796875, 0.06166839599609375, 0.0854949951171875, 0.10932159423828125, 0.133148193359375, 0.15697479248046875, 0.1808013916015625, 0.20462799072265625, 0.22845458984375, 0.25228118896484375, 0.2761077880859375, 0.29993438720703125, 0.323760986328125, 0.34758758544921875, 0.3714141845703125, 0.39524078369140625, 0.4190673828125, 0.44289398193359375, 0.4667205810546875, 0.49054718017578125, 0.514373779296875, 0.5382003784179688, 0.5620269775390625, 0.5858535766601562, 0.60968017578125, 0.6335067749023438, 0.6573333740234375, 0.6811599731445312, 0.704986572265625, 0.7288131713867188, 0.7526397705078125, 0.7764663696289062, 0.80029296875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 8.0, 4.0, 9.0, 12.0, 18.0, 15.0, 11.0, 33.0, 26.0, 27.0, 32.0, 46.0, 45.0, 51.0, 51.0, 55.0, 66.0, 44.0, 51.0, 50.0, 33.0, 41.0, 37.0, 30.0, 29.0, 24.0, 23.0, 22.0, 17.0, 14.0, 15.0, 10.0, 8.0, 6.0, 7.0, 7.0, 4.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.74913215637207e-05, -3.634113818407059e-05, -3.519095480442047e-05, -3.4040771424770355e-05, -3.289058804512024e-05, -3.174040466547012e-05, -3.059022128582001e-05, -2.944003790616989e-05, -2.8289854526519775e-05, -2.713967114686966e-05, -2.5989487767219543e-05, -2.4839304387569427e-05, -2.368912100791931e-05, -2.2538937628269196e-05, -2.138875424861908e-05, -2.0238570868968964e-05, -1.9088387489318848e-05, -1.793820410966873e-05, -1.6788020730018616e-05, -1.56378373503685e-05, -1.4487653970718384e-05, -1.3337470591068268e-05, -1.2187287211418152e-05, -1.1037103831768036e-05, -9.88692045211792e-06, -8.736737072467804e-06, -7.586553692817688e-06, -6.436370313167572e-06, -5.286186933517456e-06, -4.13600355386734e-06, -2.985820174217224e-06, -1.8356367945671082e-06, -6.854534149169922e-07, 4.647299647331238e-07, 1.6149133443832397e-06, 2.7650967240333557e-06, 3.915280103683472e-06, 5.065463483333588e-06, 6.215646862983704e-06, 7.36583024263382e-06, 8.516013622283936e-06, 9.666197001934052e-06, 1.0816380381584167e-05, 1.1966563761234283e-05, 1.31167471408844e-05, 1.4266930520534515e-05, 1.541711390018463e-05, 1.6567297279834747e-05, 1.7717480659484863e-05, 1.886766403913498e-05, 2.0017847418785095e-05, 2.116803079843521e-05, 2.2318214178085327e-05, 2.3468397557735443e-05, 2.461858093738556e-05, 2.5768764317035675e-05, 2.691894769668579e-05, 2.8069131076335907e-05, 2.9219314455986023e-05, 3.036949783563614e-05, 3.1519681215286255e-05, 3.266986459493637e-05, 3.382004797458649e-05, 3.49702313542366e-05, 3.612041473388672e-05]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 8.0, 9.0, 15.0, 11.0, 22.0, 20.0, 48.0, 58.0, 112.0, 121.0, 195.0, 255.0, 422.0, 650.0, 1067.0, 1682.0, 2780.0, 4666.0, 7925.0, 14429.0, 26801.0, 53625.0, 115044.0, 267700.0, 294778.0, 129738.0, 59480.0, 29590.0, 15678.0, 8676.0, 4986.0, 2989.0, 1790.0, 1120.0, 708.0, 464.0, 303.0, 203.0, 119.0, 86.0, 53.0, 47.0, 25.0, 22.0, 11.0, 13.0, 4.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2208251953125, -0.21393966674804688, -0.20705413818359375, -0.20016860961914062, -0.1932830810546875, -0.18639755249023438, -0.17951202392578125, -0.17262649536132812, -0.165740966796875, -0.15885543823242188, -0.15196990966796875, -0.14508438110351562, -0.1381988525390625, -0.13131332397460938, -0.12442779541015625, -0.11754226684570312, -0.11065673828125, -0.10377120971679688, -0.09688568115234375, -0.09000015258789062, -0.0831146240234375, -0.07622909545898438, -0.06934356689453125, -0.062458038330078125, -0.055572509765625, -0.048686981201171875, -0.04180145263671875, -0.034915924072265625, -0.0280303955078125, -0.021144866943359375, -0.01425933837890625, -0.007373809814453125, -0.00048828125, 0.006397247314453125, 0.01328277587890625, 0.020168304443359375, 0.0270538330078125, 0.033939361572265625, 0.04082489013671875, 0.047710418701171875, 0.054595947265625, 0.061481475830078125, 0.06836700439453125, 0.07525253295898438, 0.0821380615234375, 0.08902359008789062, 0.09590911865234375, 0.10279464721679688, 0.10968017578125, 0.11656570434570312, 0.12345123291015625, 0.13033676147460938, 0.1372222900390625, 0.14410781860351562, 0.15099334716796875, 0.15787887573242188, 0.164764404296875, 0.17164993286132812, 0.17853546142578125, 0.18542098999023438, 0.1923065185546875, 0.19919204711914062, 0.20607757568359375, 0.21296310424804688, 0.2198486328125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 5.0, 3.0, 3.0, 4.0, 5.0, 8.0, 4.0, 10.0, 9.0, 13.0, 13.0, 13.0, 22.0, 22.0, 36.0, 31.0, 39.0, 28.0, 59.0, 42.0, 55.0, 60.0, 63.0, 61.0, 45.0, 59.0, 34.0, 37.0, 30.0, 26.0, 22.0, 18.0, 22.0, 26.0, 12.0, 20.0, 13.0, 5.0, 5.0, 4.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.058990478515625, -0.057211875915527344, -0.05543327331542969, -0.05365467071533203, -0.051876068115234375, -0.05009746551513672, -0.04831886291503906, -0.046540260314941406, -0.04476165771484375, -0.042983055114746094, -0.04120445251464844, -0.03942584991455078, -0.037647247314453125, -0.03586864471435547, -0.03409004211425781, -0.032311439514160156, -0.0305328369140625, -0.028754234313964844, -0.026975631713867188, -0.02519702911376953, -0.023418426513671875, -0.02163982391357422, -0.019861221313476562, -0.018082618713378906, -0.01630401611328125, -0.014525413513183594, -0.012746810913085938, -0.010968208312988281, -0.009189605712890625, -0.007411003112792969, -0.0056324005126953125, -0.0038537979125976562, -0.0020751953125, -0.00029659271240234375, 0.0014820098876953125, 0.0032606124877929688, 0.005039215087890625, 0.006817817687988281, 0.008596420288085938, 0.010375022888183594, 0.01215362548828125, 0.013932228088378906, 0.015710830688476562, 0.01748943328857422, 0.019268035888671875, 0.02104663848876953, 0.022825241088867188, 0.024603843688964844, 0.0263824462890625, 0.028161048889160156, 0.029939651489257812, 0.03171825408935547, 0.033496856689453125, 0.03527545928955078, 0.03705406188964844, 0.038832664489746094, 0.04061126708984375, 0.042389869689941406, 0.04416847229003906, 0.04594707489013672, 0.047725677490234375, 0.04950428009033203, 0.05128288269042969, 0.053061485290527344, 0.054840087890625]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 8.0, 8.0, 6.0, 15.0, 19.0, 18.0, 23.0, 30.0, 34.0, 52.0, 64.0, 62.0, 77.0, 73.0, 72.0, 66.0, 70.0, 59.0, 45.0, 31.0, 39.0, 29.0, 23.0, 18.0, 15.0, 18.0, 6.0, 4.0, 4.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.635566234588623, -5.442609786987305, -5.249653339385986, -5.056696891784668, -4.86374044418335, -4.670783996582031, -4.477827548980713, -4.2848711013793945, -4.091914653778076, -3.898958206176758, -3.7060017585754395, -3.513045310974121, -3.3200888633728027, -3.1271324157714844, -2.934175968170166, -2.7412195205688477, -2.5482630729675293, -2.355306625366211, -2.1623501777648926, -1.9693937301635742, -1.7764372825622559, -1.5834808349609375, -1.3905243873596191, -1.1975679397583008, -1.0046114921569824, -0.8116550445556641, -0.6186985969543457, -0.42574214935302734, -0.23278570175170898, -0.039829254150390625, 0.15312719345092773, 0.3460836410522461, 0.5390396118164062, 0.7319960594177246, 0.924952507019043, 1.1179089546203613, 1.3108654022216797, 1.503821849822998, 1.6967782974243164, 1.8897347450256348, 2.082691192626953, 2.2756476402282715, 2.46860408782959, 2.661560535430908, 2.8545169830322266, 3.047473430633545, 3.2404298782348633, 3.4333863258361816, 3.6263427734375, 3.8192992210388184, 4.012255668640137, 4.205212116241455, 4.398168563842773, 4.591125011444092, 4.78408145904541, 4.9770379066467285, 5.169994354248047, 5.362950801849365, 5.555907249450684, 5.748863697052002, 5.94182014465332, 6.134776592254639, 6.327733039855957, 6.520689487457275, 6.713645935058594]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 7.0, 6.0, 8.0, 10.0, 9.0, 14.0, 10.0, 17.0, 19.0, 21.0, 17.0, 35.0, 28.0, 35.0, 27.0, 35.0, 33.0, 36.0, 27.0, 42.0, 48.0, 58.0, 48.0, 43.0, 28.0, 24.0, 32.0, 35.0, 21.0, 35.0, 22.0, 26.0, 17.0, 15.0, 18.0, 23.0, 13.0, 11.0, 13.0, 15.0, 4.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-5.685703277587891, -5.509519577026367, -5.333336353302002, -5.1571526527404785, -4.980969429016113, -4.80478572845459, -4.628602027893066, -4.452418804168701, -4.276235103607178, -4.100051403045654, -3.923868179321289, -3.7476844787597656, -3.5715010166168213, -3.395317554473877, -3.2191340923309326, -3.0429506301879883, -2.866767168045044, -2.6905837059020996, -2.5144002437591553, -2.338216781616211, -2.1620330810546875, -1.9858496189117432, -1.8096661567687988, -1.633482575416565, -1.4572991132736206, -1.2811156511306763, -1.1049320697784424, -0.928748607635498, -0.7525650858879089, -0.5763815641403198, -0.4001981019973755, -0.2240145206451416, -0.047831058502197266, 0.12835244834423065, 0.30453595519065857, 0.4807194471359253, 0.6569029688835144, 0.8330864906311035, 1.0092699527740479, 1.1854535341262817, 1.361636996269226, 1.5378204584121704, 1.7140040397644043, 1.8901875019073486, 2.066370964050293, 2.2425546646118164, 2.4187378883361816, 2.594921588897705, 2.7711050510406494, 2.9472885131835938, 3.123471975326538, 3.2996554374694824, 3.475839138031006, 3.65202260017395, 3.8282060623168945, 4.004389762878418, 4.180572986602783, 4.356756687164307, 4.532939910888672, 4.709123611450195, 4.8853068351745605, 5.061490535736084, 5.237673759460449, 5.413857460021973, 5.590041160583496]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 7.0, 14.0, 31.0, 36.0, 71.0, 122.0, 179.0, 255.0, 419.0, 708.0, 1188.0, 1977.0, 3461.0, 6273.0, 11298.0, 20277.0, 37147.0, 66070.0, 112219.0, 168812.0, 196430.0, 166242.0, 109891.0, 64480.0, 35875.0, 20060.0, 10678.0, 6056.0, 3442.0, 1969.0, 1106.0, 632.0, 396.0, 268.0, 168.0, 90.0, 66.0, 41.0, 29.0, 19.0, 14.0, 10.0, 6.0, 3.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.25408935546875, -5.0628662109375, -4.87164306640625, -4.680419921875, -4.48919677734375, -4.2979736328125, -4.10675048828125, -3.91552734375, -3.72430419921875, -3.5330810546875, -3.34185791015625, -3.150634765625, -2.95941162109375, -2.7681884765625, -2.57696533203125, -2.3857421875, -2.19451904296875, -2.0032958984375, -1.81207275390625, -1.620849609375, -1.42962646484375, -1.2384033203125, -1.04718017578125, -0.85595703125, -0.66473388671875, -0.4735107421875, -0.28228759765625, -0.091064453125, 0.10015869140625, 0.2913818359375, 0.48260498046875, 0.673828125, 0.86505126953125, 1.0562744140625, 1.24749755859375, 1.438720703125, 1.62994384765625, 1.8211669921875, 2.01239013671875, 2.20361328125, 2.39483642578125, 2.5860595703125, 2.77728271484375, 2.968505859375, 3.15972900390625, 3.3509521484375, 3.54217529296875, 3.7333984375, 3.92462158203125, 4.1158447265625, 4.30706787109375, 4.498291015625, 4.68951416015625, 4.8807373046875, 5.07196044921875, 5.26318359375, 5.45440673828125, 5.6456298828125, 5.83685302734375, 6.028076171875, 6.21929931640625, 6.4105224609375, 6.60174560546875, 6.79296875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 7.0, 6.0, 4.0, 4.0, 8.0, 6.0, 6.0, 15.0, 18.0, 16.0, 20.0, 22.0, 27.0, 30.0, 34.0, 32.0, 37.0, 33.0, 52.0, 27.0, 32.0, 51.0, 45.0, 47.0, 37.0, 34.0, 41.0, 32.0, 28.0, 30.0, 31.0, 20.0, 22.0, 22.0, 18.0, 18.0, 21.0, 14.0, 13.0, 16.0, 4.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-5.68359375, -5.50848388671875, -5.3333740234375, -5.15826416015625, -4.983154296875, -4.80804443359375, -4.6329345703125, -4.45782470703125, -4.28271484375, -4.10760498046875, -3.9324951171875, -3.75738525390625, -3.582275390625, -3.40716552734375, -3.2320556640625, -3.05694580078125, -2.8818359375, -2.70672607421875, -2.5316162109375, -2.35650634765625, -2.181396484375, -2.00628662109375, -1.8311767578125, -1.65606689453125, -1.48095703125, -1.30584716796875, -1.1307373046875, -0.95562744140625, -0.780517578125, -0.60540771484375, -0.4302978515625, -0.25518798828125, -0.080078125, 0.09503173828125, 0.2701416015625, 0.44525146484375, 0.620361328125, 0.79547119140625, 0.9705810546875, 1.14569091796875, 1.32080078125, 1.49591064453125, 1.6710205078125, 1.84613037109375, 2.021240234375, 2.19635009765625, 2.3714599609375, 2.54656982421875, 2.7216796875, 2.89678955078125, 3.0718994140625, 3.24700927734375, 3.422119140625, 3.59722900390625, 3.7723388671875, 3.94744873046875, 4.12255859375, 4.29766845703125, 4.4727783203125, 4.64788818359375, 4.822998046875, 4.99810791015625, 5.1732177734375, 5.34832763671875, 5.5234375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 7.0, 15.0, 21.0, 23.0, 37.0, 63.0, 87.0, 150.0, 260.0, 352.0, 587.0, 981.0, 1576.0, 2523.0, 4156.0, 7007.0, 11609.0, 19166.0, 31613.0, 52045.0, 82590.0, 121891.0, 155677.0, 163658.0, 136025.0, 96389.0, 62493.0, 38535.0, 23312.0, 14075.0, 8474.0, 5157.0, 3007.0, 1845.0, 1159.0, 758.0, 442.0, 291.0, 159.0, 123.0, 76.0, 52.0, 36.0, 19.0, 14.0, 9.0, 7.0, 4.0, 6.0, 2.0, 0.0, 1.0], "bins": [-5.40625, -5.25262451171875, -5.0989990234375, -4.94537353515625, -4.791748046875, -4.63812255859375, -4.4844970703125, -4.33087158203125, -4.17724609375, -4.02362060546875, -3.8699951171875, -3.71636962890625, -3.562744140625, -3.40911865234375, -3.2554931640625, -3.10186767578125, -2.9482421875, -2.79461669921875, -2.6409912109375, -2.48736572265625, -2.333740234375, -2.18011474609375, -2.0264892578125, -1.87286376953125, -1.71923828125, -1.56561279296875, -1.4119873046875, -1.25836181640625, -1.104736328125, -0.95111083984375, -0.7974853515625, -0.64385986328125, -0.490234375, -0.33660888671875, -0.1829833984375, -0.02935791015625, 0.124267578125, 0.27789306640625, 0.4315185546875, 0.58514404296875, 0.73876953125, 0.89239501953125, 1.0460205078125, 1.19964599609375, 1.353271484375, 1.50689697265625, 1.6605224609375, 1.81414794921875, 1.9677734375, 2.12139892578125, 2.2750244140625, 2.42864990234375, 2.582275390625, 2.73590087890625, 2.8895263671875, 3.04315185546875, 3.19677734375, 3.35040283203125, 3.5040283203125, 3.65765380859375, 3.811279296875, 3.96490478515625, 4.1185302734375, 4.27215576171875, 4.42578125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 5.0, 5.0, 7.0, 7.0, 8.0, 3.0, 8.0, 16.0, 12.0, 17.0, 17.0, 33.0, 11.0, 34.0, 32.0, 36.0, 32.0, 31.0, 40.0, 36.0, 37.0, 37.0, 40.0, 37.0, 33.0, 41.0, 42.0, 42.0, 35.0, 22.0, 35.0, 31.0, 22.0, 30.0, 13.0, 19.0, 19.0, 10.0, 8.0, 18.0, 10.0, 6.0, 12.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.13671875, -3.034027099609375, -2.93133544921875, -2.828643798828125, -2.7259521484375, -2.623260498046875, -2.52056884765625, -2.417877197265625, -2.315185546875, -2.212493896484375, -2.10980224609375, -2.007110595703125, -1.9044189453125, -1.801727294921875, -1.69903564453125, -1.596343994140625, -1.49365234375, -1.390960693359375, -1.28826904296875, -1.185577392578125, -1.0828857421875, -0.980194091796875, -0.87750244140625, -0.774810791015625, -0.672119140625, -0.569427490234375, -0.46673583984375, -0.364044189453125, -0.2613525390625, -0.158660888671875, -0.05596923828125, 0.046722412109375, 0.1494140625, 0.252105712890625, 0.35479736328125, 0.457489013671875, 0.5601806640625, 0.662872314453125, 0.76556396484375, 0.868255615234375, 0.970947265625, 1.073638916015625, 1.17633056640625, 1.279022216796875, 1.3817138671875, 1.484405517578125, 1.58709716796875, 1.689788818359375, 1.79248046875, 1.895172119140625, 1.99786376953125, 2.100555419921875, 2.2032470703125, 2.305938720703125, 2.40863037109375, 2.511322021484375, 2.614013671875, 2.716705322265625, 2.81939697265625, 2.922088623046875, 3.0247802734375, 3.127471923828125, 3.23016357421875, 3.332855224609375, 3.435546875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 5.0, 7.0, 13.0, 17.0, 20.0, 28.0, 41.0, 69.0, 100.0, 160.0, 257.0, 399.0, 638.0, 1103.0, 1816.0, 2979.0, 5301.0, 9360.0, 17483.0, 32549.0, 62478.0, 116713.0, 193874.0, 229331.0, 168509.0, 95312.0, 50633.0, 26593.0, 14051.0, 7788.0, 4350.0, 2543.0, 1547.0, 878.0, 570.0, 362.0, 215.0, 152.0, 96.0, 55.0, 58.0, 33.0, 13.0, 12.0, 10.0, 6.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-2.16796875, -2.098785400390625, -2.02960205078125, -1.960418701171875, -1.8912353515625, -1.822052001953125, -1.75286865234375, -1.683685302734375, -1.614501953125, -1.545318603515625, -1.47613525390625, -1.406951904296875, -1.3377685546875, -1.268585205078125, -1.19940185546875, -1.130218505859375, -1.06103515625, -0.991851806640625, -0.92266845703125, -0.853485107421875, -0.7843017578125, -0.715118408203125, -0.64593505859375, -0.576751708984375, -0.507568359375, -0.438385009765625, -0.36920166015625, -0.300018310546875, -0.2308349609375, -0.161651611328125, -0.09246826171875, -0.023284912109375, 0.0458984375, 0.115081787109375, 0.18426513671875, 0.253448486328125, 0.3226318359375, 0.391815185546875, 0.46099853515625, 0.530181884765625, 0.599365234375, 0.668548583984375, 0.73773193359375, 0.806915283203125, 0.8760986328125, 0.945281982421875, 1.01446533203125, 1.083648681640625, 1.15283203125, 1.222015380859375, 1.29119873046875, 1.360382080078125, 1.4295654296875, 1.498748779296875, 1.56793212890625, 1.637115478515625, 1.706298828125, 1.775482177734375, 1.84466552734375, 1.913848876953125, 1.9830322265625, 2.052215576171875, 2.12139892578125, 2.190582275390625, 2.259765625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 21.0, 28.0, 17.0, 38.0, 30.0, 47.0, 62.0, 57.0, 86.0, 89.0, 96.0, 79.0, 73.0, 77.0, 50.0, 31.0, 28.0, 26.0, 14.0, 14.0, 8.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014519691467285156, -0.0001389123499393463, -0.00013262778520584106, -0.00012634322047233582, -0.00012005865573883057, -0.00011377409100532532, -0.00010748952627182007, -0.00010120496153831482, -9.492039680480957e-05, -8.863583207130432e-05, -8.235126733779907e-05, -7.606670260429382e-05, -6.978213787078857e-05, -6.349757313728333e-05, -5.7213008403778076e-05, -5.092844367027283e-05, -4.464387893676758e-05, -3.835931420326233e-05, -3.207474946975708e-05, -2.579018473625183e-05, -1.9505620002746582e-05, -1.3221055269241333e-05, -6.936490535736084e-06, -6.51925802230835e-07, 5.632638931274414e-06, 1.1917203664779663e-05, 1.8201768398284912e-05, 2.448633313179016e-05, 3.077089786529541e-05, 3.705546259880066e-05, 4.334002733230591e-05, 4.962459206581116e-05, 5.5909156799316406e-05, 6.219372153282166e-05, 6.84782862663269e-05, 7.476285099983215e-05, 8.10474157333374e-05, 8.733198046684265e-05, 9.36165452003479e-05, 9.990110993385315e-05, 0.0001061856746673584, 0.00011247023940086365, 0.0001187548041343689, 0.00012503936886787415, 0.0001313239336013794, 0.00013760849833488464, 0.0001438930630683899, 0.00015017762780189514, 0.0001564621925354004, 0.00016274675726890564, 0.0001690313220024109, 0.00017531588673591614, 0.0001816004514694214, 0.00018788501620292664, 0.00019416958093643188, 0.00020045414566993713, 0.00020673871040344238, 0.00021302327513694763, 0.00021930783987045288, 0.00022559240460395813, 0.00023187696933746338, 0.00023816153407096863, 0.0002444460988044739, 0.0002507306635379791, 0.0002570152282714844]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 3.0, 17.0, 8.0, 11.0, 11.0, 20.0, 29.0, 46.0, 52.0, 89.0, 133.0, 214.0, 345.0, 651.0, 1235.0, 2532.0, 5114.0, 11445.0, 27362.0, 69901.0, 176917.0, 322729.0, 249614.0, 107372.0, 41267.0, 16861.0, 7314.0, 3347.0, 1729.0, 869.0, 524.0, 260.0, 165.0, 105.0, 70.0, 50.0, 49.0, 19.0, 18.0, 13.0, 8.0, 13.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.353515625, -3.25103759765625, -3.1485595703125, -3.04608154296875, -2.943603515625, -2.84112548828125, -2.7386474609375, -2.63616943359375, -2.53369140625, -2.43121337890625, -2.3287353515625, -2.22625732421875, -2.123779296875, -2.02130126953125, -1.9188232421875, -1.81634521484375, -1.7138671875, -1.61138916015625, -1.5089111328125, -1.40643310546875, -1.303955078125, -1.20147705078125, -1.0989990234375, -0.99652099609375, -0.89404296875, -0.79156494140625, -0.6890869140625, -0.58660888671875, -0.484130859375, -0.38165283203125, -0.2791748046875, -0.17669677734375, -0.07421875, 0.02825927734375, 0.1307373046875, 0.23321533203125, 0.335693359375, 0.43817138671875, 0.5406494140625, 0.64312744140625, 0.74560546875, 0.84808349609375, 0.9505615234375, 1.05303955078125, 1.155517578125, 1.25799560546875, 1.3604736328125, 1.46295166015625, 1.5654296875, 1.66790771484375, 1.7703857421875, 1.87286376953125, 1.975341796875, 2.07781982421875, 2.1802978515625, 2.28277587890625, 2.38525390625, 2.48773193359375, 2.5902099609375, 2.69268798828125, 2.795166015625, 2.89764404296875, 3.0001220703125, 3.10260009765625, 3.205078125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 8.0, 7.0, 5.0, 1.0, 7.0, 10.0, 7.0, 13.0, 17.0, 17.0, 27.0, 20.0, 31.0, 34.0, 50.0, 53.0, 46.0, 56.0, 53.0, 52.0, 46.0, 48.0, 64.0, 52.0, 48.0, 48.0, 30.0, 26.0, 21.0, 14.0, 17.0, 11.0, 12.0, 13.0, 10.0, 7.0, 3.0, 6.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7998046875, -0.7763748168945312, -0.7529449462890625, -0.7295150756835938, -0.706085205078125, -0.6826553344726562, -0.6592254638671875, -0.6357955932617188, -0.61236572265625, -0.5889358520507812, -0.5655059814453125, -0.5420761108398438, -0.518646240234375, -0.49521636962890625, -0.4717864990234375, -0.44835662841796875, -0.4249267578125, -0.40149688720703125, -0.3780670166015625, -0.35463714599609375, -0.331207275390625, -0.30777740478515625, -0.2843475341796875, -0.26091766357421875, -0.23748779296875, -0.21405792236328125, -0.1906280517578125, -0.16719818115234375, -0.143768310546875, -0.12033843994140625, -0.0969085693359375, -0.07347869873046875, -0.050048828125, -0.02661895751953125, -0.0031890869140625, 0.02024078369140625, 0.043670654296875, 0.06710052490234375, 0.0905303955078125, 0.11396026611328125, 0.13739013671875, 0.16082000732421875, 0.1842498779296875, 0.20767974853515625, 0.231109619140625, 0.25453948974609375, 0.2779693603515625, 0.30139923095703125, 0.3248291015625, 0.34825897216796875, 0.3716888427734375, 0.39511871337890625, 0.418548583984375, 0.44197845458984375, 0.4654083251953125, 0.48883819580078125, 0.51226806640625, 0.5356979370117188, 0.5591278076171875, 0.5825576782226562, 0.605987548828125, 0.6294174194335938, 0.6528472900390625, 0.6762771606445312, 0.69970703125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 4.0, 5.0, 12.0, 11.0, 10.0, 17.0, 19.0, 23.0, 19.0, 41.0, 40.0, 53.0, 56.0, 62.0, 62.0, 65.0, 74.0, 49.0, 53.0, 55.0, 49.0, 37.0, 37.0, 25.0, 22.0, 17.0, 23.0, 8.0, 16.0, 7.0, 5.0, 6.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84666109085083, -4.678379058837891, -4.510097026824951, -4.341814994812012, -4.173532962799072, -4.005250930786133, -3.8369688987731934, -3.668686866760254, -3.5004048347473145, -3.332122802734375, -3.1638407707214355, -2.995558738708496, -2.8272767066955566, -2.658994674682617, -2.4907126426696777, -2.3224306106567383, -2.154148578643799, -1.9858665466308594, -1.81758451461792, -1.6493024826049805, -1.481020450592041, -1.3127384185791016, -1.144456386566162, -0.9761743545532227, -0.8078923225402832, -0.6396102905273438, -0.4713282585144043, -0.30304622650146484, -0.1347641944885254, 0.03351783752441406, 0.20179986953735352, 0.37008190155029297, 0.5383634567260742, 0.7066454887390137, 0.8749275207519531, 1.0432095527648926, 1.211491584777832, 1.3797736167907715, 1.548055648803711, 1.7163376808166504, 1.8846197128295898, 2.0529017448425293, 2.2211837768554688, 2.389465808868408, 2.5577478408813477, 2.726029872894287, 2.8943119049072266, 3.062593936920166, 3.2308759689331055, 3.399158000946045, 3.5674400329589844, 3.735722064971924, 3.9040040969848633, 4.072286128997803, 4.240568161010742, 4.408850193023682, 4.577132225036621, 4.7454142570495605, 4.9136962890625, 5.0819783210754395, 5.250260353088379, 5.418542385101318, 5.586824417114258, 5.755106449127197, 5.923388481140137]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 6.0, 10.0, 5.0, 5.0, 7.0, 15.0, 13.0, 12.0, 26.0, 20.0, 20.0, 20.0, 21.0, 22.0, 32.0, 32.0, 30.0, 37.0, 36.0, 42.0, 41.0, 48.0, 34.0, 45.0, 43.0, 30.0, 34.0, 37.0, 36.0, 25.0, 30.0, 26.0, 18.0, 13.0, 22.0, 19.0, 24.0, 10.0, 14.0, 13.0, 4.0, 8.0, 5.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.406230449676514, -5.230968475341797, -5.055706977844238, -4.88044548034668, -4.705183506011963, -4.529921531677246, -4.3546600341796875, -4.179398536682129, -4.004136562347412, -3.8288748264312744, -3.6536130905151367, -3.478351354598999, -3.3030896186828613, -3.1278278827667236, -2.952566146850586, -2.7773044109344482, -2.6020426750183105, -2.426780939102173, -2.251519203186035, -2.0762574672698975, -1.9009957313537598, -1.725733995437622, -1.5504722595214844, -1.3752105236053467, -1.199948787689209, -1.0246870517730713, -0.8494253158569336, -0.6741635799407959, -0.4989018440246582, -0.3236401081085205, -0.1483783721923828, 0.026883363723754883, 0.20214462280273438, 0.37740635871887207, 0.5526680946350098, 0.7279298305511475, 0.9031915664672852, 1.0784533023834229, 1.2537150382995605, 1.4289767742156982, 1.604238510131836, 1.7795002460479736, 1.9547619819641113, 2.130023717880249, 2.3052854537963867, 2.4805471897125244, 2.655808925628662, 2.8310706615448, 3.0063323974609375, 3.181594133377075, 3.356855869293213, 3.5321176052093506, 3.7073793411254883, 3.882641077041626, 4.057902812957764, 4.2331647872924805, 4.408426284790039, 4.583687782287598, 4.7589497566223145, 4.934211730957031, 5.10947322845459, 5.284734725952148, 5.459996700286865, 5.635258674621582, 5.810520172119141]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 8.0, 6.0, 7.0, 11.0, 22.0, 25.0, 41.0, 57.0, 89.0, 119.0, 163.0, 250.0, 417.0, 541.0, 780.0, 1287.0, 1855.0, 2765.0, 4295.0, 6919.0, 11123.0, 17843.0, 30360.0, 51670.0, 90716.0, 166685.0, 313049.0, 582446.0, 894511.0, 857343.0, 526942.0, 277951.0, 149107.0, 81780.0, 47014.0, 27711.0, 17118.0, 10741.0, 6770.0, 4398.0, 2995.0, 1991.0, 1331.0, 939.0, 640.0, 405.0, 324.0, 230.0, 157.0, 101.0, 83.0, 47.0, 44.0, 28.0, 20.0, 8.0, 6.0, 10.0, 0.0, 3.0, 1.0, 2.0], "bins": [-4.5546875, -4.40740966796875, -4.2601318359375, -4.11285400390625, -3.965576171875, -3.81829833984375, -3.6710205078125, -3.52374267578125, -3.37646484375, -3.22918701171875, -3.0819091796875, -2.93463134765625, -2.787353515625, -2.64007568359375, -2.4927978515625, -2.34552001953125, -2.1982421875, -2.05096435546875, -1.9036865234375, -1.75640869140625, -1.609130859375, -1.46185302734375, -1.3145751953125, -1.16729736328125, -1.02001953125, -0.87274169921875, -0.7254638671875, -0.57818603515625, -0.430908203125, -0.28363037109375, -0.1363525390625, 0.01092529296875, 0.158203125, 0.30548095703125, 0.4527587890625, 0.60003662109375, 0.747314453125, 0.89459228515625, 1.0418701171875, 1.18914794921875, 1.33642578125, 1.48370361328125, 1.6309814453125, 1.77825927734375, 1.925537109375, 2.07281494140625, 2.2200927734375, 2.36737060546875, 2.5146484375, 2.66192626953125, 2.8092041015625, 2.95648193359375, 3.103759765625, 3.25103759765625, 3.3983154296875, 3.54559326171875, 3.69287109375, 3.84014892578125, 3.9874267578125, 4.13470458984375, 4.281982421875, 4.42926025390625, 4.5765380859375, 4.72381591796875, 4.87109375]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 2.0, 7.0, 11.0, 6.0, 11.0, 7.0, 14.0, 19.0, 23.0, 22.0, 32.0, 16.0, 24.0, 25.0, 40.0, 28.0, 29.0, 37.0, 47.0, 55.0, 48.0, 37.0, 40.0, 45.0, 38.0, 42.0, 40.0, 22.0, 23.0, 22.0, 33.0, 17.0, 22.0, 24.0, 21.0, 16.0, 11.0, 11.0, 5.0, 9.0, 5.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.951171875, -3.83184814453125, -3.7125244140625, -3.59320068359375, -3.473876953125, -3.35455322265625, -3.2352294921875, -3.11590576171875, -2.99658203125, -2.87725830078125, -2.7579345703125, -2.63861083984375, -2.519287109375, -2.39996337890625, -2.2806396484375, -2.16131591796875, -2.0419921875, -1.92266845703125, -1.8033447265625, -1.68402099609375, -1.564697265625, -1.44537353515625, -1.3260498046875, -1.20672607421875, -1.08740234375, -0.96807861328125, -0.8487548828125, -0.72943115234375, -0.610107421875, -0.49078369140625, -0.3714599609375, -0.25213623046875, -0.1328125, -0.01348876953125, 0.1058349609375, 0.22515869140625, 0.344482421875, 0.46380615234375, 0.5831298828125, 0.70245361328125, 0.82177734375, 0.94110107421875, 1.0604248046875, 1.17974853515625, 1.299072265625, 1.41839599609375, 1.5377197265625, 1.65704345703125, 1.7763671875, 1.89569091796875, 2.0150146484375, 2.13433837890625, 2.253662109375, 2.37298583984375, 2.4923095703125, 2.61163330078125, 2.73095703125, 2.85028076171875, 2.9696044921875, 3.08892822265625, 3.208251953125, 3.32757568359375, 3.4468994140625, 3.56622314453125, 3.685546875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 10.0, 13.0, 26.0, 31.0, 41.0, 70.0, 135.0, 170.0, 306.0, 508.0, 868.0, 1574.0, 2729.0, 5213.0, 9951.0, 18702.0, 37002.0, 75418.0, 158695.0, 333176.0, 659872.0, 1002047.0, 893737.0, 512103.0, 249062.0, 116708.0, 56005.0, 28216.0, 14548.0, 7781.0, 4161.0, 2254.0, 1280.0, 716.0, 436.0, 259.0, 159.0, 105.0, 64.0, 43.0, 30.0, 23.0, 10.0, 10.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.109375, -4.93792724609375, -4.7664794921875, -4.59503173828125, -4.423583984375, -4.25213623046875, -4.0806884765625, -3.90924072265625, -3.73779296875, -3.56634521484375, -3.3948974609375, -3.22344970703125, -3.052001953125, -2.88055419921875, -2.7091064453125, -2.53765869140625, -2.3662109375, -2.19476318359375, -2.0233154296875, -1.85186767578125, -1.680419921875, -1.50897216796875, -1.3375244140625, -1.16607666015625, -0.99462890625, -0.82318115234375, -0.6517333984375, -0.48028564453125, -0.308837890625, -0.13739013671875, 0.0340576171875, 0.20550537109375, 0.376953125, 0.54840087890625, 0.7198486328125, 0.89129638671875, 1.062744140625, 1.23419189453125, 1.4056396484375, 1.57708740234375, 1.74853515625, 1.91998291015625, 2.0914306640625, 2.26287841796875, 2.434326171875, 2.60577392578125, 2.7772216796875, 2.94866943359375, 3.1201171875, 3.29156494140625, 3.4630126953125, 3.63446044921875, 3.805908203125, 3.97735595703125, 4.1488037109375, 4.32025146484375, 4.49169921875, 4.66314697265625, 4.8345947265625, 5.00604248046875, 5.177490234375, 5.34893798828125, 5.5203857421875, 5.69183349609375, 5.86328125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 7.0, 4.0, 9.0, 17.0, 18.0, 19.0, 24.0, 32.0, 43.0, 49.0, 41.0, 63.0, 70.0, 102.0, 103.0, 111.0, 121.0, 139.0, 154.0, 202.0, 192.0, 215.0, 199.0, 202.0, 217.0, 193.0, 177.0, 154.0, 180.0, 147.0, 140.0, 125.0, 117.0, 81.0, 63.0, 64.0, 42.0, 38.0, 35.0, 39.0, 17.0, 21.0, 23.0, 13.0, 10.0, 6.0, 9.0, 8.0, 3.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0], "bins": [-1.7451171875, -1.692291259765625, -1.63946533203125, -1.586639404296875, -1.5338134765625, -1.480987548828125, -1.42816162109375, -1.375335693359375, -1.322509765625, -1.269683837890625, -1.21685791015625, -1.164031982421875, -1.1112060546875, -1.058380126953125, -1.00555419921875, -0.952728271484375, -0.89990234375, -0.847076416015625, -0.79425048828125, -0.741424560546875, -0.6885986328125, -0.635772705078125, -0.58294677734375, -0.530120849609375, -0.477294921875, -0.424468994140625, -0.37164306640625, -0.318817138671875, -0.2659912109375, -0.213165283203125, -0.16033935546875, -0.107513427734375, -0.0546875, -0.001861572265625, 0.05096435546875, 0.103790283203125, 0.1566162109375, 0.209442138671875, 0.26226806640625, 0.315093994140625, 0.367919921875, 0.420745849609375, 0.47357177734375, 0.526397705078125, 0.5792236328125, 0.632049560546875, 0.68487548828125, 0.737701416015625, 0.79052734375, 0.843353271484375, 0.89617919921875, 0.949005126953125, 1.0018310546875, 1.054656982421875, 1.10748291015625, 1.160308837890625, 1.213134765625, 1.265960693359375, 1.31878662109375, 1.371612548828125, 1.4244384765625, 1.477264404296875, 1.53009033203125, 1.582916259765625, 1.6357421875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 9.0, 11.0, 14.0, 8.0, 20.0, 26.0, 25.0, 36.0, 47.0, 54.0, 58.0, 81.0, 59.0, 79.0, 74.0, 70.0, 68.0, 55.0, 40.0, 25.0, 32.0, 25.0, 17.0, 14.0, 12.0, 13.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.859265327453613, -5.679550647735596, -5.499835968017578, -5.3201212882995605, -5.140406608581543, -4.960691928863525, -4.780977249145508, -4.60126256942749, -4.421547889709473, -4.241833209991455, -4.0621185302734375, -3.88240385055542, -3.7026891708374023, -3.5229744911193848, -3.343259811401367, -3.1635451316833496, -2.983830213546753, -2.8041155338287354, -2.6244008541107178, -2.4446861743927, -2.2649714946746826, -2.085256814956665, -1.905542016029358, -1.7258273363113403, -1.5461126565933228, -1.3663979768753052, -1.1866832971572876, -1.0069684982299805, -0.8272538781166077, -0.6475391983985901, -0.46782445907592773, -0.28810977935791016, -0.10839509963989258, 0.0713195949792862, 0.25103428959846497, 0.43074899911880493, 0.6104636788368225, 0.7901783585548401, 0.9698930978775024, 1.14960777759552, 1.3293224573135376, 1.5090371370315552, 1.6887518167495728, 1.8684666156768799, 2.0481812953948975, 2.227895975112915, 2.4076106548309326, 2.58732533454895, 2.7670400142669678, 2.9467546939849854, 3.126469373703003, 3.3061840534210205, 3.485898733139038, 3.6656134128570557, 3.8453283309936523, 4.02504301071167, 4.2047576904296875, 4.384472370147705, 4.564187049865723, 4.74390172958374, 4.923616409301758, 5.103331089019775, 5.283045768737793, 5.4627604484558105, 5.642475128173828]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 11.0, 8.0, 9.0, 6.0, 16.0, 13.0, 13.0, 24.0, 18.0, 20.0, 24.0, 29.0, 22.0, 37.0, 41.0, 29.0, 38.0, 46.0, 44.0, 36.0, 36.0, 41.0, 49.0, 37.0, 33.0, 40.0, 33.0, 35.0, 27.0, 23.0, 19.0, 20.0, 14.0, 21.0, 12.0, 10.0, 19.0, 9.0, 7.0, 5.0, 9.0, 5.0, 6.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.964519023895264, -4.801045894622803, -4.6375732421875, -4.474100112915039, -4.310627460479736, -4.147154331207275, -3.9836814403533936, -3.8202085494995117, -3.656735420227051, -3.493262529373169, -3.329789638519287, -3.166316509246826, -3.0028436183929443, -2.8393707275390625, -2.6758978366851807, -2.512424945831299, -2.348952054977417, -2.185479164123535, -2.0220062732696533, -1.858533263206482, -1.6950602531433105, -1.5315873622894287, -1.3681144714355469, -1.2046414613723755, -1.0411685705184937, -0.877695620059967, -0.7142226696014404, -0.5507497787475586, -0.387276828289032, -0.22380387783050537, -0.060330986976623535, 0.10314202308654785, 0.2666149139404297, 0.4300878643989563, 0.5935608148574829, 0.7570337057113647, 0.9205066561698914, 1.083979606628418, 1.2474524974822998, 1.4109255075454712, 1.574398398399353, 1.7378712892532349, 1.9013442993164062, 2.064817190170288, 2.22829008102417, 2.391763210296631, 2.5552358627319336, 2.7187089920043945, 2.8821818828582764, 3.045654773712158, 3.20912766456604, 3.372600555419922, 3.536073684692383, 3.6995465755462646, 3.8630194664001465, 4.026492595672607, 4.18996524810791, 4.353438377380371, 4.516911029815674, 4.680384159088135, 4.8438568115234375, 5.007329940795898, 5.170803070068359, 5.334275722503662, 5.497748851776123]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 7.0, 4.0, 18.0, 29.0, 31.0, 60.0, 79.0, 102.0, 145.0, 243.0, 347.0, 474.0, 772.0, 1123.0, 1603.0, 2545.0, 3973.0, 6579.0, 10490.0, 17504.0, 30277.0, 55230.0, 104838.0, 200152.0, 258192.0, 161700.0, 83374.0, 44559.0, 25137.0, 14704.0, 8823.0, 5413.0, 3481.0, 2214.0, 1422.0, 920.0, 642.0, 417.0, 309.0, 191.0, 122.0, 88.0, 68.0, 44.0, 31.0, 22.0, 22.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.63671875, -1.5827484130859375, -1.528778076171875, -1.4748077392578125, -1.42083740234375, -1.3668670654296875, -1.312896728515625, -1.2589263916015625, -1.2049560546875, -1.1509857177734375, -1.097015380859375, -1.0430450439453125, -0.98907470703125, -0.9351043701171875, -0.881134033203125, -0.8271636962890625, -0.773193359375, -0.7192230224609375, -0.665252685546875, -0.6112823486328125, -0.55731201171875, -0.5033416748046875, -0.449371337890625, -0.3954010009765625, -0.3414306640625, -0.2874603271484375, -0.233489990234375, -0.1795196533203125, -0.12554931640625, -0.0715789794921875, -0.017608642578125, 0.0363616943359375, 0.09033203125, 0.1443023681640625, 0.198272705078125, 0.2522430419921875, 0.30621337890625, 0.3601837158203125, 0.414154052734375, 0.4681243896484375, 0.5220947265625, 0.5760650634765625, 0.630035400390625, 0.6840057373046875, 0.73797607421875, 0.7919464111328125, 0.845916748046875, 0.8998870849609375, 0.953857421875, 1.0078277587890625, 1.061798095703125, 1.1157684326171875, 1.16973876953125, 1.2237091064453125, 1.277679443359375, 1.3316497802734375, 1.3856201171875, 1.4395904541015625, 1.493560791015625, 1.5475311279296875, 1.60150146484375, 1.6554718017578125, 1.709442138671875, 1.7634124755859375, 1.8173828125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 7.0, 5.0, 6.0, 19.0, 12.0, 12.0, 10.0, 19.0, 16.0, 25.0, 24.0, 30.0, 31.0, 38.0, 35.0, 22.0, 43.0, 46.0, 38.0, 38.0, 44.0, 48.0, 39.0, 44.0, 43.0, 42.0, 24.0, 23.0, 38.0, 17.0, 22.0, 23.0, 20.0, 12.0, 14.0, 12.0, 10.0, 13.0, 9.0, 4.0, 4.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8984375, -4.73065185546875, -4.5628662109375, -4.39508056640625, -4.227294921875, -4.05950927734375, -3.8917236328125, -3.72393798828125, -3.55615234375, -3.38836669921875, -3.2205810546875, -3.05279541015625, -2.885009765625, -2.71722412109375, -2.5494384765625, -2.38165283203125, -2.2138671875, -2.04608154296875, -1.8782958984375, -1.71051025390625, -1.542724609375, -1.37493896484375, -1.2071533203125, -1.03936767578125, -0.87158203125, -0.70379638671875, -0.5360107421875, -0.36822509765625, -0.200439453125, -0.03265380859375, 0.1351318359375, 0.30291748046875, 0.470703125, 0.63848876953125, 0.8062744140625, 0.97406005859375, 1.141845703125, 1.30963134765625, 1.4774169921875, 1.64520263671875, 1.81298828125, 1.98077392578125, 2.1485595703125, 2.31634521484375, 2.484130859375, 2.65191650390625, 2.8197021484375, 2.98748779296875, 3.1552734375, 3.32305908203125, 3.4908447265625, 3.65863037109375, 3.826416015625, 3.99420166015625, 4.1619873046875, 4.32977294921875, 4.49755859375, 4.66534423828125, 4.8331298828125, 5.00091552734375, 5.168701171875, 5.33648681640625, 5.5042724609375, 5.67205810546875, 5.83984375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 2.0, 9.0, 5.0, 6.0, 8.0, 10.0, 17.0, 24.0, 26.0, 30.0, 43.0, 68.0, 74.0, 97.0, 113.0, 171.0, 247.0, 387.0, 514.0, 774.0, 1271.0, 2286.0, 4402.0, 10649.0, 28366.0, 897319.0, 66387.0, 18983.0, 7632.0, 3503.0, 1801.0, 1047.0, 655.0, 439.0, 309.0, 227.0, 144.0, 123.0, 71.0, 66.0, 68.0, 41.0, 35.0, 22.0, 12.0, 15.0, 12.0, 11.0, 8.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 5.0, 0.0, 3.0], "bins": [-4.78125, -4.6309814453125, -4.480712890625, -4.3304443359375, -4.18017578125, -4.0299072265625, -3.879638671875, -3.7293701171875, -3.5791015625, -3.4288330078125, -3.278564453125, -3.1282958984375, -2.97802734375, -2.8277587890625, -2.677490234375, -2.5272216796875, -2.376953125, -2.2266845703125, -2.076416015625, -1.9261474609375, -1.77587890625, -1.6256103515625, -1.475341796875, -1.3250732421875, -1.1748046875, -1.0245361328125, -0.874267578125, -0.7239990234375, -0.57373046875, -0.4234619140625, -0.273193359375, -0.1229248046875, 0.02734375, 0.1776123046875, 0.327880859375, 0.4781494140625, 0.62841796875, 0.7786865234375, 0.928955078125, 1.0792236328125, 1.2294921875, 1.3797607421875, 1.530029296875, 1.6802978515625, 1.83056640625, 1.9808349609375, 2.131103515625, 2.2813720703125, 2.431640625, 2.5819091796875, 2.732177734375, 2.8824462890625, 3.03271484375, 3.1829833984375, 3.333251953125, 3.4835205078125, 3.6337890625, 3.7840576171875, 3.934326171875, 4.0845947265625, 4.23486328125, 4.3851318359375, 4.535400390625, 4.6856689453125, 4.8359375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 6.0, 4.0, 7.0, 6.0, 5.0, 7.0, 15.0, 12.0, 21.0, 15.0, 27.0, 37.0, 22.0, 30.0, 24.0, 41.0, 27.0, 39.0, 36.0, 45.0, 34.0, 29.0, 37.0, 37.0, 36.0, 41.0, 32.0, 44.0, 36.0, 39.0, 27.0, 29.0, 21.0, 18.0, 22.0, 11.0, 16.0, 11.0, 10.0, 13.0, 4.0, 7.0, 3.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.150390625, -3.047882080078125, -2.94537353515625, -2.842864990234375, -2.7403564453125, -2.637847900390625, -2.53533935546875, -2.432830810546875, -2.330322265625, -2.227813720703125, -2.12530517578125, -2.022796630859375, -1.9202880859375, -1.817779541015625, -1.71527099609375, -1.612762451171875, -1.51025390625, -1.407745361328125, -1.30523681640625, -1.202728271484375, -1.1002197265625, -0.997711181640625, -0.89520263671875, -0.792694091796875, -0.690185546875, -0.587677001953125, -0.48516845703125, -0.382659912109375, -0.2801513671875, -0.177642822265625, -0.07513427734375, 0.027374267578125, 0.1298828125, 0.232391357421875, 0.33489990234375, 0.437408447265625, 0.5399169921875, 0.642425537109375, 0.74493408203125, 0.847442626953125, 0.949951171875, 1.052459716796875, 1.15496826171875, 1.257476806640625, 1.3599853515625, 1.462493896484375, 1.56500244140625, 1.667510986328125, 1.77001953125, 1.872528076171875, 1.97503662109375, 2.077545166015625, 2.1800537109375, 2.282562255859375, 2.38507080078125, 2.487579345703125, 2.590087890625, 2.692596435546875, 2.79510498046875, 2.897613525390625, 3.0001220703125, 3.102630615234375, 3.20513916015625, 3.307647705078125, 3.41015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 13.0, 10.0, 11.0, 21.0, 15.0, 29.0, 47.0, 53.0, 63.0, 91.0, 139.0, 207.0, 282.0, 352.0, 521.0, 848.0, 1339.0, 2402.0, 4334.0, 9776.0, 28533.0, 926981.0, 46537.0, 12942.0, 5517.0, 2732.0, 1617.0, 981.0, 607.0, 414.0, 321.0, 220.0, 154.0, 112.0, 93.0, 57.0, 55.0, 23.0, 30.0, 20.0, 14.0, 11.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.38330078125, -0.36992645263671875, -0.3565521240234375, -0.34317779541015625, -0.329803466796875, -0.31642913818359375, -0.3030548095703125, -0.28968048095703125, -0.27630615234375, -0.26293182373046875, -0.2495574951171875, -0.23618316650390625, -0.222808837890625, -0.20943450927734375, -0.1960601806640625, -0.18268585205078125, -0.1693115234375, -0.15593719482421875, -0.1425628662109375, -0.12918853759765625, -0.115814208984375, -0.10243988037109375, -0.0890655517578125, -0.07569122314453125, -0.06231689453125, -0.04894256591796875, -0.0355682373046875, -0.02219390869140625, -0.008819580078125, 0.00455474853515625, 0.0179290771484375, 0.03130340576171875, 0.044677734375, 0.05805206298828125, 0.0714263916015625, 0.08480072021484375, 0.098175048828125, 0.11154937744140625, 0.1249237060546875, 0.13829803466796875, 0.15167236328125, 0.16504669189453125, 0.1784210205078125, 0.19179534912109375, 0.205169677734375, 0.21854400634765625, 0.2319183349609375, 0.24529266357421875, 0.2586669921875, 0.27204132080078125, 0.2854156494140625, 0.29878997802734375, 0.312164306640625, 0.32553863525390625, 0.3389129638671875, 0.35228729248046875, 0.36566162109375, 0.37903594970703125, 0.3924102783203125, 0.40578460693359375, 0.419158935546875, 0.43253326416015625, 0.4459075927734375, 0.45928192138671875, 0.47265625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 3.0, 6.0, 7.0, 7.0, 16.0, 16.0, 16.0, 18.0, 29.0, 59.0, 58.0, 74.0, 86.0, 105.0, 111.0, 89.0, 59.0, 54.0, 42.0, 36.0, 32.0, 8.0, 13.0, 13.0, 10.0, 5.0, 7.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.749961853027344e-05, -8.490961045026779e-05, -8.231960237026215e-05, -7.97295942902565e-05, -7.713958621025085e-05, -7.454957813024521e-05, -7.195957005023956e-05, -6.936956197023392e-05, -6.677955389022827e-05, -6.418954581022263e-05, -6.159953773021698e-05, -5.9009529650211334e-05, -5.641952157020569e-05, -5.382951349020004e-05, -5.12395054101944e-05, -4.864949733018875e-05, -4.6059489250183105e-05, -4.346948117017746e-05, -4.0879473090171814e-05, -3.828946501016617e-05, -3.569945693016052e-05, -3.310944885015488e-05, -3.051944077014923e-05, -2.7929432690143585e-05, -2.533942461013794e-05, -2.2749416530132294e-05, -2.0159408450126648e-05, -1.7569400370121002e-05, -1.4979392290115356e-05, -1.238938421010971e-05, -9.799376130104065e-06, -7.209368050098419e-06, -4.6193599700927734e-06, -2.0293518900871277e-06, 5.606561899185181e-07, 3.150664269924164e-06, 5.7406723499298096e-06, 8.330680429935455e-06, 1.0920688509941101e-05, 1.3510696589946747e-05, 1.6100704669952393e-05, 1.869071274995804e-05, 2.1280720829963684e-05, 2.387072890996933e-05, 2.6460736989974976e-05, 2.905074506998062e-05, 3.164075314998627e-05, 3.423076122999191e-05, 3.682076930999756e-05, 3.9410777390003204e-05, 4.200078547000885e-05, 4.4590793550014496e-05, 4.718080163002014e-05, 4.977080971002579e-05, 5.236081779003143e-05, 5.495082587003708e-05, 5.7540833950042725e-05, 6.013084203004837e-05, 6.272085011005402e-05, 6.531085819005966e-05, 6.790086627006531e-05, 7.049087435007095e-05, 7.30808824300766e-05, 7.567089051008224e-05, 7.826089859008789e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 7.0, 21.0, 22.0, 23.0, 54.0, 97.0, 157.0, 226.0, 369.0, 727.0, 1233.0, 2040.0, 3734.0, 7001.0, 13726.0, 28189.0, 63389.0, 162530.0, 381740.0, 226429.0, 84699.0, 36049.0, 16866.0, 8655.0, 4481.0, 2550.0, 1424.0, 867.0, 481.0, 294.0, 177.0, 97.0, 65.0, 44.0, 32.0, 14.0, 9.0, 11.0, 7.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20263671875, -0.1960277557373047, -0.18941879272460938, -0.18280982971191406, -0.17620086669921875, -0.16959190368652344, -0.16298294067382812, -0.1563739776611328, -0.1497650146484375, -0.1431560516357422, -0.13654708862304688, -0.12993812561035156, -0.12332916259765625, -0.11672019958496094, -0.11011123657226562, -0.10350227355957031, -0.096893310546875, -0.09028434753417969, -0.08367538452148438, -0.07706642150878906, -0.07045745849609375, -0.06384849548339844, -0.057239532470703125, -0.05063056945800781, -0.0440216064453125, -0.03741264343261719, -0.030803680419921875, -0.024194717407226562, -0.01758575439453125, -0.010976791381835938, -0.004367828369140625, 0.0022411346435546875, 0.00885009765625, 0.015459060668945312, 0.022068023681640625, 0.028676986694335938, 0.03528594970703125, 0.04189491271972656, 0.048503875732421875, 0.05511283874511719, 0.0617218017578125, 0.06833076477050781, 0.07493972778320312, 0.08154869079589844, 0.08815765380859375, 0.09476661682128906, 0.10137557983398438, 0.10798454284667969, 0.114593505859375, 0.12120246887207031, 0.12781143188476562, 0.13442039489746094, 0.14102935791015625, 0.14763832092285156, 0.15424728393554688, 0.1608562469482422, 0.1674652099609375, 0.1740741729736328, 0.18068313598632812, 0.18729209899902344, 0.19390106201171875, 0.20051002502441406, 0.20711898803710938, 0.2137279510498047, 0.2203369140625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 0.0, 3.0, 2.0, 7.0, 5.0, 8.0, 8.0, 7.0, 12.0, 19.0, 22.0, 25.0, 22.0, 30.0, 39.0, 46.0, 68.0, 69.0, 80.0, 85.0, 69.0, 83.0, 65.0, 49.0, 36.0, 22.0, 23.0, 19.0, 15.0, 15.0, 19.0, 8.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041748046875, -0.04026174545288086, -0.03877544403076172, -0.03728914260864258, -0.03580284118652344, -0.0343165397644043, -0.032830238342285156, -0.031343936920166016, -0.029857635498046875, -0.028371334075927734, -0.026885032653808594, -0.025398731231689453, -0.023912429809570312, -0.022426128387451172, -0.02093982696533203, -0.01945352554321289, -0.01796722412109375, -0.01648092269897461, -0.014994621276855469, -0.013508319854736328, -0.012022018432617188, -0.010535717010498047, -0.009049415588378906, -0.007563114166259766, -0.006076812744140625, -0.004590511322021484, -0.0031042098999023438, -0.0016179084777832031, -0.0001316070556640625, 0.0013546943664550781, 0.0028409957885742188, 0.004327297210693359, 0.0058135986328125, 0.007299900054931641, 0.008786201477050781, 0.010272502899169922, 0.011758804321289062, 0.013245105743408203, 0.014731407165527344, 0.016217708587646484, 0.017704010009765625, 0.019190311431884766, 0.020676612854003906, 0.022162914276123047, 0.023649215698242188, 0.025135517120361328, 0.02662181854248047, 0.02810811996459961, 0.02959442138671875, 0.03108072280883789, 0.03256702423095703, 0.03405332565307617, 0.03553962707519531, 0.03702592849731445, 0.038512229919433594, 0.039998531341552734, 0.041484832763671875, 0.042971134185791016, 0.044457435607910156, 0.0459437370300293, 0.04743003845214844, 0.04891633987426758, 0.05040264129638672, 0.05188894271850586, 0.053375244140625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 9.0, 9.0, 17.0, 12.0, 18.0, 25.0, 28.0, 38.0, 41.0, 48.0, 55.0, 94.0, 64.0, 63.0, 77.0, 77.0, 69.0, 52.0, 36.0, 31.0, 32.0, 23.0, 15.0, 17.0, 11.0, 10.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.624813556671143, -5.446654319763184, -5.268495082855225, -5.090335845947266, -4.912176132202148, -4.7340168952941895, -4.5558576583862305, -4.3776984214782715, -4.1995391845703125, -4.0213799476623535, -3.8432204723358154, -3.6650612354278564, -3.4869017601013184, -3.3087425231933594, -3.1305832862854004, -2.9524240493774414, -2.774264335632324, -2.5961050987243652, -2.417945623397827, -2.239786386489868, -2.06162691116333, -1.883467674255371, -1.705308437347412, -1.5271490812301636, -1.348989725112915, -1.1708303689956665, -0.9926710724830627, -0.814511775970459, -0.6363524198532104, -0.4581930637359619, -0.28003382682800293, -0.1018744707107544, 0.07628536224365234, 0.2544446885585785, 0.43260401487350464, 0.6107633113861084, 0.7889226675033569, 0.9670820236206055, 1.1452412605285645, 1.323400616645813, 1.5015599727630615, 1.67971932888031, 1.8578786849975586, 2.0360379219055176, 2.2141971588134766, 2.3923566341400146, 2.5705158710479736, 2.7486753463745117, 2.9268345832824707, 3.1049938201904297, 3.2831532955169678, 3.4613125324249268, 3.639472007751465, 3.817631244659424, 3.995790481567383, 4.173949718475342, 4.352108955383301, 4.53026819229126, 4.708427429199219, 4.886587142944336, 5.064746379852295, 5.242905616760254, 5.421064853668213, 5.599224090576172, 5.777383804321289]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 6.0, 2.0, 10.0, 11.0, 7.0, 6.0, 17.0, 13.0, 12.0, 24.0, 17.0, 20.0, 25.0, 28.0, 23.0, 37.0, 39.0, 31.0, 35.0, 48.0, 39.0, 41.0, 34.0, 42.0, 47.0, 40.0, 35.0, 36.0, 33.0, 35.0, 29.0, 24.0, 18.0, 20.0, 14.0, 20.0, 14.0, 10.0, 17.0, 11.0, 7.0, 4.0, 10.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.920654773712158, -4.75849723815918, -4.596339702606201, -4.434182167053223, -4.272024631500244, -4.109867095947266, -3.947709321975708, -3.7855517864227295, -3.623394250869751, -3.4612367153167725, -3.299079179763794, -3.1369216442108154, -2.974763870239258, -2.8126063346862793, -2.650448799133301, -2.4882912635803223, -2.3261337280273438, -2.1639761924743652, -2.0018186569213867, -1.8396610021591187, -1.6775034666061401, -1.5153459310531616, -1.3531882762908936, -1.191030740737915, -1.0288732051849365, -0.866715669631958, -0.7045580744743347, -0.5424004793167114, -0.3802429437637329, -0.2180854082107544, -0.055927813053131104, 0.10622978210449219, 0.2683873176574707, 0.4305448830127716, 0.5927024483680725, 0.7548600435256958, 0.9170175790786743, 1.0791751146316528, 1.241332769393921, 1.4034903049468994, 1.565647840499878, 1.7278053760528564, 1.889962911605835, 2.0521204471588135, 2.214278221130371, 2.3764357566833496, 2.538593292236328, 2.7007508277893066, 2.862908363342285, 3.0250658988952637, 3.187223434448242, 3.3493809700012207, 3.511538505554199, 3.6736960411071777, 3.8358538150787354, 3.998011350631714, 4.160168647766113, 4.322326183319092, 4.48448371887207, 4.646641254425049, 4.808798789978027, 4.970956325531006, 5.133113861083984, 5.295271873474121, 5.4574294090271]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 10.0, 12.0, 27.0, 37.0, 56.0, 63.0, 130.0, 205.0, 293.0, 412.0, 669.0, 1038.0, 1631.0, 2584.0, 3905.0, 6182.0, 10050.0, 16410.0, 26466.0, 42382.0, 66818.0, 101508.0, 139672.0, 160808.0, 148591.0, 112557.0, 76953.0, 48905.0, 30037.0, 18753.0, 11674.0, 7207.0, 4565.0, 2798.0, 1832.0, 1139.0, 721.0, 520.0, 316.0, 229.0, 141.0, 78.0, 58.0, 40.0, 31.0, 14.0, 10.0, 11.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.328125, -4.195556640625, -4.06298828125, -3.930419921875, -3.7978515625, -3.665283203125, -3.53271484375, -3.400146484375, -3.267578125, -3.135009765625, -3.00244140625, -2.869873046875, -2.7373046875, -2.604736328125, -2.47216796875, -2.339599609375, -2.20703125, -2.074462890625, -1.94189453125, -1.809326171875, -1.6767578125, -1.544189453125, -1.41162109375, -1.279052734375, -1.146484375, -1.013916015625, -0.88134765625, -0.748779296875, -0.6162109375, -0.483642578125, -0.35107421875, -0.218505859375, -0.0859375, 0.046630859375, 0.17919921875, 0.311767578125, 0.4443359375, 0.576904296875, 0.70947265625, 0.842041015625, 0.974609375, 1.107177734375, 1.23974609375, 1.372314453125, 1.5048828125, 1.637451171875, 1.77001953125, 1.902587890625, 2.03515625, 2.167724609375, 2.30029296875, 2.432861328125, 2.5654296875, 2.697998046875, 2.83056640625, 2.963134765625, 3.095703125, 3.228271484375, 3.36083984375, 3.493408203125, 3.6259765625, 3.758544921875, 3.89111328125, 4.023681640625, 4.15625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 8.0, 5.0, 11.0, 11.0, 10.0, 13.0, 18.0, 11.0, 22.0, 24.0, 20.0, 34.0, 37.0, 47.0, 42.0, 37.0, 45.0, 32.0, 46.0, 51.0, 31.0, 47.0, 37.0, 43.0, 39.0, 46.0, 33.0, 23.0, 21.0, 26.0, 20.0, 17.0, 12.0, 21.0, 12.0, 6.0, 12.0, 8.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.703125, -5.53326416015625, -5.3634033203125, -5.19354248046875, -5.023681640625, -4.85382080078125, -4.6839599609375, -4.51409912109375, -4.34423828125, -4.17437744140625, -4.0045166015625, -3.83465576171875, -3.664794921875, -3.49493408203125, -3.3250732421875, -3.15521240234375, -2.9853515625, -2.81549072265625, -2.6456298828125, -2.47576904296875, -2.305908203125, -2.13604736328125, -1.9661865234375, -1.79632568359375, -1.62646484375, -1.45660400390625, -1.2867431640625, -1.11688232421875, -0.947021484375, -0.77716064453125, -0.6072998046875, -0.43743896484375, -0.267578125, -0.09771728515625, 0.0721435546875, 0.24200439453125, 0.411865234375, 0.58172607421875, 0.7515869140625, 0.92144775390625, 1.09130859375, 1.26116943359375, 1.4310302734375, 1.60089111328125, 1.770751953125, 1.94061279296875, 2.1104736328125, 2.28033447265625, 2.4501953125, 2.62005615234375, 2.7899169921875, 2.95977783203125, 3.129638671875, 3.29949951171875, 3.4693603515625, 3.63922119140625, 3.80908203125, 3.97894287109375, 4.1488037109375, 4.31866455078125, 4.488525390625, 4.65838623046875, 4.8282470703125, 4.99810791015625, 5.16796875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 5.0, 14.0, 18.0, 46.0, 77.0, 113.0, 184.0, 319.0, 547.0, 898.0, 1505.0, 2649.0, 4398.0, 7556.0, 12562.0, 21350.0, 35929.0, 59725.0, 95791.0, 141677.0, 174675.0, 165121.0, 122396.0, 80226.0, 48963.0, 29122.0, 17428.0, 10350.0, 6197.0, 3538.0, 2066.0, 1236.0, 760.0, 447.0, 241.0, 154.0, 93.0, 70.0, 49.0, 25.0, 12.0, 9.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.25634765625, -4.1181640625, -3.97998046875, -3.841796875, -3.70361328125, -3.5654296875, -3.42724609375, -3.2890625, -3.15087890625, -3.0126953125, -2.87451171875, -2.736328125, -2.59814453125, -2.4599609375, -2.32177734375, -2.18359375, -2.04541015625, -1.9072265625, -1.76904296875, -1.630859375, -1.49267578125, -1.3544921875, -1.21630859375, -1.078125, -0.93994140625, -0.8017578125, -0.66357421875, -0.525390625, -0.38720703125, -0.2490234375, -0.11083984375, 0.02734375, 0.16552734375, 0.3037109375, 0.44189453125, 0.580078125, 0.71826171875, 0.8564453125, 0.99462890625, 1.1328125, 1.27099609375, 1.4091796875, 1.54736328125, 1.685546875, 1.82373046875, 1.9619140625, 2.10009765625, 2.23828125, 2.37646484375, 2.5146484375, 2.65283203125, 2.791015625, 2.92919921875, 3.0673828125, 3.20556640625, 3.34375, 3.48193359375, 3.6201171875, 3.75830078125, 3.896484375, 4.03466796875, 4.1728515625, 4.31103515625, 4.44921875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 7.0, 5.0, 8.0, 4.0, 8.0, 14.0, 9.0, 16.0, 22.0, 19.0, 21.0, 19.0, 21.0, 18.0, 27.0, 20.0, 41.0, 36.0, 37.0, 42.0, 45.0, 43.0, 39.0, 37.0, 41.0, 41.0, 37.0, 33.0, 31.0, 24.0, 26.0, 28.0, 18.0, 20.0, 18.0, 20.0, 23.0, 13.0, 20.0, 10.0, 9.0, 4.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.818359375, -2.730743408203125, -2.64312744140625, -2.555511474609375, -2.4678955078125, -2.380279541015625, -2.29266357421875, -2.205047607421875, -2.117431640625, -2.029815673828125, -1.94219970703125, -1.854583740234375, -1.7669677734375, -1.679351806640625, -1.59173583984375, -1.504119873046875, -1.41650390625, -1.328887939453125, -1.24127197265625, -1.153656005859375, -1.0660400390625, -0.978424072265625, -0.89080810546875, -0.803192138671875, -0.715576171875, -0.627960205078125, -0.54034423828125, -0.452728271484375, -0.3651123046875, -0.277496337890625, -0.18988037109375, -0.102264404296875, -0.0146484375, 0.072967529296875, 0.16058349609375, 0.248199462890625, 0.3358154296875, 0.423431396484375, 0.51104736328125, 0.598663330078125, 0.686279296875, 0.773895263671875, 0.86151123046875, 0.949127197265625, 1.0367431640625, 1.124359130859375, 1.21197509765625, 1.299591064453125, 1.38720703125, 1.474822998046875, 1.56243896484375, 1.650054931640625, 1.7376708984375, 1.825286865234375, 1.91290283203125, 2.000518798828125, 2.088134765625, 2.175750732421875, 2.26336669921875, 2.350982666015625, 2.4385986328125, 2.526214599609375, 2.61383056640625, 2.701446533203125, 2.7890625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 1.0, 5.0, 5.0, 9.0, 17.0, 22.0, 38.0, 58.0, 74.0, 90.0, 166.0, 232.0, 355.0, 551.0, 850.0, 1316.0, 2278.0, 3627.0, 6163.0, 10665.0, 18439.0, 33466.0, 59746.0, 106117.0, 170647.0, 209930.0, 173217.0, 108571.0, 61651.0, 34200.0, 18879.0, 10786.0, 6400.0, 3706.0, 2318.0, 1407.0, 902.0, 586.0, 353.0, 231.0, 148.0, 113.0, 70.0, 54.0, 31.0, 25.0, 15.0, 10.0, 11.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.43359375, -1.383331298828125, -1.33306884765625, -1.282806396484375, -1.2325439453125, -1.182281494140625, -1.13201904296875, -1.081756591796875, -1.031494140625, -0.981231689453125, -0.93096923828125, -0.880706787109375, -0.8304443359375, -0.780181884765625, -0.72991943359375, -0.679656982421875, -0.62939453125, -0.579132080078125, -0.52886962890625, -0.478607177734375, -0.4283447265625, -0.378082275390625, -0.32781982421875, -0.277557373046875, -0.227294921875, -0.177032470703125, -0.12677001953125, -0.076507568359375, -0.0262451171875, 0.024017333984375, 0.07427978515625, 0.124542236328125, 0.1748046875, 0.225067138671875, 0.27532958984375, 0.325592041015625, 0.3758544921875, 0.426116943359375, 0.47637939453125, 0.526641845703125, 0.576904296875, 0.627166748046875, 0.67742919921875, 0.727691650390625, 0.7779541015625, 0.828216552734375, 0.87847900390625, 0.928741455078125, 0.97900390625, 1.029266357421875, 1.07952880859375, 1.129791259765625, 1.1800537109375, 1.230316162109375, 1.28057861328125, 1.330841064453125, 1.381103515625, 1.431365966796875, 1.48162841796875, 1.531890869140625, 1.5821533203125, 1.632415771484375, 1.68267822265625, 1.732940673828125, 1.783203125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 10.0, 7.0, 13.0, 13.0, 14.0, 13.0, 23.0, 32.0, 23.0, 33.0, 36.0, 48.0, 44.0, 59.0, 53.0, 58.0, 70.0, 49.0, 36.0, 34.0, 46.0, 39.0, 38.0, 35.0, 29.0, 30.0, 14.0, 21.0, 15.0, 12.0, 6.0, 4.0, 13.0, 5.0, 2.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.00010508298873901367, -0.00010212883353233337, -9.917467832565308e-05, -9.622052311897278e-05, -9.326636791229248e-05, -9.031221270561218e-05, -8.735805749893188e-05, -8.440390229225159e-05, -8.144974708557129e-05, -7.849559187889099e-05, -7.55414366722107e-05, -7.25872814655304e-05, -6.96331262588501e-05, -6.66789710521698e-05, -6.37248158454895e-05, -6.0770660638809204e-05, -5.7816505432128906e-05, -5.486235022544861e-05, -5.190819501876831e-05, -4.895403981208801e-05, -4.5999884605407715e-05, -4.304572939872742e-05, -4.009157419204712e-05, -3.713741898536682e-05, -3.4183263778686523e-05, -3.1229108572006226e-05, -2.8274953365325928e-05, -2.532079815864563e-05, -2.2366642951965332e-05, -1.9412487745285034e-05, -1.6458332538604736e-05, -1.3504177331924438e-05, -1.055002212524414e-05, -7.595866918563843e-06, -4.641711711883545e-06, -1.687556505203247e-06, 1.2665987014770508e-06, 4.220753908157349e-06, 7.1749091148376465e-06, 1.0129064321517944e-05, 1.3083219528198242e-05, 1.603737473487854e-05, 1.8991529941558838e-05, 2.1945685148239136e-05, 2.4899840354919434e-05, 2.785399556159973e-05, 3.080815076828003e-05, 3.376230597496033e-05, 3.6716461181640625e-05, 3.967061638832092e-05, 4.262477159500122e-05, 4.557892680168152e-05, 4.8533082008361816e-05, 5.1487237215042114e-05, 5.444139242172241e-05, 5.739554762840271e-05, 6.034970283508301e-05, 6.33038580417633e-05, 6.62580132484436e-05, 6.92121684551239e-05, 7.21663236618042e-05, 7.51204788684845e-05, 7.80746340751648e-05, 8.102878928184509e-05, 8.398294448852539e-05]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 15.0, 9.0, 17.0, 22.0, 40.0, 57.0, 76.0, 122.0, 175.0, 303.0, 441.0, 671.0, 1038.0, 1622.0, 2675.0, 4384.0, 7108.0, 11751.0, 19539.0, 32435.0, 53856.0, 87861.0, 134219.0, 175270.0, 172782.0, 128991.0, 83497.0, 51052.0, 30807.0, 18346.0, 11341.0, 6759.0, 4196.0, 2569.0, 1622.0, 1031.0, 653.0, 407.0, 250.0, 193.0, 125.0, 75.0, 53.0, 35.0, 26.0, 11.0, 15.0, 3.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.2611236572265625, -1.217559814453125, -1.1739959716796875, -1.13043212890625, -1.0868682861328125, -1.043304443359375, -0.9997406005859375, -0.9561767578125, -0.9126129150390625, -0.869049072265625, -0.8254852294921875, -0.78192138671875, -0.7383575439453125, -0.694793701171875, -0.6512298583984375, -0.607666015625, -0.5641021728515625, -0.520538330078125, -0.4769744873046875, -0.43341064453125, -0.3898468017578125, -0.346282958984375, -0.3027191162109375, -0.2591552734375, -0.2155914306640625, -0.172027587890625, -0.1284637451171875, -0.08489990234375, -0.0413360595703125, 0.002227783203125, 0.0457916259765625, 0.08935546875, 0.1329193115234375, 0.176483154296875, 0.2200469970703125, 0.26361083984375, 0.3071746826171875, 0.350738525390625, 0.3943023681640625, 0.4378662109375, 0.4814300537109375, 0.524993896484375, 0.5685577392578125, 0.61212158203125, 0.6556854248046875, 0.699249267578125, 0.7428131103515625, 0.786376953125, 0.8299407958984375, 0.873504638671875, 0.9170684814453125, 0.96063232421875, 1.0041961669921875, 1.047760009765625, 1.0913238525390625, 1.1348876953125, 1.1784515380859375, 1.222015380859375, 1.2655792236328125, 1.30914306640625, 1.3527069091796875, 1.396270751953125, 1.4398345947265625, 1.4833984375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 14.0, 12.0, 12.0, 14.0, 19.0, 19.0, 21.0, 24.0, 24.0, 35.0, 39.0, 49.0, 59.0, 57.0, 58.0, 48.0, 64.0, 62.0, 66.0, 52.0, 55.0, 35.0, 31.0, 27.0, 25.0, 19.0, 11.0, 14.0, 8.0, 9.0, 7.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.716796875, -0.6960296630859375, -0.675262451171875, -0.6544952392578125, -0.63372802734375, -0.6129608154296875, -0.592193603515625, -0.5714263916015625, -0.5506591796875, -0.5298919677734375, -0.509124755859375, -0.4883575439453125, -0.46759033203125, -0.4468231201171875, -0.426055908203125, -0.4052886962890625, -0.384521484375, -0.3637542724609375, -0.342987060546875, -0.3222198486328125, -0.30145263671875, -0.2806854248046875, -0.259918212890625, -0.2391510009765625, -0.2183837890625, -0.1976165771484375, -0.176849365234375, -0.1560821533203125, -0.13531494140625, -0.1145477294921875, -0.093780517578125, -0.0730133056640625, -0.05224609375, -0.0314788818359375, -0.010711669921875, 0.0100555419921875, 0.03082275390625, 0.0515899658203125, 0.072357177734375, 0.0931243896484375, 0.1138916015625, 0.1346588134765625, 0.155426025390625, 0.1761932373046875, 0.19696044921875, 0.2177276611328125, 0.238494873046875, 0.2592620849609375, 0.280029296875, 0.3007965087890625, 0.321563720703125, 0.3423309326171875, 0.36309814453125, 0.3838653564453125, 0.404632568359375, 0.4253997802734375, 0.4461669921875, 0.4669342041015625, 0.487701416015625, 0.5084686279296875, 0.52923583984375, 0.5500030517578125, 0.570770263671875, 0.5915374755859375, 0.6123046875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 10.0, 13.0, 17.0, 16.0, 20.0, 33.0, 39.0, 41.0, 69.0, 66.0, 77.0, 80.0, 81.0, 71.0, 74.0, 58.0, 53.0, 32.0, 21.0, 28.0, 19.0, 17.0, 11.0, 18.0, 5.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.929625988006592, -5.745594024658203, -5.561561584472656, -5.377529144287109, -5.193497180938721, -5.009465217590332, -4.825432777404785, -4.641400337219238, -4.45736837387085, -4.273336410522461, -4.089303970336914, -3.9052717685699463, -3.7212395668029785, -3.5372073650360107, -3.353175163269043, -3.169142961502075, -2.9851107597351074, -2.8010785579681396, -2.617046356201172, -2.433014154434204, -2.2489819526672363, -2.0649497509002686, -1.8809175491333008, -1.696885347366333, -1.5128531455993652, -1.3288209438323975, -1.1447887420654297, -0.9607565402984619, -0.7767243385314941, -0.5926921367645264, -0.4086599349975586, -0.22462773323059082, -0.04059553146362305, 0.14343667030334473, 0.3274688720703125, 0.5115010738372803, 0.695533275604248, 0.8795654773712158, 1.0635976791381836, 1.2476298809051514, 1.4316620826721191, 1.615694284439087, 1.7997264862060547, 1.9837586879730225, 2.1677908897399902, 2.351823091506958, 2.535855293273926, 2.7198874950408936, 2.9039196968078613, 3.087951898574829, 3.271984100341797, 3.4560163021087646, 3.6400485038757324, 3.8240807056427, 4.008112907409668, 4.192145347595215, 4.3761773109436035, 4.560209274291992, 4.744241714477539, 4.928274154663086, 5.112306118011475, 5.296338081359863, 5.48037052154541, 5.664402961730957, 5.848434925079346]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 6.0, 6.0, 3.0, 5.0, 5.0, 12.0, 12.0, 15.0, 13.0, 15.0, 13.0, 22.0, 28.0, 20.0, 31.0, 31.0, 31.0, 38.0, 31.0, 40.0, 54.0, 54.0, 41.0, 38.0, 61.0, 46.0, 36.0, 32.0, 32.0, 34.0, 31.0, 27.0, 18.0, 21.0, 20.0, 18.0, 16.0, 13.0, 10.0, 9.0, 3.0, 7.0, 4.0, 1.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.866006851196289, -4.689187526702881, -4.512368202209473, -4.335548400878906, -4.158729076385498, -3.98190975189209, -3.8050901889801025, -3.6282706260681152, -3.451451301574707, -3.274631977081299, -3.0978124141693115, -2.920992851257324, -2.744173526763916, -2.567354202270508, -2.3905346393585205, -2.213715076446533, -2.036895751953125, -1.8600763082504272, -1.6832568645477295, -1.5064374208450317, -1.329617977142334, -1.1527985334396362, -0.9759790897369385, -0.7991596460342407, -0.622340202331543, -0.4455207586288452, -0.26870131492614746, -0.09188187122344971, 0.08493757247924805, 0.2617570161819458, 0.43857645988464355, 0.6153959035873413, 0.7922148704528809, 0.9690343141555786, 1.1458537578582764, 1.3226732015609741, 1.4994926452636719, 1.6763120889663696, 1.8531315326690674, 2.0299510955810547, 2.206770420074463, 2.383589744567871, 2.5604093074798584, 2.7372288703918457, 2.914048194885254, 3.090867519378662, 3.2676870822906494, 3.4445066452026367, 3.621325969696045, 3.798145294189453, 3.9749648571014404, 4.151784420013428, 4.328603744506836, 4.505423069000244, 4.682242393493652, 4.859062194824219, 5.035881519317627, 5.212700843811035, 5.389520645141602, 5.56633996963501, 5.743159294128418, 5.919978618621826, 6.096797943115234, 6.273617744445801, 6.450437068939209]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 9.0, 7.0, 17.0, 26.0, 45.0, 60.0, 89.0, 118.0, 204.0, 353.0, 581.0, 965.0, 1496.0, 2631.0, 4351.0, 7612.0, 14271.0, 26367.0, 52293.0, 110715.0, 251501.0, 605039.0, 1200422.0, 1059469.0, 475018.0, 197651.0, 89060.0, 42641.0, 21989.0, 12144.0, 6711.0, 3966.0, 2393.0, 1509.0, 935.0, 570.0, 415.0, 225.0, 142.0, 100.0, 78.0, 43.0, 17.0, 17.0, 10.0, 6.0, 6.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.46875, -6.283203125, -6.09765625, -5.912109375, -5.7265625, -5.541015625, -5.35546875, -5.169921875, -4.984375, -4.798828125, -4.61328125, -4.427734375, -4.2421875, -4.056640625, -3.87109375, -3.685546875, -3.5, -3.314453125, -3.12890625, -2.943359375, -2.7578125, -2.572265625, -2.38671875, -2.201171875, -2.015625, -1.830078125, -1.64453125, -1.458984375, -1.2734375, -1.087890625, -0.90234375, -0.716796875, -0.53125, -0.345703125, -0.16015625, 0.025390625, 0.2109375, 0.396484375, 0.58203125, 0.767578125, 0.953125, 1.138671875, 1.32421875, 1.509765625, 1.6953125, 1.880859375, 2.06640625, 2.251953125, 2.4375, 2.623046875, 2.80859375, 2.994140625, 3.1796875, 3.365234375, 3.55078125, 3.736328125, 3.921875, 4.107421875, 4.29296875, 4.478515625, 4.6640625, 4.849609375, 5.03515625, 5.220703125, 5.40625]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 6.0, 8.0, 9.0, 9.0, 9.0, 15.0, 14.0, 14.0, 24.0, 24.0, 24.0, 32.0, 16.0, 39.0, 39.0, 32.0, 42.0, 37.0, 57.0, 47.0, 39.0, 51.0, 39.0, 42.0, 36.0, 31.0, 33.0, 34.0, 25.0, 18.0, 27.0, 14.0, 27.0, 16.0, 14.0, 10.0, 10.0, 8.0, 6.0, 1.0, 4.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2421875, -3.1302490234375, -3.018310546875, -2.9063720703125, -2.79443359375, -2.6824951171875, -2.570556640625, -2.4586181640625, -2.3466796875, -2.2347412109375, -2.122802734375, -2.0108642578125, -1.89892578125, -1.7869873046875, -1.675048828125, -1.5631103515625, -1.451171875, -1.3392333984375, -1.227294921875, -1.1153564453125, -1.00341796875, -0.8914794921875, -0.779541015625, -0.6676025390625, -0.5556640625, -0.4437255859375, -0.331787109375, -0.2198486328125, -0.10791015625, 0.0040283203125, 0.115966796875, 0.2279052734375, 0.33984375, 0.4517822265625, 0.563720703125, 0.6756591796875, 0.78759765625, 0.8995361328125, 1.011474609375, 1.1234130859375, 1.2353515625, 1.3472900390625, 1.459228515625, 1.5711669921875, 1.68310546875, 1.7950439453125, 1.906982421875, 2.0189208984375, 2.130859375, 2.2427978515625, 2.354736328125, 2.4666748046875, 2.57861328125, 2.6905517578125, 2.802490234375, 2.9144287109375, 3.0263671875, 3.1383056640625, 3.250244140625, 3.3621826171875, 3.47412109375, 3.5860595703125, 3.697998046875, 3.8099365234375, 3.921875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 5.0, 12.0, 23.0, 22.0, 15.0, 43.0, 69.0, 125.0, 159.0, 297.0, 446.0, 758.0, 1404.0, 2601.0, 4993.0, 9798.0, 19530.0, 41976.0, 94150.0, 217689.0, 504562.0, 1002728.0, 1133963.0, 644760.0, 286099.0, 123140.0, 54753.0, 25043.0, 11893.0, 6162.0, 3132.0, 1627.0, 910.0, 554.0, 301.0, 190.0, 115.0, 66.0, 63.0, 30.0, 20.0, 17.0, 14.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33203125, -5.149169921875, -4.96630859375, -4.783447265625, -4.6005859375, -4.417724609375, -4.23486328125, -4.052001953125, -3.869140625, -3.686279296875, -3.50341796875, -3.320556640625, -3.1376953125, -2.954833984375, -2.77197265625, -2.589111328125, -2.40625, -2.223388671875, -2.04052734375, -1.857666015625, -1.6748046875, -1.491943359375, -1.30908203125, -1.126220703125, -0.943359375, -0.760498046875, -0.57763671875, -0.394775390625, -0.2119140625, -0.029052734375, 0.15380859375, 0.336669921875, 0.51953125, 0.702392578125, 0.88525390625, 1.068115234375, 1.2509765625, 1.433837890625, 1.61669921875, 1.799560546875, 1.982421875, 2.165283203125, 2.34814453125, 2.531005859375, 2.7138671875, 2.896728515625, 3.07958984375, 3.262451171875, 3.4453125, 3.628173828125, 3.81103515625, 3.993896484375, 4.1767578125, 4.359619140625, 4.54248046875, 4.725341796875, 4.908203125, 5.091064453125, 5.27392578125, 5.456787109375, 5.6396484375, 5.822509765625, 6.00537109375, 6.188232421875, 6.37109375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 10.0, 9.0, 9.0, 25.0, 24.0, 26.0, 37.0, 31.0, 51.0, 71.0, 73.0, 103.0, 117.0, 154.0, 154.0, 184.0, 203.0, 231.0, 249.0, 254.0, 229.0, 230.0, 238.0, 203.0, 193.0, 172.0, 129.0, 131.0, 106.0, 81.0, 68.0, 65.0, 57.0, 41.0, 25.0, 19.0, 19.0, 14.0, 6.0, 6.0, 3.0, 10.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7568359375, -1.6990509033203125, -1.641265869140625, -1.5834808349609375, -1.52569580078125, -1.4679107666015625, -1.410125732421875, -1.3523406982421875, -1.2945556640625, -1.2367706298828125, -1.178985595703125, -1.1212005615234375, -1.06341552734375, -1.0056304931640625, -0.947845458984375, -0.8900604248046875, -0.832275390625, -0.7744903564453125, -0.716705322265625, -0.6589202880859375, -0.60113525390625, -0.5433502197265625, -0.485565185546875, -0.4277801513671875, -0.3699951171875, -0.3122100830078125, -0.254425048828125, -0.1966400146484375, -0.13885498046875, -0.0810699462890625, -0.023284912109375, 0.0345001220703125, 0.09228515625, 0.1500701904296875, 0.207855224609375, 0.2656402587890625, 0.32342529296875, 0.3812103271484375, 0.438995361328125, 0.4967803955078125, 0.5545654296875, 0.6123504638671875, 0.670135498046875, 0.7279205322265625, 0.78570556640625, 0.8434906005859375, 0.901275634765625, 0.9590606689453125, 1.016845703125, 1.0746307373046875, 1.132415771484375, 1.1902008056640625, 1.24798583984375, 1.3057708740234375, 1.363555908203125, 1.4213409423828125, 1.4791259765625, 1.5369110107421875, 1.594696044921875, 1.6524810791015625, 1.71026611328125, 1.7680511474609375, 1.825836181640625, 1.8836212158203125, 1.94140625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 12.0, 9.0, 13.0, 15.0, 21.0, 25.0, 37.0, 50.0, 42.0, 68.0, 68.0, 84.0, 85.0, 85.0, 80.0, 63.0, 41.0, 43.0, 28.0, 28.0, 27.0, 17.0, 8.0, 10.0, 7.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.055538177490234, -4.87870979309082, -4.7018818855285645, -4.52505350112915, -4.348225116729736, -4.171396732330322, -3.9945688247680664, -3.8177404403686523, -3.6409120559692383, -3.4640839099884033, -3.2872555255889893, -3.1104273796081543, -2.9335989952087402, -2.7567708492279053, -2.5799427032470703, -2.4031143188476562, -2.2262861728668213, -2.0494580268859863, -1.8726296424865723, -1.6958014965057373, -1.5189731121063232, -1.3421449661254883, -1.1653167009353638, -0.9884884357452393, -0.8116601705551147, -0.6348319053649902, -0.4580036699771881, -0.281175434589386, -0.10434716939926147, 0.07248109579086304, 0.24930930137634277, 0.4261375665664673, 0.6029658317565918, 0.7797940969467163, 0.9566223621368408, 1.1334505081176758, 1.3102788925170898, 1.4871070384979248, 1.6639353036880493, 1.8407635688781738, 2.017591953277588, 2.194420099258423, 2.371248483657837, 2.548076629638672, 2.724905014038086, 2.901733160018921, 3.078561305999756, 3.25538969039917, 3.432217836380005, 3.60904598236084, 3.785874366760254, 3.962702512741089, 4.139530658721924, 4.316359043121338, 4.493187427520752, 4.670015335083008, 4.846843719482422, 5.023672103881836, 5.200500011444092, 5.377328395843506, 5.55415678024292, 5.730985164642334, 5.90781307220459, 6.084641456604004, 6.261469841003418]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 8.0, 2.0, 12.0, 5.0, 9.0, 16.0, 23.0, 19.0, 18.0, 27.0, 41.0, 26.0, 33.0, 27.0, 41.0, 46.0, 34.0, 45.0, 46.0, 52.0, 55.0, 50.0, 47.0, 45.0, 44.0, 30.0, 28.0, 31.0, 20.0, 19.0, 21.0, 17.0, 16.0, 11.0, 5.0, 9.0, 9.0, 5.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.728874206542969, -4.554924964904785, -4.38097620010376, -4.207026958465576, -4.033078193664551, -3.859128952026367, -3.6851797103881836, -3.511230707168579, -3.3372817039489746, -3.16333270072937, -2.9893836975097656, -2.815434455871582, -2.6414854526519775, -2.467536449432373, -2.2935872077941895, -2.119638204574585, -1.9456892013549805, -1.771740198135376, -1.597791075706482, -1.423841953277588, -1.2498929500579834, -1.075943946838379, -0.9019948244094849, -0.7280457019805908, -0.5540966987609863, -0.38014763593673706, -0.2061985731124878, -0.032249510288238525, 0.14169955253601074, 0.31564861536026, 0.4895976781845093, 0.6635468006134033, 0.8374953269958496, 1.011444330215454, 1.1853934526443481, 1.3593425750732422, 1.5332915782928467, 1.7072405815124512, 1.8811897039413452, 2.0551388263702393, 2.2290878295898438, 2.4030368328094482, 2.5769858360290527, 2.7509350776672363, 2.924884080886841, 3.0988330841064453, 3.272782325744629, 3.4467313289642334, 3.620680332183838, 3.7946293354034424, 3.968578338623047, 4.1425275802612305, 4.316476821899414, 4.4904255867004395, 4.664374828338623, 4.838323593139648, 5.012272834777832, 5.186222076416016, 5.360170841217041, 5.534120082855225, 5.70806884765625, 5.882018089294434, 6.055967330932617, 6.229916572570801, 6.403865337371826]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 9.0, 11.0, 18.0, 20.0, 38.0, 52.0, 85.0, 156.0, 230.0, 328.0, 530.0, 826.0, 1384.0, 2154.0, 3520.0, 6163.0, 10556.0, 18448.0, 34862.0, 68146.0, 142363.0, 275596.0, 241399.0, 116778.0, 57168.0, 29265.0, 15762.0, 9080.0, 5198.0, 3190.0, 1899.0, 1210.0, 804.0, 473.0, 295.0, 197.0, 137.0, 65.0, 45.0, 34.0, 24.0, 9.0, 11.0, 8.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.8759765625, -1.820587158203125, -1.76519775390625, -1.709808349609375, -1.6544189453125, -1.599029541015625, -1.54364013671875, -1.488250732421875, -1.432861328125, -1.377471923828125, -1.32208251953125, -1.266693115234375, -1.2113037109375, -1.155914306640625, -1.10052490234375, -1.045135498046875, -0.98974609375, -0.934356689453125, -0.87896728515625, -0.823577880859375, -0.7681884765625, -0.712799072265625, -0.65740966796875, -0.602020263671875, -0.546630859375, -0.491241455078125, -0.43585205078125, -0.380462646484375, -0.3250732421875, -0.269683837890625, -0.21429443359375, -0.158905029296875, -0.103515625, -0.048126220703125, 0.00726318359375, 0.062652587890625, 0.1180419921875, 0.173431396484375, 0.22882080078125, 0.284210205078125, 0.339599609375, 0.394989013671875, 0.45037841796875, 0.505767822265625, 0.5611572265625, 0.616546630859375, 0.67193603515625, 0.727325439453125, 0.78271484375, 0.838104248046875, 0.89349365234375, 0.948883056640625, 1.0042724609375, 1.059661865234375, 1.11505126953125, 1.170440673828125, 1.225830078125, 1.281219482421875, 1.33660888671875, 1.391998291015625, 1.4473876953125, 1.502777099609375, 1.55816650390625, 1.613555908203125, 1.6689453125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 5.0, 2.0, 10.0, 9.0, 13.0, 12.0, 21.0, 20.0, 27.0, 22.0, 33.0, 36.0, 31.0, 39.0, 45.0, 44.0, 53.0, 50.0, 45.0, 71.0, 51.0, 43.0, 43.0, 45.0, 42.0, 28.0, 30.0, 26.0, 13.0, 19.0, 22.0, 15.0, 10.0, 4.0, 10.0, 2.0, 6.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5703125, -5.38116455078125, -5.1920166015625, -5.00286865234375, -4.813720703125, -4.62457275390625, -4.4354248046875, -4.24627685546875, -4.05712890625, -3.86798095703125, -3.6788330078125, -3.48968505859375, -3.300537109375, -3.11138916015625, -2.9222412109375, -2.73309326171875, -2.5439453125, -2.35479736328125, -2.1656494140625, -1.97650146484375, -1.787353515625, -1.59820556640625, -1.4090576171875, -1.21990966796875, -1.03076171875, -0.84161376953125, -0.6524658203125, -0.46331787109375, -0.274169921875, -0.08502197265625, 0.1041259765625, 0.29327392578125, 0.482421875, 0.67156982421875, 0.8607177734375, 1.04986572265625, 1.239013671875, 1.42816162109375, 1.6173095703125, 1.80645751953125, 1.99560546875, 2.18475341796875, 2.3739013671875, 2.56304931640625, 2.752197265625, 2.94134521484375, 3.1304931640625, 3.31964111328125, 3.5087890625, 3.69793701171875, 3.8870849609375, 4.07623291015625, 4.265380859375, 4.45452880859375, 4.6436767578125, 4.83282470703125, 5.02197265625, 5.21112060546875, 5.4002685546875, 5.58941650390625, 5.778564453125, 5.96771240234375, 6.1568603515625, 6.34600830078125, 6.53515625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 7.0, 5.0, 2.0, 4.0, 1.0, 6.0, 5.0, 5.0, 6.0, 9.0, 14.0, 20.0, 20.0, 29.0, 46.0, 47.0, 64.0, 94.0, 109.0, 173.0, 216.0, 322.0, 422.0, 683.0, 983.0, 1792.0, 3324.0, 6956.0, 17097.0, 51741.0, 904729.0, 34464.0, 12608.0, 5376.0, 2725.0, 1505.0, 900.0, 539.0, 411.0, 294.0, 226.0, 138.0, 88.0, 88.0, 79.0, 45.0, 35.0, 32.0, 25.0, 16.0, 11.0, 5.0, 9.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0], "bins": [-4.265625, -4.13372802734375, -4.0018310546875, -3.86993408203125, -3.738037109375, -3.60614013671875, -3.4742431640625, -3.34234619140625, -3.21044921875, -3.07855224609375, -2.9466552734375, -2.81475830078125, -2.682861328125, -2.55096435546875, -2.4190673828125, -2.28717041015625, -2.1552734375, -2.02337646484375, -1.8914794921875, -1.75958251953125, -1.627685546875, -1.49578857421875, -1.3638916015625, -1.23199462890625, -1.10009765625, -0.96820068359375, -0.8363037109375, -0.70440673828125, -0.572509765625, -0.44061279296875, -0.3087158203125, -0.17681884765625, -0.044921875, 0.08697509765625, 0.2188720703125, 0.35076904296875, 0.482666015625, 0.61456298828125, 0.7464599609375, 0.87835693359375, 1.01025390625, 1.14215087890625, 1.2740478515625, 1.40594482421875, 1.537841796875, 1.66973876953125, 1.8016357421875, 1.93353271484375, 2.0654296875, 2.19732666015625, 2.3292236328125, 2.46112060546875, 2.593017578125, 2.72491455078125, 2.8568115234375, 2.98870849609375, 3.12060546875, 3.25250244140625, 3.3843994140625, 3.51629638671875, 3.648193359375, 3.78009033203125, 3.9119873046875, 4.04388427734375, 4.17578125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 1.0, 5.0, 8.0, 5.0, 14.0, 14.0, 9.0, 15.0, 15.0, 20.0, 15.0, 20.0, 39.0, 38.0, 28.0, 33.0, 38.0, 31.0, 27.0, 35.0, 39.0, 39.0, 46.0, 51.0, 29.0, 31.0, 44.0, 40.0, 35.0, 31.0, 27.0, 27.0, 22.0, 23.0, 31.0, 9.0, 8.0, 8.0, 7.0, 11.0, 5.0, 8.0, 3.0, 4.0, 5.0, 6.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1640625, -3.0638427734375, -2.963623046875, -2.8634033203125, -2.76318359375, -2.6629638671875, -2.562744140625, -2.4625244140625, -2.3623046875, -2.2620849609375, -2.161865234375, -2.0616455078125, -1.96142578125, -1.8612060546875, -1.760986328125, -1.6607666015625, -1.560546875, -1.4603271484375, -1.360107421875, -1.2598876953125, -1.15966796875, -1.0594482421875, -0.959228515625, -0.8590087890625, -0.7587890625, -0.6585693359375, -0.558349609375, -0.4581298828125, -0.35791015625, -0.2576904296875, -0.157470703125, -0.0572509765625, 0.04296875, 0.1431884765625, 0.243408203125, 0.3436279296875, 0.44384765625, 0.5440673828125, 0.644287109375, 0.7445068359375, 0.8447265625, 0.9449462890625, 1.045166015625, 1.1453857421875, 1.24560546875, 1.3458251953125, 1.446044921875, 1.5462646484375, 1.646484375, 1.7467041015625, 1.846923828125, 1.9471435546875, 2.04736328125, 2.1475830078125, 2.247802734375, 2.3480224609375, 2.4482421875, 2.5484619140625, 2.648681640625, 2.7489013671875, 2.84912109375, 2.9493408203125, 3.049560546875, 3.1497802734375, 3.25]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 10.0, 6.0, 14.0, 13.0, 7.0, 23.0, 30.0, 54.0, 80.0, 138.0, 236.0, 342.0, 611.0, 1197.0, 2320.0, 5188.0, 15075.0, 87505.0, 905756.0, 18206.0, 6112.0, 2609.0, 1305.0, 680.0, 378.0, 231.0, 149.0, 102.0, 60.0, 35.0, 23.0, 12.0, 13.0, 10.0, 3.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.51123046875, -0.4957733154296875, -0.480316162109375, -0.4648590087890625, -0.44940185546875, -0.4339447021484375, -0.418487548828125, -0.4030303955078125, -0.3875732421875, -0.3721160888671875, -0.356658935546875, -0.3412017822265625, -0.32574462890625, -0.3102874755859375, -0.294830322265625, -0.2793731689453125, -0.263916015625, -0.2484588623046875, -0.233001708984375, -0.2175445556640625, -0.20208740234375, -0.1866302490234375, -0.171173095703125, -0.1557159423828125, -0.1402587890625, -0.1248016357421875, -0.109344482421875, -0.0938873291015625, -0.07843017578125, -0.0629730224609375, -0.047515869140625, -0.0320587158203125, -0.0166015625, -0.0011444091796875, 0.014312744140625, 0.0297698974609375, 0.04522705078125, 0.0606842041015625, 0.076141357421875, 0.0915985107421875, 0.1070556640625, 0.1225128173828125, 0.137969970703125, 0.1534271240234375, 0.16888427734375, 0.1843414306640625, 0.199798583984375, 0.2152557373046875, 0.230712890625, 0.2461700439453125, 0.261627197265625, 0.2770843505859375, 0.29254150390625, 0.3079986572265625, 0.323455810546875, 0.3389129638671875, 0.3543701171875, 0.3698272705078125, 0.385284423828125, 0.4007415771484375, 0.41619873046875, 0.4316558837890625, 0.447113037109375, 0.4625701904296875, 0.47802734375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 8.0, 3.0, 6.0, 5.0, 4.0, 11.0, 14.0, 15.0, 18.0, 18.0, 27.0, 23.0, 24.0, 51.0, 56.0, 57.0, 61.0, 59.0, 53.0, 66.0, 72.0, 46.0, 57.0, 47.0, 37.0, 27.0, 33.0, 27.0, 20.0, 16.0, 16.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.060434341430664e-05, -4.91337850689888e-05, -4.766322672367096e-05, -4.619266837835312e-05, -4.472211003303528e-05, -4.325155168771744e-05, -4.17809933423996e-05, -4.0310434997081757e-05, -3.8839876651763916e-05, -3.7369318306446075e-05, -3.5898759961128235e-05, -3.4428201615810394e-05, -3.2957643270492554e-05, -3.148708492517471e-05, -3.0016526579856873e-05, -2.8545968234539032e-05, -2.707540988922119e-05, -2.560485154390335e-05, -2.413429319858551e-05, -2.266373485326767e-05, -2.119317650794983e-05, -1.972261816263199e-05, -1.8252059817314148e-05, -1.6781501471996307e-05, -1.5310943126678467e-05, -1.3840384781360626e-05, -1.2369826436042786e-05, -1.0899268090724945e-05, -9.428709745407104e-06, -7.958151400089264e-06, -6.487593054771423e-06, -5.017034709453583e-06, -3.546476364135742e-06, -2.0759180188179016e-06, -6.05359673500061e-07, 8.651986718177795e-07, 2.33575701713562e-06, 3.8063153624534607e-06, 5.276873707771301e-06, 6.747432053089142e-06, 8.217990398406982e-06, 9.688548743724823e-06, 1.1159107089042664e-05, 1.2629665434360504e-05, 1.4100223779678345e-05, 1.5570782124996185e-05, 1.7041340470314026e-05, 1.8511898815631866e-05, 1.9982457160949707e-05, 2.1453015506267548e-05, 2.2923573851585388e-05, 2.439413219690323e-05, 2.586469054222107e-05, 2.733524888753891e-05, 2.880580723285675e-05, 3.027636557817459e-05, 3.174692392349243e-05, 3.321748226881027e-05, 3.468804061412811e-05, 3.615859895944595e-05, 3.7629157304763794e-05, 3.9099715650081635e-05, 4.0570273995399475e-05, 4.2040832340717316e-05, 4.3511390686035156e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 8.0, 6.0, 6.0, 15.0, 10.0, 19.0, 24.0, 28.0, 43.0, 86.0, 119.0, 168.0, 307.0, 383.0, 596.0, 969.0, 1466.0, 2458.0, 4084.0, 6991.0, 12662.0, 24063.0, 48233.0, 104705.0, 245823.0, 314765.0, 146378.0, 64469.0, 31461.0, 16122.0, 9026.0, 5068.0, 2933.0, 1767.0, 1155.0, 723.0, 455.0, 323.0, 214.0, 136.0, 94.0, 66.0, 36.0, 24.0, 23.0, 12.0, 13.0, 7.0, 5.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1422119140625, -0.13765335083007812, -0.13309478759765625, -0.12853622436523438, -0.1239776611328125, -0.11941909790039062, -0.11486053466796875, -0.11030197143554688, -0.105743408203125, -0.10118484497070312, -0.09662628173828125, -0.09206771850585938, -0.0875091552734375, -0.08295059204101562, -0.07839202880859375, -0.07383346557617188, -0.06927490234375, -0.06471633911132812, -0.06015777587890625, -0.055599212646484375, -0.0510406494140625, -0.046482086181640625, -0.04192352294921875, -0.037364959716796875, -0.032806396484375, -0.028247833251953125, -0.02368927001953125, -0.019130706787109375, -0.0145721435546875, -0.010013580322265625, -0.00545501708984375, -0.000896453857421875, 0.003662109375, 0.008220672607421875, 0.01277923583984375, 0.017337799072265625, 0.0218963623046875, 0.026454925537109375, 0.03101348876953125, 0.035572052001953125, 0.040130615234375, 0.044689178466796875, 0.04924774169921875, 0.053806304931640625, 0.0583648681640625, 0.06292343139648438, 0.06748199462890625, 0.07204055786132812, 0.07659912109375, 0.08115768432617188, 0.08571624755859375, 0.09027481079101562, 0.0948333740234375, 0.09939193725585938, 0.10395050048828125, 0.10850906372070312, 0.113067626953125, 0.11762619018554688, 0.12218475341796875, 0.12674331665039062, 0.1313018798828125, 0.13586044311523438, 0.14041900634765625, 0.14497756958007812, 0.1495361328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 5.0, 10.0, 16.0, 12.0, 26.0, 25.0, 32.0, 41.0, 61.0, 88.0, 64.0, 76.0, 68.0, 76.0, 54.0, 58.0, 57.0, 38.0, 45.0, 41.0, 16.0, 28.0, 14.0, 11.0, 5.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.056060791015625, -0.05428791046142578, -0.05251502990722656, -0.050742149353027344, -0.048969268798828125, -0.047196388244628906, -0.04542350769042969, -0.04365062713623047, -0.04187774658203125, -0.04010486602783203, -0.03833198547363281, -0.036559104919433594, -0.034786224365234375, -0.033013343811035156, -0.031240463256835938, -0.02946758270263672, -0.0276947021484375, -0.02592182159423828, -0.024148941040039062, -0.022376060485839844, -0.020603179931640625, -0.018830299377441406, -0.017057418823242188, -0.015284538269042969, -0.01351165771484375, -0.011738777160644531, -0.009965896606445312, -0.008193016052246094, -0.006420135498046875, -0.004647254943847656, -0.0028743743896484375, -0.0011014938354492188, 0.00067138671875, 0.0024442672729492188, 0.0042171478271484375, 0.005990028381347656, 0.007762908935546875, 0.009535789489746094, 0.011308670043945312, 0.013081550598144531, 0.01485443115234375, 0.01662731170654297, 0.018400192260742188, 0.020173072814941406, 0.021945953369140625, 0.023718833923339844, 0.025491714477539062, 0.02726459503173828, 0.0290374755859375, 0.03081035614013672, 0.03258323669433594, 0.034356117248535156, 0.036128997802734375, 0.037901878356933594, 0.03967475891113281, 0.04144763946533203, 0.04322052001953125, 0.04499340057373047, 0.04676628112792969, 0.048539161682128906, 0.050312042236328125, 0.052084922790527344, 0.05385780334472656, 0.05563068389892578, 0.057403564453125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 7.0, 3.0, 10.0, 9.0, 14.0, 15.0, 17.0, 30.0, 23.0, 39.0, 53.0, 53.0, 61.0, 75.0, 96.0, 80.0, 76.0, 72.0, 50.0, 47.0, 30.0, 30.0, 29.0, 25.0, 14.0, 10.0, 6.0, 8.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.992961406707764, -4.8208160400390625, -4.648670196533203, -4.476524829864502, -4.304379463195801, -4.1322340965271, -3.9600882530212402, -3.787942886352539, -3.615797519683838, -3.4436519145965576, -3.2715065479278564, -3.099360942840576, -2.927215576171875, -2.7550699710845947, -2.5829243659973145, -2.4107789993286133, -2.238633394241333, -2.0664877891540527, -1.8943424224853516, -1.7221968173980713, -1.5500514507293701, -1.3779058456420898, -1.2057603597640991, -1.0336148738861084, -0.8614693880081177, -0.689323902130127, -0.5171784162521362, -0.34503287076950073, -0.17288738489151, -0.0007418990135192871, 0.1714036464691162, 0.34354913234710693, 0.5156946182250977, 0.6878401041030884, 0.8599855899810791, 1.0321311950683594, 1.2042765617370605, 1.3764221668243408, 1.5485676527023315, 1.7207131385803223, 1.892858624458313, 2.0650041103363037, 2.237149715423584, 2.409295082092285, 2.5814406871795654, 2.7535860538482666, 2.925731658935547, 3.097877025604248, 3.2700226306915283, 3.4421682357788086, 3.6143136024475098, 3.78645920753479, 3.958604574203491, 4.1307501792907715, 4.302895545959473, 4.475041389465332, 4.647186756134033, 4.819332122802734, 4.991477966308594, 5.163623332977295, 5.335768699645996, 5.507914066314697, 5.680059909820557, 5.852205276489258, 6.024350643157959]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 6.0, 7.0, 2.0, 12.0, 5.0, 10.0, 16.0, 23.0, 19.0, 19.0, 26.0, 42.0, 27.0, 31.0, 28.0, 42.0, 44.0, 36.0, 44.0, 47.0, 51.0, 52.0, 53.0, 46.0, 48.0, 41.0, 30.0, 30.0, 28.0, 20.0, 18.0, 22.0, 17.0, 16.0, 11.0, 5.0, 9.0, 9.0, 5.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.674624443054199, -4.501932621002197, -4.329240798950195, -4.156548976898193, -3.9838571548461914, -3.8111653327941895, -3.6384737491607666, -3.4657819271087646, -3.2930901050567627, -3.1203982830047607, -2.947706460952759, -2.775014877319336, -2.602323055267334, -2.429631233215332, -2.25693941116333, -2.084247589111328, -1.9115557670593262, -1.7388639450073242, -1.5661721229553223, -1.3934804201126099, -1.220788598060608, -1.048096776008606, -0.8754050731658936, -0.7027132511138916, -0.5300214290618896, -0.3573296368122101, -0.18463784456253052, -0.01194608211517334, 0.1607457399368286, 0.33343756198883057, 0.506129264831543, 0.6788210868835449, 0.8515133857727051, 1.024205207824707, 1.196897029876709, 1.3695887327194214, 1.5422805547714233, 1.7149723768234253, 1.8876640796661377, 2.0603559017181396, 2.2330477237701416, 2.4057395458221436, 2.5784313678741455, 2.7511229515075684, 2.9238147735595703, 3.0965065956115723, 3.269198417663574, 3.441890239715576, 3.614582061767578, 3.78727388381958, 3.959965705871582, 4.132657527923584, 4.305349349975586, 4.478041172027588, 4.65073299407959, 4.823424339294434, 4.996116638183594, 5.168808460235596, 5.341500282287598, 5.5141921043396, 5.686883926391602, 5.8595757484436035, 6.0322675704956055, 6.204958915710449, 6.377650737762451]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 2.0, 6.0, 10.0, 10.0, 9.0, 21.0, 36.0, 57.0, 68.0, 127.0, 203.0, 244.0, 394.0, 588.0, 947.0, 1401.0, 2220.0, 3380.0, 5148.0, 8553.0, 13320.0, 21234.0, 33803.0, 54029.0, 83455.0, 121242.0, 154564.0, 159210.0, 130077.0, 91709.0, 60188.0, 37921.0, 23752.0, 14775.0, 9187.0, 5949.0, 3758.0, 2369.0, 1538.0, 1066.0, 668.0, 419.0, 315.0, 217.0, 140.0, 78.0, 47.0, 48.0, 22.0, 16.0, 7.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.6796875, -3.561431884765625, -3.44317626953125, -3.324920654296875, -3.2066650390625, -3.088409423828125, -2.97015380859375, -2.851898193359375, -2.733642578125, -2.615386962890625, -2.49713134765625, -2.378875732421875, -2.2606201171875, -2.142364501953125, -2.02410888671875, -1.905853271484375, -1.78759765625, -1.669342041015625, -1.55108642578125, -1.432830810546875, -1.3145751953125, -1.196319580078125, -1.07806396484375, -0.959808349609375, -0.841552734375, -0.723297119140625, -0.60504150390625, -0.486785888671875, -0.3685302734375, -0.250274658203125, -0.13201904296875, -0.013763427734375, 0.1044921875, 0.222747802734375, 0.34100341796875, 0.459259033203125, 0.5775146484375, 0.695770263671875, 0.81402587890625, 0.932281494140625, 1.050537109375, 1.168792724609375, 1.28704833984375, 1.405303955078125, 1.5235595703125, 1.641815185546875, 1.76007080078125, 1.878326416015625, 1.99658203125, 2.114837646484375, 2.23309326171875, 2.351348876953125, 2.4696044921875, 2.587860107421875, 2.70611572265625, 2.824371337890625, 2.942626953125, 3.060882568359375, 3.17913818359375, 3.297393798828125, 3.4156494140625, 3.533905029296875, 3.65216064453125, 3.770416259765625, 3.888671875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 7.0, 8.0, 6.0, 7.0, 15.0, 13.0, 14.0, 17.0, 27.0, 26.0, 29.0, 31.0, 33.0, 30.0, 39.0, 47.0, 49.0, 48.0, 50.0, 56.0, 40.0, 57.0, 42.0, 32.0, 40.0, 45.0, 44.0, 20.0, 14.0, 21.0, 16.0, 15.0, 17.0, 15.0, 10.0, 3.0, 9.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.11328125, -4.93756103515625, -4.7618408203125, -4.58612060546875, -4.410400390625, -4.23468017578125, -4.0589599609375, -3.88323974609375, -3.70751953125, -3.53179931640625, -3.3560791015625, -3.18035888671875, -3.004638671875, -2.82891845703125, -2.6531982421875, -2.47747802734375, -2.3017578125, -2.12603759765625, -1.9503173828125, -1.77459716796875, -1.598876953125, -1.42315673828125, -1.2474365234375, -1.07171630859375, -0.89599609375, -0.72027587890625, -0.5445556640625, -0.36883544921875, -0.193115234375, -0.01739501953125, 0.1583251953125, 0.33404541015625, 0.509765625, 0.68548583984375, 0.8612060546875, 1.03692626953125, 1.212646484375, 1.38836669921875, 1.5640869140625, 1.73980712890625, 1.91552734375, 2.09124755859375, 2.2669677734375, 2.44268798828125, 2.618408203125, 2.79412841796875, 2.9698486328125, 3.14556884765625, 3.3212890625, 3.49700927734375, 3.6727294921875, 3.84844970703125, 4.024169921875, 4.19989013671875, 4.3756103515625, 4.55133056640625, 4.72705078125, 4.90277099609375, 5.0784912109375, 5.25421142578125, 5.429931640625, 5.60565185546875, 5.7813720703125, 5.95709228515625, 6.1328125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 12.0, 8.0, 21.0, 21.0, 36.0, 55.0, 89.0, 135.0, 199.0, 333.0, 544.0, 799.0, 1254.0, 2093.0, 3283.0, 5419.0, 8768.0, 14708.0, 24558.0, 40697.0, 67203.0, 105777.0, 150462.0, 174239.0, 154996.0, 111536.0, 71215.0, 43740.0, 26201.0, 15689.0, 9398.0, 5649.0, 3506.0, 2067.0, 1379.0, 870.0, 536.0, 367.0, 259.0, 167.0, 88.0, 55.0, 47.0, 29.0, 20.0, 11.0, 10.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8203125, -3.6953125, -3.5703125, -3.4453125, -3.3203125, -3.1953125, -3.0703125, -2.9453125, -2.8203125, -2.6953125, -2.5703125, -2.4453125, -2.3203125, -2.1953125, -2.0703125, -1.9453125, -1.8203125, -1.6953125, -1.5703125, -1.4453125, -1.3203125, -1.1953125, -1.0703125, -0.9453125, -0.8203125, -0.6953125, -0.5703125, -0.4453125, -0.3203125, -0.1953125, -0.0703125, 0.0546875, 0.1796875, 0.3046875, 0.4296875, 0.5546875, 0.6796875, 0.8046875, 0.9296875, 1.0546875, 1.1796875, 1.3046875, 1.4296875, 1.5546875, 1.6796875, 1.8046875, 1.9296875, 2.0546875, 2.1796875, 2.3046875, 2.4296875, 2.5546875, 2.6796875, 2.8046875, 2.9296875, 3.0546875, 3.1796875, 3.3046875, 3.4296875, 3.5546875, 3.6796875, 3.8046875, 3.9296875, 4.0546875, 4.1796875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 8.0, 8.0, 6.0, 13.0, 11.0, 16.0, 17.0, 16.0, 16.0, 21.0, 18.0, 21.0, 25.0, 30.0, 30.0, 24.0, 23.0, 27.0, 28.0, 38.0, 35.0, 46.0, 28.0, 35.0, 35.0, 36.0, 37.0, 22.0, 38.0, 40.0, 23.0, 21.0, 27.0, 28.0, 23.0, 22.0, 13.0, 11.0, 11.0, 10.0, 11.0, 10.0, 7.0, 6.0, 4.0, 7.0, 2.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0], "bins": [-2.552734375, -2.47552490234375, -2.3983154296875, -2.32110595703125, -2.243896484375, -2.16668701171875, -2.0894775390625, -2.01226806640625, -1.93505859375, -1.85784912109375, -1.7806396484375, -1.70343017578125, -1.626220703125, -1.54901123046875, -1.4718017578125, -1.39459228515625, -1.3173828125, -1.24017333984375, -1.1629638671875, -1.08575439453125, -1.008544921875, -0.93133544921875, -0.8541259765625, -0.77691650390625, -0.69970703125, -0.62249755859375, -0.5452880859375, -0.46807861328125, -0.390869140625, -0.31365966796875, -0.2364501953125, -0.15924072265625, -0.08203125, -0.00482177734375, 0.0723876953125, 0.14959716796875, 0.226806640625, 0.30401611328125, 0.3812255859375, 0.45843505859375, 0.53564453125, 0.61285400390625, 0.6900634765625, 0.76727294921875, 0.844482421875, 0.92169189453125, 0.9989013671875, 1.07611083984375, 1.1533203125, 1.23052978515625, 1.3077392578125, 1.38494873046875, 1.462158203125, 1.53936767578125, 1.6165771484375, 1.69378662109375, 1.77099609375, 1.84820556640625, 1.9254150390625, 2.00262451171875, 2.079833984375, 2.15704345703125, 2.2342529296875, 2.31146240234375, 2.388671875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 16.0, 17.0, 23.0, 34.0, 63.0, 80.0, 146.0, 203.0, 289.0, 413.0, 696.0, 1093.0, 1693.0, 2521.0, 3881.0, 5953.0, 9349.0, 14991.0, 24420.0, 40331.0, 65845.0, 106530.0, 158642.0, 186702.0, 154890.0, 103016.0, 63826.0, 38625.0, 23762.0, 14576.0, 9137.0, 5827.0, 3697.0, 2517.0, 1660.0, 1035.0, 686.0, 451.0, 337.0, 195.0, 119.0, 89.0, 47.0, 38.0, 23.0, 19.0, 18.0, 8.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-1.22265625, -1.18499755859375, -1.1473388671875, -1.10968017578125, -1.072021484375, -1.03436279296875, -0.9967041015625, -0.95904541015625, -0.92138671875, -0.88372802734375, -0.8460693359375, -0.80841064453125, -0.770751953125, -0.73309326171875, -0.6954345703125, -0.65777587890625, -0.6201171875, -0.58245849609375, -0.5447998046875, -0.50714111328125, -0.469482421875, -0.43182373046875, -0.3941650390625, -0.35650634765625, -0.31884765625, -0.28118896484375, -0.2435302734375, -0.20587158203125, -0.168212890625, -0.13055419921875, -0.0928955078125, -0.05523681640625, -0.017578125, 0.02008056640625, 0.0577392578125, 0.09539794921875, 0.133056640625, 0.17071533203125, 0.2083740234375, 0.24603271484375, 0.28369140625, 0.32135009765625, 0.3590087890625, 0.39666748046875, 0.434326171875, 0.47198486328125, 0.5096435546875, 0.54730224609375, 0.5849609375, 0.62261962890625, 0.6602783203125, 0.69793701171875, 0.735595703125, 0.77325439453125, 0.8109130859375, 0.84857177734375, 0.88623046875, 0.92388916015625, 0.9615478515625, 0.99920654296875, 1.036865234375, 1.07452392578125, 1.1121826171875, 1.14984130859375, 1.1875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 5.0, 6.0, 2.0, 8.0, 9.0, 21.0, 11.0, 26.0, 24.0, 30.0, 42.0, 58.0, 42.0, 51.0, 62.0, 54.0, 63.0, 63.0, 83.0, 52.0, 46.0, 39.0, 33.0, 24.0, 28.0, 32.0, 18.0, 11.0, 11.0, 10.0, 4.0, 7.0, 7.0, 7.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00010025501251220703, -9.735021740198135e-05, -9.444542229175568e-05, -9.154062718153e-05, -8.863583207130432e-05, -8.573103696107864e-05, -8.282624185085297e-05, -7.992144674062729e-05, -7.701665163040161e-05, -7.411185652017593e-05, -7.120706140995026e-05, -6.830226629972458e-05, -6.53974711894989e-05, -6.249267607927322e-05, -5.9587880969047546e-05, -5.668308585882187e-05, -5.377829074859619e-05, -5.0873495638370514e-05, -4.7968700528144836e-05, -4.506390541791916e-05, -4.215911030769348e-05, -3.9254315197467804e-05, -3.6349520087242126e-05, -3.344472497701645e-05, -3.053992986679077e-05, -2.7635134756565094e-05, -2.4730339646339417e-05, -2.182554453611374e-05, -1.892074942588806e-05, -1.6015954315662384e-05, -1.3111159205436707e-05, -1.0206364095211029e-05, -7.3015689849853516e-06, -4.396773874759674e-06, -1.4919787645339966e-06, 1.412816345691681e-06, 4.317611455917358e-06, 7.222406566143036e-06, 1.0127201676368713e-05, 1.3031996786594391e-05, 1.593679189682007e-05, 1.8841587007045746e-05, 2.1746382117271423e-05, 2.46511772274971e-05, 2.755597233772278e-05, 3.0460767447948456e-05, 3.336556255817413e-05, 3.627035766839981e-05, 3.917515277862549e-05, 4.2079947888851166e-05, 4.498474299907684e-05, 4.788953810930252e-05, 5.07943332195282e-05, 5.3699128329753876e-05, 5.660392343997955e-05, 5.950871855020523e-05, 6.241351366043091e-05, 6.531830877065659e-05, 6.822310388088226e-05, 7.112789899110794e-05, 7.403269410133362e-05, 7.69374892115593e-05, 7.984228432178497e-05, 8.274707943201065e-05, 8.565187454223633e-05]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 6.0, 19.0, 17.0, 30.0, 57.0, 52.0, 113.0, 197.0, 356.0, 667.0, 1209.0, 2348.0, 4269.0, 7957.0, 15751.0, 31659.0, 65797.0, 134890.0, 233931.0, 247803.0, 151796.0, 75418.0, 36765.0, 18031.0, 8966.0, 4835.0, 2416.0, 1402.0, 723.0, 435.0, 252.0, 140.0, 80.0, 52.0, 45.0, 20.0, 16.0, 10.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5595703125, -1.5059661865234375, -1.452362060546875, -1.3987579345703125, -1.34515380859375, -1.2915496826171875, -1.237945556640625, -1.1843414306640625, -1.1307373046875, -1.0771331787109375, -1.023529052734375, -0.9699249267578125, -0.91632080078125, -0.8627166748046875, -0.809112548828125, -0.7555084228515625, -0.701904296875, -0.6483001708984375, -0.594696044921875, -0.5410919189453125, -0.48748779296875, -0.4338836669921875, -0.380279541015625, -0.3266754150390625, -0.2730712890625, -0.2194671630859375, -0.165863037109375, -0.1122589111328125, -0.05865478515625, -0.0050506591796875, 0.048553466796875, 0.1021575927734375, 0.15576171875, 0.2093658447265625, 0.262969970703125, 0.3165740966796875, 0.37017822265625, 0.4237823486328125, 0.477386474609375, 0.5309906005859375, 0.5845947265625, 0.6381988525390625, 0.691802978515625, 0.7454071044921875, 0.79901123046875, 0.8526153564453125, 0.906219482421875, 0.9598236083984375, 1.013427734375, 1.0670318603515625, 1.120635986328125, 1.1742401123046875, 1.22784423828125, 1.2814483642578125, 1.335052490234375, 1.3886566162109375, 1.4422607421875, 1.4958648681640625, 1.549468994140625, 1.6030731201171875, 1.65667724609375, 1.7102813720703125, 1.763885498046875, 1.8174896240234375, 1.87109375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 6.0, 8.0, 7.0, 13.0, 15.0, 19.0, 18.0, 27.0, 37.0, 29.0, 33.0, 41.0, 41.0, 58.0, 52.0, 59.0, 70.0, 53.0, 60.0, 55.0, 39.0, 48.0, 34.0, 33.0, 29.0, 22.0, 16.0, 16.0, 8.0, 7.0, 10.0, 8.0, 4.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76123046875, -0.7384567260742188, -0.7156829833984375, -0.6929092407226562, -0.670135498046875, -0.6473617553710938, -0.6245880126953125, -0.6018142700195312, -0.57904052734375, -0.5562667846679688, -0.5334930419921875, -0.5107192993164062, -0.487945556640625, -0.46517181396484375, -0.4423980712890625, -0.41962432861328125, -0.3968505859375, -0.37407684326171875, -0.3513031005859375, -0.32852935791015625, -0.305755615234375, -0.28298187255859375, -0.2602081298828125, -0.23743438720703125, -0.21466064453125, -0.19188690185546875, -0.1691131591796875, -0.14633941650390625, -0.123565673828125, -0.10079193115234375, -0.0780181884765625, -0.05524444580078125, -0.032470703125, -0.00969696044921875, 0.0130767822265625, 0.03585052490234375, 0.058624267578125, 0.08139801025390625, 0.1041717529296875, 0.12694549560546875, 0.14971923828125, 0.17249298095703125, 0.1952667236328125, 0.21804046630859375, 0.240814208984375, 0.26358795166015625, 0.2863616943359375, 0.30913543701171875, 0.3319091796875, 0.35468292236328125, 0.3774566650390625, 0.40023040771484375, 0.423004150390625, 0.44577789306640625, 0.4685516357421875, 0.49132537841796875, 0.51409912109375, 0.5368728637695312, 0.5596466064453125, 0.5824203491210938, 0.605194091796875, 0.6279678344726562, 0.6507415771484375, 0.6735153198242188, 0.6962890625]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 13.0, 11.0, 22.0, 20.0, 30.0, 33.0, 42.0, 70.0, 72.0, 98.0, 81.0, 86.0, 79.0, 82.0, 43.0, 49.0, 35.0, 31.0, 22.0, 19.0, 11.0, 3.0, 13.0, 4.0, 7.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2118754386901855, -5.025350570678711, -4.8388261795043945, -4.65230131149292, -4.465776443481445, -4.279252052307129, -4.092727184295654, -3.9062023162841797, -3.719677686691284, -3.5331530570983887, -3.346628189086914, -3.1601035594940186, -2.973578929901123, -2.7870540618896484, -2.600529432296753, -2.4140048027038574, -2.227479934692383, -2.0409553050994873, -1.8544304370880127, -1.6679058074951172, -1.4813810586929321, -1.294856309890747, -1.1083316802978516, -0.9218069314956665, -0.7352821826934814, -0.5487574338912964, -0.3622327446937561, -0.17570805549621582, 0.010816693305969238, 0.1973414421081543, 0.3838660717010498, 0.5703908205032349, 0.7569150924682617, 0.9434398412704468, 1.1299645900726318, 1.3164892196655273, 1.5030139684677124, 1.6895387172698975, 1.876063346862793, 2.0625882148742676, 2.249112844467163, 2.4356374740600586, 2.622162342071533, 2.8086869716644287, 2.995211601257324, 3.181736469268799, 3.3682610988616943, 3.55478572845459, 3.7413105964660645, 3.92783522605896, 4.1143598556518555, 4.30088472366333, 4.487409591674805, 4.673933982849121, 4.860458850860596, 5.04698371887207, 5.233508110046387, 5.420032978057861, 5.606557369232178, 5.793082237243652, 5.979607105255127, 6.166131973266602, 6.352656364440918, 6.539181232452393, 6.725706100463867]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 4.0, 5.0, 4.0, 8.0, 7.0, 6.0, 8.0, 10.0, 18.0, 16.0, 21.0, 15.0, 24.0, 21.0, 23.0, 30.0, 30.0, 36.0, 23.0, 30.0, 38.0, 47.0, 50.0, 41.0, 51.0, 49.0, 53.0, 38.0, 36.0, 30.0, 27.0, 19.0, 29.0, 20.0, 28.0, 26.0, 10.0, 21.0, 11.0, 10.0, 4.0, 3.0, 4.0, 5.0, 3.0, 8.0, 5.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.061321258544922, -3.908433437347412, -3.7555456161499023, -3.6026580333709717, -3.449770212173462, -3.296882390975952, -3.1439948081970215, -2.9911069869995117, -2.838219165802002, -2.685331344604492, -2.5324435234069824, -2.3795559406280518, -2.226668119430542, -2.0737802982330322, -1.920892596244812, -1.7680048942565918, -1.615117073059082, -1.4622292518615723, -1.309341549873352, -1.1564538478851318, -1.003566026687622, -0.8506782650947571, -0.6977905035018921, -0.5449028015136719, -0.3920149803161621, -0.23912721872329712, -0.08623945713043213, 0.06664830446243286, 0.21953606605529785, 0.37242382764816284, 0.5253115892410278, 0.678199291229248, 0.831087589263916, 0.983975350856781, 1.136863112449646, 1.2897508144378662, 1.442638635635376, 1.5955264568328857, 1.748414158821106, 1.9013018608093262, 2.054189682006836, 2.2070775032043457, 2.3599653244018555, 2.512852907180786, 2.665740728378296, 2.8186285495758057, 2.9715161323547363, 3.124403953552246, 3.277291774749756, 3.4301795959472656, 3.5830674171447754, 3.735954999923706, 3.888842821121216, 4.0417304039001465, 4.194618225097656, 4.347506046295166, 4.500393867492676, 4.6532816886901855, 4.806169509887695, 4.959057331085205, 5.111945152282715, 5.264832496643066, 5.417720317840576, 5.570608139038086, 5.723495960235596]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 13.0, 10.0, 17.0, 35.0, 48.0, 60.0, 100.0, 150.0, 219.0, 322.0, 493.0, 653.0, 1055.0, 1568.0, 2341.0, 3776.0, 5988.0, 9676.0, 16640.0, 30403.0, 58047.0, 119266.0, 270006.0, 651804.0, 1222497.0, 990234.0, 441517.0, 185696.0, 84057.0, 41843.0, 22025.0, 12476.0, 7308.0, 4565.0, 2990.0, 1888.0, 1349.0, 987.0, 635.0, 422.0, 301.0, 224.0, 153.0, 129.0, 97.0, 57.0, 40.0, 33.0, 24.0, 16.0, 5.0, 9.0, 8.0, 4.0, 0.0, 4.0, 2.0, 4.0, 4.0], "bins": [-4.875, -4.71124267578125, -4.5474853515625, -4.38372802734375, -4.219970703125, -4.05621337890625, -3.8924560546875, -3.72869873046875, -3.56494140625, -3.40118408203125, -3.2374267578125, -3.07366943359375, -2.909912109375, -2.74615478515625, -2.5823974609375, -2.41864013671875, -2.2548828125, -2.09112548828125, -1.9273681640625, -1.76361083984375, -1.599853515625, -1.43609619140625, -1.2723388671875, -1.10858154296875, -0.94482421875, -0.78106689453125, -0.6173095703125, -0.45355224609375, -0.289794921875, -0.12603759765625, 0.0377197265625, 0.20147705078125, 0.365234375, 0.52899169921875, 0.6927490234375, 0.85650634765625, 1.020263671875, 1.18402099609375, 1.3477783203125, 1.51153564453125, 1.67529296875, 1.83905029296875, 2.0028076171875, 2.16656494140625, 2.330322265625, 2.49407958984375, 2.6578369140625, 2.82159423828125, 2.9853515625, 3.14910888671875, 3.3128662109375, 3.47662353515625, 3.640380859375, 3.80413818359375, 3.9678955078125, 4.13165283203125, 4.29541015625, 4.45916748046875, 4.6229248046875, 4.78668212890625, 4.950439453125, 5.11419677734375, 5.2779541015625, 5.44171142578125, 5.60546875]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 6.0, 3.0, 4.0, 2.0, 8.0, 8.0, 10.0, 12.0, 15.0, 19.0, 20.0, 25.0, 23.0, 18.0, 29.0, 38.0, 24.0, 39.0, 37.0, 46.0, 42.0, 41.0, 40.0, 48.0, 56.0, 53.0, 37.0, 46.0, 29.0, 34.0, 28.0, 21.0, 28.0, 19.0, 18.0, 20.0, 12.0, 9.0, 9.0, 9.0, 5.0, 5.0, 2.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.666015625, -2.561737060546875, -2.45745849609375, -2.353179931640625, -2.2489013671875, -2.144622802734375, -2.04034423828125, -1.936065673828125, -1.831787109375, -1.727508544921875, -1.62322998046875, -1.518951416015625, -1.4146728515625, -1.310394287109375, -1.20611572265625, -1.101837158203125, -0.99755859375, -0.893280029296875, -0.78900146484375, -0.684722900390625, -0.5804443359375, -0.476165771484375, -0.37188720703125, -0.267608642578125, -0.163330078125, -0.059051513671875, 0.04522705078125, 0.149505615234375, 0.2537841796875, 0.358062744140625, 0.46234130859375, 0.566619873046875, 0.6708984375, 0.775177001953125, 0.87945556640625, 0.983734130859375, 1.0880126953125, 1.192291259765625, 1.29656982421875, 1.400848388671875, 1.505126953125, 1.609405517578125, 1.71368408203125, 1.817962646484375, 1.9222412109375, 2.026519775390625, 2.13079833984375, 2.235076904296875, 2.33935546875, 2.443634033203125, 2.54791259765625, 2.652191162109375, 2.7564697265625, 2.860748291015625, 2.96502685546875, 3.069305419921875, 3.173583984375, 3.277862548828125, 3.38214111328125, 3.486419677734375, 3.5906982421875, 3.694976806640625, 3.79925537109375, 3.903533935546875, 4.0078125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 9.0, 10.0, 24.0, 29.0, 30.0, 65.0, 94.0, 190.0, 288.0, 462.0, 917.0, 1597.0, 2954.0, 5812.0, 11540.0, 24907.0, 55848.0, 134067.0, 336429.0, 808352.0, 1290981.0, 882447.0, 372921.0, 148379.0, 62014.0, 27655.0, 12901.0, 6220.0, 3152.0, 1720.0, 964.0, 514.0, 328.0, 169.0, 121.0, 52.0, 46.0, 25.0, 13.0, 13.0, 9.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.4609375, -6.27923583984375, -6.0975341796875, -5.91583251953125, -5.734130859375, -5.55242919921875, -5.3707275390625, -5.18902587890625, -5.00732421875, -4.82562255859375, -4.6439208984375, -4.46221923828125, -4.280517578125, -4.09881591796875, -3.9171142578125, -3.73541259765625, -3.5537109375, -3.37200927734375, -3.1903076171875, -3.00860595703125, -2.826904296875, -2.64520263671875, -2.4635009765625, -2.28179931640625, -2.10009765625, -1.91839599609375, -1.7366943359375, -1.55499267578125, -1.373291015625, -1.19158935546875, -1.0098876953125, -0.82818603515625, -0.646484375, -0.46478271484375, -0.2830810546875, -0.10137939453125, 0.080322265625, 0.26202392578125, 0.4437255859375, 0.62542724609375, 0.80712890625, 0.98883056640625, 1.1705322265625, 1.35223388671875, 1.533935546875, 1.71563720703125, 1.8973388671875, 2.07904052734375, 2.2607421875, 2.44244384765625, 2.6241455078125, 2.80584716796875, 2.987548828125, 3.16925048828125, 3.3509521484375, 3.53265380859375, 3.71435546875, 3.89605712890625, 4.0777587890625, 4.25946044921875, 4.441162109375, 4.62286376953125, 4.8045654296875, 4.98626708984375, 5.16796875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 6.0, 5.0, 14.0, 27.0, 20.0, 33.0, 33.0, 46.0, 65.0, 70.0, 66.0, 108.0, 134.0, 132.0, 159.0, 204.0, 190.0, 245.0, 254.0, 247.0, 271.0, 239.0, 236.0, 211.0, 176.0, 155.0, 130.0, 106.0, 82.0, 73.0, 69.0, 53.0, 45.0, 32.0, 25.0, 30.0, 18.0, 7.0, 7.0, 7.0, 7.0, 8.0, 3.0, 0.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.6923828125, -1.64129638671875, -1.5902099609375, -1.53912353515625, -1.488037109375, -1.43695068359375, -1.3858642578125, -1.33477783203125, -1.28369140625, -1.23260498046875, -1.1815185546875, -1.13043212890625, -1.079345703125, -1.02825927734375, -0.9771728515625, -0.92608642578125, -0.875, -0.82391357421875, -0.7728271484375, -0.72174072265625, -0.670654296875, -0.61956787109375, -0.5684814453125, -0.51739501953125, -0.46630859375, -0.41522216796875, -0.3641357421875, -0.31304931640625, -0.261962890625, -0.21087646484375, -0.1597900390625, -0.10870361328125, -0.0576171875, -0.00653076171875, 0.0445556640625, 0.09564208984375, 0.146728515625, 0.19781494140625, 0.2489013671875, 0.29998779296875, 0.35107421875, 0.40216064453125, 0.4532470703125, 0.50433349609375, 0.555419921875, 0.60650634765625, 0.6575927734375, 0.70867919921875, 0.759765625, 0.81085205078125, 0.8619384765625, 0.91302490234375, 0.964111328125, 1.01519775390625, 1.0662841796875, 1.11737060546875, 1.16845703125, 1.21954345703125, 1.2706298828125, 1.32171630859375, 1.372802734375, 1.42388916015625, 1.4749755859375, 1.52606201171875, 1.5771484375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 2.0, 9.0, 5.0, 16.0, 22.0, 22.0, 31.0, 39.0, 53.0, 49.0, 72.0, 80.0, 85.0, 85.0, 81.0, 83.0, 55.0, 51.0, 46.0, 25.0, 23.0, 17.0, 12.0, 6.0, 9.0, 8.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.294277191162109, -4.1091084480285645, -3.9239397048950195, -3.7387712001800537, -3.553602457046509, -3.368433713912964, -3.183265209197998, -2.998096466064453, -2.812927722930908, -2.6277589797973633, -2.4425902366638184, -2.2574217319488525, -2.0722529888153076, -1.8870842456817627, -1.7019156217575073, -1.516746997833252, -1.331578254699707, -1.146409511566162, -0.9612408876419067, -0.7760722041130066, -0.5909035205841064, -0.4057348370552063, -0.22056615352630615, -0.03539752960205078, 0.14977121353149414, 0.3349398970603943, 0.5201085805892944, 0.7052772641181946, 0.8904459476470947, 1.0756146907806396, 1.260783314704895, 1.4459519386291504, 1.6311206817626953, 1.8162894248962402, 2.001458168029785, 2.186626672744751, 2.371795415878296, 2.556964159011841, 2.7421326637268066, 2.9273014068603516, 3.1124701499938965, 3.2976388931274414, 3.4828076362609863, 3.667976140975952, 3.853144884109497, 4.038313388824463, 4.223482131958008, 4.408650875091553, 4.593819618225098, 4.778988361358643, 4.9641571044921875, 5.149325847625732, 5.334494590759277, 5.519662857055664, 5.704831600189209, 5.890000343322754, 6.075169086456299, 6.260337829589844, 6.445506572723389, 6.630675315856934, 6.81584358215332, 7.001012325286865, 7.18618106842041, 7.371349811553955, 7.5565185546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 6.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 9.0, 10.0, 9.0, 13.0, 9.0, 13.0, 8.0, 21.0, 21.0, 32.0, 16.0, 27.0, 38.0, 36.0, 25.0, 35.0, 38.0, 38.0, 42.0, 50.0, 39.0, 40.0, 42.0, 36.0, 42.0, 33.0, 31.0, 31.0, 31.0, 32.0, 23.0, 16.0, 20.0, 10.0, 9.0, 9.0, 10.0, 9.0, 11.0, 5.0, 4.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.8116629123687744, -3.676187515258789, -3.5407118797302246, -3.4052364826202393, -3.269761085510254, -3.1342854499816895, -2.998810052871704, -2.8633346557617188, -2.7278590202331543, -2.592383623123169, -2.4569079875946045, -2.321432590484619, -2.185957193374634, -2.0504817962646484, -1.915006160736084, -1.7795307636260986, -1.6440553665161133, -1.5085798501968384, -1.373104453086853, -1.2376289367675781, -1.1021535396575928, -0.9666780233383179, -0.831202507019043, -0.6957270503044128, -0.5602515935897827, -0.4247761368751526, -0.2893006503582001, -0.15382516384124756, -0.01834970712661743, 0.1171257495880127, 0.2526012659072876, 0.3880767226219177, 0.523552417755127, 0.6590278744697571, 0.7945033311843872, 0.9299788475036621, 1.0654542446136475, 1.2009297609329224, 1.3364052772521973, 1.4718806743621826, 1.6073561906814575, 1.7428317070007324, 1.8783071041107178, 2.013782501220703, 2.1492581367492676, 2.284733533859253, 2.4202089309692383, 2.5556845664978027, 2.691159963607788, 2.8266353607177734, 2.962110996246338, 3.0975863933563232, 3.2330617904663086, 3.368537425994873, 3.5040128231048584, 3.6394882202148438, 3.774963855743408, 3.9104392528533936, 4.045914649963379, 4.181390285491943, 4.316865921020508, 4.452341079711914, 4.5878167152404785, 4.723292350769043, 4.858767509460449]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 7.0, 12.0, 24.0, 26.0, 43.0, 63.0, 62.0, 99.0, 186.0, 301.0, 442.0, 729.0, 1333.0, 2276.0, 4054.0, 7967.0, 15844.0, 34005.0, 82440.0, 222934.0, 381447.0, 172608.0, 65612.0, 27838.0, 13110.0, 6663.0, 3627.0, 1921.0, 1057.0, 692.0, 388.0, 248.0, 142.0, 110.0, 66.0, 54.0, 36.0, 16.0, 20.0, 11.0, 11.0, 6.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7744140625, -1.7071380615234375, -1.639862060546875, -1.5725860595703125, -1.50531005859375, -1.4380340576171875, -1.370758056640625, -1.3034820556640625, -1.2362060546875, -1.1689300537109375, -1.101654052734375, -1.0343780517578125, -0.96710205078125, -0.8998260498046875, -0.832550048828125, -0.7652740478515625, -0.697998046875, -0.6307220458984375, -0.563446044921875, -0.4961700439453125, -0.42889404296875, -0.3616180419921875, -0.294342041015625, -0.2270660400390625, -0.1597900390625, -0.0925140380859375, -0.025238037109375, 0.0420379638671875, 0.10931396484375, 0.1765899658203125, 0.243865966796875, 0.3111419677734375, 0.37841796875, 0.4456939697265625, 0.512969970703125, 0.5802459716796875, 0.64752197265625, 0.7147979736328125, 0.782073974609375, 0.8493499755859375, 0.9166259765625, 0.9839019775390625, 1.051177978515625, 1.1184539794921875, 1.18572998046875, 1.2530059814453125, 1.320281982421875, 1.3875579833984375, 1.454833984375, 1.5221099853515625, 1.589385986328125, 1.6566619873046875, 1.72393798828125, 1.7912139892578125, 1.858489990234375, 1.9257659912109375, 1.9930419921875, 2.0603179931640625, 2.127593994140625, 2.1948699951171875, 2.26214599609375, 2.3294219970703125, 2.396697998046875, 2.4639739990234375, 2.53125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 9.0, 12.0, 9.0, 11.0, 13.0, 18.0, 12.0, 34.0, 19.0, 29.0, 32.0, 34.0, 39.0, 42.0, 35.0, 31.0, 53.0, 63.0, 39.0, 46.0, 32.0, 47.0, 50.0, 38.0, 29.0, 39.0, 27.0, 22.0, 22.0, 16.0, 12.0, 11.0, 10.0, 12.0, 8.0, 4.0, 8.0, 8.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.17578125, -4.02606201171875, -3.8763427734375, -3.72662353515625, -3.576904296875, -3.42718505859375, -3.2774658203125, -3.12774658203125, -2.97802734375, -2.82830810546875, -2.6785888671875, -2.52886962890625, -2.379150390625, -2.22943115234375, -2.0797119140625, -1.92999267578125, -1.7802734375, -1.63055419921875, -1.4808349609375, -1.33111572265625, -1.181396484375, -1.03167724609375, -0.8819580078125, -0.73223876953125, -0.58251953125, -0.43280029296875, -0.2830810546875, -0.13336181640625, 0.016357421875, 0.16607666015625, 0.3157958984375, 0.46551513671875, 0.615234375, 0.76495361328125, 0.9146728515625, 1.06439208984375, 1.214111328125, 1.36383056640625, 1.5135498046875, 1.66326904296875, 1.81298828125, 1.96270751953125, 2.1124267578125, 2.26214599609375, 2.411865234375, 2.56158447265625, 2.7113037109375, 2.86102294921875, 3.0107421875, 3.16046142578125, 3.3101806640625, 3.45989990234375, 3.609619140625, 3.75933837890625, 3.9090576171875, 4.05877685546875, 4.20849609375, 4.35821533203125, 4.5079345703125, 4.65765380859375, 4.807373046875, 4.95709228515625, 5.1068115234375, 5.25653076171875, 5.40625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 7.0, 13.0, 12.0, 23.0, 16.0, 20.0, 32.0, 55.0, 53.0, 94.0, 105.0, 159.0, 225.0, 288.0, 425.0, 649.0, 1131.0, 1934.0, 3965.0, 9353.0, 26607.0, 903022.0, 68126.0, 17956.0, 6780.0, 3041.0, 1610.0, 886.0, 603.0, 373.0, 242.0, 178.0, 164.0, 97.0, 71.0, 54.0, 51.0, 29.0, 25.0, 18.0, 17.0, 13.0, 15.0, 6.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32421875, -4.1839599609375, -4.043701171875, -3.9034423828125, -3.76318359375, -3.6229248046875, -3.482666015625, -3.3424072265625, -3.2021484375, -3.0618896484375, -2.921630859375, -2.7813720703125, -2.64111328125, -2.5008544921875, -2.360595703125, -2.2203369140625, -2.080078125, -1.9398193359375, -1.799560546875, -1.6593017578125, -1.51904296875, -1.3787841796875, -1.238525390625, -1.0982666015625, -0.9580078125, -0.8177490234375, -0.677490234375, -0.5372314453125, -0.39697265625, -0.2567138671875, -0.116455078125, 0.0238037109375, 0.1640625, 0.3043212890625, 0.444580078125, 0.5848388671875, 0.72509765625, 0.8653564453125, 1.005615234375, 1.1458740234375, 1.2861328125, 1.4263916015625, 1.566650390625, 1.7069091796875, 1.84716796875, 1.9874267578125, 2.127685546875, 2.2679443359375, 2.408203125, 2.5484619140625, 2.688720703125, 2.8289794921875, 2.96923828125, 3.1094970703125, 3.249755859375, 3.3900146484375, 3.5302734375, 3.6705322265625, 3.810791015625, 3.9510498046875, 4.09130859375, 4.2315673828125, 4.371826171875, 4.5120849609375, 4.65234375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 7.0, 5.0, 10.0, 11.0, 8.0, 19.0, 20.0, 15.0, 21.0, 20.0, 31.0, 38.0, 28.0, 43.0, 43.0, 32.0, 49.0, 29.0, 43.0, 46.0, 50.0, 48.0, 33.0, 39.0, 28.0, 34.0, 38.0, 32.0, 31.0, 20.0, 21.0, 19.0, 17.0, 15.0, 13.0, 3.0, 10.0, 6.0, 4.0, 7.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.875, -2.78125, -2.6875, -2.59375, -2.5, -2.40625, -2.3125, -2.21875, -2.125, -2.03125, -1.9375, -1.84375, -1.75, -1.65625, -1.5625, -1.46875, -1.375, -1.28125, -1.1875, -1.09375, -1.0, -0.90625, -0.8125, -0.71875, -0.625, -0.53125, -0.4375, -0.34375, -0.25, -0.15625, -0.0625, 0.03125, 0.125, 0.21875, 0.3125, 0.40625, 0.5, 0.59375, 0.6875, 0.78125, 0.875, 0.96875, 1.0625, 1.15625, 1.25, 1.34375, 1.4375, 1.53125, 1.625, 1.71875, 1.8125, 1.90625, 2.0, 2.09375, 2.1875, 2.28125, 2.375, 2.46875, 2.5625, 2.65625, 2.75, 2.84375, 2.9375, 3.03125, 3.125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 5.0, 4.0, 10.0, 11.0, 11.0, 14.0, 21.0, 36.0, 34.0, 76.0, 81.0, 94.0, 143.0, 216.0, 305.0, 412.0, 625.0, 1013.0, 1636.0, 3007.0, 6158.0, 15560.0, 70609.0, 910404.0, 21369.0, 7777.0, 3540.0, 1883.0, 1142.0, 718.0, 457.0, 366.0, 222.0, 133.0, 122.0, 84.0, 70.0, 47.0, 40.0, 24.0, 16.0, 10.0, 12.0, 8.0, 6.0, 8.0, 2.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.341064453125, -0.33045196533203125, -0.3198394775390625, -0.30922698974609375, -0.298614501953125, -0.28800201416015625, -0.2773895263671875, -0.26677703857421875, -0.25616455078125, -0.24555206298828125, -0.2349395751953125, -0.22432708740234375, -0.213714599609375, -0.20310211181640625, -0.1924896240234375, -0.18187713623046875, -0.1712646484375, -0.16065216064453125, -0.1500396728515625, -0.13942718505859375, -0.128814697265625, -0.11820220947265625, -0.1075897216796875, -0.09697723388671875, -0.08636474609375, -0.07575225830078125, -0.0651397705078125, -0.05452728271484375, -0.043914794921875, -0.03330230712890625, -0.0226898193359375, -0.01207733154296875, -0.00146484375, 0.00914764404296875, 0.0197601318359375, 0.03037261962890625, 0.040985107421875, 0.05159759521484375, 0.0622100830078125, 0.07282257080078125, 0.08343505859375, 0.09404754638671875, 0.1046600341796875, 0.11527252197265625, 0.125885009765625, 0.13649749755859375, 0.1471099853515625, 0.15772247314453125, 0.1683349609375, 0.17894744873046875, 0.1895599365234375, 0.20017242431640625, 0.210784912109375, 0.22139739990234375, 0.2320098876953125, 0.24262237548828125, 0.25323486328125, 0.26384735107421875, 0.2744598388671875, 0.28507232666015625, 0.295684814453125, 0.30629730224609375, 0.3169097900390625, 0.32752227783203125, 0.338134765625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 3.0, 6.0, 2.0, 6.0, 9.0, 9.0, 7.0, 8.0, 9.0, 15.0, 22.0, 23.0, 12.0, 30.0, 39.0, 14.0, 36.0, 40.0, 47.0, 34.0, 45.0, 43.0, 59.0, 51.0, 50.0, 40.0, 38.0, 51.0, 33.0, 29.0, 30.0, 26.0, 14.0, 21.0, 22.0, 12.0, 13.0, 15.0, 4.0, 11.0, 7.0, 6.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.528594970703125e-05, -3.4195370972156525e-05, -3.31047922372818e-05, -3.2014213502407074e-05, -3.092363476753235e-05, -2.9833056032657623e-05, -2.8742477297782898e-05, -2.7651898562908173e-05, -2.6561319828033447e-05, -2.5470741093158722e-05, -2.4380162358283997e-05, -2.328958362340927e-05, -2.2199004888534546e-05, -2.110842615365982e-05, -2.0017847418785095e-05, -1.892726868391037e-05, -1.7836689949035645e-05, -1.674611121416092e-05, -1.5655532479286194e-05, -1.4564953744411469e-05, -1.3474375009536743e-05, -1.2383796274662018e-05, -1.1293217539787292e-05, -1.0202638804912567e-05, -9.112060070037842e-06, -8.021481335163116e-06, -6.930902600288391e-06, -5.840323865413666e-06, -4.7497451305389404e-06, -3.659166395664215e-06, -2.5685876607894897e-06, -1.4780089259147644e-06, -3.8743019104003906e-07, 7.031485438346863e-07, 1.7937272787094116e-06, 2.884306013584137e-06, 3.974884748458862e-06, 5.065463483333588e-06, 6.156042218208313e-06, 7.246620953083038e-06, 8.337199687957764e-06, 9.427778422832489e-06, 1.0518357157707214e-05, 1.160893589258194e-05, 1.2699514627456665e-05, 1.379009336233139e-05, 1.4880672097206116e-05, 1.597125083208084e-05, 1.7061829566955566e-05, 1.8152408301830292e-05, 1.9242987036705017e-05, 2.0333565771579742e-05, 2.1424144506454468e-05, 2.2514723241329193e-05, 2.360530197620392e-05, 2.4695880711078644e-05, 2.578645944595337e-05, 2.6877038180828094e-05, 2.796761691570282e-05, 2.9058195650577545e-05, 3.014877438545227e-05, 3.1239353120326996e-05, 3.232993185520172e-05, 3.3420510590076447e-05, 3.451108932495117e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 7.0, 4.0, 6.0, 15.0, 21.0, 22.0, 28.0, 45.0, 61.0, 101.0, 158.0, 222.0, 319.0, 473.0, 666.0, 924.0, 1536.0, 2420.0, 3756.0, 5921.0, 10267.0, 18015.0, 33885.0, 73410.0, 203557.0, 413586.0, 151600.0, 59333.0, 28864.0, 15529.0, 8851.0, 5253.0, 3287.0, 2086.0, 1451.0, 933.0, 625.0, 419.0, 287.0, 226.0, 126.0, 77.0, 54.0, 43.0, 40.0, 19.0, 10.0, 4.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.1571044921875, -0.15239715576171875, -0.1476898193359375, -0.14298248291015625, -0.138275146484375, -0.13356781005859375, -0.1288604736328125, -0.12415313720703125, -0.11944580078125, -0.11473846435546875, -0.1100311279296875, -0.10532379150390625, -0.100616455078125, -0.09590911865234375, -0.0912017822265625, -0.08649444580078125, -0.081787109375, -0.07707977294921875, -0.0723724365234375, -0.06766510009765625, -0.062957763671875, -0.05825042724609375, -0.0535430908203125, -0.04883575439453125, -0.04412841796875, -0.03942108154296875, -0.0347137451171875, -0.03000640869140625, -0.025299072265625, -0.02059173583984375, -0.0158843994140625, -0.01117706298828125, -0.0064697265625, -0.00176239013671875, 0.0029449462890625, 0.00765228271484375, 0.012359619140625, 0.01706695556640625, 0.0217742919921875, 0.02648162841796875, 0.03118896484375, 0.03589630126953125, 0.0406036376953125, 0.04531097412109375, 0.050018310546875, 0.05472564697265625, 0.0594329833984375, 0.06414031982421875, 0.06884765625, 0.07355499267578125, 0.0782623291015625, 0.08296966552734375, 0.087677001953125, 0.09238433837890625, 0.0970916748046875, 0.10179901123046875, 0.10650634765625, 0.11121368408203125, 0.1159210205078125, 0.12062835693359375, 0.125335693359375, 0.13004302978515625, 0.1347503662109375, 0.13945770263671875, 0.1441650390625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 9.0, 7.0, 13.0, 15.0, 29.0, 40.0, 51.0, 82.0, 143.0, 177.0, 153.0, 105.0, 65.0, 37.0, 18.0, 15.0, 11.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09051513671875, -0.08803653717041016, -0.08555793762207031, -0.08307933807373047, -0.08060073852539062, -0.07812213897705078, -0.07564353942871094, -0.0731649398803711, -0.07068634033203125, -0.0682077407836914, -0.06572914123535156, -0.06325054168701172, -0.060771942138671875, -0.05829334259033203, -0.05581474304199219, -0.053336143493652344, -0.0508575439453125, -0.048378944396972656, -0.04590034484863281, -0.04342174530029297, -0.040943145751953125, -0.03846454620361328, -0.03598594665527344, -0.033507347106933594, -0.03102874755859375, -0.028550148010253906, -0.026071548461914062, -0.02359294891357422, -0.021114349365234375, -0.01863574981689453, -0.016157150268554688, -0.013678550720214844, -0.011199951171875, -0.008721351623535156, -0.0062427520751953125, -0.0037641525268554688, -0.001285552978515625, 0.0011930465698242188, 0.0036716461181640625, 0.006150245666503906, 0.00862884521484375, 0.011107444763183594, 0.013586044311523438, 0.01606464385986328, 0.018543243408203125, 0.02102184295654297, 0.023500442504882812, 0.025979042053222656, 0.0284576416015625, 0.030936241149902344, 0.03341484069824219, 0.03589344024658203, 0.038372039794921875, 0.04085063934326172, 0.04332923889160156, 0.045807838439941406, 0.04828643798828125, 0.050765037536621094, 0.05324363708496094, 0.05572223663330078, 0.058200836181640625, 0.06067943572998047, 0.06315803527832031, 0.06563663482666016, 0.068115234375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 6.0, 8.0, 8.0, 10.0, 24.0, 24.0, 29.0, 31.0, 53.0, 60.0, 62.0, 88.0, 85.0, 80.0, 86.0, 81.0, 57.0, 42.0, 50.0, 34.0, 16.0, 16.0, 13.0, 10.0, 6.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.220959663391113, -4.0385003089904785, -3.8560404777526855, -3.673581123352051, -3.491121292114258, -3.308661937713623, -3.126202344894409, -2.9437427520751953, -2.7612831592559814, -2.5788235664367676, -2.3963639736175537, -2.21390438079834, -2.031445026397705, -1.8489853143692017, -1.6665258407592773, -1.4840662479400635, -1.3016066551208496, -1.1191470623016357, -0.9366875290870667, -0.7542279958724976, -0.5717684030532837, -0.3893088102340698, -0.2068493366241455, -0.02438974380493164, 0.15806984901428223, 0.3405294120311737, 0.5229889750480652, 0.7054485082626343, 0.8879081010818481, 1.070367693901062, 1.2528271675109863, 1.4352867603302002, 1.6177458763122559, 1.8002054691314697, 1.9826650619506836, 2.1651244163513184, 2.3475842475891113, 2.530043601989746, 2.71250319480896, 2.894962787628174, 3.0774223804473877, 3.2598819732666016, 3.4423415660858154, 3.6248011589050293, 3.807260513305664, 3.989720344543457, 4.172179698944092, 4.354639053344727, 4.5370988845825195, 4.719558238983154, 4.902018070220947, 5.084477424621582, 5.266937255859375, 5.44939661026001, 5.6318559646606445, 5.8143157958984375, 5.9967756271362305, 6.179234981536865, 6.361694812774658, 6.544154167175293, 6.726613998413086, 6.909073352813721, 7.0915327072143555, 7.273992538452148, 7.456451892852783]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 3.0, 4.0, 2.0, 3.0, 5.0, 8.0, 10.0, 9.0, 13.0, 11.0, 11.0, 8.0, 21.0, 22.0, 31.0, 17.0, 30.0, 35.0, 36.0, 25.0, 35.0, 38.0, 36.0, 46.0, 47.0, 40.0, 40.0, 42.0, 35.0, 43.0, 34.0, 29.0, 32.0, 31.0, 33.0, 23.0, 15.0, 18.0, 11.0, 8.0, 11.0, 9.0, 10.0, 11.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.7671401500701904, -3.632723331451416, -3.4983067512512207, -3.3638899326324463, -3.229473352432251, -3.0950565338134766, -2.9606399536132812, -2.826223134994507, -2.6918063163757324, -2.557389497756958, -2.4229729175567627, -2.2885560989379883, -2.154139518737793, -2.0197227001190186, -1.8853060007095337, -1.7508893013000488, -1.6164727210998535, -1.4820560216903687, -1.3476393222808838, -1.2132225036621094, -1.078805923461914, -0.9443891644477844, -0.8099724054336548, -0.6755557060241699, -0.5411390066146851, -0.4067223072052002, -0.27230557799339294, -0.1378888487815857, -0.00347214937210083, 0.13094455003738403, 0.26536130905151367, 0.39977800846099854, 0.5341944694519043, 0.6686111688613892, 0.803027868270874, 0.9374446272850037, 1.0718612670898438, 1.2062780857086182, 1.340694785118103, 1.475111484527588, 1.6095281839370728, 1.7439448833465576, 1.8783615827560425, 2.0127782821655273, 2.1471951007843018, 2.281611680984497, 2.4160284996032715, 2.550445079803467, 2.684861898422241, 2.8192787170410156, 2.953695297241211, 3.0881121158599854, 3.2225286960601807, 3.356945514678955, 3.4913620948791504, 3.625778913497925, 3.760195732116699, 3.8946125507354736, 4.029029369354248, 4.163445949554443, 4.297862529754639, 4.432279109954834, 4.5666961669921875, 4.701112747192383, 4.835529327392578]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 10.0, 8.0, 17.0, 18.0, 27.0, 57.0, 90.0, 124.0, 208.0, 310.0, 488.0, 703.0, 1126.0, 1714.0, 2842.0, 4606.0, 7568.0, 12760.0, 21946.0, 37274.0, 64826.0, 108521.0, 165230.0, 194523.0, 162872.0, 107222.0, 63476.0, 36474.0, 21409.0, 12393.0, 7455.0, 4554.0, 2845.0, 1770.0, 1095.0, 709.0, 417.0, 294.0, 193.0, 119.0, 80.0, 62.0, 40.0, 26.0, 18.0, 9.0, 15.0, 6.0, 2.0, 1.0, 2.0, 3.0], "bins": [-4.6171875, -4.487060546875, -4.35693359375, -4.226806640625, -4.0966796875, -3.966552734375, -3.83642578125, -3.706298828125, -3.576171875, -3.446044921875, -3.31591796875, -3.185791015625, -3.0556640625, -2.925537109375, -2.79541015625, -2.665283203125, -2.53515625, -2.405029296875, -2.27490234375, -2.144775390625, -2.0146484375, -1.884521484375, -1.75439453125, -1.624267578125, -1.494140625, -1.364013671875, -1.23388671875, -1.103759765625, -0.9736328125, -0.843505859375, -0.71337890625, -0.583251953125, -0.453125, -0.322998046875, -0.19287109375, -0.062744140625, 0.0673828125, 0.197509765625, 0.32763671875, 0.457763671875, 0.587890625, 0.718017578125, 0.84814453125, 0.978271484375, 1.1083984375, 1.238525390625, 1.36865234375, 1.498779296875, 1.62890625, 1.759033203125, 1.88916015625, 2.019287109375, 2.1494140625, 2.279541015625, 2.40966796875, 2.539794921875, 2.669921875, 2.800048828125, 2.93017578125, 3.060302734375, 3.1904296875, 3.320556640625, 3.45068359375, 3.580810546875, 3.7109375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 11.0, 5.0, 10.0, 18.0, 6.0, 10.0, 19.0, 12.0, 27.0, 28.0, 30.0, 26.0, 28.0, 34.0, 30.0, 43.0, 36.0, 40.0, 47.0, 41.0, 42.0, 48.0, 37.0, 35.0, 34.0, 47.0, 28.0, 41.0, 27.0, 28.0, 19.0, 11.0, 11.0, 14.0, 9.0, 7.0, 11.0, 8.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.89453125, -3.75836181640625, -3.6221923828125, -3.48602294921875, -3.349853515625, -3.21368408203125, -3.0775146484375, -2.94134521484375, -2.80517578125, -2.66900634765625, -2.5328369140625, -2.39666748046875, -2.260498046875, -2.12432861328125, -1.9881591796875, -1.85198974609375, -1.7158203125, -1.57965087890625, -1.4434814453125, -1.30731201171875, -1.171142578125, -1.03497314453125, -0.8988037109375, -0.76263427734375, -0.62646484375, -0.49029541015625, -0.3541259765625, -0.21795654296875, -0.081787109375, 0.05438232421875, 0.1905517578125, 0.32672119140625, 0.462890625, 0.59906005859375, 0.7352294921875, 0.87139892578125, 1.007568359375, 1.14373779296875, 1.2799072265625, 1.41607666015625, 1.55224609375, 1.68841552734375, 1.8245849609375, 1.96075439453125, 2.096923828125, 2.23309326171875, 2.3692626953125, 2.50543212890625, 2.6416015625, 2.77777099609375, 2.9139404296875, 3.05010986328125, 3.186279296875, 3.32244873046875, 3.4586181640625, 3.59478759765625, 3.73095703125, 3.86712646484375, 4.0032958984375, 4.13946533203125, 4.275634765625, 4.41180419921875, 4.5479736328125, 4.68414306640625, 4.8203125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 10.0, 8.0, 29.0, 39.0, 62.0, 75.0, 106.0, 214.0, 299.0, 616.0, 1033.0, 1984.0, 3723.0, 7140.0, 14522.0, 29081.0, 58421.0, 113524.0, 197207.0, 239111.0, 179437.0, 99700.0, 50948.0, 25172.0, 12686.0, 6192.0, 3259.0, 1762.0, 916.0, 494.0, 295.0, 193.0, 95.0, 72.0, 44.0, 31.0, 14.0, 12.0, 12.0, 3.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.2265625, -5.070068359375, -4.91357421875, -4.757080078125, -4.6005859375, -4.444091796875, -4.28759765625, -4.131103515625, -3.974609375, -3.818115234375, -3.66162109375, -3.505126953125, -3.3486328125, -3.192138671875, -3.03564453125, -2.879150390625, -2.72265625, -2.566162109375, -2.40966796875, -2.253173828125, -2.0966796875, -1.940185546875, -1.78369140625, -1.627197265625, -1.470703125, -1.314208984375, -1.15771484375, -1.001220703125, -0.8447265625, -0.688232421875, -0.53173828125, -0.375244140625, -0.21875, -0.062255859375, 0.09423828125, 0.250732421875, 0.4072265625, 0.563720703125, 0.72021484375, 0.876708984375, 1.033203125, 1.189697265625, 1.34619140625, 1.502685546875, 1.6591796875, 1.815673828125, 1.97216796875, 2.128662109375, 2.28515625, 2.441650390625, 2.59814453125, 2.754638671875, 2.9111328125, 3.067626953125, 3.22412109375, 3.380615234375, 3.537109375, 3.693603515625, 3.85009765625, 4.006591796875, 4.1630859375, 4.319580078125, 4.47607421875, 4.632568359375, 4.7890625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 7.0, 7.0, 11.0, 11.0, 22.0, 21.0, 22.0, 25.0, 37.0, 34.0, 41.0, 29.0, 37.0, 40.0, 55.0, 55.0, 47.0, 43.0, 50.0, 53.0, 46.0, 42.0, 47.0, 37.0, 34.0, 20.0, 29.0, 29.0, 12.0, 18.0, 7.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1015625, -3.0064697265625, -2.911376953125, -2.8162841796875, -2.72119140625, -2.6260986328125, -2.531005859375, -2.4359130859375, -2.3408203125, -2.2457275390625, -2.150634765625, -2.0555419921875, -1.96044921875, -1.8653564453125, -1.770263671875, -1.6751708984375, -1.580078125, -1.4849853515625, -1.389892578125, -1.2947998046875, -1.19970703125, -1.1046142578125, -1.009521484375, -0.9144287109375, -0.8193359375, -0.7242431640625, -0.629150390625, -0.5340576171875, -0.43896484375, -0.3438720703125, -0.248779296875, -0.1536865234375, -0.05859375, 0.0364990234375, 0.131591796875, 0.2266845703125, 0.32177734375, 0.4168701171875, 0.511962890625, 0.6070556640625, 0.7021484375, 0.7972412109375, 0.892333984375, 0.9874267578125, 1.08251953125, 1.1776123046875, 1.272705078125, 1.3677978515625, 1.462890625, 1.5579833984375, 1.653076171875, 1.7481689453125, 1.84326171875, 1.9383544921875, 2.033447265625, 2.1285400390625, 2.2236328125, 2.3187255859375, 2.413818359375, 2.5089111328125, 2.60400390625, 2.6990966796875, 2.794189453125, 2.8892822265625, 2.984375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 13.0, 9.0, 21.0, 21.0, 27.0, 38.0, 47.0, 74.0, 111.0, 163.0, 238.0, 363.0, 554.0, 789.0, 1192.0, 1937.0, 2927.0, 4982.0, 8415.0, 14458.0, 25520.0, 45039.0, 82159.0, 143384.0, 210707.0, 201895.0, 131613.0, 74175.0, 41352.0, 23143.0, 12911.0, 7644.0, 4675.0, 2757.0, 1773.0, 1144.0, 727.0, 488.0, 305.0, 213.0, 176.0, 107.0, 105.0, 46.0, 35.0, 18.0, 17.0, 17.0, 10.0, 3.0, 8.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0], "bins": [-1.3037109375, -1.2628631591796875, -1.222015380859375, -1.1811676025390625, -1.14031982421875, -1.0994720458984375, -1.058624267578125, -1.0177764892578125, -0.9769287109375, -0.9360809326171875, -0.895233154296875, -0.8543853759765625, -0.81353759765625, -0.7726898193359375, -0.731842041015625, -0.6909942626953125, -0.650146484375, -0.6092987060546875, -0.568450927734375, -0.5276031494140625, -0.48675537109375, -0.4459075927734375, -0.405059814453125, -0.3642120361328125, -0.3233642578125, -0.2825164794921875, -0.241668701171875, -0.2008209228515625, -0.15997314453125, -0.1191253662109375, -0.078277587890625, -0.0374298095703125, 0.00341796875, 0.0442657470703125, 0.085113525390625, 0.1259613037109375, 0.16680908203125, 0.2076568603515625, 0.248504638671875, 0.2893524169921875, 0.3302001953125, 0.3710479736328125, 0.411895751953125, 0.4527435302734375, 0.49359130859375, 0.5344390869140625, 0.575286865234375, 0.6161346435546875, 0.656982421875, 0.6978302001953125, 0.738677978515625, 0.7795257568359375, 0.82037353515625, 0.8612213134765625, 0.902069091796875, 0.9429168701171875, 0.9837646484375, 1.0246124267578125, 1.065460205078125, 1.1063079833984375, 1.14715576171875, 1.1880035400390625, 1.228851318359375, 1.2696990966796875, 1.310546875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 6.0, 8.0, 14.0, 7.0, 19.0, 7.0, 24.0, 21.0, 27.0, 33.0, 45.0, 49.0, 46.0, 50.0, 52.0, 49.0, 62.0, 65.0, 69.0, 65.0, 50.0, 37.0, 40.0, 34.0, 23.0, 21.0, 15.0, 16.0, 10.0, 7.0, 7.0, 8.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.189678192138672e-05, -7.918942719697952e-05, -7.648207247257233e-05, -7.377471774816513e-05, -7.106736302375793e-05, -6.836000829935074e-05, -6.565265357494354e-05, -6.294529885053635e-05, -6.023794412612915e-05, -5.7530589401721954e-05, -5.482323467731476e-05, -5.211587995290756e-05, -4.9408525228500366e-05, -4.670117050409317e-05, -4.3993815779685974e-05, -4.128646105527878e-05, -3.857910633087158e-05, -3.5871751606464386e-05, -3.316439688205719e-05, -3.0457042157649994e-05, -2.7749687433242798e-05, -2.5042332708835602e-05, -2.2334977984428406e-05, -1.962762326002121e-05, -1.6920268535614014e-05, -1.4212913811206818e-05, -1.1505559086799622e-05, -8.798204362392426e-06, -6.0908496379852295e-06, -3.3834949135780334e-06, -6.761401891708374e-07, 2.0312145352363586e-06, 4.738569259643555e-06, 7.445923984050751e-06, 1.0153278708457947e-05, 1.2860633432865143e-05, 1.556798815727234e-05, 1.8275342881679535e-05, 2.098269760608673e-05, 2.3690052330493927e-05, 2.6397407054901123e-05, 2.910476177930832e-05, 3.1812116503715515e-05, 3.451947122812271e-05, 3.722682595252991e-05, 3.99341806769371e-05, 4.26415354013443e-05, 4.5348890125751495e-05, 4.805624485015869e-05, 5.076359957456589e-05, 5.3470954298973083e-05, 5.617830902338028e-05, 5.8885663747787476e-05, 6.159301847219467e-05, 6.430037319660187e-05, 6.700772792100906e-05, 6.971508264541626e-05, 7.242243736982346e-05, 7.512979209423065e-05, 7.783714681863785e-05, 8.054450154304504e-05, 8.325185626745224e-05, 8.595921099185944e-05, 8.866656571626663e-05, 9.137392044067383e-05]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 11.0, 20.0, 21.0, 39.0, 50.0, 91.0, 140.0, 219.0, 343.0, 513.0, 906.0, 1466.0, 2489.0, 4408.0, 7462.0, 13457.0, 24065.0, 44296.0, 81737.0, 146635.0, 217432.0, 207142.0, 132734.0, 73403.0, 39405.0, 21664.0, 11880.0, 6886.0, 3921.0, 2272.0, 1305.0, 838.0, 487.0, 320.0, 179.0, 111.0, 75.0, 49.0, 25.0, 23.0, 9.0, 10.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2978515625, -1.25445556640625, -1.2110595703125, -1.16766357421875, -1.124267578125, -1.08087158203125, -1.0374755859375, -0.99407958984375, -0.95068359375, -0.90728759765625, -0.8638916015625, -0.82049560546875, -0.777099609375, -0.73370361328125, -0.6903076171875, -0.64691162109375, -0.603515625, -0.56011962890625, -0.5167236328125, -0.47332763671875, -0.429931640625, -0.38653564453125, -0.3431396484375, -0.29974365234375, -0.25634765625, -0.21295166015625, -0.1695556640625, -0.12615966796875, -0.082763671875, -0.03936767578125, 0.0040283203125, 0.04742431640625, 0.0908203125, 0.13421630859375, 0.1776123046875, 0.22100830078125, 0.264404296875, 0.30780029296875, 0.3511962890625, 0.39459228515625, 0.43798828125, 0.48138427734375, 0.5247802734375, 0.56817626953125, 0.611572265625, 0.65496826171875, 0.6983642578125, 0.74176025390625, 0.78515625, 0.82855224609375, 0.8719482421875, 0.91534423828125, 0.958740234375, 1.00213623046875, 1.0455322265625, 1.08892822265625, 1.13232421875, 1.17572021484375, 1.2191162109375, 1.26251220703125, 1.305908203125, 1.34930419921875, 1.3927001953125, 1.43609619140625, 1.4794921875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 7.0, 6.0, 13.0, 14.0, 17.0, 21.0, 21.0, 25.0, 33.0, 35.0, 42.0, 46.0, 38.0, 43.0, 58.0, 66.0, 56.0, 57.0, 49.0, 49.0, 46.0, 52.0, 25.0, 30.0, 19.0, 15.0, 18.0, 12.0, 15.0, 18.0, 10.0, 6.0, 6.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.53564453125, -0.5198326110839844, -0.5040206909179688, -0.4882087707519531, -0.4723968505859375, -0.4565849304199219, -0.44077301025390625, -0.4249610900878906, -0.409149169921875, -0.3933372497558594, -0.37752532958984375, -0.3617134094238281, -0.3459014892578125, -0.3300895690917969, -0.31427764892578125, -0.2984657287597656, -0.28265380859375, -0.2668418884277344, -0.25102996826171875, -0.23521804809570312, -0.2194061279296875, -0.20359420776367188, -0.18778228759765625, -0.17197036743164062, -0.156158447265625, -0.14034652709960938, -0.12453460693359375, -0.10872268676757812, -0.0929107666015625, -0.07709884643554688, -0.06128692626953125, -0.045475006103515625, -0.0296630859375, -0.013851165771484375, 0.00196075439453125, 0.017772674560546875, 0.0335845947265625, 0.049396514892578125, 0.06520843505859375, 0.08102035522460938, 0.096832275390625, 0.11264419555664062, 0.12845611572265625, 0.14426803588867188, 0.1600799560546875, 0.17589187622070312, 0.19170379638671875, 0.20751571655273438, 0.22332763671875, 0.23913955688476562, 0.25495147705078125, 0.2707633972167969, 0.2865753173828125, 0.3023872375488281, 0.31819915771484375, 0.3340110778808594, 0.349822998046875, 0.3656349182128906, 0.38144683837890625, 0.3972587585449219, 0.4130706787109375, 0.4288825988769531, 0.44469451904296875, 0.4605064392089844, 0.476318359375]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 13.0, 11.0, 13.0, 30.0, 20.0, 25.0, 35.0, 59.0, 58.0, 68.0, 83.0, 80.0, 82.0, 87.0, 74.0, 38.0, 55.0, 33.0, 41.0, 16.0, 17.0, 19.0, 6.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.585756301879883, -4.415316104888916, -4.244875431060791, -4.074435234069824, -3.903994560241699, -3.7335543632507324, -3.5631139278411865, -3.3926734924316406, -3.2222330570220947, -3.051792621612549, -2.881352186203003, -2.710911750793457, -2.5404715538024902, -2.3700308799743652, -2.1995906829833984, -2.0291502475738525, -1.8587098121643066, -1.6882693767547607, -1.5178289413452148, -1.3473886251449585, -1.1769481897354126, -1.0065077543258667, -0.8360674381256104, -0.6656270027160645, -0.49518656730651855, -0.32474616169929504, -0.15430575609207153, 0.01613461971282959, 0.1865750551223755, 0.3570154905319214, 0.5274558067321777, 0.6978962421417236, 0.8683371543884277, 1.0387775897979736, 1.2092180252075195, 1.3796583414077759, 1.5500987768173218, 1.7205392122268677, 1.890979528427124, 2.06141996383667, 2.231860399246216, 2.4023008346557617, 2.5727412700653076, 2.7431817054748535, 2.9136219024658203, 3.0840625762939453, 3.254502773284912, 3.424943208694458, 3.595383644104004, 3.76582407951355, 3.9362645149230957, 4.1067047119140625, 4.2771453857421875, 4.447585582733154, 4.618025779724121, 4.788466453552246, 4.958907127380371, 5.129347324371338, 5.299787998199463, 5.47022819519043, 5.640668869018555, 5.8111090660095215, 5.981549263000488, 6.151989936828613, 6.32243013381958]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 1.0, 1.0, 8.0, 9.0, 7.0, 9.0, 13.0, 22.0, 14.0, 14.0, 30.0, 24.0, 27.0, 36.0, 34.0, 43.0, 54.0, 31.0, 46.0, 40.0, 47.0, 37.0, 44.0, 34.0, 49.0, 42.0, 31.0, 30.0, 26.0, 29.0, 24.0, 25.0, 25.0, 16.0, 9.0, 13.0, 13.0, 4.0, 6.0, 5.0, 6.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8674609661102295, -3.7244491577148438, -3.581437587738037, -3.4384257793426514, -3.2954139709472656, -3.15240216255188, -3.009390354156494, -2.8663787841796875, -2.7233669757843018, -2.580355167388916, -2.4373435974121094, -2.2943317890167236, -2.151319980621338, -2.008308172225952, -1.865296483039856, -1.7222847938537598, -1.579272985458374, -1.4362611770629883, -1.293249487876892, -1.150237798690796, -1.0072259902954102, -0.8642142415046692, -0.7212024927139282, -0.578190803527832, -0.4351789951324463, -0.2921672463417053, -0.14915549755096436, -0.006143748760223389, 0.13686800003051758, 0.27987974882125854, 0.4228914976119995, 0.5659031867980957, 0.7089152336120605, 0.8519269824028015, 0.9949387311935425, 1.1379504203796387, 1.2809622287750244, 1.4239740371704102, 1.5669857263565063, 1.7099974155426025, 1.8530092239379883, 1.996021032333374, 2.1390328407287598, 2.2820444107055664, 2.425056219100952, 2.568068027496338, 2.7110795974731445, 2.8540914058685303, 2.997103214263916, 3.1401150226593018, 3.2831268310546875, 3.426138401031494, 3.56915020942688, 3.7121620178222656, 3.8551735877990723, 3.998185396194458, 4.141197204589844, 4.28420877456665, 4.427220821380615, 4.570232391357422, 4.713244438171387, 4.856256008148193, 4.999267578125, 5.142279624938965, 5.2852911949157715]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 6.0, 14.0, 17.0, 38.0, 64.0, 85.0, 114.0, 177.0, 283.0, 390.0, 561.0, 709.0, 1188.0, 1792.0, 2737.0, 4188.0, 6454.0, 10605.0, 17690.0, 30245.0, 55117.0, 104952.0, 212314.0, 443668.0, 861235.0, 1063835.0, 690789.0, 335550.0, 160656.0, 80792.0, 43019.0, 24454.0, 14041.0, 8786.0, 5684.0, 3663.0, 2558.0, 1672.0, 1166.0, 848.0, 621.0, 457.0, 310.0, 219.0, 148.0, 114.0, 82.0, 61.0, 37.0, 21.0, 25.0, 20.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-3.94921875, -3.81451416015625, -3.6798095703125, -3.54510498046875, -3.410400390625, -3.27569580078125, -3.1409912109375, -3.00628662109375, -2.87158203125, -2.73687744140625, -2.6021728515625, -2.46746826171875, -2.332763671875, -2.19805908203125, -2.0633544921875, -1.92864990234375, -1.7939453125, -1.65924072265625, -1.5245361328125, -1.38983154296875, -1.255126953125, -1.12042236328125, -0.9857177734375, -0.85101318359375, -0.71630859375, -0.58160400390625, -0.4468994140625, -0.31219482421875, -0.177490234375, -0.04278564453125, 0.0919189453125, 0.22662353515625, 0.361328125, 0.49603271484375, 0.6307373046875, 0.76544189453125, 0.900146484375, 1.03485107421875, 1.1695556640625, 1.30426025390625, 1.43896484375, 1.57366943359375, 1.7083740234375, 1.84307861328125, 1.977783203125, 2.11248779296875, 2.2471923828125, 2.38189697265625, 2.5166015625, 2.65130615234375, 2.7860107421875, 2.92071533203125, 3.055419921875, 3.19012451171875, 3.3248291015625, 3.45953369140625, 3.59423828125, 3.72894287109375, 3.8636474609375, 3.99835205078125, 4.133056640625, 4.26776123046875, 4.4024658203125, 4.53717041015625, 4.671875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 5.0, 4.0, 12.0, 6.0, 3.0, 11.0, 14.0, 11.0, 16.0, 17.0, 21.0, 20.0, 34.0, 44.0, 45.0, 38.0, 42.0, 31.0, 44.0, 38.0, 44.0, 37.0, 40.0, 31.0, 54.0, 44.0, 36.0, 26.0, 35.0, 29.0, 27.0, 17.0, 21.0, 16.0, 15.0, 17.0, 9.0, 8.0, 6.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.546875, -2.453216552734375, -2.35955810546875, -2.265899658203125, -2.1722412109375, -2.078582763671875, -1.98492431640625, -1.891265869140625, -1.797607421875, -1.703948974609375, -1.61029052734375, -1.516632080078125, -1.4229736328125, -1.329315185546875, -1.23565673828125, -1.141998291015625, -1.04833984375, -0.954681396484375, -0.86102294921875, -0.767364501953125, -0.6737060546875, -0.580047607421875, -0.48638916015625, -0.392730712890625, -0.299072265625, -0.205413818359375, -0.11175537109375, -0.018096923828125, 0.0755615234375, 0.169219970703125, 0.26287841796875, 0.356536865234375, 0.4501953125, 0.543853759765625, 0.63751220703125, 0.731170654296875, 0.8248291015625, 0.918487548828125, 1.01214599609375, 1.105804443359375, 1.199462890625, 1.293121337890625, 1.38677978515625, 1.480438232421875, 1.5740966796875, 1.667755126953125, 1.76141357421875, 1.855072021484375, 1.94873046875, 2.042388916015625, 2.13604736328125, 2.229705810546875, 2.3233642578125, 2.417022705078125, 2.51068115234375, 2.604339599609375, 2.697998046875, 2.791656494140625, 2.88531494140625, 2.978973388671875, 3.0726318359375, 3.166290283203125, 3.25994873046875, 3.353607177734375, 3.447265625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 5.0, 8.0, 8.0, 15.0, 26.0, 37.0, 45.0, 77.0, 107.0, 165.0, 284.0, 497.0, 806.0, 1345.0, 2394.0, 4234.0, 7925.0, 14940.0, 29377.0, 60102.0, 129022.0, 282652.0, 607417.0, 1046867.0, 989285.0, 541136.0, 250424.0, 114805.0, 54002.0, 26245.0, 13648.0, 7073.0, 3998.0, 2270.0, 1235.0, 721.0, 415.0, 255.0, 149.0, 79.0, 58.0, 36.0, 29.0, 25.0, 15.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0], "bins": [-4.7734375, -4.6239013671875, -4.474365234375, -4.3248291015625, -4.17529296875, -4.0257568359375, -3.876220703125, -3.7266845703125, -3.5771484375, -3.4276123046875, -3.278076171875, -3.1285400390625, -2.97900390625, -2.8294677734375, -2.679931640625, -2.5303955078125, -2.380859375, -2.2313232421875, -2.081787109375, -1.9322509765625, -1.78271484375, -1.6331787109375, -1.483642578125, -1.3341064453125, -1.1845703125, -1.0350341796875, -0.885498046875, -0.7359619140625, -0.58642578125, -0.4368896484375, -0.287353515625, -0.1378173828125, 0.01171875, 0.1612548828125, 0.310791015625, 0.4603271484375, 0.60986328125, 0.7593994140625, 0.908935546875, 1.0584716796875, 1.2080078125, 1.3575439453125, 1.507080078125, 1.6566162109375, 1.80615234375, 1.9556884765625, 2.105224609375, 2.2547607421875, 2.404296875, 2.5538330078125, 2.703369140625, 2.8529052734375, 3.00244140625, 3.1519775390625, 3.301513671875, 3.4510498046875, 3.6005859375, 3.7501220703125, 3.899658203125, 4.0491943359375, 4.19873046875, 4.3482666015625, 4.497802734375, 4.6473388671875, 4.796875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 7.0, 9.0, 8.0, 11.0, 18.0, 17.0, 15.0, 24.0, 27.0, 48.0, 48.0, 49.0, 86.0, 100.0, 108.0, 127.0, 146.0, 183.0, 184.0, 229.0, 237.0, 212.0, 259.0, 203.0, 226.0, 222.0, 222.0, 178.0, 156.0, 104.0, 117.0, 88.0, 85.0, 62.0, 60.0, 43.0, 47.0, 29.0, 19.0, 8.0, 14.0, 7.0, 7.0, 8.0, 6.0, 5.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4228515625, -1.377105712890625, -1.33135986328125, -1.285614013671875, -1.2398681640625, -1.194122314453125, -1.14837646484375, -1.102630615234375, -1.056884765625, -1.011138916015625, -0.96539306640625, -0.919647216796875, -0.8739013671875, -0.828155517578125, -0.78240966796875, -0.736663818359375, -0.69091796875, -0.645172119140625, -0.59942626953125, -0.553680419921875, -0.5079345703125, -0.462188720703125, -0.41644287109375, -0.370697021484375, -0.324951171875, -0.279205322265625, -0.23345947265625, -0.187713623046875, -0.1419677734375, -0.096221923828125, -0.05047607421875, -0.004730224609375, 0.041015625, 0.086761474609375, 0.13250732421875, 0.178253173828125, 0.2239990234375, 0.269744873046875, 0.31549072265625, 0.361236572265625, 0.406982421875, 0.452728271484375, 0.49847412109375, 0.544219970703125, 0.5899658203125, 0.635711669921875, 0.68145751953125, 0.727203369140625, 0.77294921875, 0.818695068359375, 0.86444091796875, 0.910186767578125, 0.9559326171875, 1.001678466796875, 1.04742431640625, 1.093170166015625, 1.138916015625, 1.184661865234375, 1.23040771484375, 1.276153564453125, 1.3218994140625, 1.367645263671875, 1.41339111328125, 1.459136962890625, 1.5048828125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 9.0, 7.0, 19.0, 24.0, 30.0, 26.0, 21.0, 30.0, 40.0, 45.0, 52.0, 58.0, 50.0, 76.0, 61.0, 55.0, 55.0, 68.0, 33.0, 40.0, 27.0, 27.0, 20.0, 21.0, 11.0, 9.0, 11.0, 11.0, 6.0, 6.0, 6.0, 7.0, 8.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.546537160873413, -3.423889636993408, -3.301241874694824, -3.1785943508148193, -3.0559465885162354, -2.9332990646362305, -2.8106513023376465, -2.6880037784576416, -2.5653562545776367, -2.442708730697632, -2.320060968399048, -2.197413444519043, -2.074765682220459, -1.952118158340454, -1.8294705152511597, -1.7068228721618652, -1.5841751098632812, -1.4615274667739868, -1.3388798236846924, -1.2162322998046875, -1.0935845375061035, -0.9709369540214539, -0.8482893705368042, -0.7256417274475098, -0.6029940843582153, -0.4803464412689209, -0.35769882798194885, -0.2350512146949768, -0.11240357160568237, 0.01024407148361206, 0.13289165496826172, 0.25553929805755615, 0.3781867027282715, 0.5008343458175659, 0.6234819889068604, 0.74612957239151, 0.8687772154808044, 0.9914248585700989, 1.1140724420547485, 1.236720085144043, 1.3593677282333374, 1.4820153713226318, 1.6046630144119263, 1.7273106575012207, 1.8499581813812256, 1.9726059436798096, 2.0952534675598145, 2.2179012298583984, 2.3405487537384033, 2.463196277618408, 2.585844039916992, 2.708491563796997, 2.831139326095581, 2.953786849975586, 3.07643461227417, 3.199082136154175, 3.3217296600341797, 3.4443771839141846, 3.5670249462127686, 3.6896724700927734, 3.8123202323913574, 3.9349677562713623, 4.057615280151367, 4.180263042449951, 4.302910804748535]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 8.0, 13.0, 12.0, 13.0, 21.0, 29.0, 24.0, 18.0, 30.0, 33.0, 38.0, 37.0, 47.0, 54.0, 50.0, 52.0, 61.0, 44.0, 51.0, 36.0, 42.0, 40.0, 31.0, 37.0, 27.0, 18.0, 25.0, 20.0, 18.0, 9.0, 13.0, 4.0, 14.0, 12.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.3004560470581055, -5.145878791809082, -4.991302013397217, -4.836724758148193, -4.68214750289917, -4.527570724487305, -4.372993469238281, -4.218416213989258, -4.063838958740234, -3.90926194190979, -3.7546846866607666, -3.6001076698303223, -3.445530414581299, -3.2909533977508545, -3.13637638092041, -2.9817991256713867, -2.8272223472595215, -2.672645330429077, -2.5180680751800537, -2.3634910583496094, -2.208913803100586, -2.0543367862701416, -1.8997597694396973, -1.7451826333999634, -1.5906054973602295, -1.4360283613204956, -1.2814512252807617, -1.1268742084503174, -0.9722970724105835, -0.8177199363708496, -0.6631428599357605, -0.5085657835006714, -0.3539886474609375, -0.199411541223526, -0.0448344349861145, 0.109742671251297, 0.2643197774887085, 0.4188969135284424, 0.5734739899635315, 0.7280510663986206, 0.8826282024383545, 1.0372053384780884, 1.1917824745178223, 1.3463594913482666, 1.5009366273880005, 1.6555137634277344, 1.8100907802581787, 1.9646679162979126, 2.1192450523376465, 2.273822069168091, 2.4283993244171143, 2.5829763412475586, 2.737553596496582, 2.8921306133270264, 3.0467076301574707, 3.201284885406494, 3.3558619022369385, 3.510438919067383, 3.6650161743164062, 3.8195931911468506, 3.974170207977295, 4.128747463226318, 4.283324718475342, 4.437901496887207, 4.5924787521362305]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 4.0, 6.0, 11.0, 18.0, 15.0, 30.0, 34.0, 72.0, 82.0, 154.0, 175.0, 322.0, 432.0, 639.0, 944.0, 1508.0, 2294.0, 3608.0, 5726.0, 9190.0, 15339.0, 26979.0, 48177.0, 92075.0, 179836.0, 273591.0, 179508.0, 91700.0, 48324.0, 26886.0, 15595.0, 9229.0, 5751.0, 3537.0, 2372.0, 1491.0, 939.0, 670.0, 416.0, 281.0, 184.0, 139.0, 89.0, 73.0, 35.0, 25.0, 23.0, 6.0, 10.0, 10.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2724609375, -1.233306884765625, -1.19415283203125, -1.154998779296875, -1.1158447265625, -1.076690673828125, -1.03753662109375, -0.998382568359375, -0.959228515625, -0.920074462890625, -0.88092041015625, -0.841766357421875, -0.8026123046875, -0.763458251953125, -0.72430419921875, -0.685150146484375, -0.64599609375, -0.606842041015625, -0.56768798828125, -0.528533935546875, -0.4893798828125, -0.450225830078125, -0.41107177734375, -0.371917724609375, -0.332763671875, -0.293609619140625, -0.25445556640625, -0.215301513671875, -0.1761474609375, -0.136993408203125, -0.09783935546875, -0.058685302734375, -0.01953125, 0.019622802734375, 0.05877685546875, 0.097930908203125, 0.1370849609375, 0.176239013671875, 0.21539306640625, 0.254547119140625, 0.293701171875, 0.332855224609375, 0.37200927734375, 0.411163330078125, 0.4503173828125, 0.489471435546875, 0.52862548828125, 0.567779541015625, 0.60693359375, 0.646087646484375, 0.68524169921875, 0.724395751953125, 0.7635498046875, 0.802703857421875, 0.84185791015625, 0.881011962890625, 0.920166015625, 0.959320068359375, 0.99847412109375, 1.037628173828125, 1.0767822265625, 1.115936279296875, 1.15509033203125, 1.194244384765625, 1.2333984375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 9.0, 5.0, 9.0, 9.0, 13.0, 16.0, 19.0, 21.0, 16.0, 26.0, 31.0, 34.0, 27.0, 45.0, 25.0, 43.0, 46.0, 52.0, 43.0, 40.0, 46.0, 43.0, 36.0, 39.0, 43.0, 31.0, 33.0, 32.0, 24.0, 18.0, 17.0, 25.0, 24.0, 8.0, 8.0, 8.0, 6.0, 9.0, 4.0, 5.0, 7.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.70703125, -4.5662841796875, -4.425537109375, -4.2847900390625, -4.14404296875, -4.0032958984375, -3.862548828125, -3.7218017578125, -3.5810546875, -3.4403076171875, -3.299560546875, -3.1588134765625, -3.01806640625, -2.8773193359375, -2.736572265625, -2.5958251953125, -2.455078125, -2.3143310546875, -2.173583984375, -2.0328369140625, -1.89208984375, -1.7513427734375, -1.610595703125, -1.4698486328125, -1.3291015625, -1.1883544921875, -1.047607421875, -0.9068603515625, -0.76611328125, -0.6253662109375, -0.484619140625, -0.3438720703125, -0.203125, -0.0623779296875, 0.078369140625, 0.2191162109375, 0.35986328125, 0.5006103515625, 0.641357421875, 0.7821044921875, 0.9228515625, 1.0635986328125, 1.204345703125, 1.3450927734375, 1.48583984375, 1.6265869140625, 1.767333984375, 1.9080810546875, 2.048828125, 2.1895751953125, 2.330322265625, 2.4710693359375, 2.61181640625, 2.7525634765625, 2.893310546875, 3.0340576171875, 3.1748046875, 3.3155517578125, 3.456298828125, 3.5970458984375, 3.73779296875, 3.8785400390625, 4.019287109375, 4.1600341796875, 4.30078125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 11.0, 9.0, 8.0, 16.0, 18.0, 22.0, 30.0, 38.0, 50.0, 81.0, 68.0, 111.0, 137.0, 193.0, 265.0, 338.0, 526.0, 754.0, 1243.0, 2139.0, 4470.0, 10123.0, 26368.0, 884626.0, 77228.0, 21629.0, 8476.0, 3808.0, 2058.0, 1158.0, 725.0, 499.0, 348.0, 225.0, 173.0, 142.0, 116.0, 57.0, 60.0, 52.0, 42.0, 28.0, 27.0, 14.0, 13.0, 5.0, 7.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0], "bins": [-3.521484375, -3.414459228515625, -3.30743408203125, -3.200408935546875, -3.0933837890625, -2.986358642578125, -2.87933349609375, -2.772308349609375, -2.665283203125, -2.558258056640625, -2.45123291015625, -2.344207763671875, -2.2371826171875, -2.130157470703125, -2.02313232421875, -1.916107177734375, -1.80908203125, -1.702056884765625, -1.59503173828125, -1.488006591796875, -1.3809814453125, -1.273956298828125, -1.16693115234375, -1.059906005859375, -0.952880859375, -0.845855712890625, -0.73883056640625, -0.631805419921875, -0.5247802734375, -0.417755126953125, -0.31072998046875, -0.203704833984375, -0.0966796875, 0.010345458984375, 0.11737060546875, 0.224395751953125, 0.3314208984375, 0.438446044921875, 0.54547119140625, 0.652496337890625, 0.759521484375, 0.866546630859375, 0.97357177734375, 1.080596923828125, 1.1876220703125, 1.294647216796875, 1.40167236328125, 1.508697509765625, 1.61572265625, 1.722747802734375, 1.82977294921875, 1.936798095703125, 2.0438232421875, 2.150848388671875, 2.25787353515625, 2.364898681640625, 2.471923828125, 2.578948974609375, 2.68597412109375, 2.792999267578125, 2.9000244140625, 3.007049560546875, 3.11407470703125, 3.221099853515625, 3.328125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 16.0, 14.0, 12.0, 10.0, 14.0, 16.0, 22.0, 23.0, 20.0, 27.0, 34.0, 34.0, 32.0, 25.0, 27.0, 44.0, 35.0, 44.0, 42.0, 27.0, 33.0, 37.0, 27.0, 32.0, 42.0, 31.0, 30.0, 25.0, 26.0, 22.0, 22.0, 22.0, 21.0, 13.0, 14.0, 16.0, 8.0, 4.0, 13.0, 6.0, 7.0, 3.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-2.529296875, -2.453643798828125, -2.37799072265625, -2.302337646484375, -2.2266845703125, -2.151031494140625, -2.07537841796875, -1.999725341796875, -1.924072265625, -1.848419189453125, -1.77276611328125, -1.697113037109375, -1.6214599609375, -1.545806884765625, -1.47015380859375, -1.394500732421875, -1.31884765625, -1.243194580078125, -1.16754150390625, -1.091888427734375, -1.0162353515625, -0.940582275390625, -0.86492919921875, -0.789276123046875, -0.713623046875, -0.637969970703125, -0.56231689453125, -0.486663818359375, -0.4110107421875, -0.335357666015625, -0.25970458984375, -0.184051513671875, -0.1083984375, -0.032745361328125, 0.04290771484375, 0.118560791015625, 0.1942138671875, 0.269866943359375, 0.34552001953125, 0.421173095703125, 0.496826171875, 0.572479248046875, 0.64813232421875, 0.723785400390625, 0.7994384765625, 0.875091552734375, 0.95074462890625, 1.026397705078125, 1.10205078125, 1.177703857421875, 1.25335693359375, 1.329010009765625, 1.4046630859375, 1.480316162109375, 1.55596923828125, 1.631622314453125, 1.707275390625, 1.782928466796875, 1.85858154296875, 1.934234619140625, 2.0098876953125, 2.085540771484375, 2.16119384765625, 2.236846923828125, 2.3125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 8.0, 9.0, 14.0, 19.0, 32.0, 36.0, 48.0, 93.0, 163.0, 282.0, 550.0, 1159.0, 2726.0, 8875.0, 58834.0, 952760.0, 15642.0, 4157.0, 1542.0, 689.0, 381.0, 217.0, 108.0, 72.0, 42.0, 31.0, 21.0, 9.0, 14.0, 9.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4716796875, -0.4560546875, -0.4404296875, -0.4248046875, -0.4091796875, -0.3935546875, -0.3779296875, -0.3623046875, -0.3466796875, -0.3310546875, -0.3154296875, -0.2998046875, -0.2841796875, -0.2685546875, -0.2529296875, -0.2373046875, -0.2216796875, -0.2060546875, -0.1904296875, -0.1748046875, -0.1591796875, -0.1435546875, -0.1279296875, -0.1123046875, -0.0966796875, -0.0810546875, -0.0654296875, -0.0498046875, -0.0341796875, -0.0185546875, -0.0029296875, 0.0126953125, 0.0283203125, 0.0439453125, 0.0595703125, 0.0751953125, 0.0908203125, 0.1064453125, 0.1220703125, 0.1376953125, 0.1533203125, 0.1689453125, 0.1845703125, 0.2001953125, 0.2158203125, 0.2314453125, 0.2470703125, 0.2626953125, 0.2783203125, 0.2939453125, 0.3095703125, 0.3251953125, 0.3408203125, 0.3564453125, 0.3720703125, 0.3876953125, 0.4033203125, 0.4189453125, 0.4345703125, 0.4501953125, 0.4658203125, 0.4814453125, 0.4970703125, 0.5126953125, 0.5283203125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 9.0, 11.0, 8.0, 11.0, 14.0, 22.0, 14.0, 27.0, 22.0, 29.0, 43.0, 42.0, 46.0, 52.0, 38.0, 49.0, 59.0, 52.0, 48.0, 60.0, 30.0, 46.0, 34.0, 38.0, 31.0, 24.0, 24.0, 17.0, 21.0, 14.0, 13.0, 10.0, 4.0, 4.0, 5.0, 7.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.534555435180664e-05, -3.4232623875141144e-05, -3.311969339847565e-05, -3.200676292181015e-05, -3.089383244514465e-05, -2.9780901968479156e-05, -2.866797149181366e-05, -2.7555041015148163e-05, -2.6442110538482666e-05, -2.532918006181717e-05, -2.4216249585151672e-05, -2.3103319108486176e-05, -2.199038863182068e-05, -2.0877458155155182e-05, -1.9764527678489685e-05, -1.8651597201824188e-05, -1.753866672515869e-05, -1.6425736248493195e-05, -1.5312805771827698e-05, -1.4199875295162201e-05, -1.3086944818496704e-05, -1.1974014341831207e-05, -1.086108386516571e-05, -9.748153388500214e-06, -8.635222911834717e-06, -7.52229243516922e-06, -6.409361958503723e-06, -5.296431481838226e-06, -4.1835010051727295e-06, -3.0705705285072327e-06, -1.957640051841736e-06, -8.44709575176239e-07, 2.682209014892578e-07, 1.3811513781547546e-06, 2.4940818548202515e-06, 3.6070123314857483e-06, 4.719942808151245e-06, 5.832873284816742e-06, 6.945803761482239e-06, 8.058734238147736e-06, 9.171664714813232e-06, 1.028459519147873e-05, 1.1397525668144226e-05, 1.2510456144809723e-05, 1.362338662147522e-05, 1.4736317098140717e-05, 1.5849247574806213e-05, 1.696217805147171e-05, 1.8075108528137207e-05, 1.9188039004802704e-05, 2.03009694814682e-05, 2.1413899958133698e-05, 2.2526830434799194e-05, 2.363976091146469e-05, 2.4752691388130188e-05, 2.5865621864795685e-05, 2.697855234146118e-05, 2.809148281812668e-05, 2.9204413294792175e-05, 3.0317343771457672e-05, 3.143027424812317e-05, 3.2543204724788666e-05, 3.365613520145416e-05, 3.476906567811966e-05, 3.5881996154785156e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 8.0, 6.0, 9.0, 20.0, 21.0, 35.0, 54.0, 93.0, 156.0, 301.0, 510.0, 981.0, 1785.0, 3403.0, 7019.0, 15730.0, 40425.0, 120668.0, 445777.0, 283100.0, 78035.0, 27795.0, 11491.0, 5305.0, 2623.0, 1433.0, 723.0, 440.0, 263.0, 138.0, 80.0, 45.0, 29.0, 26.0, 9.0, 7.0, 8.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1409912109375, -0.13573265075683594, -0.13047409057617188, -0.1252155303955078, -0.11995697021484375, -0.11469841003417969, -0.10943984985351562, -0.10418128967285156, -0.0989227294921875, -0.09366416931152344, -0.08840560913085938, -0.08314704895019531, -0.07788848876953125, -0.07262992858886719, -0.06737136840820312, -0.06211280822753906, -0.056854248046875, -0.05159568786621094, -0.046337127685546875, -0.04107856750488281, -0.03582000732421875, -0.030561447143554688, -0.025302886962890625, -0.020044326782226562, -0.0147857666015625, -0.009527206420898438, -0.004268646240234375, 0.0009899139404296875, 0.00624847412109375, 0.011507034301757812, 0.016765594482421875, 0.022024154663085938, 0.02728271484375, 0.03254127502441406, 0.037799835205078125, 0.04305839538574219, 0.04831695556640625, 0.05357551574707031, 0.058834075927734375, 0.06409263610839844, 0.0693511962890625, 0.07460975646972656, 0.07986831665039062, 0.08512687683105469, 0.09038543701171875, 0.09564399719238281, 0.10090255737304688, 0.10616111755371094, 0.111419677734375, 0.11667823791503906, 0.12193679809570312, 0.1271953582763672, 0.13245391845703125, 0.1377124786376953, 0.14297103881835938, 0.14822959899902344, 0.1534881591796875, 0.15874671936035156, 0.16400527954101562, 0.1692638397216797, 0.17452239990234375, 0.1797809600830078, 0.18503952026367188, 0.19029808044433594, 0.195556640625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 12.0, 6.0, 3.0, 5.0, 11.0, 13.0, 17.0, 31.0, 28.0, 44.0, 44.0, 86.0, 92.0, 93.0, 114.0, 94.0, 68.0, 53.0, 39.0, 26.0, 16.0, 14.0, 16.0, 7.0, 10.0, 11.0, 7.0, 9.0, 5.0, 4.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.04388427734375, -0.04254913330078125, -0.0412139892578125, -0.03987884521484375, -0.038543701171875, -0.03720855712890625, -0.0358734130859375, -0.03453826904296875, -0.033203125, -0.03186798095703125, -0.0305328369140625, -0.02919769287109375, -0.027862548828125, -0.02652740478515625, -0.0251922607421875, -0.02385711669921875, -0.02252197265625, -0.02118682861328125, -0.0198516845703125, -0.01851654052734375, -0.017181396484375, -0.01584625244140625, -0.0145111083984375, -0.01317596435546875, -0.0118408203125, -0.01050567626953125, -0.0091705322265625, -0.00783538818359375, -0.006500244140625, -0.00516510009765625, -0.0038299560546875, -0.00249481201171875, -0.00115966796875, 0.00017547607421875, 0.0015106201171875, 0.00284576416015625, 0.004180908203125, 0.00551605224609375, 0.0068511962890625, 0.00818634033203125, 0.009521484375, 0.01085662841796875, 0.0121917724609375, 0.01352691650390625, 0.014862060546875, 0.01619720458984375, 0.0175323486328125, 0.01886749267578125, 0.02020263671875, 0.02153778076171875, 0.0228729248046875, 0.02420806884765625, 0.025543212890625, 0.02687835693359375, 0.0282135009765625, 0.02954864501953125, 0.0308837890625, 0.03221893310546875, 0.0335540771484375, 0.03488922119140625, 0.036224365234375, 0.03755950927734375, 0.0388946533203125, 0.04022979736328125, 0.04156494140625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 5.0, 4.0, 7.0, 7.0, 9.0, 11.0, 18.0, 27.0, 24.0, 29.0, 24.0, 38.0, 33.0, 50.0, 55.0, 51.0, 71.0, 59.0, 68.0, 59.0, 65.0, 50.0, 30.0, 33.0, 28.0, 28.0, 18.0, 18.0, 11.0, 11.0, 8.0, 8.0, 6.0, 7.0, 4.0, 11.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.50710391998291, -3.3838088512420654, -3.2605140209198, -3.137218952178955, -3.0139241218566895, -2.8906290531158447, -2.767334222793579, -2.6440391540527344, -2.5207443237304688, -2.397449254989624, -2.2741544246673584, -2.1508593559265137, -2.027564525604248, -1.9042694568634033, -1.7809746265411377, -1.657679557800293, -1.5343846082687378, -1.4110896587371826, -1.2877947092056274, -1.1644997596740723, -1.041204810142517, -0.9179098010063171, -0.794614851474762, -0.6713199019432068, -0.5480249524116516, -0.42473000288009644, -0.30143505334854126, -0.1781400740146637, -0.05484512448310852, 0.06844985485076904, 0.19174480438232422, 0.3150397539138794, 0.43833470344543457, 0.5616296529769897, 0.6849246025085449, 0.8082195520401001, 0.9315145015716553, 1.0548095703125, 1.1781044006347656, 1.3013994693756104, 1.424694299697876, 1.5479892492294312, 1.6712841987609863, 1.7945791482925415, 1.9178740978240967, 2.0411691665649414, 2.164463996887207, 2.2877590656280518, 2.4110541343688965, 2.534349203109741, 2.657644033432007, 2.7809391021728516, 2.904233932495117, 3.027529001235962, 3.1508238315582275, 3.2741189002990723, 3.397413730621338, 3.5207087993621826, 3.6440036296844482, 3.767298698425293, 3.8905935287475586, 4.013888359069824, 4.137183666229248, 4.260478496551514, 4.383773326873779]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 8.0, 13.0, 13.0, 13.0, 23.0, 25.0, 25.0, 19.0, 28.0, 34.0, 39.0, 41.0, 43.0, 53.0, 53.0, 51.0, 56.0, 49.0, 51.0, 39.0, 38.0, 38.0, 35.0, 34.0, 29.0, 18.0, 23.0, 22.0, 16.0, 9.0, 14.0, 3.0, 16.0, 11.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.310791015625, -5.156094551086426, -5.001398086547852, -4.846701622009277, -4.692005157470703, -4.537308216094971, -4.3826117515563965, -4.227915287017822, -4.073218822479248, -3.918522357940674, -3.7638258934020996, -3.6091291904449463, -3.454432725906372, -3.299736261367798, -3.1450395584106445, -2.9903430938720703, -2.835646629333496, -2.680950164794922, -2.5262537002563477, -2.3715569972991943, -2.21686053276062, -2.062164068222046, -1.9074674844741821, -1.7527709007263184, -1.5980744361877441, -1.44337797164917, -1.2886813879013062, -1.1339848041534424, -0.9792883396148682, -0.8245918154716492, -0.6698952913284302, -0.5151987075805664, -0.3605027198791504, -0.2058061957359314, -0.0511096715927124, 0.10358685255050659, 0.2582833766937256, 0.4129799008369446, 0.5676764249801636, 0.7223730087280273, 0.8770694732666016, 1.0317659378051758, 1.1864625215530396, 1.3411591053009033, 1.4958555698394775, 1.6505520343780518, 1.8052486181259155, 1.9599452018737793, 2.1146416664123535, 2.2693381309509277, 2.424034595489502, 2.5787312984466553, 2.7334277629852295, 2.8881242275238037, 3.042820930480957, 3.1975173950195312, 3.3522138595581055, 3.5069103240966797, 3.661606788635254, 3.8163034915924072, 3.9709999561309814, 4.125696659088135, 4.280393123626709, 4.435089588165283, 4.589786052703857]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 3.0, 2.0, 6.0, 14.0, 15.0, 18.0, 30.0, 59.0, 68.0, 149.0, 204.0, 325.0, 551.0, 905.0, 1503.0, 2765.0, 4809.0, 8891.0, 16603.0, 31472.0, 61023.0, 115989.0, 194392.0, 229875.0, 172612.0, 97695.0, 51209.0, 26282.0, 13646.0, 7578.0, 4186.0, 2320.0, 1298.0, 787.0, 494.0, 308.0, 147.0, 119.0, 57.0, 42.0, 37.0, 20.0, 18.0, 17.0, 7.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.3046875, -4.1580810546875, -4.011474609375, -3.8648681640625, -3.71826171875, -3.5716552734375, -3.425048828125, -3.2784423828125, -3.1318359375, -2.9852294921875, -2.838623046875, -2.6920166015625, -2.54541015625, -2.3988037109375, -2.252197265625, -2.1055908203125, -1.958984375, -1.8123779296875, -1.665771484375, -1.5191650390625, -1.37255859375, -1.2259521484375, -1.079345703125, -0.9327392578125, -0.7861328125, -0.6395263671875, -0.492919921875, -0.3463134765625, -0.19970703125, -0.0531005859375, 0.093505859375, 0.2401123046875, 0.38671875, 0.5333251953125, 0.679931640625, 0.8265380859375, 0.97314453125, 1.1197509765625, 1.266357421875, 1.4129638671875, 1.5595703125, 1.7061767578125, 1.852783203125, 1.9993896484375, 2.14599609375, 2.2926025390625, 2.439208984375, 2.5858154296875, 2.732421875, 2.8790283203125, 3.025634765625, 3.1722412109375, 3.31884765625, 3.4654541015625, 3.612060546875, 3.7586669921875, 3.9052734375, 4.0518798828125, 4.198486328125, 4.3450927734375, 4.49169921875, 4.6383056640625, 4.784912109375, 4.9315185546875, 5.078125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 8.0, 6.0, 5.0, 10.0, 16.0, 22.0, 23.0, 16.0, 24.0, 32.0, 31.0, 45.0, 49.0, 41.0, 47.0, 53.0, 54.0, 51.0, 59.0, 52.0, 48.0, 50.0, 41.0, 31.0, 30.0, 20.0, 22.0, 27.0, 21.0, 17.0, 12.0, 17.0, 7.0, 9.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.8671875, -5.70135498046875, -5.5355224609375, -5.36968994140625, -5.203857421875, -5.03802490234375, -4.8721923828125, -4.70635986328125, -4.54052734375, -4.37469482421875, -4.2088623046875, -4.04302978515625, -3.877197265625, -3.71136474609375, -3.5455322265625, -3.37969970703125, -3.2138671875, -3.04803466796875, -2.8822021484375, -2.71636962890625, -2.550537109375, -2.38470458984375, -2.2188720703125, -2.05303955078125, -1.88720703125, -1.72137451171875, -1.5555419921875, -1.38970947265625, -1.223876953125, -1.05804443359375, -0.8922119140625, -0.72637939453125, -0.560546875, -0.39471435546875, -0.2288818359375, -0.06304931640625, 0.102783203125, 0.26861572265625, 0.4344482421875, 0.60028076171875, 0.76611328125, 0.93194580078125, 1.0977783203125, 1.26361083984375, 1.429443359375, 1.59527587890625, 1.7611083984375, 1.92694091796875, 2.0927734375, 2.25860595703125, 2.4244384765625, 2.59027099609375, 2.756103515625, 2.92193603515625, 3.0877685546875, 3.25360107421875, 3.41943359375, 3.58526611328125, 3.7510986328125, 3.91693115234375, 4.082763671875, 4.24859619140625, 4.4144287109375, 4.58026123046875, 4.74609375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 10.0, 15.0, 22.0, 28.0, 39.0, 58.0, 108.0, 149.0, 267.0, 405.0, 658.0, 1039.0, 1618.0, 2709.0, 4327.0, 6873.0, 11395.0, 18199.0, 29286.0, 47723.0, 75825.0, 115753.0, 157107.0, 170326.0, 141664.0, 98445.0, 62667.0, 38889.0, 23891.0, 14679.0, 9203.0, 5735.0, 3595.0, 2205.0, 1345.0, 864.0, 559.0, 312.0, 180.0, 135.0, 74.0, 49.0, 36.0, 30.0, 17.0, 10.0, 4.0, 8.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0], "bins": [-3.400390625, -3.298248291015625, -3.19610595703125, -3.093963623046875, -2.9918212890625, -2.889678955078125, -2.78753662109375, -2.685394287109375, -2.583251953125, -2.481109619140625, -2.37896728515625, -2.276824951171875, -2.1746826171875, -2.072540283203125, -1.97039794921875, -1.868255615234375, -1.76611328125, -1.663970947265625, -1.56182861328125, -1.459686279296875, -1.3575439453125, -1.255401611328125, -1.15325927734375, -1.051116943359375, -0.948974609375, -0.846832275390625, -0.74468994140625, -0.642547607421875, -0.5404052734375, -0.438262939453125, -0.33612060546875, -0.233978271484375, -0.1318359375, -0.029693603515625, 0.07244873046875, 0.174591064453125, 0.2767333984375, 0.378875732421875, 0.48101806640625, 0.583160400390625, 0.685302734375, 0.787445068359375, 0.88958740234375, 0.991729736328125, 1.0938720703125, 1.196014404296875, 1.29815673828125, 1.400299072265625, 1.50244140625, 1.604583740234375, 1.70672607421875, 1.808868408203125, 1.9110107421875, 2.013153076171875, 2.11529541015625, 2.217437744140625, 2.319580078125, 2.421722412109375, 2.52386474609375, 2.626007080078125, 2.7281494140625, 2.830291748046875, 2.93243408203125, 3.034576416015625, 3.13671875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 9.0, 10.0, 10.0, 10.0, 7.0, 12.0, 16.0, 24.0, 21.0, 24.0, 26.0, 26.0, 33.0, 30.0, 30.0, 41.0, 33.0, 40.0, 43.0, 46.0, 53.0, 29.0, 45.0, 34.0, 45.0, 48.0, 27.0, 23.0, 26.0, 20.0, 23.0, 29.0, 10.0, 16.0, 18.0, 17.0, 10.0, 11.0, 11.0, 9.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.361328125, -2.287261962890625, -2.21319580078125, -2.139129638671875, -2.0650634765625, -1.990997314453125, -1.91693115234375, -1.842864990234375, -1.768798828125, -1.694732666015625, -1.62066650390625, -1.546600341796875, -1.4725341796875, -1.398468017578125, -1.32440185546875, -1.250335693359375, -1.17626953125, -1.102203369140625, -1.02813720703125, -0.954071044921875, -0.8800048828125, -0.805938720703125, -0.73187255859375, -0.657806396484375, -0.583740234375, -0.509674072265625, -0.43560791015625, -0.361541748046875, -0.2874755859375, -0.213409423828125, -0.13934326171875, -0.065277099609375, 0.0087890625, 0.082855224609375, 0.15692138671875, 0.230987548828125, 0.3050537109375, 0.379119873046875, 0.45318603515625, 0.527252197265625, 0.601318359375, 0.675384521484375, 0.74945068359375, 0.823516845703125, 0.8975830078125, 0.971649169921875, 1.04571533203125, 1.119781494140625, 1.19384765625, 1.267913818359375, 1.34197998046875, 1.416046142578125, 1.4901123046875, 1.564178466796875, 1.63824462890625, 1.712310791015625, 1.786376953125, 1.860443115234375, 1.93450927734375, 2.008575439453125, 2.0826416015625, 2.156707763671875, 2.23077392578125, 2.304840087890625, 2.37890625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 13.0, 9.0, 20.0, 28.0, 53.0, 86.0, 126.0, 219.0, 418.0, 746.0, 1380.0, 2528.0, 4896.0, 10111.0, 20176.0, 41490.0, 82684.0, 158606.0, 243666.0, 219721.0, 129972.0, 65940.0, 32998.0, 16110.0, 7962.0, 3997.0, 2111.0, 1092.0, 573.0, 320.0, 188.0, 115.0, 71.0, 47.0, 22.0, 18.0, 12.0, 6.0, 6.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7470703125, -1.6983184814453125, -1.649566650390625, -1.6008148193359375, -1.55206298828125, -1.5033111572265625, -1.454559326171875, -1.4058074951171875, -1.3570556640625, -1.3083038330078125, -1.259552001953125, -1.2108001708984375, -1.16204833984375, -1.1132965087890625, -1.064544677734375, -1.0157928466796875, -0.967041015625, -0.9182891845703125, -0.869537353515625, -0.8207855224609375, -0.77203369140625, -0.7232818603515625, -0.674530029296875, -0.6257781982421875, -0.5770263671875, -0.5282745361328125, -0.479522705078125, -0.4307708740234375, -0.38201904296875, -0.3332672119140625, -0.284515380859375, -0.2357635498046875, -0.18701171875, -0.1382598876953125, -0.089508056640625, -0.0407562255859375, 0.00799560546875, 0.0567474365234375, 0.105499267578125, 0.1542510986328125, 0.2030029296875, 0.2517547607421875, 0.300506591796875, 0.3492584228515625, 0.39801025390625, 0.4467620849609375, 0.495513916015625, 0.5442657470703125, 0.593017578125, 0.6417694091796875, 0.690521240234375, 0.7392730712890625, 0.78802490234375, 0.8367767333984375, 0.885528564453125, 0.9342803955078125, 0.9830322265625, 1.0317840576171875, 1.080535888671875, 1.1292877197265625, 1.17803955078125, 1.2267913818359375, 1.275543212890625, 1.3242950439453125, 1.373046875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 5.0, 2.0, 4.0, 5.0, 8.0, 7.0, 5.0, 8.0, 10.0, 21.0, 19.0, 26.0, 26.0, 35.0, 44.0, 36.0, 57.0, 55.0, 57.0, 52.0, 53.0, 70.0, 57.0, 68.0, 50.0, 40.0, 36.0, 20.0, 36.0, 11.0, 20.0, 8.0, 17.0, 6.0, 6.0, 3.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.194280624389648e-05, -6.944779306650162e-05, -6.695277988910675e-05, -6.445776671171188e-05, -6.196275353431702e-05, -5.946774035692215e-05, -5.697272717952728e-05, -5.4477714002132416e-05, -5.198270082473755e-05, -4.948768764734268e-05, -4.6992674469947815e-05, -4.449766129255295e-05, -4.200264811515808e-05, -3.9507634937763214e-05, -3.701262176036835e-05, -3.451760858297348e-05, -3.202259540557861e-05, -2.9527582228183746e-05, -2.703256905078888e-05, -2.4537555873394012e-05, -2.2042542695999146e-05, -1.954752951860428e-05, -1.705251634120941e-05, -1.4557503163814545e-05, -1.2062489986419678e-05, -9.56747680902481e-06, -7.072463631629944e-06, -4.577450454235077e-06, -2.08243727684021e-06, 4.12575900554657e-07, 2.907589077949524e-06, 5.402602255344391e-06, 7.897615432739258e-06, 1.0392628610134125e-05, 1.2887641787528992e-05, 1.538265496492386e-05, 1.7877668142318726e-05, 2.0372681319713593e-05, 2.286769449710846e-05, 2.5362707674503326e-05, 2.7857720851898193e-05, 3.035273402929306e-05, 3.284774720668793e-05, 3.5342760384082794e-05, 3.783777356147766e-05, 4.033278673887253e-05, 4.2827799916267395e-05, 4.532281309366226e-05, 4.781782627105713e-05, 5.0312839448451996e-05, 5.280785262584686e-05, 5.530286580324173e-05, 5.77978789806366e-05, 6.0292892158031464e-05, 6.278790533542633e-05, 6.52829185128212e-05, 6.777793169021606e-05, 7.027294486761093e-05, 7.27679580450058e-05, 7.526297122240067e-05, 7.775798439979553e-05, 8.02529975771904e-05, 8.274801075458527e-05, 8.524302393198013e-05, 8.7738037109375e-05]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 3.0, 14.0, 17.0, 21.0, 33.0, 53.0, 97.0, 140.0, 276.0, 536.0, 1013.0, 2078.0, 4257.0, 8787.0, 19443.0, 42372.0, 91718.0, 186545.0, 276924.0, 212103.0, 108336.0, 50209.0, 23090.0, 10691.0, 4891.0, 2352.0, 1144.0, 639.0, 308.0, 202.0, 92.0, 64.0, 44.0, 22.0, 14.0, 14.0, 9.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6552734375, -1.6011962890625, -1.547119140625, -1.4930419921875, -1.43896484375, -1.3848876953125, -1.330810546875, -1.2767333984375, -1.22265625, -1.1685791015625, -1.114501953125, -1.0604248046875, -1.00634765625, -0.9522705078125, -0.898193359375, -0.8441162109375, -0.7900390625, -0.7359619140625, -0.681884765625, -0.6278076171875, -0.57373046875, -0.5196533203125, -0.465576171875, -0.4114990234375, -0.357421875, -0.3033447265625, -0.249267578125, -0.1951904296875, -0.14111328125, -0.0870361328125, -0.032958984375, 0.0211181640625, 0.0751953125, 0.1292724609375, 0.183349609375, 0.2374267578125, 0.29150390625, 0.3455810546875, 0.399658203125, 0.4537353515625, 0.5078125, 0.5618896484375, 0.615966796875, 0.6700439453125, 0.72412109375, 0.7781982421875, 0.832275390625, 0.8863525390625, 0.9404296875, 0.9945068359375, 1.048583984375, 1.1026611328125, 1.15673828125, 1.2108154296875, 1.264892578125, 1.3189697265625, 1.373046875, 1.4271240234375, 1.481201171875, 1.5352783203125, 1.58935546875, 1.6434326171875, 1.697509765625, 1.7515869140625, 1.8056640625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 16.0, 17.0, 18.0, 24.0, 26.0, 31.0, 33.0, 35.0, 40.0, 56.0, 47.0, 51.0, 59.0, 61.0, 50.0, 59.0, 46.0, 51.0, 46.0, 34.0, 41.0, 39.0, 23.0, 17.0, 18.0, 6.0, 9.0, 6.0, 11.0, 4.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.58984375, -0.5730705261230469, -0.5562973022460938, -0.5395240783691406, -0.5227508544921875, -0.5059776306152344, -0.48920440673828125, -0.4724311828613281, -0.455657958984375, -0.4388847351074219, -0.42211151123046875, -0.4053382873535156, -0.3885650634765625, -0.3717918395996094, -0.35501861572265625, -0.3382453918457031, -0.32147216796875, -0.3046989440917969, -0.28792572021484375, -0.2711524963378906, -0.2543792724609375, -0.23760604858398438, -0.22083282470703125, -0.20405960083007812, -0.187286376953125, -0.17051315307617188, -0.15373992919921875, -0.13696670532226562, -0.1201934814453125, -0.10342025756835938, -0.08664703369140625, -0.06987380981445312, -0.0531005859375, -0.036327362060546875, -0.01955413818359375, -0.002780914306640625, 0.0139923095703125, 0.030765533447265625, 0.04753875732421875, 0.06431198120117188, 0.081085205078125, 0.09785842895507812, 0.11463165283203125, 0.13140487670898438, 0.1481781005859375, 0.16495132446289062, 0.18172454833984375, 0.19849777221679688, 0.21527099609375, 0.23204421997070312, 0.24881744384765625, 0.2655906677246094, 0.2823638916015625, 0.2991371154785156, 0.31591033935546875, 0.3326835632324219, 0.349456787109375, 0.3662300109863281, 0.38300323486328125, 0.3997764587402344, 0.4165496826171875, 0.4333229064941406, 0.45009613037109375, 0.4668693542480469, 0.483642578125]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 11.0, 14.0, 15.0, 10.0, 20.0, 34.0, 38.0, 37.0, 47.0, 42.0, 50.0, 56.0, 62.0, 74.0, 72.0, 81.0, 62.0, 42.0, 44.0, 32.0, 24.0, 32.0, 16.0, 11.0, 13.0, 13.0, 11.0, 7.0, 5.0, 5.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0058674812316895, -3.8648617267608643, -3.72385573387146, -3.5828499794006348, -3.4418442249298096, -3.3008384704589844, -3.15983247756958, -3.018826723098755, -2.8778209686279297, -2.7368152141571045, -2.5958092212677, -2.454803466796875, -2.31379771232605, -2.1727919578552246, -2.0317859649658203, -1.8907802104949951, -1.7497742176055908, -1.608768343925476, -1.4677625894546509, -1.3267567157745361, -1.185750961303711, -1.0447450876235962, -0.9037392139434814, -0.7627333998680115, -0.6217275857925415, -0.48072177171707153, -0.3397159278392792, -0.19871008396148682, -0.057704269886016846, 0.08330154418945312, 0.22430741786956787, 0.36531323194503784, 0.5063190460205078, 0.6473248600959778, 0.7883306741714478, 0.9293365478515625, 1.0703423023223877, 1.2113481760025024, 1.3523540496826172, 1.4933598041534424, 1.6343656778335571, 1.7753715515136719, 1.916377305984497, 2.0573830604553223, 2.1983890533447266, 2.3393948078155518, 2.480400562286377, 2.6214065551757812, 2.7624123096466064, 2.9034180641174316, 3.044424057006836, 3.185429811477661, 3.3264355659484863, 3.4674415588378906, 3.608447313308716, 3.749453067779541, 3.8904590606689453, 4.03146505355835, 4.172470569610596, 4.3134765625, 4.454482555389404, 4.59548807144165, 4.736494064331055, 4.877500057220459, 5.018505573272705]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 10.0, 10.0, 16.0, 12.0, 13.0, 21.0, 35.0, 25.0, 34.0, 24.0, 37.0, 48.0, 48.0, 44.0, 64.0, 52.0, 47.0, 46.0, 40.0, 57.0, 41.0, 34.0, 42.0, 30.0, 30.0, 26.0, 19.0, 10.0, 18.0, 18.0, 7.0, 13.0, 7.0, 7.0, 2.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.557457447052002, -4.400729656219482, -4.244002342224121, -4.087274551391602, -3.9305472373962402, -3.7738194465637207, -3.6170918941497803, -3.46036434173584, -3.3036367893218994, -3.146909236907959, -2.9901816844940186, -2.833454132080078, -2.6767263412475586, -2.5199990272521973, -2.3632712364196777, -2.2065436840057373, -2.049816131591797, -1.8930885791778564, -1.736361026763916, -1.579633355140686, -1.4229058027267456, -1.2661782503128052, -1.1094505786895752, -0.9527230262756348, -0.7959954738616943, -0.6392679214477539, -0.4825403094291687, -0.3258127272129059, -0.16908514499664307, -0.012357592582702637, 0.14437001943588257, 0.3010976314544678, 0.45782470703125, 0.6145522594451904, 0.7712798714637756, 0.9280074834823608, 1.0847350358963013, 1.2414625883102417, 1.3981902599334717, 1.554917812347412, 1.7116453647613525, 1.868372917175293, 2.0251004695892334, 2.181828022003174, 2.3385558128356934, 2.4952831268310547, 2.652010917663574, 2.8087384700775146, 2.965466022491455, 3.1221935749053955, 3.278921127319336, 3.4356486797332764, 3.592376232147217, 3.7491040229797363, 3.9058315753936768, 4.062559127807617, 4.219286918640137, 4.376014709472656, 4.532742023468018, 4.689469814300537, 4.846197128295898, 5.002924919128418, 5.159652233123779, 5.316380023956299, 5.47310733795166]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 11.0, 15.0, 25.0, 36.0, 54.0, 56.0, 105.0, 163.0, 306.0, 492.0, 818.0, 1349.0, 2344.0, 4498.0, 8753.0, 17868.0, 40490.0, 104570.0, 315966.0, 1037466.0, 1642091.0, 676516.0, 206314.0, 73858.0, 30348.0, 14033.0, 6946.0, 3670.0, 2070.0, 1185.0, 712.0, 437.0, 261.0, 170.0, 102.0, 62.0, 44.0, 23.0, 20.0, 10.0, 11.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.78125, -6.5714111328125, -6.361572265625, -6.1517333984375, -5.94189453125, -5.7320556640625, -5.522216796875, -5.3123779296875, -5.1025390625, -4.8927001953125, -4.682861328125, -4.4730224609375, -4.26318359375, -4.0533447265625, -3.843505859375, -3.6336669921875, -3.423828125, -3.2139892578125, -3.004150390625, -2.7943115234375, -2.58447265625, -2.3746337890625, -2.164794921875, -1.9549560546875, -1.7451171875, -1.5352783203125, -1.325439453125, -1.1156005859375, -0.90576171875, -0.6959228515625, -0.486083984375, -0.2762451171875, -0.06640625, 0.1434326171875, 0.353271484375, 0.5631103515625, 0.77294921875, 0.9827880859375, 1.192626953125, 1.4024658203125, 1.6123046875, 1.8221435546875, 2.031982421875, 2.2418212890625, 2.45166015625, 2.6614990234375, 2.871337890625, 3.0811767578125, 3.291015625, 3.5008544921875, 3.710693359375, 3.9205322265625, 4.13037109375, 4.3402099609375, 4.550048828125, 4.7598876953125, 4.9697265625, 5.1795654296875, 5.389404296875, 5.5992431640625, 5.80908203125, 6.0189208984375, 6.228759765625, 6.4385986328125, 6.6484375]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 5.0, 7.0, 12.0, 13.0, 16.0, 17.0, 22.0, 27.0, 30.0, 26.0, 45.0, 39.0, 45.0, 65.0, 50.0, 55.0, 55.0, 45.0, 60.0, 40.0, 47.0, 47.0, 50.0, 26.0, 25.0, 27.0, 20.0, 17.0, 11.0, 14.0, 11.0, 7.0, 7.0, 3.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33984375, -3.23028564453125, -3.1207275390625, -3.01116943359375, -2.901611328125, -2.79205322265625, -2.6824951171875, -2.57293701171875, -2.46337890625, -2.35382080078125, -2.2442626953125, -2.13470458984375, -2.025146484375, -1.91558837890625, -1.8060302734375, -1.69647216796875, -1.5869140625, -1.47735595703125, -1.3677978515625, -1.25823974609375, -1.148681640625, -1.03912353515625, -0.9295654296875, -0.82000732421875, -0.71044921875, -0.60089111328125, -0.4913330078125, -0.38177490234375, -0.272216796875, -0.16265869140625, -0.0531005859375, 0.05645751953125, 0.166015625, 0.27557373046875, 0.3851318359375, 0.49468994140625, 0.604248046875, 0.71380615234375, 0.8233642578125, 0.93292236328125, 1.04248046875, 1.15203857421875, 1.2615966796875, 1.37115478515625, 1.480712890625, 1.59027099609375, 1.6998291015625, 1.80938720703125, 1.9189453125, 2.02850341796875, 2.1380615234375, 2.24761962890625, 2.357177734375, 2.46673583984375, 2.5762939453125, 2.68585205078125, 2.79541015625, 2.90496826171875, 3.0145263671875, 3.12408447265625, 3.233642578125, 3.34320068359375, 3.4527587890625, 3.56231689453125, 3.671875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 7.0, 16.0, 22.0, 41.0, 48.0, 84.0, 145.0, 266.0, 448.0, 786.0, 1424.0, 2616.0, 4878.0, 9381.0, 19169.0, 40669.0, 92175.0, 219164.0, 532554.0, 1092680.0, 1151045.0, 592773.0, 245036.0, 102182.0, 44631.0, 20385.0, 10133.0, 5202.0, 2809.0, 1587.0, 789.0, 461.0, 264.0, 160.0, 96.0, 60.0, 42.0, 21.0, 12.0, 9.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75, -4.5865478515625, -4.423095703125, -4.2596435546875, -4.09619140625, -3.9327392578125, -3.769287109375, -3.6058349609375, -3.4423828125, -3.2789306640625, -3.115478515625, -2.9520263671875, -2.78857421875, -2.6251220703125, -2.461669921875, -2.2982177734375, -2.134765625, -1.9713134765625, -1.807861328125, -1.6444091796875, -1.48095703125, -1.3175048828125, -1.154052734375, -0.9906005859375, -0.8271484375, -0.6636962890625, -0.500244140625, -0.3367919921875, -0.17333984375, -0.0098876953125, 0.153564453125, 0.3170166015625, 0.48046875, 0.6439208984375, 0.807373046875, 0.9708251953125, 1.13427734375, 1.2977294921875, 1.461181640625, 1.6246337890625, 1.7880859375, 1.9515380859375, 2.114990234375, 2.2784423828125, 2.44189453125, 2.6053466796875, 2.768798828125, 2.9322509765625, 3.095703125, 3.2591552734375, 3.422607421875, 3.5860595703125, 3.74951171875, 3.9129638671875, 4.076416015625, 4.2398681640625, 4.4033203125, 4.5667724609375, 4.730224609375, 4.8936767578125, 5.05712890625, 5.2205810546875, 5.384033203125, 5.5474853515625, 5.7109375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 2.0, 6.0, 9.0, 17.0, 15.0, 25.0, 43.0, 47.0, 57.0, 87.0, 81.0, 121.0, 141.0, 211.0, 212.0, 268.0, 259.0, 328.0, 306.0, 304.0, 251.0, 244.0, 193.0, 189.0, 145.0, 106.0, 68.0, 70.0, 66.0, 52.0, 40.0, 26.0, 27.0, 11.0, 13.0, 10.0, 12.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5947265625, -1.5405731201171875, -1.486419677734375, -1.4322662353515625, -1.37811279296875, -1.3239593505859375, -1.269805908203125, -1.2156524658203125, -1.1614990234375, -1.1073455810546875, -1.053192138671875, -0.9990386962890625, -0.94488525390625, -0.8907318115234375, -0.836578369140625, -0.7824249267578125, -0.728271484375, -0.6741180419921875, -0.619964599609375, -0.5658111572265625, -0.51165771484375, -0.4575042724609375, -0.403350830078125, -0.3491973876953125, -0.2950439453125, -0.2408905029296875, -0.186737060546875, -0.1325836181640625, -0.07843017578125, -0.0242767333984375, 0.029876708984375, 0.0840301513671875, 0.13818359375, 0.1923370361328125, 0.246490478515625, 0.3006439208984375, 0.35479736328125, 0.4089508056640625, 0.463104248046875, 0.5172576904296875, 0.5714111328125, 0.6255645751953125, 0.679718017578125, 0.7338714599609375, 0.78802490234375, 0.8421783447265625, 0.896331787109375, 0.9504852294921875, 1.004638671875, 1.0587921142578125, 1.112945556640625, 1.1670989990234375, 1.22125244140625, 1.2754058837890625, 1.329559326171875, 1.3837127685546875, 1.4378662109375, 1.4920196533203125, 1.546173095703125, 1.6003265380859375, 1.65447998046875, 1.7086334228515625, 1.762786865234375, 1.8169403076171875, 1.87109375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 11.0, 9.0, 10.0, 14.0, 32.0, 30.0, 38.0, 36.0, 34.0, 52.0, 53.0, 88.0, 93.0, 74.0, 71.0, 59.0, 65.0, 48.0, 33.0, 29.0, 33.0, 11.0, 16.0, 14.0, 9.0, 13.0, 8.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9060957431793213, -3.756324529647827, -3.606553077697754, -3.4567818641662598, -3.3070106506347656, -3.1572394371032715, -3.0074682235717773, -2.857696771621704, -2.70792555809021, -2.558154344558716, -2.4083828926086426, -2.2586116790771484, -2.1088404655456543, -1.9590692520141602, -1.8092979192733765, -1.6595265865325928, -1.5097553730010986, -1.3599841594696045, -1.2102128267288208, -1.060441493988037, -0.910670280456543, -0.760899007320404, -0.6111277341842651, -0.46135640144348145, -0.3115851879119873, -0.1618139147758484, -0.012042641639709473, 0.13772863149642944, 0.28749990463256836, 0.4372711777687073, 0.5870424509048462, 0.7368137836456299, 0.8865852355957031, 1.0363564491271973, 1.186127781867981, 1.3358991146087646, 1.4856703281402588, 1.635441541671753, 1.7852128744125366, 1.9349842071533203, 2.0847554206848145, 2.2345266342163086, 2.3842978477478027, 2.534069299697876, 2.68384051322937, 2.8336117267608643, 2.9833831787109375, 3.1331543922424316, 3.282925605773926, 3.43269681930542, 3.582468032836914, 3.7322394847869873, 3.8820106983184814, 4.031782150268555, 4.181553363800049, 4.331324577331543, 4.481095790863037, 4.630867004394531, 4.780638217926025, 4.9304094314575195, 5.080181121826172, 5.229952335357666, 5.37972354888916, 5.529494762420654, 5.679265975952148]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 9.0, 10.0, 11.0, 12.0, 15.0, 16.0, 15.0, 22.0, 29.0, 32.0, 31.0, 38.0, 37.0, 49.0, 49.0, 50.0, 51.0, 31.0, 51.0, 46.0, 37.0, 45.0, 33.0, 40.0, 37.0, 26.0, 27.0, 26.0, 18.0, 18.0, 11.0, 19.0, 15.0, 12.0, 7.0, 7.0, 7.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.755153179168701, -3.6149749755859375, -3.4747965335845947, -3.334618330001831, -3.1944401264190674, -3.0542616844177246, -2.914083480834961, -2.7739052772521973, -2.6337270736694336, -2.49354887008667, -2.353370428085327, -2.2131922245025635, -2.0730140209198, -1.9328356981277466, -1.7926573753356934, -1.6524791717529297, -1.512300729751587, -1.3721224069595337, -1.23194420337677, -1.0917658805847168, -0.9515876173973083, -0.8114093542098999, -0.6712310314178467, -0.5310527682304382, -0.3908745050430298, -0.25069624185562134, -0.1105179488658905, 0.029660344123840332, 0.16983860731124878, 0.3100168704986572, 0.45019519329071045, 0.5903734564781189, 0.7305517196655273, 0.8707299828529358, 1.0109082460403442, 1.1510865688323975, 1.2912647724151611, 1.4314430952072144, 1.5716214179992676, 1.7117996215820312, 1.8519779443740845, 1.9921562671661377, 2.1323344707489014, 2.272512912750244, 2.412691116333008, 2.5528693199157715, 2.693047523498535, 2.833225965499878, 2.9734041690826416, 3.1135823726654053, 3.253760814666748, 3.3939390182495117, 3.5341172218322754, 3.674295425415039, 3.814473867416382, 3.9546520709991455, 4.094830513000488, 4.235008716583252, 4.375186920166016, 4.5153656005859375, 4.655543804168701, 4.795722007751465, 4.9359002113342285, 5.076078414916992, 5.216256618499756]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 8.0, 6.0, 12.0, 20.0, 24.0, 42.0, 60.0, 89.0, 145.0, 255.0, 454.0, 717.0, 1207.0, 2183.0, 3481.0, 6086.0, 10371.0, 18878.0, 34946.0, 71847.0, 164537.0, 321744.0, 219390.0, 94270.0, 44261.0, 22890.0, 12700.0, 7388.0, 4344.0, 2421.0, 1497.0, 876.0, 523.0, 337.0, 192.0, 131.0, 73.0, 51.0, 37.0, 19.0, 19.0, 9.0, 10.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3291015625, -1.282745361328125, -1.23638916015625, -1.190032958984375, -1.1436767578125, -1.097320556640625, -1.05096435546875, -1.004608154296875, -0.958251953125, -0.911895751953125, -0.86553955078125, -0.819183349609375, -0.7728271484375, -0.726470947265625, -0.68011474609375, -0.633758544921875, -0.58740234375, -0.541046142578125, -0.49468994140625, -0.448333740234375, -0.4019775390625, -0.355621337890625, -0.30926513671875, -0.262908935546875, -0.216552734375, -0.170196533203125, -0.12384033203125, -0.077484130859375, -0.0311279296875, 0.015228271484375, 0.06158447265625, 0.107940673828125, 0.154296875, 0.200653076171875, 0.24700927734375, 0.293365478515625, 0.3397216796875, 0.386077880859375, 0.43243408203125, 0.478790283203125, 0.525146484375, 0.571502685546875, 0.61785888671875, 0.664215087890625, 0.7105712890625, 0.756927490234375, 0.80328369140625, 0.849639892578125, 0.89599609375, 0.942352294921875, 0.98870849609375, 1.035064697265625, 1.0814208984375, 1.127777099609375, 1.17413330078125, 1.220489501953125, 1.266845703125, 1.313201904296875, 1.35955810546875, 1.405914306640625, 1.4522705078125, 1.498626708984375, 1.54498291015625, 1.591339111328125, 1.6376953125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 9.0, 3.0, 10.0, 15.0, 13.0, 14.0, 22.0, 20.0, 28.0, 38.0, 39.0, 40.0, 41.0, 52.0, 54.0, 59.0, 51.0, 47.0, 42.0, 53.0, 42.0, 39.0, 49.0, 33.0, 35.0, 24.0, 26.0, 16.0, 16.0, 18.0, 11.0, 16.0, 5.0, 9.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12890625, -3.9705810546875, -3.812255859375, -3.6539306640625, -3.49560546875, -3.3372802734375, -3.178955078125, -3.0206298828125, -2.8623046875, -2.7039794921875, -2.545654296875, -2.3873291015625, -2.22900390625, -2.0706787109375, -1.912353515625, -1.7540283203125, -1.595703125, -1.4373779296875, -1.279052734375, -1.1207275390625, -0.96240234375, -0.8040771484375, -0.645751953125, -0.4874267578125, -0.3291015625, -0.1707763671875, -0.012451171875, 0.1458740234375, 0.30419921875, 0.4625244140625, 0.620849609375, 0.7791748046875, 0.9375, 1.0958251953125, 1.254150390625, 1.4124755859375, 1.57080078125, 1.7291259765625, 1.887451171875, 2.0457763671875, 2.2041015625, 2.3624267578125, 2.520751953125, 2.6790771484375, 2.83740234375, 2.9957275390625, 3.154052734375, 3.3123779296875, 3.470703125, 3.6290283203125, 3.787353515625, 3.9456787109375, 4.10400390625, 4.2623291015625, 4.420654296875, 4.5789794921875, 4.7373046875, 4.8956298828125, 5.053955078125, 5.2122802734375, 5.37060546875, 5.5289306640625, 5.687255859375, 5.8455810546875, 6.00390625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 4.0, 12.0, 6.0, 12.0, 25.0, 25.0, 32.0, 25.0, 50.0, 62.0, 90.0, 125.0, 164.0, 229.0, 349.0, 468.0, 776.0, 1351.0, 2463.0, 5298.0, 13575.0, 45155.0, 919528.0, 36449.0, 11809.0, 4669.0, 2224.0, 1217.0, 745.0, 464.0, 333.0, 208.0, 161.0, 114.0, 88.0, 65.0, 40.0, 41.0, 27.0, 21.0, 13.0, 19.0, 7.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.787109375, -3.666595458984375, -3.54608154296875, -3.425567626953125, -3.3050537109375, -3.184539794921875, -3.06402587890625, -2.943511962890625, -2.822998046875, -2.702484130859375, -2.58197021484375, -2.461456298828125, -2.3409423828125, -2.220428466796875, -2.09991455078125, -1.979400634765625, -1.85888671875, -1.738372802734375, -1.61785888671875, -1.497344970703125, -1.3768310546875, -1.256317138671875, -1.13580322265625, -1.015289306640625, -0.894775390625, -0.774261474609375, -0.65374755859375, -0.533233642578125, -0.4127197265625, -0.292205810546875, -0.17169189453125, -0.051177978515625, 0.0693359375, 0.189849853515625, 0.31036376953125, 0.430877685546875, 0.5513916015625, 0.671905517578125, 0.79241943359375, 0.912933349609375, 1.033447265625, 1.153961181640625, 1.27447509765625, 1.394989013671875, 1.5155029296875, 1.636016845703125, 1.75653076171875, 1.877044677734375, 1.99755859375, 2.118072509765625, 2.23858642578125, 2.359100341796875, 2.4796142578125, 2.600128173828125, 2.72064208984375, 2.841156005859375, 2.961669921875, 3.082183837890625, 3.20269775390625, 3.323211669921875, 3.4437255859375, 3.564239501953125, 3.68475341796875, 3.805267333984375, 3.92578125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 8.0, 3.0, 5.0, 10.0, 9.0, 14.0, 12.0, 10.0, 22.0, 20.0, 19.0, 23.0, 28.0, 25.0, 30.0, 34.0, 34.0, 45.0, 32.0, 41.0, 41.0, 41.0, 48.0, 46.0, 52.0, 37.0, 27.0, 41.0, 29.0, 32.0, 24.0, 24.0, 26.0, 13.0, 22.0, 13.0, 18.0, 12.0, 8.0, 5.0, 7.0, 3.0, 5.0, 9.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.27734375, -2.193145751953125, -2.10894775390625, -2.024749755859375, -1.9405517578125, -1.856353759765625, -1.77215576171875, -1.687957763671875, -1.603759765625, -1.519561767578125, -1.43536376953125, -1.351165771484375, -1.2669677734375, -1.182769775390625, -1.09857177734375, -1.014373779296875, -0.93017578125, -0.845977783203125, -0.76177978515625, -0.677581787109375, -0.5933837890625, -0.509185791015625, -0.42498779296875, -0.340789794921875, -0.256591796875, -0.172393798828125, -0.08819580078125, -0.003997802734375, 0.0802001953125, 0.164398193359375, 0.24859619140625, 0.332794189453125, 0.4169921875, 0.501190185546875, 0.58538818359375, 0.669586181640625, 0.7537841796875, 0.837982177734375, 0.92218017578125, 1.006378173828125, 1.090576171875, 1.174774169921875, 1.25897216796875, 1.343170166015625, 1.4273681640625, 1.511566162109375, 1.59576416015625, 1.679962158203125, 1.76416015625, 1.848358154296875, 1.93255615234375, 2.016754150390625, 2.1009521484375, 2.185150146484375, 2.26934814453125, 2.353546142578125, 2.437744140625, 2.521942138671875, 2.60614013671875, 2.690338134765625, 2.7745361328125, 2.858734130859375, 2.94293212890625, 3.027130126953125, 3.111328125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 10.0, 8.0, 9.0, 19.0, 21.0, 23.0, 47.0, 61.0, 76.0, 99.0, 169.0, 297.0, 479.0, 713.0, 1373.0, 2688.0, 6183.0, 17842.0, 897476.0, 93730.0, 15807.0, 5725.0, 2550.0, 1198.0, 753.0, 404.0, 249.0, 160.0, 111.0, 78.0, 54.0, 39.0, 38.0, 18.0, 15.0, 8.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.3564453125, -0.345947265625, -0.33544921875, -0.324951171875, -0.314453125, -0.303955078125, -0.29345703125, -0.282958984375, -0.2724609375, -0.261962890625, -0.25146484375, -0.240966796875, -0.23046875, -0.219970703125, -0.20947265625, -0.198974609375, -0.1884765625, -0.177978515625, -0.16748046875, -0.156982421875, -0.146484375, -0.135986328125, -0.12548828125, -0.114990234375, -0.1044921875, -0.093994140625, -0.08349609375, -0.072998046875, -0.0625, -0.052001953125, -0.04150390625, -0.031005859375, -0.0205078125, -0.010009765625, 0.00048828125, 0.010986328125, 0.021484375, 0.031982421875, 0.04248046875, 0.052978515625, 0.0634765625, 0.073974609375, 0.08447265625, 0.094970703125, 0.10546875, 0.115966796875, 0.12646484375, 0.136962890625, 0.1474609375, 0.157958984375, 0.16845703125, 0.178955078125, 0.189453125, 0.199951171875, 0.21044921875, 0.220947265625, 0.2314453125, 0.241943359375, 0.25244140625, 0.262939453125, 0.2734375, 0.283935546875, 0.29443359375, 0.304931640625, 0.3154296875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 6.0, 3.0, 2.0, 1.0, 6.0, 10.0, 15.0, 21.0, 35.0, 51.0, 69.0, 79.0, 118.0, 117.0, 106.0, 97.0, 64.0, 48.0, 42.0, 18.0, 17.0, 12.0, 10.0, 6.0, 9.0, 7.0, 6.0, 3.0, 2.0, 6.0, 0.0, 0.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.761882781982422e-05, -8.457247167825699e-05, -8.152611553668976e-05, -7.847975939512253e-05, -7.54334032535553e-05, -7.238704711198807e-05, -6.934069097042084e-05, -6.629433482885361e-05, -6.324797868728638e-05, -6.020162254571915e-05, -5.7155266404151917e-05, -5.4108910262584686e-05, -5.1062554121017456e-05, -4.8016197979450226e-05, -4.4969841837882996e-05, -4.1923485696315765e-05, -3.8877129554748535e-05, -3.5830773413181305e-05, -3.2784417271614075e-05, -2.9738061130046844e-05, -2.6691704988479614e-05, -2.3645348846912384e-05, -2.0598992705345154e-05, -1.7552636563777924e-05, -1.4506280422210693e-05, -1.1459924280643463e-05, -8.413568139076233e-06, -5.367211997509003e-06, -2.3208558559417725e-06, 7.255002856254578e-07, 3.771856427192688e-06, 6.818212568759918e-06, 9.864568710327148e-06, 1.2910924851894379e-05, 1.595728099346161e-05, 1.900363713502884e-05, 2.204999327659607e-05, 2.50963494181633e-05, 2.814270555973053e-05, 3.118906170129776e-05, 3.423541784286499e-05, 3.728177398443222e-05, 4.032813012599945e-05, 4.337448626756668e-05, 4.642084240913391e-05, 4.946719855070114e-05, 5.251355469226837e-05, 5.55599108338356e-05, 5.860626697540283e-05, 6.165262311697006e-05, 6.469897925853729e-05, 6.774533540010452e-05, 7.079169154167175e-05, 7.383804768323898e-05, 7.688440382480621e-05, 7.993075996637344e-05, 8.297711610794067e-05, 8.60234722495079e-05, 8.906982839107513e-05, 9.211618453264236e-05, 9.51625406742096e-05, 9.820889681577682e-05, 0.00010125525295734406, 0.00010430160909891129, 0.00010734796524047852]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 7.0, 19.0, 13.0, 21.0, 39.0, 60.0, 133.0, 217.0, 387.0, 732.0, 1817.0, 4749.0, 13611.0, 43039.0, 173058.0, 575322.0, 171123.0, 42489.0, 13379.0, 4864.0, 1762.0, 769.0, 398.0, 206.0, 137.0, 69.0, 43.0, 17.0, 16.0, 20.0, 10.0, 7.0, 4.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2366943359375, -0.2300262451171875, -0.223358154296875, -0.2166900634765625, -0.21002197265625, -0.2033538818359375, -0.196685791015625, -0.1900177001953125, -0.183349609375, -0.1766815185546875, -0.170013427734375, -0.1633453369140625, -0.15667724609375, -0.1500091552734375, -0.143341064453125, -0.1366729736328125, -0.1300048828125, -0.1233367919921875, -0.116668701171875, -0.1100006103515625, -0.10333251953125, -0.0966644287109375, -0.089996337890625, -0.0833282470703125, -0.07666015625, -0.0699920654296875, -0.063323974609375, -0.0566558837890625, -0.04998779296875, -0.0433197021484375, -0.036651611328125, -0.0299835205078125, -0.0233154296875, -0.0166473388671875, -0.009979248046875, -0.0033111572265625, 0.00335693359375, 0.0100250244140625, 0.016693115234375, 0.0233612060546875, 0.030029296875, 0.0366973876953125, 0.043365478515625, 0.0500335693359375, 0.05670166015625, 0.0633697509765625, 0.070037841796875, 0.0767059326171875, 0.0833740234375, 0.0900421142578125, 0.096710205078125, 0.1033782958984375, 0.11004638671875, 0.1167144775390625, 0.123382568359375, 0.1300506591796875, 0.13671875, 0.1433868408203125, 0.150054931640625, 0.1567230224609375, 0.16339111328125, 0.1700592041015625, 0.176727294921875, 0.1833953857421875, 0.1900634765625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 11.0, 10.0, 8.0, 6.0, 17.0, 14.0, 23.0, 31.0, 43.0, 63.0, 88.0, 117.0, 126.0, 120.0, 81.0, 66.0, 41.0, 37.0, 30.0, 17.0, 25.0, 10.0, 6.0, 5.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03521728515625, -0.03358268737792969, -0.031948089599609375, -0.030313491821289062, -0.02867889404296875, -0.027044296264648438, -0.025409698486328125, -0.023775100708007812, -0.0221405029296875, -0.020505905151367188, -0.018871307373046875, -0.017236709594726562, -0.01560211181640625, -0.013967514038085938, -0.012332916259765625, -0.010698318481445312, -0.009063720703125, -0.0074291229248046875, -0.005794525146484375, -0.0041599273681640625, -0.00252532958984375, -0.0008907318115234375, 0.000743865966796875, 0.0023784637451171875, 0.0040130615234375, 0.0056476593017578125, 0.007282257080078125, 0.008916854858398438, 0.01055145263671875, 0.012186050415039062, 0.013820648193359375, 0.015455245971679688, 0.01708984375, 0.018724441528320312, 0.020359039306640625, 0.021993637084960938, 0.02362823486328125, 0.025262832641601562, 0.026897430419921875, 0.028532028198242188, 0.0301666259765625, 0.03180122375488281, 0.033435821533203125, 0.03507041931152344, 0.03670501708984375, 0.03833961486816406, 0.039974212646484375, 0.04160881042480469, 0.043243408203125, 0.04487800598144531, 0.046512603759765625, 0.04814720153808594, 0.04978179931640625, 0.05141639709472656, 0.053050994873046875, 0.05468559265136719, 0.0563201904296875, 0.05795478820800781, 0.059589385986328125, 0.06122398376464844, 0.06285858154296875, 0.06449317932128906, 0.06612777709960938, 0.06776237487792969, 0.06939697265625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 6.0, 13.0, 6.0, 12.0, 24.0, 25.0, 39.0, 38.0, 34.0, 35.0, 54.0, 69.0, 85.0, 84.0, 77.0, 63.0, 64.0, 55.0, 44.0, 33.0, 29.0, 20.0, 19.0, 15.0, 14.0, 7.0, 15.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9245996475219727, -3.7775754928588867, -3.6305510997772217, -3.4835267066955566, -3.3365025520324707, -3.1894783973693848, -3.0424540042877197, -2.8954296112060547, -2.7484054565429688, -2.601381301879883, -2.4543569087982178, -2.3073325157165527, -2.160308361053467, -2.013284206390381, -1.8662598133087158, -1.7192355394363403, -1.5722112655639648, -1.4251869916915894, -1.2781627178192139, -1.1311384439468384, -0.9841141700744629, -0.8370898962020874, -0.6900656223297119, -0.5430413484573364, -0.39601707458496094, -0.24899280071258545, -0.10196852684020996, 0.04505574703216553, 0.19208002090454102, 0.3391042947769165, 0.486128568649292, 0.6331528425216675, 0.7801775932312012, 0.9272018671035767, 1.0742261409759521, 1.2212504148483276, 1.3682746887207031, 1.5152989625930786, 1.662323236465454, 1.8093475103378296, 1.956371784210205, 2.103395938873291, 2.250420331954956, 2.397444725036621, 2.544468879699707, 2.691493034362793, 2.838517427444458, 2.985541820526123, 3.132565975189209, 3.279590129852295, 3.42661452293396, 3.573638916015625, 3.720663070678711, 3.867687225341797, 4.014711380004883, 4.161736011505127, 4.308760166168213, 4.455784320831299, 4.602808952331543, 4.749833106994629, 4.896857261657715, 5.043881416320801, 5.190905570983887, 5.337930202484131, 5.484954357147217]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 10.0, 11.0, 12.0, 16.0, 16.0, 16.0, 20.0, 31.0, 31.0, 31.0, 38.0, 39.0, 51.0, 46.0, 48.0, 52.0, 33.0, 51.0, 44.0, 37.0, 47.0, 31.0, 42.0, 34.0, 31.0, 23.0, 27.0, 16.0, 19.0, 11.0, 20.0, 14.0, 12.0, 6.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7296736240386963, -3.5901713371276855, -3.450669288635254, -3.311167001724243, -3.1716649532318115, -3.032162666320801, -2.892660617828369, -2.7531583309173584, -2.6136560440063477, -2.474153757095337, -2.3346517086029053, -2.1951494216918945, -2.055647373199463, -1.9161450862884521, -1.776642918586731, -1.6371407508850098, -1.4976387023925781, -1.358136534690857, -1.2186343669891357, -1.079132080078125, -0.9396299719810486, -0.8001278042793274, -0.6606255769729614, -0.5211234092712402, -0.38162124156951904, -0.24211905896663666, -0.10261687636375427, 0.03688532114028931, 0.1763874888420105, 0.3158896565437317, 0.45539188385009766, 0.5948940515518188, 0.7343964576721191, 0.8738986253738403, 1.0134007930755615, 1.1529030799865723, 1.292405128479004, 1.4319074153900146, 1.5714095830917358, 1.710911750793457, 1.8504139184951782, 1.9899160861968994, 2.12941837310791, 2.268920421600342, 2.4084227085113525, 2.547924757003784, 2.687427043914795, 2.8269290924072266, 2.9664313793182373, 3.105933666229248, 3.2454357147216797, 3.3849380016326904, 3.524440050125122, 3.663942337036133, 3.8034443855285645, 3.942946672439575, 4.082448959350586, 4.221951007843018, 4.361453533172607, 4.500955581665039, 4.640457630157471, 4.779959678649902, 4.919462203979492, 5.058964252471924, 5.1984663009643555]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 17.0, 15.0, 13.0, 26.0, 47.0, 51.0, 88.0, 126.0, 207.0, 296.0, 365.0, 604.0, 958.0, 1454.0, 2183.0, 3358.0, 5138.0, 8022.0, 12628.0, 20080.0, 32709.0, 53116.0, 83924.0, 126823.0, 167109.0, 167398.0, 130304.0, 86551.0, 54085.0, 33140.0, 21116.0, 13191.0, 8148.0, 5332.0, 3390.0, 2256.0, 1411.0, 946.0, 607.0, 443.0, 291.0, 184.0, 146.0, 92.0, 58.0, 34.0, 23.0, 16.0, 10.0, 11.0, 3.0, 4.0, 3.0, 2.0, 4.0], "bins": [-3.474609375, -3.37249755859375, -3.2703857421875, -3.16827392578125, -3.066162109375, -2.96405029296875, -2.8619384765625, -2.75982666015625, -2.65771484375, -2.55560302734375, -2.4534912109375, -2.35137939453125, -2.249267578125, -2.14715576171875, -2.0450439453125, -1.94293212890625, -1.8408203125, -1.73870849609375, -1.6365966796875, -1.53448486328125, -1.432373046875, -1.33026123046875, -1.2281494140625, -1.12603759765625, -1.02392578125, -0.92181396484375, -0.8197021484375, -0.71759033203125, -0.615478515625, -0.51336669921875, -0.4112548828125, -0.30914306640625, -0.20703125, -0.10491943359375, -0.0028076171875, 0.09930419921875, 0.201416015625, 0.30352783203125, 0.4056396484375, 0.50775146484375, 0.60986328125, 0.71197509765625, 0.8140869140625, 0.91619873046875, 1.018310546875, 1.12042236328125, 1.2225341796875, 1.32464599609375, 1.4267578125, 1.52886962890625, 1.6309814453125, 1.73309326171875, 1.835205078125, 1.93731689453125, 2.0394287109375, 2.14154052734375, 2.24365234375, 2.34576416015625, 2.4478759765625, 2.54998779296875, 2.652099609375, 2.75421142578125, 2.8563232421875, 2.95843505859375, 3.060546875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 6.0, 11.0, 12.0, 11.0, 8.0, 8.0, 13.0, 20.0, 17.0, 24.0, 30.0, 32.0, 34.0, 39.0, 43.0, 37.0, 38.0, 50.0, 55.0, 37.0, 40.0, 46.0, 40.0, 35.0, 36.0, 32.0, 31.0, 36.0, 38.0, 21.0, 12.0, 14.0, 15.0, 17.0, 13.0, 15.0, 8.0, 10.0, 6.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.78515625, -3.6527099609375, -3.520263671875, -3.3878173828125, -3.25537109375, -3.1229248046875, -2.990478515625, -2.8580322265625, -2.7255859375, -2.5931396484375, -2.460693359375, -2.3282470703125, -2.19580078125, -2.0633544921875, -1.930908203125, -1.7984619140625, -1.666015625, -1.5335693359375, -1.401123046875, -1.2686767578125, -1.13623046875, -1.0037841796875, -0.871337890625, -0.7388916015625, -0.6064453125, -0.4739990234375, -0.341552734375, -0.2091064453125, -0.07666015625, 0.0557861328125, 0.188232421875, 0.3206787109375, 0.453125, 0.5855712890625, 0.718017578125, 0.8504638671875, 0.98291015625, 1.1153564453125, 1.247802734375, 1.3802490234375, 1.5126953125, 1.6451416015625, 1.777587890625, 1.9100341796875, 2.04248046875, 2.1749267578125, 2.307373046875, 2.4398193359375, 2.572265625, 2.7047119140625, 2.837158203125, 2.9696044921875, 3.10205078125, 3.2344970703125, 3.366943359375, 3.4993896484375, 3.6318359375, 3.7642822265625, 3.896728515625, 4.0291748046875, 4.16162109375, 4.2940673828125, 4.426513671875, 4.5589599609375, 4.69140625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 18.0, 23.0, 43.0, 92.0, 114.0, 188.0, 284.0, 511.0, 819.0, 1416.0, 2407.0, 4280.0, 7597.0, 14025.0, 25484.0, 48260.0, 88861.0, 151586.0, 209724.0, 196636.0, 132484.0, 74727.0, 40310.0, 21626.0, 11694.0, 6570.0, 3678.0, 2100.0, 1254.0, 686.0, 403.0, 252.0, 146.0, 90.0, 52.0, 39.0, 21.0, 9.0, 13.0, 14.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.94921875, -3.82525634765625, -3.7012939453125, -3.57733154296875, -3.453369140625, -3.32940673828125, -3.2054443359375, -3.08148193359375, -2.95751953125, -2.83355712890625, -2.7095947265625, -2.58563232421875, -2.461669921875, -2.33770751953125, -2.2137451171875, -2.08978271484375, -1.9658203125, -1.84185791015625, -1.7178955078125, -1.59393310546875, -1.469970703125, -1.34600830078125, -1.2220458984375, -1.09808349609375, -0.97412109375, -0.85015869140625, -0.7261962890625, -0.60223388671875, -0.478271484375, -0.35430908203125, -0.2303466796875, -0.10638427734375, 0.017578125, 0.14154052734375, 0.2655029296875, 0.38946533203125, 0.513427734375, 0.63739013671875, 0.7613525390625, 0.88531494140625, 1.00927734375, 1.13323974609375, 1.2572021484375, 1.38116455078125, 1.505126953125, 1.62908935546875, 1.7530517578125, 1.87701416015625, 2.0009765625, 2.12493896484375, 2.2489013671875, 2.37286376953125, 2.496826171875, 2.62078857421875, 2.7447509765625, 2.86871337890625, 2.99267578125, 3.11663818359375, 3.2406005859375, 3.36456298828125, 3.488525390625, 3.61248779296875, 3.7364501953125, 3.86041259765625, 3.984375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 0.0, 5.0, 6.0, 7.0, 6.0, 9.0, 8.0, 12.0, 8.0, 10.0, 16.0, 21.0, 16.0, 37.0, 29.0, 35.0, 37.0, 46.0, 22.0, 31.0, 43.0, 39.0, 28.0, 40.0, 40.0, 41.0, 29.0, 44.0, 36.0, 34.0, 35.0, 35.0, 27.0, 26.0, 20.0, 20.0, 17.0, 20.0, 12.0, 7.0, 9.0, 8.0, 3.0, 10.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.06640625, -1.99853515625, -1.9306640625, -1.86279296875, -1.794921875, -1.72705078125, -1.6591796875, -1.59130859375, -1.5234375, -1.45556640625, -1.3876953125, -1.31982421875, -1.251953125, -1.18408203125, -1.1162109375, -1.04833984375, -0.98046875, -0.91259765625, -0.8447265625, -0.77685546875, -0.708984375, -0.64111328125, -0.5732421875, -0.50537109375, -0.4375, -0.36962890625, -0.3017578125, -0.23388671875, -0.166015625, -0.09814453125, -0.0302734375, 0.03759765625, 0.10546875, 0.17333984375, 0.2412109375, 0.30908203125, 0.376953125, 0.44482421875, 0.5126953125, 0.58056640625, 0.6484375, 0.71630859375, 0.7841796875, 0.85205078125, 0.919921875, 0.98779296875, 1.0556640625, 1.12353515625, 1.19140625, 1.25927734375, 1.3271484375, 1.39501953125, 1.462890625, 1.53076171875, 1.5986328125, 1.66650390625, 1.734375, 1.80224609375, 1.8701171875, 1.93798828125, 2.005859375, 2.07373046875, 2.1416015625, 2.20947265625, 2.27734375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 2.0, 9.0, 9.0, 11.0, 21.0, 24.0, 42.0, 66.0, 85.0, 160.0, 215.0, 341.0, 538.0, 919.0, 1486.0, 2396.0, 4049.0, 7176.0, 12279.0, 21788.0, 38415.0, 67312.0, 113781.0, 172719.0, 200386.0, 160724.0, 103096.0, 60123.0, 34285.0, 19454.0, 10963.0, 6344.0, 3577.0, 2217.0, 1308.0, 829.0, 541.0, 284.0, 187.0, 139.0, 86.0, 55.0, 36.0, 15.0, 20.0, 19.0, 6.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.0693359375, -1.0352783203125, -1.001220703125, -0.9671630859375, -0.93310546875, -0.8990478515625, -0.864990234375, -0.8309326171875, -0.796875, -0.7628173828125, -0.728759765625, -0.6947021484375, -0.66064453125, -0.6265869140625, -0.592529296875, -0.5584716796875, -0.5244140625, -0.4903564453125, -0.456298828125, -0.4222412109375, -0.38818359375, -0.3541259765625, -0.320068359375, -0.2860107421875, -0.251953125, -0.2178955078125, -0.183837890625, -0.1497802734375, -0.11572265625, -0.0816650390625, -0.047607421875, -0.0135498046875, 0.0205078125, 0.0545654296875, 0.088623046875, 0.1226806640625, 0.15673828125, 0.1907958984375, 0.224853515625, 0.2589111328125, 0.29296875, 0.3270263671875, 0.361083984375, 0.3951416015625, 0.42919921875, 0.4632568359375, 0.497314453125, 0.5313720703125, 0.5654296875, 0.5994873046875, 0.633544921875, 0.6676025390625, 0.70166015625, 0.7357177734375, 0.769775390625, 0.8038330078125, 0.837890625, 0.8719482421875, 0.906005859375, 0.9400634765625, 0.97412109375, 1.0081787109375, 1.042236328125, 1.0762939453125, 1.1103515625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 5.0, 6.0, 15.0, 17.0, 19.0, 25.0, 34.0, 36.0, 44.0, 55.0, 63.0, 79.0, 72.0, 64.0, 81.0, 78.0, 66.0, 54.0, 48.0, 31.0, 30.0, 23.0, 19.0, 14.0, 12.0, 8.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.626150131225586e-05, -9.336695075035095e-05, -9.047240018844604e-05, -8.757784962654114e-05, -8.468329906463623e-05, -8.178874850273132e-05, -7.889419794082642e-05, -7.599964737892151e-05, -7.31050968170166e-05, -7.02105462551117e-05, -6.731599569320679e-05, -6.442144513130188e-05, -6.152689456939697e-05, -5.8632344007492065e-05, -5.573779344558716e-05, -5.284324288368225e-05, -4.9948692321777344e-05, -4.7054141759872437e-05, -4.415959119796753e-05, -4.126504063606262e-05, -3.8370490074157715e-05, -3.547593951225281e-05, -3.25813889503479e-05, -2.9686838388442993e-05, -2.6792287826538086e-05, -2.389773726463318e-05, -2.100318670272827e-05, -1.8108636140823364e-05, -1.5214085578918457e-05, -1.231953501701355e-05, -9.424984455108643e-06, -6.530433893203735e-06, -3.635883331298828e-06, -7.413327693939209e-07, 2.1532177925109863e-06, 5.0477683544158936e-06, 7.9423189163208e-06, 1.0836869478225708e-05, 1.3731420040130615e-05, 1.6625970602035522e-05, 1.952052116394043e-05, 2.2415071725845337e-05, 2.5309622287750244e-05, 2.820417284965515e-05, 3.109872341156006e-05, 3.3993273973464966e-05, 3.688782453536987e-05, 3.978237509727478e-05, 4.267692565917969e-05, 4.5571476221084595e-05, 4.84660267829895e-05, 5.136057734489441e-05, 5.4255127906799316e-05, 5.7149678468704224e-05, 6.004422903060913e-05, 6.293877959251404e-05, 6.583333015441895e-05, 6.872788071632385e-05, 7.162243127822876e-05, 7.451698184013367e-05, 7.741153240203857e-05, 8.030608296394348e-05, 8.320063352584839e-05, 8.60951840877533e-05, 8.89897346496582e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 18.0, 22.0, 37.0, 63.0, 114.0, 224.0, 352.0, 675.0, 1460.0, 2651.0, 5589.0, 11907.0, 25932.0, 57491.0, 125436.0, 237053.0, 268876.0, 165715.0, 78339.0, 35330.0, 16220.0, 7569.0, 3589.0, 1855.0, 886.0, 531.0, 274.0, 143.0, 74.0, 44.0, 30.0, 16.0, 13.0, 5.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.677734375, -1.63006591796875, -1.5823974609375, -1.53472900390625, -1.487060546875, -1.43939208984375, -1.3917236328125, -1.34405517578125, -1.29638671875, -1.24871826171875, -1.2010498046875, -1.15338134765625, -1.105712890625, -1.05804443359375, -1.0103759765625, -0.96270751953125, -0.9150390625, -0.86737060546875, -0.8197021484375, -0.77203369140625, -0.724365234375, -0.67669677734375, -0.6290283203125, -0.58135986328125, -0.53369140625, -0.48602294921875, -0.4383544921875, -0.39068603515625, -0.343017578125, -0.29534912109375, -0.2476806640625, -0.20001220703125, -0.15234375, -0.10467529296875, -0.0570068359375, -0.00933837890625, 0.038330078125, 0.08599853515625, 0.1336669921875, 0.18133544921875, 0.22900390625, 0.27667236328125, 0.3243408203125, 0.37200927734375, 0.419677734375, 0.46734619140625, 0.5150146484375, 0.56268310546875, 0.6103515625, 0.65802001953125, 0.7056884765625, 0.75335693359375, 0.801025390625, 0.84869384765625, 0.8963623046875, 0.94403076171875, 0.99169921875, 1.03936767578125, 1.0870361328125, 1.13470458984375, 1.182373046875, 1.23004150390625, 1.2777099609375, 1.32537841796875, 1.373046875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 6.0, 11.0, 12.0, 9.0, 9.0, 17.0, 18.0, 16.0, 32.0, 34.0, 27.0, 40.0, 41.0, 61.0, 58.0, 49.0, 47.0, 59.0, 55.0, 62.0, 55.0, 53.0, 50.0, 31.0, 31.0, 25.0, 17.0, 18.0, 13.0, 16.0, 8.0, 11.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.52783203125, -0.5130996704101562, -0.4983673095703125, -0.48363494873046875, -0.468902587890625, -0.45417022705078125, -0.4394378662109375, -0.42470550537109375, -0.40997314453125, -0.39524078369140625, -0.3805084228515625, -0.36577606201171875, -0.351043701171875, -0.33631134033203125, -0.3215789794921875, -0.30684661865234375, -0.2921142578125, -0.27738189697265625, -0.2626495361328125, -0.24791717529296875, -0.233184814453125, -0.21845245361328125, -0.2037200927734375, -0.18898773193359375, -0.17425537109375, -0.15952301025390625, -0.1447906494140625, -0.13005828857421875, -0.115325927734375, -0.10059356689453125, -0.0858612060546875, -0.07112884521484375, -0.056396484375, -0.04166412353515625, -0.0269317626953125, -0.01219940185546875, 0.002532958984375, 0.01726531982421875, 0.0319976806640625, 0.04673004150390625, 0.06146240234375, 0.07619476318359375, 0.0909271240234375, 0.10565948486328125, 0.120391845703125, 0.13512420654296875, 0.1498565673828125, 0.16458892822265625, 0.1793212890625, 0.19405364990234375, 0.2087860107421875, 0.22351837158203125, 0.238250732421875, 0.25298309326171875, 0.2677154541015625, 0.28244781494140625, 0.29718017578125, 0.31191253662109375, 0.3266448974609375, 0.34137725830078125, 0.356109619140625, 0.37084197998046875, 0.3855743408203125, 0.40030670166015625, 0.4150390625]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 5.0, 4.0, 11.0, 6.0, 19.0, 22.0, 34.0, 34.0, 35.0, 45.0, 66.0, 74.0, 86.0, 75.0, 86.0, 81.0, 61.0, 67.0, 39.0, 35.0, 29.0, 22.0, 14.0, 7.0, 11.0, 7.0, 12.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9126126766204834, -3.7540371417999268, -3.59546160697937, -3.4368858337402344, -3.2783102989196777, -3.119734764099121, -2.9611592292785645, -2.802583694458008, -2.644008159637451, -2.4854326248168945, -2.326857089996338, -2.1682815551757812, -2.0097057819366455, -1.8511302471160889, -1.6925547122955322, -1.533979058265686, -1.3754034042358398, -1.2168278694152832, -1.058252215385437, -0.8996766805648804, -0.741101086139679, -0.5825254917144775, -0.4239499568939209, -0.2653743028640747, -0.10679876804351807, 0.051776811480522156, 0.21035239100456238, 0.3689279556274414, 0.5275035500526428, 0.6860791444778442, 0.8446546792984009, 1.003230333328247, 1.1618056297302246, 1.3203811645507812, 1.4789568185806274, 1.637532353401184, 1.7961080074310303, 1.954683542251587, 2.1132590770721436, 2.2718348503112793, 2.430410385131836, 2.5889859199523926, 2.747561454772949, 2.906136989593506, 3.0647127628326416, 3.2232882976531982, 3.381863832473755, 3.5404396057128906, 3.699014902114868, 3.857590436935425, 4.0161662101745605, 4.174741744995117, 4.333317279815674, 4.4918928146362305, 4.650468349456787, 4.809043884277344, 4.9676194190979, 5.126194953918457, 5.284770488739014, 5.44334602355957, 5.601921558380127, 5.760497093200684, 5.919073104858398, 6.077648639678955, 6.236224174499512]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 7.0, 9.0, 13.0, 9.0, 17.0, 20.0, 17.0, 25.0, 21.0, 39.0, 51.0, 42.0, 34.0, 46.0, 42.0, 60.0, 43.0, 35.0, 45.0, 44.0, 42.0, 52.0, 35.0, 40.0, 24.0, 37.0, 30.0, 16.0, 12.0, 28.0, 16.0, 8.0, 17.0, 9.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.346937656402588, -4.203651428222656, -4.060365200042725, -3.917079210281372, -3.7737929821014404, -3.630506753921509, -3.4872207641601562, -3.3439345359802246, -3.200648307800293, -3.0573620796203613, -2.9140758514404297, -2.770789861679077, -2.6275036334991455, -2.484217405319214, -2.3409314155578613, -2.1976451873779297, -2.054358959197998, -1.9110727310180664, -1.7677866220474243, -1.6245005130767822, -1.4812142848968506, -1.337928056716919, -1.1946419477462769, -1.0513558387756348, -0.9080696105957031, -0.7647834420204163, -0.6214972734451294, -0.47821110486984253, -0.33492493629455566, -0.1916387677192688, -0.048352599143981934, 0.09493350982666016, 0.23822021484375, 0.38150638341903687, 0.5247925519943237, 0.6680787205696106, 0.8113648891448975, 0.9546510577201843, 1.0979372262954712, 1.2412233352661133, 1.384509563446045, 1.5277957916259766, 1.6710819005966187, 1.8143680095672607, 1.9576542377471924, 2.100940465927124, 2.2442264556884766, 2.387512683868408, 2.53079891204834, 2.6740851402282715, 2.817371368408203, 2.9606573581695557, 3.1039435863494873, 3.247229814529419, 3.3905158042907715, 3.533802032470703, 3.6770882606506348, 3.8203744888305664, 3.963660717010498, 4.10694694519043, 4.250232696533203, 4.393518924713135, 4.536805152893066, 4.680091381072998, 4.82337760925293]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 6.0, 5.0, 7.0, 9.0, 26.0, 19.0, 36.0, 64.0, 70.0, 112.0, 164.0, 256.0, 369.0, 541.0, 878.0, 1341.0, 2069.0, 3467.0, 5566.0, 9256.0, 16480.0, 29907.0, 58737.0, 122964.0, 279674.0, 666601.0, 1219235.0, 974967.0, 435615.0, 184783.0, 84682.0, 42368.0, 22175.0, 12390.0, 7200.0, 4353.0, 2721.0, 1684.0, 1135.0, 751.0, 489.0, 335.0, 238.0, 176.0, 119.0, 79.0, 45.0, 30.0, 38.0, 22.0, 14.0, 6.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.1796875, -4.0343017578125, -3.888916015625, -3.7435302734375, -3.59814453125, -3.4527587890625, -3.307373046875, -3.1619873046875, -3.0166015625, -2.8712158203125, -2.725830078125, -2.5804443359375, -2.43505859375, -2.2896728515625, -2.144287109375, -1.9989013671875, -1.853515625, -1.7081298828125, -1.562744140625, -1.4173583984375, -1.27197265625, -1.1265869140625, -0.981201171875, -0.8358154296875, -0.6904296875, -0.5450439453125, -0.399658203125, -0.2542724609375, -0.10888671875, 0.0364990234375, 0.181884765625, 0.3272705078125, 0.47265625, 0.6180419921875, 0.763427734375, 0.9088134765625, 1.05419921875, 1.1995849609375, 1.344970703125, 1.4903564453125, 1.6357421875, 1.7811279296875, 1.926513671875, 2.0718994140625, 2.21728515625, 2.3626708984375, 2.508056640625, 2.6534423828125, 2.798828125, 2.9442138671875, 3.089599609375, 3.2349853515625, 3.38037109375, 3.5257568359375, 3.671142578125, 3.8165283203125, 3.9619140625, 4.1072998046875, 4.252685546875, 4.3980712890625, 4.54345703125, 4.6888427734375, 4.834228515625, 4.9796142578125, 5.125]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 4.0, 10.0, 10.0, 12.0, 9.0, 16.0, 23.0, 22.0, 25.0, 33.0, 33.0, 40.0, 50.0, 37.0, 45.0, 52.0, 53.0, 40.0, 49.0, 31.0, 49.0, 54.0, 34.0, 34.0, 39.0, 27.0, 32.0, 27.0, 24.0, 16.0, 13.0, 13.0, 15.0, 10.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.873046875, -2.776275634765625, -2.67950439453125, -2.582733154296875, -2.4859619140625, -2.389190673828125, -2.29241943359375, -2.195648193359375, -2.098876953125, -2.002105712890625, -1.90533447265625, -1.808563232421875, -1.7117919921875, -1.615020751953125, -1.51824951171875, -1.421478271484375, -1.32470703125, -1.227935791015625, -1.13116455078125, -1.034393310546875, -0.9376220703125, -0.840850830078125, -0.74407958984375, -0.647308349609375, -0.550537109375, -0.453765869140625, -0.35699462890625, -0.260223388671875, -0.1634521484375, -0.066680908203125, 0.03009033203125, 0.126861572265625, 0.2236328125, 0.320404052734375, 0.41717529296875, 0.513946533203125, 0.6107177734375, 0.707489013671875, 0.80426025390625, 0.901031494140625, 0.997802734375, 1.094573974609375, 1.19134521484375, 1.288116455078125, 1.3848876953125, 1.481658935546875, 1.57843017578125, 1.675201416015625, 1.77197265625, 1.868743896484375, 1.96551513671875, 2.062286376953125, 2.1590576171875, 2.255828857421875, 2.35260009765625, 2.449371337890625, 2.546142578125, 2.642913818359375, 2.73968505859375, 2.836456298828125, 2.9332275390625, 3.029998779296875, 3.12677001953125, 3.223541259765625, 3.3203125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 9.0, 5.0, 12.0, 21.0, 35.0, 35.0, 67.0, 86.0, 140.0, 207.0, 319.0, 541.0, 828.0, 1211.0, 2038.0, 3299.0, 5287.0, 8861.0, 14884.0, 26075.0, 46734.0, 86307.0, 166180.0, 320350.0, 600111.0, 917352.0, 865495.0, 530032.0, 279434.0, 144577.0, 75922.0, 41155.0, 22996.0, 13237.0, 7884.0, 4675.0, 2819.0, 1819.0, 1135.0, 759.0, 471.0, 274.0, 227.0, 109.0, 97.0, 68.0, 39.0, 27.0, 19.0, 7.0, 6.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.814453125, -3.694854736328125, -3.57525634765625, -3.455657958984375, -3.3360595703125, -3.216461181640625, -3.09686279296875, -2.977264404296875, -2.857666015625, -2.738067626953125, -2.61846923828125, -2.498870849609375, -2.3792724609375, -2.259674072265625, -2.14007568359375, -2.020477294921875, -1.90087890625, -1.781280517578125, -1.66168212890625, -1.542083740234375, -1.4224853515625, -1.302886962890625, -1.18328857421875, -1.063690185546875, -0.944091796875, -0.824493408203125, -0.70489501953125, -0.585296630859375, -0.4656982421875, -0.346099853515625, -0.22650146484375, -0.106903076171875, 0.0126953125, 0.132293701171875, 0.25189208984375, 0.371490478515625, 0.4910888671875, 0.610687255859375, 0.73028564453125, 0.849884033203125, 0.969482421875, 1.089080810546875, 1.20867919921875, 1.328277587890625, 1.4478759765625, 1.567474365234375, 1.68707275390625, 1.806671142578125, 1.92626953125, 2.045867919921875, 2.16546630859375, 2.285064697265625, 2.4046630859375, 2.524261474609375, 2.64385986328125, 2.763458251953125, 2.883056640625, 3.002655029296875, 3.12225341796875, 3.241851806640625, 3.3614501953125, 3.481048583984375, 3.60064697265625, 3.720245361328125, 3.83984375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 11.0, 11.0, 10.0, 20.0, 22.0, 41.0, 47.0, 52.0, 67.0, 68.0, 95.0, 108.0, 109.0, 141.0, 198.0, 228.0, 259.0, 206.0, 268.0, 243.0, 253.0, 240.0, 208.0, 177.0, 180.0, 139.0, 114.0, 109.0, 94.0, 67.0, 55.0, 59.0, 31.0, 19.0, 21.0, 17.0, 14.0, 19.0, 14.0, 3.0, 8.0, 3.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.3388671875, -1.2947845458984375, -1.250701904296875, -1.2066192626953125, -1.16253662109375, -1.1184539794921875, -1.074371337890625, -1.0302886962890625, -0.9862060546875, -0.9421234130859375, -0.898040771484375, -0.8539581298828125, -0.80987548828125, -0.7657928466796875, -0.721710205078125, -0.6776275634765625, -0.633544921875, -0.5894622802734375, -0.545379638671875, -0.5012969970703125, -0.45721435546875, -0.4131317138671875, -0.369049072265625, -0.3249664306640625, -0.2808837890625, -0.2368011474609375, -0.192718505859375, -0.1486358642578125, -0.10455322265625, -0.0604705810546875, -0.016387939453125, 0.0276947021484375, 0.07177734375, 0.1158599853515625, 0.159942626953125, 0.2040252685546875, 0.24810791015625, 0.2921905517578125, 0.336273193359375, 0.3803558349609375, 0.4244384765625, 0.4685211181640625, 0.512603759765625, 0.5566864013671875, 0.60076904296875, 0.6448516845703125, 0.688934326171875, 0.7330169677734375, 0.777099609375, 0.8211822509765625, 0.865264892578125, 0.9093475341796875, 0.95343017578125, 0.9975128173828125, 1.041595458984375, 1.0856781005859375, 1.1297607421875, 1.1738433837890625, 1.217926025390625, 1.2620086669921875, 1.30609130859375, 1.3501739501953125, 1.394256591796875, 1.4383392333984375, 1.482421875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 9.0, 10.0, 15.0, 13.0, 25.0, 25.0, 35.0, 31.0, 64.0, 69.0, 83.0, 62.0, 70.0, 84.0, 64.0, 71.0, 43.0, 39.0, 40.0, 28.0, 25.0, 20.0, 11.0, 15.0, 8.0, 12.0, 6.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7482481002807617, -3.602992057800293, -3.457735776901245, -3.3124794960021973, -3.1672234535217285, -3.0219674110412598, -2.876711130142212, -2.731454849243164, -2.5861988067626953, -2.4409427642822266, -2.2956864833831787, -2.150430202484131, -2.005174160003662, -1.8599179983139038, -1.7146618366241455, -1.5694056749343872, -1.424149513244629, -1.2788933515548706, -1.1336371898651123, -0.988381028175354, -0.8431248664855957, -0.6978687047958374, -0.5526125431060791, -0.4073563814163208, -0.2621002197265625, -0.1168440580368042, 0.0284121036529541, 0.1736682653427124, 0.3189244270324707, 0.464180588722229, 0.6094367504119873, 0.7546929121017456, 0.8999495506286621, 1.0452057123184204, 1.1904618740081787, 1.335718035697937, 1.4809741973876953, 1.6262303590774536, 1.771486520767212, 1.9167426824569702, 2.0619988441467285, 2.2072548866271973, 2.352511167526245, 2.497767448425293, 2.6430234909057617, 2.7882795333862305, 2.9335358142852783, 3.078792095184326, 3.224048137664795, 3.3693041801452637, 3.5145604610443115, 3.6598167419433594, 3.805072784423828, 3.950328826904297, 4.095584869384766, 4.240841388702393, 4.386097431182861, 4.53135347366333, 4.676609992980957, 4.821866035461426, 4.9671220779418945, 5.112378120422363, 5.257634162902832, 5.402890682220459, 5.548146724700928]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 12.0, 6.0, 5.0, 9.0, 16.0, 23.0, 22.0, 26.0, 37.0, 38.0, 49.0, 42.0, 35.0, 48.0, 40.0, 45.0, 66.0, 38.0, 43.0, 55.0, 38.0, 45.0, 45.0, 32.0, 27.0, 36.0, 23.0, 18.0, 16.0, 14.0, 10.0, 13.0, 7.0, 8.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.070130825042725, -3.9240877628326416, -3.7780447006225586, -3.6320016384124756, -3.4859585762023926, -3.3399152755737305, -3.1938722133636475, -3.0478291511535645, -2.9017860889434814, -2.7557430267333984, -2.6096999645233154, -2.4636569023132324, -2.3176136016845703, -2.1715707778930664, -2.0255274772644043, -1.8794844150543213, -1.7334413528442383, -1.5873982906341553, -1.4413552284240723, -1.2953120470046997, -1.1492689847946167, -1.0032259225845337, -0.8571828007698059, -0.7111396789550781, -0.5650966167449951, -0.4190535247325897, -0.2730104327201843, -0.12696734070777893, 0.019075751304626465, 0.16511881351470947, 0.31116193532943726, 0.45720505714416504, 0.6032476425170898, 0.7492907047271729, 0.8953338265419006, 1.0413769483566284, 1.1874200105667114, 1.3334630727767944, 1.479506254196167, 1.62554931640625, 1.771592378616333, 1.917635440826416, 2.063678503036499, 2.209721565246582, 2.355764865875244, 2.501807689666748, 2.64785099029541, 2.793894052505493, 2.939937114715576, 3.085980176925659, 3.232023239135742, 3.378066301345825, 3.524109363555908, 3.6701526641845703, 3.8161957263946533, 3.9622387886047363, 4.108282089233398, 4.2543253898620605, 4.4003682136535645, 4.546411514282227, 4.6924543380737305, 4.838497638702393, 4.9845404624938965, 5.130583763122559, 5.2766265869140625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 20.0, 25.0, 33.0, 39.0, 63.0, 80.0, 122.0, 174.0, 269.0, 370.0, 548.0, 778.0, 1267.0, 1854.0, 2925.0, 4779.0, 7535.0, 11985.0, 19596.0, 33539.0, 58974.0, 112510.0, 221812.0, 257555.0, 139120.0, 72041.0, 39741.0, 22891.0, 13980.0, 8653.0, 5355.0, 3547.0, 2179.0, 1316.0, 889.0, 658.0, 425.0, 271.0, 194.0, 128.0, 99.0, 58.0, 46.0, 34.0, 27.0, 18.0, 12.0, 8.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.2216796875, -1.183685302734375, -1.14569091796875, -1.107696533203125, -1.0697021484375, -1.031707763671875, -0.99371337890625, -0.955718994140625, -0.917724609375, -0.879730224609375, -0.84173583984375, -0.803741455078125, -0.7657470703125, -0.727752685546875, -0.68975830078125, -0.651763916015625, -0.61376953125, -0.575775146484375, -0.53778076171875, -0.499786376953125, -0.4617919921875, -0.423797607421875, -0.38580322265625, -0.347808837890625, -0.309814453125, -0.271820068359375, -0.23382568359375, -0.195831298828125, -0.1578369140625, -0.119842529296875, -0.08184814453125, -0.043853759765625, -0.005859375, 0.032135009765625, 0.07012939453125, 0.108123779296875, 0.1461181640625, 0.184112548828125, 0.22210693359375, 0.260101318359375, 0.298095703125, 0.336090087890625, 0.37408447265625, 0.412078857421875, 0.4500732421875, 0.488067626953125, 0.52606201171875, 0.564056396484375, 0.60205078125, 0.640045166015625, 0.67803955078125, 0.716033935546875, 0.7540283203125, 0.792022705078125, 0.83001708984375, 0.868011474609375, 0.906005859375, 0.944000244140625, 0.98199462890625, 1.019989013671875, 1.0579833984375, 1.095977783203125, 1.13397216796875, 1.171966552734375, 1.2099609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 6.0, 7.0, 6.0, 11.0, 9.0, 15.0, 23.0, 22.0, 33.0, 35.0, 38.0, 45.0, 40.0, 37.0, 54.0, 46.0, 47.0, 45.0, 53.0, 48.0, 50.0, 40.0, 31.0, 42.0, 40.0, 33.0, 22.0, 22.0, 20.0, 19.0, 7.0, 11.0, 14.0, 10.0, 8.0, 3.0, 5.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.48828125, -4.341552734375, -4.19482421875, -4.048095703125, -3.9013671875, -3.754638671875, -3.60791015625, -3.461181640625, -3.314453125, -3.167724609375, -3.02099609375, -2.874267578125, -2.7275390625, -2.580810546875, -2.43408203125, -2.287353515625, -2.140625, -1.993896484375, -1.84716796875, -1.700439453125, -1.5537109375, -1.406982421875, -1.26025390625, -1.113525390625, -0.966796875, -0.820068359375, -0.67333984375, -0.526611328125, -0.3798828125, -0.233154296875, -0.08642578125, 0.060302734375, 0.20703125, 0.353759765625, 0.50048828125, 0.647216796875, 0.7939453125, 0.940673828125, 1.08740234375, 1.234130859375, 1.380859375, 1.527587890625, 1.67431640625, 1.821044921875, 1.9677734375, 2.114501953125, 2.26123046875, 2.407958984375, 2.5546875, 2.701416015625, 2.84814453125, 2.994873046875, 3.1416015625, 3.288330078125, 3.43505859375, 3.581787109375, 3.728515625, 3.875244140625, 4.02197265625, 4.168701171875, 4.3154296875, 4.462158203125, 4.60888671875, 4.755615234375, 4.90234375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 15.0, 8.0, 13.0, 12.0, 16.0, 26.0, 33.0, 28.0, 38.0, 77.0, 82.0, 96.0, 148.0, 196.0, 303.0, 393.0, 625.0, 860.0, 1527.0, 2868.0, 5970.0, 14852.0, 45207.0, 913227.0, 37109.0, 12793.0, 5184.0, 2563.0, 1422.0, 840.0, 584.0, 372.0, 267.0, 177.0, 150.0, 126.0, 72.0, 69.0, 52.0, 36.0, 20.0, 21.0, 18.0, 12.0, 11.0, 5.0, 10.0, 6.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.39453125, -3.2864990234375, -3.178466796875, -3.0704345703125, -2.96240234375, -2.8543701171875, -2.746337890625, -2.6383056640625, -2.5302734375, -2.4222412109375, -2.314208984375, -2.2061767578125, -2.09814453125, -1.9901123046875, -1.882080078125, -1.7740478515625, -1.666015625, -1.5579833984375, -1.449951171875, -1.3419189453125, -1.23388671875, -1.1258544921875, -1.017822265625, -0.9097900390625, -0.8017578125, -0.6937255859375, -0.585693359375, -0.4776611328125, -0.36962890625, -0.2615966796875, -0.153564453125, -0.0455322265625, 0.0625, 0.1705322265625, 0.278564453125, 0.3865966796875, 0.49462890625, 0.6026611328125, 0.710693359375, 0.8187255859375, 0.9267578125, 1.0347900390625, 1.142822265625, 1.2508544921875, 1.35888671875, 1.4669189453125, 1.574951171875, 1.6829833984375, 1.791015625, 1.8990478515625, 2.007080078125, 2.1151123046875, 2.22314453125, 2.3311767578125, 2.439208984375, 2.5472412109375, 2.6552734375, 2.7633056640625, 2.871337890625, 2.9793701171875, 3.08740234375, 3.1954345703125, 3.303466796875, 3.4114990234375, 3.51953125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 3.0, 8.0, 11.0, 16.0, 11.0, 16.0, 22.0, 23.0, 16.0, 13.0, 26.0, 33.0, 37.0, 34.0, 45.0, 41.0, 45.0, 43.0, 59.0, 36.0, 41.0, 41.0, 37.0, 35.0, 35.0, 28.0, 30.0, 31.0, 35.0, 30.0, 20.0, 13.0, 11.0, 14.0, 14.0, 10.0, 11.0, 4.0, 7.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0], "bins": [-2.873046875, -2.791656494140625, -2.71026611328125, -2.628875732421875, -2.5474853515625, -2.466094970703125, -2.38470458984375, -2.303314208984375, -2.221923828125, -2.140533447265625, -2.05914306640625, -1.977752685546875, -1.8963623046875, -1.814971923828125, -1.73358154296875, -1.652191162109375, -1.57080078125, -1.489410400390625, -1.40802001953125, -1.326629638671875, -1.2452392578125, -1.163848876953125, -1.08245849609375, -1.001068115234375, -0.919677734375, -0.838287353515625, -0.75689697265625, -0.675506591796875, -0.5941162109375, -0.512725830078125, -0.43133544921875, -0.349945068359375, -0.2685546875, -0.187164306640625, -0.10577392578125, -0.024383544921875, 0.0570068359375, 0.138397216796875, 0.21978759765625, 0.301177978515625, 0.382568359375, 0.463958740234375, 0.54534912109375, 0.626739501953125, 0.7081298828125, 0.789520263671875, 0.87091064453125, 0.952301025390625, 1.03369140625, 1.115081787109375, 1.19647216796875, 1.277862548828125, 1.3592529296875, 1.440643310546875, 1.52203369140625, 1.603424072265625, 1.684814453125, 1.766204833984375, 1.84759521484375, 1.928985595703125, 2.0103759765625, 2.091766357421875, 2.17315673828125, 2.254547119140625, 2.3359375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 11.0, 9.0, 17.0, 15.0, 22.0, 29.0, 46.0, 59.0, 69.0, 120.0, 157.0, 239.0, 327.0, 481.0, 695.0, 1101.0, 1932.0, 3494.0, 7146.0, 18011.0, 74786.0, 898606.0, 22426.0, 8655.0, 4154.0, 2173.0, 1305.0, 816.0, 486.0, 347.0, 227.0, 154.0, 107.0, 89.0, 66.0, 39.0, 40.0, 25.0, 18.0, 16.0, 13.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20361328125, -0.19661903381347656, -0.18962478637695312, -0.1826305389404297, -0.17563629150390625, -0.1686420440673828, -0.16164779663085938, -0.15465354919433594, -0.1476593017578125, -0.14066505432128906, -0.13367080688476562, -0.1266765594482422, -0.11968231201171875, -0.11268806457519531, -0.10569381713867188, -0.09869956970214844, -0.091705322265625, -0.08471107482910156, -0.07771682739257812, -0.07072257995605469, -0.06372833251953125, -0.05673408508300781, -0.049739837646484375, -0.04274559020996094, -0.0357513427734375, -0.028757095336914062, -0.021762847900390625, -0.014768600463867188, -0.00777435302734375, -0.0007801055908203125, 0.006214141845703125, 0.013208389282226562, 0.02020263671875, 0.027196884155273438, 0.034191131591796875, 0.04118537902832031, 0.04817962646484375, 0.05517387390136719, 0.062168121337890625, 0.06916236877441406, 0.0761566162109375, 0.08315086364746094, 0.09014511108398438, 0.09713935852050781, 0.10413360595703125, 0.11112785339355469, 0.11812210083007812, 0.12511634826660156, 0.132110595703125, 0.13910484313964844, 0.14609909057617188, 0.1530933380126953, 0.16008758544921875, 0.1670818328857422, 0.17407608032226562, 0.18107032775878906, 0.1880645751953125, 0.19505882263183594, 0.20205307006835938, 0.2090473175048828, 0.21604156494140625, 0.2230358123779297, 0.23003005981445312, 0.23702430725097656, 0.2440185546875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 3.0, 3.0, 5.0, 11.0, 3.0, 12.0, 17.0, 17.0, 21.0, 30.0, 37.0, 42.0, 41.0, 37.0, 43.0, 59.0, 56.0, 83.0, 55.0, 53.0, 55.0, 42.0, 37.0, 37.0, 34.0, 29.0, 31.0, 19.0, 17.0, 14.0, 13.0, 9.0, 12.0, 6.0, 4.0, 5.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.869699478149414e-05, -4.728604108095169e-05, -4.587508738040924e-05, -4.446413367986679e-05, -4.305317997932434e-05, -4.164222627878189e-05, -4.023127257823944e-05, -3.882031887769699e-05, -3.740936517715454e-05, -3.599841147661209e-05, -3.458745777606964e-05, -3.317650407552719e-05, -3.176555037498474e-05, -3.035459667444229e-05, -2.894364297389984e-05, -2.753268927335739e-05, -2.612173557281494e-05, -2.471078187227249e-05, -2.329982817173004e-05, -2.188887447118759e-05, -2.047792077064514e-05, -1.906696707010269e-05, -1.7656013369560242e-05, -1.6245059669017792e-05, -1.4834105968475342e-05, -1.3423152267932892e-05, -1.2012198567390442e-05, -1.0601244866847992e-05, -9.190291166305542e-06, -7.779337465763092e-06, -6.368383765220642e-06, -4.957430064678192e-06, -3.546476364135742e-06, -2.1355226635932922e-06, -7.245689630508423e-07, 6.863847374916077e-07, 2.0973384380340576e-06, 3.5082921385765076e-06, 4.9192458391189575e-06, 6.3301995396614075e-06, 7.741153240203857e-06, 9.152106940746307e-06, 1.0563060641288757e-05, 1.1974014341831207e-05, 1.3384968042373657e-05, 1.4795921742916107e-05, 1.6206875443458557e-05, 1.7617829144001007e-05, 1.9028782844543457e-05, 2.0439736545085907e-05, 2.1850690245628357e-05, 2.3261643946170807e-05, 2.4672597646713257e-05, 2.6083551347255707e-05, 2.7494505047798157e-05, 2.8905458748340607e-05, 3.0316412448883057e-05, 3.1727366149425507e-05, 3.3138319849967957e-05, 3.4549273550510406e-05, 3.5960227251052856e-05, 3.7371180951595306e-05, 3.8782134652137756e-05, 4.0193088352680206e-05, 4.1604042053222656e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 9.0, 10.0, 8.0, 29.0, 28.0, 33.0, 59.0, 81.0, 115.0, 140.0, 276.0, 365.0, 598.0, 912.0, 1254.0, 1962.0, 3065.0, 4801.0, 7545.0, 12485.0, 21336.0, 38383.0, 76220.0, 168670.0, 323483.0, 195923.0, 87057.0, 43481.0, 23565.0, 13579.0, 8375.0, 5115.0, 3278.0, 2119.0, 1402.0, 938.0, 624.0, 403.0, 253.0, 195.0, 121.0, 92.0, 49.0, 37.0, 26.0, 15.0, 20.0, 7.0, 6.0, 8.0, 4.0, 2.0, 0.0, 3.0], "bins": [-0.08807373046875, -0.08552742004394531, -0.08298110961914062, -0.08043479919433594, -0.07788848876953125, -0.07534217834472656, -0.07279586791992188, -0.07024955749511719, -0.0677032470703125, -0.06515693664550781, -0.06261062622070312, -0.06006431579589844, -0.05751800537109375, -0.05497169494628906, -0.052425384521484375, -0.04987907409667969, -0.047332763671875, -0.04478645324707031, -0.042240142822265625, -0.03969383239746094, -0.03714752197265625, -0.03460121154785156, -0.032054901123046875, -0.029508590698242188, -0.0269622802734375, -0.024415969848632812, -0.021869659423828125, -0.019323348999023438, -0.01677703857421875, -0.014230728149414062, -0.011684417724609375, -0.009138107299804688, -0.006591796875, -0.0040454864501953125, -0.001499176025390625, 0.0010471343994140625, 0.00359344482421875, 0.0061397552490234375, 0.008686065673828125, 0.011232376098632812, 0.0137786865234375, 0.016324996948242188, 0.018871307373046875, 0.021417617797851562, 0.02396392822265625, 0.026510238647460938, 0.029056549072265625, 0.03160285949707031, 0.034149169921875, 0.03669548034667969, 0.039241790771484375, 0.04178810119628906, 0.04433441162109375, 0.04688072204589844, 0.049427032470703125, 0.05197334289550781, 0.0545196533203125, 0.05706596374511719, 0.059612274169921875, 0.06215858459472656, 0.06470489501953125, 0.06725120544433594, 0.06979751586914062, 0.07234382629394531, 0.07489013671875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 4.0, 3.0, 3.0, 6.0, 3.0, 6.0, 8.0, 11.0, 19.0, 26.0, 28.0, 43.0, 50.0, 68.0, 76.0, 120.0, 108.0, 90.0, 74.0, 70.0, 37.0, 31.0, 25.0, 16.0, 14.0, 3.0, 6.0, 10.0, 10.0, 5.0, 7.0, 3.0, 4.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0234222412109375, -0.022532224655151367, -0.021642208099365234, -0.0207521915435791, -0.01986217498779297, -0.018972158432006836, -0.018082141876220703, -0.01719212532043457, -0.016302108764648438, -0.015412092208862305, -0.014522075653076172, -0.013632059097290039, -0.012742042541503906, -0.011852025985717773, -0.01096200942993164, -0.010071992874145508, -0.009181976318359375, -0.008291959762573242, -0.007401943206787109, -0.0065119266510009766, -0.005621910095214844, -0.004731893539428711, -0.003841876983642578, -0.0029518604278564453, -0.0020618438720703125, -0.0011718273162841797, -0.0002818107604980469, 0.0006082057952880859, 0.0014982223510742188, 0.0023882389068603516, 0.0032782554626464844, 0.004168272018432617, 0.00505828857421875, 0.005948305130004883, 0.006838321685791016, 0.0077283382415771484, 0.008618354797363281, 0.009508371353149414, 0.010398387908935547, 0.01128840446472168, 0.012178421020507812, 0.013068437576293945, 0.013958454132080078, 0.014848470687866211, 0.015738487243652344, 0.016628503799438477, 0.01751852035522461, 0.018408536911010742, 0.019298553466796875, 0.020188570022583008, 0.02107858657836914, 0.021968603134155273, 0.022858619689941406, 0.02374863624572754, 0.024638652801513672, 0.025528669357299805, 0.026418685913085938, 0.02730870246887207, 0.028198719024658203, 0.029088735580444336, 0.02997875213623047, 0.0308687686920166, 0.031758785247802734, 0.03264880180358887, 0.033538818359375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 7.0, 12.0, 9.0, 18.0, 14.0, 22.0, 34.0, 24.0, 39.0, 66.0, 70.0, 78.0, 59.0, 72.0, 75.0, 65.0, 67.0, 48.0, 39.0, 39.0, 29.0, 24.0, 21.0, 12.0, 11.0, 9.0, 10.0, 4.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.647355556488037, -3.5052900314331055, -3.363224506378174, -3.221158981323242, -3.0790934562683105, -2.937027931213379, -2.7949624061584473, -2.6528968811035156, -2.510831356048584, -2.3687658309936523, -2.2267003059387207, -2.084634780883789, -1.9425692558288574, -1.8005037307739258, -1.6584383249282837, -1.516372799873352, -1.37430739402771, -1.2322418689727783, -1.0901763439178467, -0.9481108784675598, -0.8060453534126282, -0.6639798283576965, -0.5219143629074097, -0.379848837852478, -0.2377833127975464, -0.09571780264377594, 0.04634770750999451, 0.18841320276260376, 0.3304787278175354, 0.47254425287246704, 0.6146097183227539, 0.7566752433776855, 0.8987407684326172, 1.0408062934875488, 1.1828718185424805, 1.324937343597412, 1.4670028686523438, 1.6090683937072754, 1.7511337995529175, 1.8931993246078491, 2.0352649688720703, 2.177330493927002, 2.3193960189819336, 2.4614615440368652, 2.603527069091797, 2.7455925941467285, 2.88765811920166, 3.029723644256592, 3.1717889308929443, 3.313854455947876, 3.4559199810028076, 3.5979855060577393, 3.740051031112671, 3.8821165561676025, 4.024181842803955, 4.166247367858887, 4.308312892913818, 4.45037841796875, 4.592443943023682, 4.734509468078613, 4.876574993133545, 5.018640518188477, 5.160706043243408, 5.30277156829834, 5.4448370933532715]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 10.0, 7.0, 4.0, 10.0, 16.0, 23.0, 21.0, 29.0, 36.0, 38.0, 52.0, 40.0, 35.0, 46.0, 43.0, 43.0, 70.0, 35.0, 44.0, 53.0, 40.0, 42.0, 51.0, 27.0, 29.0, 35.0, 23.0, 16.0, 16.0, 14.0, 9.0, 14.0, 7.0, 7.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0280022621154785, -3.8825244903564453, -3.737046718597412, -3.591569185256958, -3.446091413497925, -3.3006136417388916, -3.1551361083984375, -3.0096583366394043, -2.864180564880371, -2.718702793121338, -2.5732250213623047, -2.4277474880218506, -2.2822697162628174, -2.136791944503784, -1.9913142919540405, -1.8458366394042969, -1.7003588676452637, -1.5548810958862305, -1.4094034433364868, -1.2639257907867432, -1.11844801902771, -0.9729703068733215, -0.8274925947189331, -0.6820149421691895, -0.5365371704101562, -0.3910594582557678, -0.2455817461013794, -0.10010403394699097, 0.04537367820739746, 0.1908513903617859, 0.3363291025161743, 0.48180675506591797, 0.627284049987793, 0.7727617621421814, 0.9182394742965698, 1.0637171268463135, 1.2091948986053467, 1.3546726703643799, 1.5001503229141235, 1.6456279754638672, 1.7911057472229004, 1.9365835189819336, 2.082061290740967, 2.227538824081421, 2.373016595840454, 2.5184943675994873, 2.6639719009399414, 2.8094496726989746, 2.954927444458008, 3.100405216217041, 3.245882987976074, 3.3913605213165283, 3.5368382930755615, 3.6823160648345947, 3.827793598175049, 3.973271369934082, 4.118749141693115, 4.264226913452148, 4.409704685211182, 4.555182456970215, 4.70065975189209, 4.846137523651123, 4.991615295410156, 5.1370930671691895, 5.282570838928223]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 11.0, 23.0, 19.0, 44.0, 64.0, 91.0, 154.0, 225.0, 367.0, 647.0, 1100.0, 1934.0, 3449.0, 6373.0, 11890.0, 22756.0, 44650.0, 88788.0, 164692.0, 236409.0, 209054.0, 124222.0, 63298.0, 32254.0, 16478.0, 8690.0, 4579.0, 2591.0, 1517.0, 896.0, 452.0, 318.0, 193.0, 128.0, 66.0, 43.0, 30.0, 18.0, 11.0, 9.0, 4.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.0, -4.85614013671875, -4.7122802734375, -4.56842041015625, -4.424560546875, -4.28070068359375, -4.1368408203125, -3.99298095703125, -3.84912109375, -3.70526123046875, -3.5614013671875, -3.41754150390625, -3.273681640625, -3.12982177734375, -2.9859619140625, -2.84210205078125, -2.6982421875, -2.55438232421875, -2.4105224609375, -2.26666259765625, -2.122802734375, -1.97894287109375, -1.8350830078125, -1.69122314453125, -1.54736328125, -1.40350341796875, -1.2596435546875, -1.11578369140625, -0.971923828125, -0.82806396484375, -0.6842041015625, -0.54034423828125, -0.396484375, -0.25262451171875, -0.1087646484375, 0.03509521484375, 0.178955078125, 0.32281494140625, 0.4666748046875, 0.61053466796875, 0.75439453125, 0.89825439453125, 1.0421142578125, 1.18597412109375, 1.329833984375, 1.47369384765625, 1.6175537109375, 1.76141357421875, 1.9052734375, 2.04913330078125, 2.1929931640625, 2.33685302734375, 2.480712890625, 2.62457275390625, 2.7684326171875, 2.91229248046875, 3.05615234375, 3.20001220703125, 3.3438720703125, 3.48773193359375, 3.631591796875, 3.77545166015625, 3.9193115234375, 4.06317138671875, 4.20703125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 11.0, 7.0, 10.0, 9.0, 13.0, 16.0, 31.0, 34.0, 32.0, 39.0, 43.0, 51.0, 45.0, 53.0, 50.0, 45.0, 43.0, 62.0, 39.0, 45.0, 39.0, 40.0, 43.0, 22.0, 31.0, 35.0, 25.0, 16.0, 15.0, 11.0, 11.0, 9.0, 4.0, 5.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.884765625, -3.736968994140625, -3.58917236328125, -3.441375732421875, -3.2935791015625, -3.145782470703125, -2.99798583984375, -2.850189208984375, -2.702392578125, -2.554595947265625, -2.40679931640625, -2.259002685546875, -2.1112060546875, -1.963409423828125, -1.81561279296875, -1.667816162109375, -1.52001953125, -1.372222900390625, -1.22442626953125, -1.076629638671875, -0.9288330078125, -0.781036376953125, -0.63323974609375, -0.485443115234375, -0.337646484375, -0.189849853515625, -0.04205322265625, 0.105743408203125, 0.2535400390625, 0.401336669921875, 0.54913330078125, 0.696929931640625, 0.8447265625, 0.992523193359375, 1.14031982421875, 1.288116455078125, 1.4359130859375, 1.583709716796875, 1.73150634765625, 1.879302978515625, 2.027099609375, 2.174896240234375, 2.32269287109375, 2.470489501953125, 2.6182861328125, 2.766082763671875, 2.91387939453125, 3.061676025390625, 3.20947265625, 3.357269287109375, 3.50506591796875, 3.652862548828125, 3.8006591796875, 3.948455810546875, 4.09625244140625, 4.244049072265625, 4.391845703125, 4.539642333984375, 4.68743896484375, 4.835235595703125, 4.9830322265625, 5.130828857421875, 5.27862548828125, 5.426422119140625, 5.57421875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 7.0, 8.0, 13.0, 27.0, 35.0, 44.0, 83.0, 136.0, 197.0, 345.0, 514.0, 868.0, 1423.0, 2342.0, 3900.0, 6777.0, 11606.0, 20322.0, 35926.0, 62784.0, 106730.0, 162748.0, 194532.0, 168355.0, 112127.0, 66759.0, 38435.0, 21478.0, 12420.0, 7059.0, 4185.0, 2508.0, 1444.0, 923.0, 542.0, 371.0, 215.0, 139.0, 91.0, 49.0, 33.0, 22.0, 15.0, 12.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.666015625, -3.549835205078125, -3.43365478515625, -3.317474365234375, -3.2012939453125, -3.085113525390625, -2.96893310546875, -2.852752685546875, -2.736572265625, -2.620391845703125, -2.50421142578125, -2.388031005859375, -2.2718505859375, -2.155670166015625, -2.03948974609375, -1.923309326171875, -1.80712890625, -1.690948486328125, -1.57476806640625, -1.458587646484375, -1.3424072265625, -1.226226806640625, -1.11004638671875, -0.993865966796875, -0.877685546875, -0.761505126953125, -0.64532470703125, -0.529144287109375, -0.4129638671875, -0.296783447265625, -0.18060302734375, -0.064422607421875, 0.0517578125, 0.167938232421875, 0.28411865234375, 0.400299072265625, 0.5164794921875, 0.632659912109375, 0.74884033203125, 0.865020751953125, 0.981201171875, 1.097381591796875, 1.21356201171875, 1.329742431640625, 1.4459228515625, 1.562103271484375, 1.67828369140625, 1.794464111328125, 1.91064453125, 2.026824951171875, 2.14300537109375, 2.259185791015625, 2.3753662109375, 2.491546630859375, 2.60772705078125, 2.723907470703125, 2.840087890625, 2.956268310546875, 3.07244873046875, 3.188629150390625, 3.3048095703125, 3.420989990234375, 3.53717041015625, 3.653350830078125, 3.76953125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 9.0, 9.0, 4.0, 4.0, 5.0, 15.0, 13.0, 15.0, 26.0, 26.0, 25.0, 28.0, 25.0, 34.0, 38.0, 52.0, 32.0, 25.0, 44.0, 38.0, 48.0, 45.0, 42.0, 39.0, 37.0, 40.0, 40.0, 32.0, 30.0, 25.0, 27.0, 24.0, 21.0, 29.0, 17.0, 8.0, 9.0, 8.0, 5.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.34375, -2.268829345703125, -2.19390869140625, -2.118988037109375, -2.0440673828125, -1.969146728515625, -1.89422607421875, -1.819305419921875, -1.744384765625, -1.669464111328125, -1.59454345703125, -1.519622802734375, -1.4447021484375, -1.369781494140625, -1.29486083984375, -1.219940185546875, -1.14501953125, -1.070098876953125, -0.99517822265625, -0.920257568359375, -0.8453369140625, -0.770416259765625, -0.69549560546875, -0.620574951171875, -0.545654296875, -0.470733642578125, -0.39581298828125, -0.320892333984375, -0.2459716796875, -0.171051025390625, -0.09613037109375, -0.021209716796875, 0.0537109375, 0.128631591796875, 0.20355224609375, 0.278472900390625, 0.3533935546875, 0.428314208984375, 0.50323486328125, 0.578155517578125, 0.653076171875, 0.727996826171875, 0.80291748046875, 0.877838134765625, 0.9527587890625, 1.027679443359375, 1.10260009765625, 1.177520751953125, 1.25244140625, 1.327362060546875, 1.40228271484375, 1.477203369140625, 1.5521240234375, 1.627044677734375, 1.70196533203125, 1.776885986328125, 1.851806640625, 1.926727294921875, 2.00164794921875, 2.076568603515625, 2.1514892578125, 2.226409912109375, 2.30133056640625, 2.376251220703125, 2.451171875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 3.0, 6.0, 18.0, 25.0, 34.0, 55.0, 57.0, 109.0, 149.0, 220.0, 300.0, 500.0, 855.0, 1327.0, 2199.0, 3909.0, 6940.0, 12626.0, 24118.0, 48695.0, 100593.0, 196734.0, 264902.0, 189341.0, 96739.0, 46712.0, 23073.0, 12148.0, 6662.0, 3733.0, 2228.0, 1326.0, 781.0, 459.0, 329.0, 203.0, 120.0, 93.0, 64.0, 46.0, 34.0, 28.0, 23.0, 9.0, 14.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.302734375, -1.259979248046875, -1.21722412109375, -1.174468994140625, -1.1317138671875, -1.088958740234375, -1.04620361328125, -1.003448486328125, -0.960693359375, -0.917938232421875, -0.87518310546875, -0.832427978515625, -0.7896728515625, -0.746917724609375, -0.70416259765625, -0.661407470703125, -0.61865234375, -0.575897216796875, -0.53314208984375, -0.490386962890625, -0.4476318359375, -0.404876708984375, -0.36212158203125, -0.319366455078125, -0.276611328125, -0.233856201171875, -0.19110107421875, -0.148345947265625, -0.1055908203125, -0.062835693359375, -0.02008056640625, 0.022674560546875, 0.0654296875, 0.108184814453125, 0.15093994140625, 0.193695068359375, 0.2364501953125, 0.279205322265625, 0.32196044921875, 0.364715576171875, 0.407470703125, 0.450225830078125, 0.49298095703125, 0.535736083984375, 0.5784912109375, 0.621246337890625, 0.66400146484375, 0.706756591796875, 0.74951171875, 0.792266845703125, 0.83502197265625, 0.877777099609375, 0.9205322265625, 0.963287353515625, 1.00604248046875, 1.048797607421875, 1.091552734375, 1.134307861328125, 1.17706298828125, 1.219818115234375, 1.2625732421875, 1.305328369140625, 1.34808349609375, 1.390838623046875, 1.43359375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 8.0, 4.0, 4.0, 4.0, 12.0, 15.0, 20.0, 19.0, 28.0, 31.0, 38.0, 51.0, 53.0, 62.0, 61.0, 75.0, 65.0, 64.0, 56.0, 58.0, 56.0, 45.0, 34.0, 26.0, 22.0, 20.0, 17.0, 13.0, 13.0, 6.0, 8.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.706880569458008e-05, -7.452908903360367e-05, -7.198937237262726e-05, -6.944965571165085e-05, -6.690993905067444e-05, -6.437022238969803e-05, -6.183050572872162e-05, -5.929078906774521e-05, -5.67510724067688e-05, -5.421135574579239e-05, -5.167163908481598e-05, -4.913192242383957e-05, -4.659220576286316e-05, -4.405248910188675e-05, -4.151277244091034e-05, -3.897305577993393e-05, -3.643333911895752e-05, -3.389362245798111e-05, -3.13539057970047e-05, -2.881418913602829e-05, -2.627447247505188e-05, -2.373475581407547e-05, -2.119503915309906e-05, -1.865532249212265e-05, -1.611560583114624e-05, -1.357588917016983e-05, -1.103617250919342e-05, -8.49645584821701e-06, -5.956739187240601e-06, -3.4170225262641907e-06, -8.773058652877808e-07, 1.6624107956886292e-06, 4.202127456665039e-06, 6.741844117641449e-06, 9.281560778617859e-06, 1.1821277439594269e-05, 1.4360994100570679e-05, 1.690071076154709e-05, 1.94404274225235e-05, 2.198014408349991e-05, 2.451986074447632e-05, 2.7059577405452728e-05, 2.9599294066429138e-05, 3.213901072740555e-05, 3.467872738838196e-05, 3.721844404935837e-05, 3.975816071033478e-05, 4.229787737131119e-05, 4.48375940322876e-05, 4.737731069326401e-05, 4.991702735424042e-05, 5.245674401521683e-05, 5.499646067619324e-05, 5.753617733716965e-05, 6.007589399814606e-05, 6.261561065912247e-05, 6.515532732009888e-05, 6.769504398107529e-05, 7.02347606420517e-05, 7.27744773030281e-05, 7.531419396400452e-05, 7.785391062498093e-05, 8.039362728595734e-05, 8.293334394693375e-05, 8.547306060791016e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 5.0, 9.0, 11.0, 18.0, 26.0, 42.0, 63.0, 105.0, 145.0, 284.0, 409.0, 742.0, 1162.0, 2027.0, 3535.0, 6260.0, 11411.0, 21504.0, 40423.0, 78399.0, 144977.0, 226045.0, 219139.0, 136175.0, 73042.0, 37626.0, 19901.0, 10847.0, 5970.0, 3339.0, 2005.0, 1148.0, 673.0, 404.0, 249.0, 159.0, 84.0, 64.0, 57.0, 27.0, 18.0, 7.0, 12.0, 8.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1484375, -1.111328125, -1.07421875, -1.037109375, -1.0, -0.962890625, -0.92578125, -0.888671875, -0.8515625, -0.814453125, -0.77734375, -0.740234375, -0.703125, -0.666015625, -0.62890625, -0.591796875, -0.5546875, -0.517578125, -0.48046875, -0.443359375, -0.40625, -0.369140625, -0.33203125, -0.294921875, -0.2578125, -0.220703125, -0.18359375, -0.146484375, -0.109375, -0.072265625, -0.03515625, 0.001953125, 0.0390625, 0.076171875, 0.11328125, 0.150390625, 0.1875, 0.224609375, 0.26171875, 0.298828125, 0.3359375, 0.373046875, 0.41015625, 0.447265625, 0.484375, 0.521484375, 0.55859375, 0.595703125, 0.6328125, 0.669921875, 0.70703125, 0.744140625, 0.78125, 0.818359375, 0.85546875, 0.892578125, 0.9296875, 0.966796875, 1.00390625, 1.041015625, 1.078125, 1.115234375, 1.15234375, 1.189453125, 1.2265625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 2.0, 2.0, 8.0, 5.0, 7.0, 3.0, 4.0, 11.0, 21.0, 19.0, 24.0, 30.0, 37.0, 43.0, 50.0, 75.0, 80.0, 91.0, 83.0, 81.0, 73.0, 61.0, 47.0, 27.0, 21.0, 18.0, 17.0, 8.0, 12.0, 8.0, 10.0, 5.0, 1.0, 2.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.60107421875, -0.5833358764648438, -0.5655975341796875, -0.5478591918945312, -0.530120849609375, -0.5123825073242188, -0.4946441650390625, -0.47690582275390625, -0.45916748046875, -0.44142913818359375, -0.4236907958984375, -0.40595245361328125, -0.388214111328125, -0.37047576904296875, -0.3527374267578125, -0.33499908447265625, -0.3172607421875, -0.29952239990234375, -0.2817840576171875, -0.26404571533203125, -0.246307373046875, -0.22856903076171875, -0.2108306884765625, -0.19309234619140625, -0.17535400390625, -0.15761566162109375, -0.1398773193359375, -0.12213897705078125, -0.104400634765625, -0.08666229248046875, -0.0689239501953125, -0.05118560791015625, -0.033447265625, -0.01570892333984375, 0.0020294189453125, 0.01976776123046875, 0.037506103515625, 0.05524444580078125, 0.0729827880859375, 0.09072113037109375, 0.10845947265625, 0.12619781494140625, 0.1439361572265625, 0.16167449951171875, 0.179412841796875, 0.19715118408203125, 0.2148895263671875, 0.23262786865234375, 0.2503662109375, 0.26810455322265625, 0.2858428955078125, 0.30358123779296875, 0.321319580078125, 0.33905792236328125, 0.3567962646484375, 0.37453460693359375, 0.39227294921875, 0.41001129150390625, 0.4277496337890625, 0.44548797607421875, 0.463226318359375, 0.48096466064453125, 0.4987030029296875, 0.5164413452148438, 0.5341796875]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 5.0, 7.0, 14.0, 12.0, 14.0, 22.0, 24.0, 36.0, 41.0, 53.0, 62.0, 62.0, 79.0, 79.0, 70.0, 69.0, 56.0, 53.0, 45.0, 34.0, 38.0, 17.0, 24.0, 17.0, 15.0, 13.0, 7.0, 8.0, 2.0, 7.0, 3.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.137364387512207, -2.995353937149048, -2.8533434867858887, -2.7113330364227295, -2.5693225860595703, -2.427312135696411, -2.285301685333252, -2.1432912349700928, -2.0012807846069336, -1.8592703342437744, -1.7172598838806152, -1.575249433517456, -1.4332389831542969, -1.2912285327911377, -1.1492180824279785, -1.0072076320648193, -0.8651971817016602, -0.723186731338501, -0.5811762809753418, -0.4391658306121826, -0.29715538024902344, -0.15514492988586426, -0.013134479522705078, 0.1288759708404541, 0.2708864212036133, 0.41289687156677246, 0.5549073219299316, 0.6969177722930908, 0.83892822265625, 0.9809386730194092, 1.1229491233825684, 1.2649595737457275, 1.406970500946045, 1.548980951309204, 1.6909914016723633, 1.8330018520355225, 1.9750123023986816, 2.117022752761841, 2.259033203125, 2.401043653488159, 2.5430541038513184, 2.6850645542144775, 2.8270750045776367, 2.969085454940796, 3.111095905303955, 3.2531063556671143, 3.3951168060302734, 3.5371272563934326, 3.679137706756592, 3.821148157119751, 3.96315860748291, 4.105169296264648, 4.2471795082092285, 4.389189720153809, 4.531200408935547, 4.673211097717285, 4.815221309661865, 4.957231521606445, 5.099242210388184, 5.241252899169922, 5.383263111114502, 5.525273323059082, 5.66728401184082, 5.809294700622559, 5.951304912567139]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 10.0, 4.0, 12.0, 10.0, 9.0, 15.0, 14.0, 26.0, 24.0, 31.0, 37.0, 34.0, 33.0, 40.0, 34.0, 53.0, 30.0, 44.0, 34.0, 56.0, 46.0, 40.0, 50.0, 57.0, 33.0, 24.0, 22.0, 25.0, 21.0, 29.0, 24.0, 12.0, 10.0, 12.0, 9.0, 10.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7395386695861816, -3.6085987091064453, -3.477658748626709, -3.3467185497283936, -3.2157785892486572, -3.084838628768921, -2.9538984298706055, -2.822958469390869, -2.692018508911133, -2.5610785484313965, -2.43013858795166, -2.2991983890533447, -2.1682584285736084, -2.037318468093872, -1.9063783884048462, -1.7754383087158203, -1.644498348236084, -1.5135583877563477, -1.3826183080673218, -1.251678228378296, -1.1207382678985596, -0.9897982478141785, -0.8588582277297974, -0.7279182076454163, -0.5969781875610352, -0.46603816747665405, -0.33509814739227295, -0.20415812730789185, -0.07321810722351074, 0.05772191286087036, 0.18866193294525146, 0.31960195302963257, 0.45054149627685547, 0.5814815163612366, 0.7124215364456177, 0.8433615565299988, 0.9743015766143799, 1.1052415370941162, 1.236181616783142, 1.367121696472168, 1.4980616569519043, 1.6290016174316406, 1.7599416971206665, 1.8908817768096924, 2.0218217372894287, 2.152761697769165, 2.2837018966674805, 2.414641857147217, 2.545581817626953, 2.6765217781066895, 2.807461738586426, 2.938401937484741, 3.0693418979644775, 3.200281858444214, 3.3312220573425293, 3.4621620178222656, 3.593101978302002, 3.7240419387817383, 3.8549818992614746, 3.98592209815979, 4.1168622970581055, 4.247802257537842, 4.378742218017578, 4.5096821784973145, 4.640622138977051]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 9.0, 13.0, 19.0, 26.0, 47.0, 63.0, 96.0, 120.0, 160.0, 288.0, 411.0, 652.0, 994.0, 1569.0, 2412.0, 3927.0, 6589.0, 11121.0, 20024.0, 37654.0, 75757.0, 163596.0, 383974.0, 883771.0, 1257264.0, 752318.0, 313336.0, 136285.0, 64485.0, 33188.0, 18014.0, 10183.0, 6022.0, 3615.0, 2162.0, 1356.0, 911.0, 556.0, 440.0, 270.0, 173.0, 142.0, 79.0, 45.0, 47.0, 30.0, 22.0, 16.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0], "bins": [-4.63671875, -4.49359130859375, -4.3504638671875, -4.20733642578125, -4.064208984375, -3.92108154296875, -3.7779541015625, -3.63482666015625, -3.49169921875, -3.34857177734375, -3.2054443359375, -3.06231689453125, -2.919189453125, -2.77606201171875, -2.6329345703125, -2.48980712890625, -2.3466796875, -2.20355224609375, -2.0604248046875, -1.91729736328125, -1.774169921875, -1.63104248046875, -1.4879150390625, -1.34478759765625, -1.20166015625, -1.05853271484375, -0.9154052734375, -0.77227783203125, -0.629150390625, -0.48602294921875, -0.3428955078125, -0.19976806640625, -0.056640625, 0.08648681640625, 0.2296142578125, 0.37274169921875, 0.515869140625, 0.65899658203125, 0.8021240234375, 0.94525146484375, 1.08837890625, 1.23150634765625, 1.3746337890625, 1.51776123046875, 1.660888671875, 1.80401611328125, 1.9471435546875, 2.09027099609375, 2.2333984375, 2.37652587890625, 2.5196533203125, 2.66278076171875, 2.805908203125, 2.94903564453125, 3.0921630859375, 3.23529052734375, 3.37841796875, 3.52154541015625, 3.6646728515625, 3.80780029296875, 3.950927734375, 4.09405517578125, 4.2371826171875, 4.38031005859375, 4.5234375]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 8.0, 5.0, 8.0, 5.0, 10.0, 8.0, 12.0, 18.0, 23.0, 16.0, 22.0, 29.0, 39.0, 33.0, 34.0, 33.0, 44.0, 38.0, 39.0, 38.0, 39.0, 55.0, 40.0, 53.0, 54.0, 36.0, 35.0, 25.0, 29.0, 30.0, 26.0, 12.0, 20.0, 15.0, 13.0, 14.0, 6.0, 12.0, 5.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.76171875, -2.676849365234375, -2.59197998046875, -2.507110595703125, -2.4222412109375, -2.337371826171875, -2.25250244140625, -2.167633056640625, -2.082763671875, -1.997894287109375, -1.91302490234375, -1.828155517578125, -1.7432861328125, -1.658416748046875, -1.57354736328125, -1.488677978515625, -1.40380859375, -1.318939208984375, -1.23406982421875, -1.149200439453125, -1.0643310546875, -0.979461669921875, -0.89459228515625, -0.809722900390625, -0.724853515625, -0.639984130859375, -0.55511474609375, -0.470245361328125, -0.3853759765625, -0.300506591796875, -0.21563720703125, -0.130767822265625, -0.0458984375, 0.038970947265625, 0.12384033203125, 0.208709716796875, 0.2935791015625, 0.378448486328125, 0.46331787109375, 0.548187255859375, 0.633056640625, 0.717926025390625, 0.80279541015625, 0.887664794921875, 0.9725341796875, 1.057403564453125, 1.14227294921875, 1.227142333984375, 1.31201171875, 1.396881103515625, 1.48175048828125, 1.566619873046875, 1.6514892578125, 1.736358642578125, 1.82122802734375, 1.906097412109375, 1.990966796875, 2.075836181640625, 2.16070556640625, 2.245574951171875, 2.3304443359375, 2.415313720703125, 2.50018310546875, 2.585052490234375, 2.669921875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 7.0, 6.0, 10.0, 9.0, 13.0, 32.0, 56.0, 67.0, 133.0, 231.0, 312.0, 490.0, 852.0, 1439.0, 2380.0, 4195.0, 7511.0, 13322.0, 25312.0, 49090.0, 99678.0, 209317.0, 446244.0, 857130.0, 1070373.0, 718355.0, 354988.0, 166809.0, 79712.0, 40002.0, 20797.0, 10995.0, 6005.0, 3478.0, 1940.0, 1191.0, 679.0, 449.0, 224.0, 152.0, 108.0, 80.0, 35.0, 33.0, 14.0, 18.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.20703125, -4.07281494140625, -3.9385986328125, -3.80438232421875, -3.670166015625, -3.53594970703125, -3.4017333984375, -3.26751708984375, -3.13330078125, -2.99908447265625, -2.8648681640625, -2.73065185546875, -2.596435546875, -2.46221923828125, -2.3280029296875, -2.19378662109375, -2.0595703125, -1.92535400390625, -1.7911376953125, -1.65692138671875, -1.522705078125, -1.38848876953125, -1.2542724609375, -1.12005615234375, -0.98583984375, -0.85162353515625, -0.7174072265625, -0.58319091796875, -0.448974609375, -0.31475830078125, -0.1805419921875, -0.04632568359375, 0.087890625, 0.22210693359375, 0.3563232421875, 0.49053955078125, 0.624755859375, 0.75897216796875, 0.8931884765625, 1.02740478515625, 1.16162109375, 1.29583740234375, 1.4300537109375, 1.56427001953125, 1.698486328125, 1.83270263671875, 1.9669189453125, 2.10113525390625, 2.2353515625, 2.36956787109375, 2.5037841796875, 2.63800048828125, 2.772216796875, 2.90643310546875, 3.0406494140625, 3.17486572265625, 3.30908203125, 3.44329833984375, 3.5775146484375, 3.71173095703125, 3.845947265625, 3.98016357421875, 4.1143798828125, 4.24859619140625, 4.3828125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 1.0, 10.0, 10.0, 18.0, 10.0, 18.0, 31.0, 30.0, 36.0, 55.0, 61.0, 81.0, 70.0, 106.0, 118.0, 159.0, 157.0, 200.0, 194.0, 230.0, 233.0, 264.0, 236.0, 227.0, 236.0, 186.0, 187.0, 128.0, 131.0, 110.0, 90.0, 69.0, 72.0, 48.0, 43.0, 34.0, 37.0, 33.0, 26.0, 16.0, 9.0, 12.0, 11.0, 8.0, 9.0, 6.0, 2.0, 3.0, 0.0, 3.0, 5.0, 1.0, 1.0, 2.0], "bins": [-1.271484375, -1.231964111328125, -1.19244384765625, -1.152923583984375, -1.1134033203125, -1.073883056640625, -1.03436279296875, -0.994842529296875, -0.955322265625, -0.915802001953125, -0.87628173828125, -0.836761474609375, -0.7972412109375, -0.757720947265625, -0.71820068359375, -0.678680419921875, -0.63916015625, -0.599639892578125, -0.56011962890625, -0.520599365234375, -0.4810791015625, -0.441558837890625, -0.40203857421875, -0.362518310546875, -0.322998046875, -0.283477783203125, -0.24395751953125, -0.204437255859375, -0.1649169921875, -0.125396728515625, -0.08587646484375, -0.046356201171875, -0.0068359375, 0.032684326171875, 0.07220458984375, 0.111724853515625, 0.1512451171875, 0.190765380859375, 0.23028564453125, 0.269805908203125, 0.309326171875, 0.348846435546875, 0.38836669921875, 0.427886962890625, 0.4674072265625, 0.506927490234375, 0.54644775390625, 0.585968017578125, 0.62548828125, 0.665008544921875, 0.70452880859375, 0.744049072265625, 0.7835693359375, 0.823089599609375, 0.86260986328125, 0.902130126953125, 0.941650390625, 0.981170654296875, 1.02069091796875, 1.060211181640625, 1.0997314453125, 1.139251708984375, 1.17877197265625, 1.218292236328125, 1.2578125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 2.0, 6.0, 3.0, 16.0, 10.0, 17.0, 21.0, 28.0, 37.0, 38.0, 36.0, 55.0, 62.0, 81.0, 81.0, 76.0, 69.0, 71.0, 49.0, 45.0, 19.0, 29.0, 34.0, 20.0, 16.0, 19.0, 13.0, 9.0, 11.0, 3.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1793346405029297, -3.0423638820648193, -2.905393123626709, -2.7684223651885986, -2.6314516067504883, -2.494481086730957, -2.3575103282928467, -2.2205395698547363, -2.083568811416626, -1.9465980529785156, -1.8096272945404053, -1.6726566553115845, -1.5356858968734741, -1.3987151384353638, -1.261744499206543, -1.1247737407684326, -0.9878029823303223, -0.8508322238922119, -0.7138615250587463, -0.5768908262252808, -0.4399200677871704, -0.30294930934906006, -0.16597861051559448, -0.029007911682128906, 0.10796284675598145, 0.2449335753917694, 0.3819043040275574, 0.518875002861023, 0.6558457612991333, 0.7928165197372437, 0.9297872185707092, 1.0667579174041748, 1.203728199005127, 1.3406989574432373, 1.4776697158813477, 1.6146403551101685, 1.7516111135482788, 1.8885818719863892, 2.02555251121521, 2.1625232696533203, 2.2994940280914307, 2.436464786529541, 2.5734355449676514, 2.7104063034057617, 2.847376823425293, 2.9843478202819824, 3.1213183403015137, 3.258289098739624, 3.3952598571777344, 3.5322306156158447, 3.669201374053955, 3.8061721324920654, 3.943142890930176, 4.080113410949707, 4.2170844078063965, 4.354054927825928, 4.491025924682617, 4.627996444702148, 4.764967441558838, 4.901937961578369, 5.038908958435059, 5.17587947845459, 5.312850475311279, 5.4498209953308105, 5.586791515350342]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 3.0, 5.0, 3.0, 7.0, 9.0, 7.0, 9.0, 8.0, 15.0, 13.0, 16.0, 27.0, 23.0, 29.0, 26.0, 40.0, 33.0, 38.0, 40.0, 41.0, 40.0, 38.0, 38.0, 37.0, 36.0, 33.0, 43.0, 34.0, 47.0, 34.0, 23.0, 26.0, 15.0, 37.0, 16.0, 18.0, 13.0, 15.0, 8.0, 9.0, 11.0, 4.0, 8.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.26567006111145, -3.1519546508789062, -3.0382392406463623, -2.9245238304138184, -2.8108084201812744, -2.6970930099487305, -2.5833775997161865, -2.4696621894836426, -2.3559467792510986, -2.2422313690185547, -2.1285159587860107, -2.014800548553467, -1.9010851383209229, -1.787369728088379, -1.673654317855835, -1.559938907623291, -1.446223497390747, -1.3325080871582031, -1.2187926769256592, -1.1050772666931152, -0.9913618564605713, -0.8776464462280273, -0.7639310359954834, -0.6502156257629395, -0.5365002155303955, -0.42278480529785156, -0.3090693950653076, -0.19535398483276367, -0.08163857460021973, 0.03207683563232422, 0.14579224586486816, 0.2595076560974121, 0.37322282791137695, 0.4869382381439209, 0.6006536483764648, 0.7143690586090088, 0.8280844688415527, 0.9417998790740967, 1.0555152893066406, 1.1692306995391846, 1.2829461097717285, 1.3966615200042725, 1.5103769302368164, 1.6240923404693604, 1.7378077507019043, 1.8515231609344482, 1.9652385711669922, 2.078953981399536, 2.19266939163208, 2.306384801864624, 2.420100212097168, 2.533815622329712, 2.647531032562256, 2.7612464427948, 2.8749618530273438, 2.9886772632598877, 3.1023926734924316, 3.2161080837249756, 3.3298234939575195, 3.4435389041900635, 3.5572543144226074, 3.6709697246551514, 3.7846851348876953, 3.8984005451202393, 4.012115955352783]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 15.0, 15.0, 29.0, 66.0, 63.0, 97.0, 149.0, 179.0, 258.0, 390.0, 542.0, 682.0, 1002.0, 1460.0, 1984.0, 2979.0, 4337.0, 6361.0, 9820.0, 14846.0, 23887.0, 39851.0, 69736.0, 131600.0, 244743.0, 220193.0, 113728.0, 61028.0, 35662.0, 21377.0, 13484.0, 8850.0, 6004.0, 3872.0, 2800.0, 1871.0, 1311.0, 938.0, 646.0, 492.0, 347.0, 249.0, 169.0, 150.0, 99.0, 62.0, 29.0, 31.0, 25.0, 15.0, 9.0, 6.0, 7.0, 1.0, 0.0, 2.0], "bins": [-1.0654296875, -1.0330352783203125, -1.000640869140625, -0.9682464599609375, -0.93585205078125, -0.9034576416015625, -0.871063232421875, -0.8386688232421875, -0.8062744140625, -0.7738800048828125, -0.741485595703125, -0.7090911865234375, -0.67669677734375, -0.6443023681640625, -0.611907958984375, -0.5795135498046875, -0.547119140625, -0.5147247314453125, -0.482330322265625, -0.4499359130859375, -0.41754150390625, -0.3851470947265625, -0.352752685546875, -0.3203582763671875, -0.2879638671875, -0.2555694580078125, -0.223175048828125, -0.1907806396484375, -0.15838623046875, -0.1259918212890625, -0.093597412109375, -0.0612030029296875, -0.02880859375, 0.0035858154296875, 0.035980224609375, 0.0683746337890625, 0.10076904296875, 0.1331634521484375, 0.165557861328125, 0.1979522705078125, 0.2303466796875, 0.2627410888671875, 0.295135498046875, 0.3275299072265625, 0.35992431640625, 0.3923187255859375, 0.424713134765625, 0.4571075439453125, 0.489501953125, 0.5218963623046875, 0.554290771484375, 0.5866851806640625, 0.61907958984375, 0.6514739990234375, 0.683868408203125, 0.7162628173828125, 0.7486572265625, 0.7810516357421875, 0.813446044921875, 0.8458404541015625, 0.87823486328125, 0.9106292724609375, 0.943023681640625, 0.9754180908203125, 1.0078125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 5.0, 9.0, 7.0, 6.0, 9.0, 11.0, 9.0, 21.0, 17.0, 15.0, 12.0, 24.0, 29.0, 28.0, 37.0, 48.0, 46.0, 35.0, 38.0, 44.0, 39.0, 44.0, 43.0, 42.0, 38.0, 27.0, 31.0, 43.0, 25.0, 23.0, 25.0, 22.0, 16.0, 27.0, 11.0, 18.0, 13.0, 9.0, 11.0, 6.0, 5.0, 9.0, 5.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.63671875, -3.52056884765625, -3.4044189453125, -3.28826904296875, -3.172119140625, -3.05596923828125, -2.9398193359375, -2.82366943359375, -2.70751953125, -2.59136962890625, -2.4752197265625, -2.35906982421875, -2.242919921875, -2.12677001953125, -2.0106201171875, -1.89447021484375, -1.7783203125, -1.66217041015625, -1.5460205078125, -1.42987060546875, -1.313720703125, -1.19757080078125, -1.0814208984375, -0.96527099609375, -0.84912109375, -0.73297119140625, -0.6168212890625, -0.50067138671875, -0.384521484375, -0.26837158203125, -0.1522216796875, -0.03607177734375, 0.080078125, 0.19622802734375, 0.3123779296875, 0.42852783203125, 0.544677734375, 0.66082763671875, 0.7769775390625, 0.89312744140625, 1.00927734375, 1.12542724609375, 1.2415771484375, 1.35772705078125, 1.473876953125, 1.59002685546875, 1.7061767578125, 1.82232666015625, 1.9384765625, 2.05462646484375, 2.1707763671875, 2.28692626953125, 2.403076171875, 2.51922607421875, 2.6353759765625, 2.75152587890625, 2.86767578125, 2.98382568359375, 3.0999755859375, 3.21612548828125, 3.332275390625, 3.44842529296875, 3.5645751953125, 3.68072509765625, 3.796875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 1.0, 5.0, 6.0, 10.0, 18.0, 20.0, 19.0, 35.0, 36.0, 39.0, 68.0, 89.0, 117.0, 161.0, 207.0, 342.0, 469.0, 723.0, 1207.0, 2143.0, 4155.0, 10306.0, 31595.0, 914589.0, 53763.0, 15562.0, 5971.0, 2714.0, 1444.0, 901.0, 516.0, 377.0, 237.0, 174.0, 137.0, 111.0, 69.0, 46.0, 35.0, 32.0, 25.0, 18.0, 20.0, 10.0, 11.0, 6.0, 3.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.35546875, -3.24615478515625, -3.1368408203125, -3.02752685546875, -2.918212890625, -2.80889892578125, -2.6995849609375, -2.59027099609375, -2.48095703125, -2.37164306640625, -2.2623291015625, -2.15301513671875, -2.043701171875, -1.93438720703125, -1.8250732421875, -1.71575927734375, -1.6064453125, -1.49713134765625, -1.3878173828125, -1.27850341796875, -1.169189453125, -1.05987548828125, -0.9505615234375, -0.84124755859375, -0.73193359375, -0.62261962890625, -0.5133056640625, -0.40399169921875, -0.294677734375, -0.18536376953125, -0.0760498046875, 0.03326416015625, 0.142578125, 0.25189208984375, 0.3612060546875, 0.47052001953125, 0.579833984375, 0.68914794921875, 0.7984619140625, 0.90777587890625, 1.01708984375, 1.12640380859375, 1.2357177734375, 1.34503173828125, 1.454345703125, 1.56365966796875, 1.6729736328125, 1.78228759765625, 1.8916015625, 2.00091552734375, 2.1102294921875, 2.21954345703125, 2.328857421875, 2.43817138671875, 2.5474853515625, 2.65679931640625, 2.76611328125, 2.87542724609375, 2.9847412109375, 3.09405517578125, 3.203369140625, 3.31268310546875, 3.4219970703125, 3.53131103515625, 3.640625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 7.0, 3.0, 6.0, 9.0, 9.0, 13.0, 14.0, 17.0, 18.0, 22.0, 21.0, 27.0, 25.0, 33.0, 37.0, 42.0, 42.0, 47.0, 42.0, 39.0, 41.0, 42.0, 35.0, 35.0, 32.0, 46.0, 30.0, 25.0, 28.0, 31.0, 25.0, 25.0, 30.0, 11.0, 16.0, 14.0, 10.0, 10.0, 13.0, 1.0, 4.0, 8.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.185546875, -2.114349365234375, -2.04315185546875, -1.971954345703125, -1.9007568359375, -1.829559326171875, -1.75836181640625, -1.687164306640625, -1.615966796875, -1.544769287109375, -1.47357177734375, -1.402374267578125, -1.3311767578125, -1.259979248046875, -1.18878173828125, -1.117584228515625, -1.04638671875, -0.975189208984375, -0.90399169921875, -0.832794189453125, -0.7615966796875, -0.690399169921875, -0.61920166015625, -0.548004150390625, -0.476806640625, -0.405609130859375, -0.33441162109375, -0.263214111328125, -0.1920166015625, -0.120819091796875, -0.04962158203125, 0.021575927734375, 0.0927734375, 0.163970947265625, 0.23516845703125, 0.306365966796875, 0.3775634765625, 0.448760986328125, 0.51995849609375, 0.591156005859375, 0.662353515625, 0.733551025390625, 0.80474853515625, 0.875946044921875, 0.9471435546875, 1.018341064453125, 1.08953857421875, 1.160736083984375, 1.23193359375, 1.303131103515625, 1.37432861328125, 1.445526123046875, 1.5167236328125, 1.587921142578125, 1.65911865234375, 1.730316162109375, 1.801513671875, 1.872711181640625, 1.94390869140625, 2.015106201171875, 2.0863037109375, 2.157501220703125, 2.22869873046875, 2.299896240234375, 2.37109375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 12.0, 9.0, 23.0, 14.0, 15.0, 47.0, 44.0, 70.0, 102.0, 143.0, 193.0, 316.0, 509.0, 808.0, 1471.0, 2807.0, 6269.0, 17350.0, 94041.0, 891157.0, 19312.0, 6934.0, 2962.0, 1529.0, 867.0, 528.0, 307.0, 216.0, 147.0, 91.0, 58.0, 51.0, 43.0, 30.0, 23.0, 8.0, 7.0, 8.0, 10.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264892578125, -0.2566261291503906, -0.24835968017578125, -0.24009323120117188, -0.2318267822265625, -0.22356033325195312, -0.21529388427734375, -0.20702743530273438, -0.198760986328125, -0.19049453735351562, -0.18222808837890625, -0.17396163940429688, -0.1656951904296875, -0.15742874145507812, -0.14916229248046875, -0.14089584350585938, -0.13262939453125, -0.12436294555664062, -0.11609649658203125, -0.10783004760742188, -0.0995635986328125, -0.09129714965820312, -0.08303070068359375, -0.07476425170898438, -0.066497802734375, -0.058231353759765625, -0.04996490478515625, -0.041698455810546875, -0.0334320068359375, -0.025165557861328125, -0.01689910888671875, -0.008632659912109375, -0.0003662109375, 0.007900238037109375, 0.01616668701171875, 0.024433135986328125, 0.0326995849609375, 0.040966033935546875, 0.04923248291015625, 0.057498931884765625, 0.065765380859375, 0.07403182983398438, 0.08229827880859375, 0.09056472778320312, 0.0988311767578125, 0.10709762573242188, 0.11536407470703125, 0.12363052368164062, 0.13189697265625, 0.14016342163085938, 0.14842987060546875, 0.15669631958007812, 0.1649627685546875, 0.17322921752929688, 0.18149566650390625, 0.18976211547851562, 0.198028564453125, 0.20629501342773438, 0.21456146240234375, 0.22282791137695312, 0.2310943603515625, 0.23936080932617188, 0.24762725830078125, 0.2558937072753906, 0.26416015625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 7.0, 3.0, 7.0, 14.0, 11.0, 10.0, 9.0, 10.0, 19.0, 20.0, 33.0, 16.0, 34.0, 39.0, 53.0, 28.0, 41.0, 48.0, 44.0, 48.0, 47.0, 43.0, 40.0, 46.0, 39.0, 39.0, 29.0, 29.0, 37.0, 27.0, 15.0, 21.0, 11.0, 15.0, 8.0, 18.0, 12.0, 5.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.3974647521972656e-05, -3.284495323896408e-05, -3.1715258955955505e-05, -3.058556467294693e-05, -2.9455870389938354e-05, -2.832617610692978e-05, -2.7196481823921204e-05, -2.6066787540912628e-05, -2.4937093257904053e-05, -2.3807398974895477e-05, -2.2677704691886902e-05, -2.1548010408878326e-05, -2.041831612586975e-05, -1.9288621842861176e-05, -1.81589275598526e-05, -1.7029233276844025e-05, -1.589953899383545e-05, -1.4769844710826874e-05, -1.3640150427818298e-05, -1.2510456144809723e-05, -1.1380761861801147e-05, -1.0251067578792572e-05, -9.121373295783997e-06, -7.991679012775421e-06, -6.861984729766846e-06, -5.73229044675827e-06, -4.602596163749695e-06, -3.4729018807411194e-06, -2.343207597732544e-06, -1.2135133147239685e-06, -8.381903171539307e-08, 1.0458752512931824e-06, 2.175569534301758e-06, 3.3052638173103333e-06, 4.434958100318909e-06, 5.564652383327484e-06, 6.6943466663360596e-06, 7.824040949344635e-06, 8.95373523235321e-06, 1.0083429515361786e-05, 1.1213123798370361e-05, 1.2342818081378937e-05, 1.3472512364387512e-05, 1.4602206647396088e-05, 1.5731900930404663e-05, 1.686159521341324e-05, 1.7991289496421814e-05, 1.912098377943039e-05, 2.0250678062438965e-05, 2.138037234544754e-05, 2.2510066628456116e-05, 2.363976091146469e-05, 2.4769455194473267e-05, 2.5899149477481842e-05, 2.7028843760490417e-05, 2.8158538043498993e-05, 2.928823232650757e-05, 3.0417926609516144e-05, 3.154762089252472e-05, 3.2677315175533295e-05, 3.380700945854187e-05, 3.4936703741550446e-05, 3.606639802455902e-05, 3.7196092307567596e-05, 3.832578659057617e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 11.0, 12.0, 18.0, 27.0, 33.0, 46.0, 97.0, 122.0, 146.0, 264.0, 364.0, 576.0, 843.0, 1377.0, 2115.0, 3544.0, 6399.0, 11232.0, 21618.0, 45467.0, 112876.0, 332897.0, 313210.0, 105301.0, 42941.0, 20407.0, 10898.0, 6188.0, 3531.0, 2163.0, 1327.0, 870.0, 523.0, 347.0, 239.0, 161.0, 123.0, 76.0, 58.0, 41.0, 23.0, 12.0, 14.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08917236328125, -0.08609390258789062, -0.08301544189453125, -0.07993698120117188, -0.0768585205078125, -0.07378005981445312, -0.07070159912109375, -0.06762313842773438, -0.064544677734375, -0.061466217041015625, -0.05838775634765625, -0.055309295654296875, -0.0522308349609375, -0.049152374267578125, -0.04607391357421875, -0.042995452880859375, -0.0399169921875, -0.036838531494140625, -0.03376007080078125, -0.030681610107421875, -0.0276031494140625, -0.024524688720703125, -0.02144622802734375, -0.018367767333984375, -0.015289306640625, -0.012210845947265625, -0.00913238525390625, -0.006053924560546875, -0.0029754638671875, 0.000102996826171875, 0.00318145751953125, 0.006259918212890625, 0.00933837890625, 0.012416839599609375, 0.01549530029296875, 0.018573760986328125, 0.0216522216796875, 0.024730682373046875, 0.02780914306640625, 0.030887603759765625, 0.033966064453125, 0.037044525146484375, 0.04012298583984375, 0.043201446533203125, 0.0462799072265625, 0.049358367919921875, 0.05243682861328125, 0.055515289306640625, 0.05859375, 0.061672210693359375, 0.06475067138671875, 0.06782913208007812, 0.0709075927734375, 0.07398605346679688, 0.07706451416015625, 0.08014297485351562, 0.083221435546875, 0.08629989624023438, 0.08937835693359375, 0.09245681762695312, 0.0955352783203125, 0.09861373901367188, 0.10169219970703125, 0.10477066040039062, 0.10784912109375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 9.0, 8.0, 11.0, 10.0, 13.0, 20.0, 27.0, 20.0, 33.0, 45.0, 62.0, 65.0, 77.0, 90.0, 109.0, 92.0, 81.0, 59.0, 30.0, 28.0, 24.0, 22.0, 14.0, 16.0, 10.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0307769775390625, -0.029919147491455078, -0.029061317443847656, -0.028203487396240234, -0.027345657348632812, -0.02648782730102539, -0.02562999725341797, -0.024772167205810547, -0.023914337158203125, -0.023056507110595703, -0.02219867706298828, -0.02134084701538086, -0.020483016967773438, -0.019625186920166016, -0.018767356872558594, -0.017909526824951172, -0.01705169677734375, -0.016193866729736328, -0.015336036682128906, -0.014478206634521484, -0.013620376586914062, -0.01276254653930664, -0.011904716491699219, -0.011046886444091797, -0.010189056396484375, -0.009331226348876953, -0.008473396301269531, -0.007615566253662109, -0.0067577362060546875, -0.005899906158447266, -0.005042076110839844, -0.004184246063232422, -0.003326416015625, -0.002468585968017578, -0.0016107559204101562, -0.0007529258728027344, 0.0001049041748046875, 0.0009627342224121094, 0.0018205642700195312, 0.002678394317626953, 0.003536224365234375, 0.004394054412841797, 0.005251884460449219, 0.006109714508056641, 0.0069675445556640625, 0.007825374603271484, 0.008683204650878906, 0.009541034698486328, 0.01039886474609375, 0.011256694793701172, 0.012114524841308594, 0.012972354888916016, 0.013830184936523438, 0.01468801498413086, 0.015545845031738281, 0.016403675079345703, 0.017261505126953125, 0.018119335174560547, 0.01897716522216797, 0.01983499526977539, 0.020692825317382812, 0.021550655364990234, 0.022408485412597656, 0.023266315460205078, 0.0241241455078125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 4.0, 4.0, 3.0, 8.0, 12.0, 16.0, 13.0, 27.0, 22.0, 31.0, 51.0, 26.0, 59.0, 56.0, 74.0, 86.0, 67.0, 72.0, 76.0, 54.0, 33.0, 25.0, 27.0, 32.0, 27.0, 17.0, 11.0, 17.0, 11.0, 11.0, 7.0, 4.0, 1.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2039647102355957, -3.071798086166382, -2.939631462097168, -2.807464838027954, -2.6752982139587402, -2.5431313514709473, -2.4109647274017334, -2.2787981033325195, -2.1466314792633057, -2.014464855194092, -1.882298231124878, -1.7501314878463745, -1.6179648637771606, -1.4857982397079468, -1.3536314964294434, -1.2214648723602295, -1.0892982482910156, -0.9571316242218018, -0.8249649405479431, -0.6927982568740845, -0.5606316328048706, -0.42846500873565674, -0.2962983250617981, -0.16413164138793945, -0.031965017318725586, 0.10020163655281067, 0.23236829042434692, 0.3645349442958832, 0.49670159816741943, 0.6288682222366333, 0.7610349059104919, 0.8932015895843506, 1.0253686904907227, 1.1575353145599365, 1.2897019386291504, 1.4218686819076538, 1.5540353059768677, 1.6862019300460815, 1.818368673324585, 1.9505352973937988, 2.0827019214630127, 2.2148685455322266, 2.3470351696014404, 2.4792017936706543, 2.6113686561584473, 2.743535041809082, 2.875701904296875, 3.007868528366089, 3.1400351524353027, 3.2722017765045166, 3.4043684005737305, 3.5365350246429443, 3.668701648712158, 3.800868511199951, 3.933035135269165, 4.065201759338379, 4.197368621826172, 4.329535484313965, 4.4617018699646, 4.593868732452393, 4.726035118103027, 4.85820198059082, 4.990368366241455, 5.122535228729248, 5.254701614379883]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 5.0, 2.0, 6.0, 7.0, 9.0, 5.0, 11.0, 8.0, 15.0, 12.0, 17.0, 25.0, 24.0, 27.0, 31.0, 37.0, 34.0, 38.0, 41.0, 39.0, 41.0, 38.0, 39.0, 37.0, 37.0, 32.0, 42.0, 37.0, 44.0, 34.0, 23.0, 28.0, 17.0, 33.0, 17.0, 18.0, 12.0, 15.0, 9.0, 9.0, 10.0, 6.0, 7.0, 3.0, 4.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.273930788040161, -3.1599223613739014, -3.0459139347076416, -2.9319052696228027, -2.817896842956543, -2.703888416290283, -2.5898799896240234, -2.4758715629577637, -2.361863136291504, -2.247854709625244, -2.1338462829589844, -2.0198378562927246, -1.9058291912078857, -1.791820764541626, -1.6778123378753662, -1.5638039112091064, -1.4497952461242676, -1.3357868194580078, -1.2217782735824585, -1.1077698469161987, -0.9937613606452942, -0.8797528743743896, -0.7657444477081299, -0.6517359614372253, -0.5377274751663208, -0.42371898889541626, -0.3097105324268341, -0.19570207595825195, -0.08169358968734741, 0.03231489658355713, 0.1463233232498169, 0.26033180952072144, 0.3743400573730469, 0.4883485436439514, 0.602357029914856, 0.7163654565811157, 0.8303739428520203, 0.9443824291229248, 1.0583908557891846, 1.1723992824554443, 1.2864078283309937, 1.4004162549972534, 1.5144248008728027, 1.6284332275390625, 1.7424416542053223, 1.8564502000808716, 1.9704586267471313, 2.0844671726226807, 2.1984755992889404, 2.3124840259552, 2.42649245262146, 2.540501117706299, 2.6545095443725586, 2.7685179710388184, 2.882526397705078, 2.996534824371338, 3.1105432510375977, 3.2245516777038574, 3.338560104370117, 3.452568531036377, 3.566577196121216, 3.6805856227874756, 3.7945940494537354, 3.908602476119995, 4.022611141204834]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 1.0, 11.0, 9.0, 21.0, 27.0, 32.0, 51.0, 72.0, 90.0, 158.0, 247.0, 345.0, 491.0, 713.0, 1110.0, 1722.0, 2595.0, 4191.0, 6667.0, 11021.0, 18649.0, 32075.0, 56375.0, 98241.0, 157520.0, 200196.0, 176346.0, 116321.0, 67845.0, 38526.0, 22184.0, 13001.0, 7866.0, 4877.0, 3092.0, 1943.0, 1293.0, 837.0, 566.0, 405.0, 243.0, 184.0, 103.0, 98.0, 59.0, 41.0, 29.0, 24.0, 22.0, 11.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.248046875, -3.134735107421875, -3.02142333984375, -2.908111572265625, -2.7947998046875, -2.681488037109375, -2.56817626953125, -2.454864501953125, -2.341552734375, -2.228240966796875, -2.11492919921875, -2.001617431640625, -1.8883056640625, -1.774993896484375, -1.66168212890625, -1.548370361328125, -1.43505859375, -1.321746826171875, -1.20843505859375, -1.095123291015625, -0.9818115234375, -0.868499755859375, -0.75518798828125, -0.641876220703125, -0.528564453125, -0.415252685546875, -0.30194091796875, -0.188629150390625, -0.0753173828125, 0.037994384765625, 0.15130615234375, 0.264617919921875, 0.3779296875, 0.491241455078125, 0.60455322265625, 0.717864990234375, 0.8311767578125, 0.944488525390625, 1.05780029296875, 1.171112060546875, 1.284423828125, 1.397735595703125, 1.51104736328125, 1.624359130859375, 1.7376708984375, 1.850982666015625, 1.96429443359375, 2.077606201171875, 2.19091796875, 2.304229736328125, 2.41754150390625, 2.530853271484375, 2.6441650390625, 2.757476806640625, 2.87078857421875, 2.984100341796875, 3.097412109375, 3.210723876953125, 3.32403564453125, 3.437347412109375, 3.5506591796875, 3.663970947265625, 3.77728271484375, 3.890594482421875, 4.00390625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 9.0, 5.0, 5.0, 9.0, 8.0, 14.0, 12.0, 21.0, 29.0, 20.0, 25.0, 32.0, 25.0, 38.0, 44.0, 46.0, 56.0, 42.0, 38.0, 45.0, 40.0, 40.0, 37.0, 41.0, 35.0, 35.0, 28.0, 25.0, 35.0, 27.0, 18.0, 21.0, 16.0, 6.0, 10.0, 10.0, 8.0, 7.0, 5.0, 10.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.431640625, -3.311065673828125, -3.19049072265625, -3.069915771484375, -2.9493408203125, -2.828765869140625, -2.70819091796875, -2.587615966796875, -2.467041015625, -2.346466064453125, -2.22589111328125, -2.105316162109375, -1.9847412109375, -1.864166259765625, -1.74359130859375, -1.623016357421875, -1.50244140625, -1.381866455078125, -1.26129150390625, -1.140716552734375, -1.0201416015625, -0.899566650390625, -0.77899169921875, -0.658416748046875, -0.537841796875, -0.417266845703125, -0.29669189453125, -0.176116943359375, -0.0555419921875, 0.065032958984375, 0.18560791015625, 0.306182861328125, 0.4267578125, 0.547332763671875, 0.66790771484375, 0.788482666015625, 0.9090576171875, 1.029632568359375, 1.15020751953125, 1.270782470703125, 1.391357421875, 1.511932373046875, 1.63250732421875, 1.753082275390625, 1.8736572265625, 1.994232177734375, 2.11480712890625, 2.235382080078125, 2.35595703125, 2.476531982421875, 2.59710693359375, 2.717681884765625, 2.8382568359375, 2.958831787109375, 3.07940673828125, 3.199981689453125, 3.320556640625, 3.441131591796875, 3.56170654296875, 3.682281494140625, 3.8028564453125, 3.923431396484375, 4.04400634765625, 4.164581298828125, 4.28515625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 11.0, 16.0, 25.0, 24.0, 45.0, 62.0, 95.0, 148.0, 215.0, 307.0, 502.0, 724.0, 1131.0, 1731.0, 2675.0, 4133.0, 6532.0, 10447.0, 17025.0, 26990.0, 44536.0, 71601.0, 110516.0, 152763.0, 171754.0, 146814.0, 103666.0, 65802.0, 40881.0, 25156.0, 15345.0, 9761.0, 6071.0, 3899.0, 2469.0, 1581.0, 1113.0, 648.0, 417.0, 296.0, 183.0, 142.0, 107.0, 72.0, 46.0, 23.0, 15.0, 12.0, 8.0, 5.0, 9.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.939453125, -2.84588623046875, -2.7523193359375, -2.65875244140625, -2.565185546875, -2.47161865234375, -2.3780517578125, -2.28448486328125, -2.19091796875, -2.09735107421875, -2.0037841796875, -1.91021728515625, -1.816650390625, -1.72308349609375, -1.6295166015625, -1.53594970703125, -1.4423828125, -1.34881591796875, -1.2552490234375, -1.16168212890625, -1.068115234375, -0.97454833984375, -0.8809814453125, -0.78741455078125, -0.69384765625, -0.60028076171875, -0.5067138671875, -0.41314697265625, -0.319580078125, -0.22601318359375, -0.1324462890625, -0.03887939453125, 0.0546875, 0.14825439453125, 0.2418212890625, 0.33538818359375, 0.428955078125, 0.52252197265625, 0.6160888671875, 0.70965576171875, 0.80322265625, 0.89678955078125, 0.9903564453125, 1.08392333984375, 1.177490234375, 1.27105712890625, 1.3646240234375, 1.45819091796875, 1.5517578125, 1.64532470703125, 1.7388916015625, 1.83245849609375, 1.926025390625, 2.01959228515625, 2.1131591796875, 2.20672607421875, 2.30029296875, 2.39385986328125, 2.4874267578125, 2.58099365234375, 2.674560546875, 2.76812744140625, 2.8616943359375, 2.95526123046875, 3.048828125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 0.0, 2.0, 5.0, 9.0, 4.0, 10.0, 5.0, 6.0, 8.0, 10.0, 20.0, 14.0, 19.0, 17.0, 22.0, 24.0, 28.0, 30.0, 25.0, 39.0, 37.0, 35.0, 24.0, 50.0, 45.0, 37.0, 46.0, 33.0, 36.0, 33.0, 41.0, 34.0, 23.0, 34.0, 27.0, 33.0, 16.0, 20.0, 13.0, 14.0, 15.0, 15.0, 18.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8095703125, -1.7480621337890625, -1.686553955078125, -1.6250457763671875, -1.56353759765625, -1.5020294189453125, -1.440521240234375, -1.3790130615234375, -1.3175048828125, -1.2559967041015625, -1.194488525390625, -1.1329803466796875, -1.07147216796875, -1.0099639892578125, -0.948455810546875, -0.8869476318359375, -0.825439453125, -0.7639312744140625, -0.702423095703125, -0.6409149169921875, -0.57940673828125, -0.5178985595703125, -0.456390380859375, -0.3948822021484375, -0.3333740234375, -0.2718658447265625, -0.210357666015625, -0.1488494873046875, -0.08734130859375, -0.0258331298828125, 0.035675048828125, 0.0971832275390625, 0.15869140625, 0.2201995849609375, 0.281707763671875, 0.3432159423828125, 0.40472412109375, 0.4662322998046875, 0.527740478515625, 0.5892486572265625, 0.6507568359375, 0.7122650146484375, 0.773773193359375, 0.8352813720703125, 0.89678955078125, 0.9582977294921875, 1.019805908203125, 1.0813140869140625, 1.142822265625, 1.2043304443359375, 1.265838623046875, 1.3273468017578125, 1.38885498046875, 1.4503631591796875, 1.511871337890625, 1.5733795166015625, 1.6348876953125, 1.6963958740234375, 1.757904052734375, 1.8194122314453125, 1.88092041015625, 1.9424285888671875, 2.003936767578125, 2.0654449462890625, 2.126953125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 7.0, 24.0, 19.0, 62.0, 98.0, 124.0, 196.0, 345.0, 514.0, 891.0, 1361.0, 2269.0, 3729.0, 5877.0, 10442.0, 17589.0, 31214.0, 54780.0, 94790.0, 154685.0, 201668.0, 181551.0, 120388.0, 70277.0, 39828.0, 22710.0, 13264.0, 7886.0, 4610.0, 2722.0, 1781.0, 1079.0, 664.0, 410.0, 257.0, 149.0, 102.0, 52.0, 38.0, 20.0, 19.0, 21.0, 10.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8740234375, -0.843597412109375, -0.81317138671875, -0.782745361328125, -0.7523193359375, -0.721893310546875, -0.69146728515625, -0.661041259765625, -0.630615234375, -0.600189208984375, -0.56976318359375, -0.539337158203125, -0.5089111328125, -0.478485107421875, -0.44805908203125, -0.417633056640625, -0.38720703125, -0.356781005859375, -0.32635498046875, -0.295928955078125, -0.2655029296875, -0.235076904296875, -0.20465087890625, -0.174224853515625, -0.143798828125, -0.113372802734375, -0.08294677734375, -0.052520751953125, -0.0220947265625, 0.008331298828125, 0.03875732421875, 0.069183349609375, 0.099609375, 0.130035400390625, 0.16046142578125, 0.190887451171875, 0.2213134765625, 0.251739501953125, 0.28216552734375, 0.312591552734375, 0.343017578125, 0.373443603515625, 0.40386962890625, 0.434295654296875, 0.4647216796875, 0.495147705078125, 0.52557373046875, 0.555999755859375, 0.58642578125, 0.616851806640625, 0.64727783203125, 0.677703857421875, 0.7081298828125, 0.738555908203125, 0.76898193359375, 0.799407958984375, 0.829833984375, 0.860260009765625, 0.89068603515625, 0.921112060546875, 0.9515380859375, 0.981964111328125, 1.01239013671875, 1.042816162109375, 1.0732421875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 9.0, 6.0, 8.0, 11.0, 15.0, 21.0, 8.0, 17.0, 14.0, 31.0, 25.0, 40.0, 46.0, 39.0, 31.0, 50.0, 46.0, 56.0, 50.0, 56.0, 49.0, 51.0, 53.0, 31.0, 34.0, 32.0, 23.0, 32.0, 19.0, 18.0, 16.0, 14.0, 9.0, 12.0, 4.0, 5.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.073713302612305e-05, -5.9011392295360565e-05, -5.7285651564598083e-05, -5.55599108338356e-05, -5.383417010307312e-05, -5.210842937231064e-05, -5.038268864154816e-05, -4.8656947910785675e-05, -4.693120718002319e-05, -4.520546644926071e-05, -4.347972571849823e-05, -4.175398498773575e-05, -4.0028244256973267e-05, -3.8302503526210785e-05, -3.65767627954483e-05, -3.485102206468582e-05, -3.312528133392334e-05, -3.139954060316086e-05, -2.9673799872398376e-05, -2.7948059141635895e-05, -2.6222318410873413e-05, -2.449657768011093e-05, -2.277083694934845e-05, -2.1045096218585968e-05, -1.9319355487823486e-05, -1.7593614757061005e-05, -1.5867874026298523e-05, -1.4142133295536041e-05, -1.241639256477356e-05, -1.0690651834011078e-05, -8.964911103248596e-06, -7.2391703724861145e-06, -5.513429641723633e-06, -3.787688910961151e-06, -2.0619481801986694e-06, -3.3620744943618774e-07, 1.389533281326294e-06, 3.1152740120887756e-06, 4.841014742851257e-06, 6.566755473613739e-06, 8.29249620437622e-06, 1.0018236935138702e-05, 1.1743977665901184e-05, 1.3469718396663666e-05, 1.5195459127426147e-05, 1.692119985818863e-05, 1.864694058895111e-05, 2.0372681319713593e-05, 2.2098422050476074e-05, 2.3824162781238556e-05, 2.5549903512001038e-05, 2.727564424276352e-05, 2.9001384973526e-05, 3.072712570428848e-05, 3.2452866435050964e-05, 3.4178607165813446e-05, 3.590434789657593e-05, 3.763008862733841e-05, 3.935582935810089e-05, 4.108157008886337e-05, 4.2807310819625854e-05, 4.4533051550388336e-05, 4.625879228115082e-05, 4.79845330119133e-05, 4.971027374267578e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 10.0, 14.0, 27.0, 29.0, 44.0, 58.0, 114.0, 156.0, 284.0, 420.0, 751.0, 1204.0, 2071.0, 3498.0, 5874.0, 10491.0, 18868.0, 34698.0, 64569.0, 115715.0, 184275.0, 216703.0, 166696.0, 99486.0, 54685.0, 29630.0, 16421.0, 9028.0, 5189.0, 3039.0, 1720.0, 1099.0, 623.0, 428.0, 250.0, 147.0, 82.0, 53.0, 41.0, 24.0, 18.0, 11.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0439453125, -1.0106658935546875, -0.977386474609375, -0.9441070556640625, -0.91082763671875, -0.8775482177734375, -0.844268798828125, -0.8109893798828125, -0.7777099609375, -0.7444305419921875, -0.711151123046875, -0.6778717041015625, -0.64459228515625, -0.6113128662109375, -0.578033447265625, -0.5447540283203125, -0.511474609375, -0.4781951904296875, -0.444915771484375, -0.4116363525390625, -0.37835693359375, -0.3450775146484375, -0.311798095703125, -0.2785186767578125, -0.2452392578125, -0.2119598388671875, -0.178680419921875, -0.1454010009765625, -0.11212158203125, -0.0788421630859375, -0.045562744140625, -0.0122833251953125, 0.02099609375, 0.0542755126953125, 0.087554931640625, 0.1208343505859375, 0.15411376953125, 0.1873931884765625, 0.220672607421875, 0.2539520263671875, 0.2872314453125, 0.3205108642578125, 0.353790283203125, 0.3870697021484375, 0.42034912109375, 0.4536285400390625, 0.486907958984375, 0.5201873779296875, 0.553466796875, 0.5867462158203125, 0.620025634765625, 0.6533050537109375, 0.68658447265625, 0.7198638916015625, 0.753143310546875, 0.7864227294921875, 0.8197021484375, 0.8529815673828125, 0.886260986328125, 0.9195404052734375, 0.95281982421875, 0.9860992431640625, 1.019378662109375, 1.0526580810546875, 1.0859375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 7.0, 5.0, 14.0, 6.0, 12.0, 16.0, 21.0, 15.0, 21.0, 11.0, 23.0, 28.0, 28.0, 28.0, 48.0, 40.0, 48.0, 57.0, 47.0, 55.0, 49.0, 41.0, 39.0, 52.0, 47.0, 34.0, 26.0, 25.0, 23.0, 20.0, 9.0, 20.0, 13.0, 9.0, 7.0, 7.0, 5.0, 8.0, 8.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.29833984375, -0.28885650634765625, -0.2793731689453125, -0.26988983154296875, -0.260406494140625, -0.25092315673828125, -0.2414398193359375, -0.23195648193359375, -0.22247314453125, -0.21298980712890625, -0.2035064697265625, -0.19402313232421875, -0.184539794921875, -0.17505645751953125, -0.1655731201171875, -0.15608978271484375, -0.1466064453125, -0.13712310791015625, -0.1276397705078125, -0.11815643310546875, -0.108673095703125, -0.09918975830078125, -0.0897064208984375, -0.08022308349609375, -0.07073974609375, -0.06125640869140625, -0.0517730712890625, -0.04228973388671875, -0.032806396484375, -0.02332305908203125, -0.0138397216796875, -0.00435638427734375, 0.005126953125, 0.01461029052734375, 0.0240936279296875, 0.03357696533203125, 0.043060302734375, 0.05254364013671875, 0.0620269775390625, 0.07151031494140625, 0.08099365234375, 0.09047698974609375, 0.0999603271484375, 0.10944366455078125, 0.118927001953125, 0.12841033935546875, 0.1378936767578125, 0.14737701416015625, 0.1568603515625, 0.16634368896484375, 0.1758270263671875, 0.18531036376953125, 0.194793701171875, 0.20427703857421875, 0.2137603759765625, 0.22324371337890625, 0.23272705078125, 0.24221038818359375, 0.2516937255859375, 0.26117706298828125, 0.270660400390625, 0.28014373779296875, 0.2896270751953125, 0.29911041259765625, 0.30859375]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 9.0, 7.0, 12.0, 15.0, 24.0, 25.0, 40.0, 34.0, 43.0, 52.0, 60.0, 64.0, 59.0, 73.0, 65.0, 74.0, 60.0, 47.0, 34.0, 32.0, 32.0, 26.0, 21.0, 20.0, 16.0, 6.0, 12.0, 9.0, 4.0, 1.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.809433698654175, -3.6809611320495605, -3.5524885654449463, -3.424015998840332, -3.2955434322357178, -3.1670708656311035, -3.0385985374450684, -2.910125732421875, -2.78165340423584, -2.6531808376312256, -2.5247082710266113, -2.396235704421997, -2.267763137817383, -2.1392905712127686, -2.0108180046081543, -1.8823455572128296, -1.7538728713989258, -1.6254003047943115, -1.4969277381896973, -1.368455171585083, -1.2399826049804688, -1.1115100383758545, -0.9830375909805298, -0.8545650243759155, -0.7260924577713013, -0.597619891166687, -0.46914735436439514, -0.34067481756210327, -0.212202250957489, -0.08372968435287476, 0.04474282264709473, 0.17321538925170898, 0.30168771743774414, 0.4301602840423584, 0.5586328506469727, 0.6871053576469421, 0.8155779242515564, 0.9440504908561707, 1.0725229978561401, 1.2009955644607544, 1.3294681310653687, 1.457940697669983, 1.5864132642745972, 1.7148857116699219, 1.8433582782745361, 1.9718308448791504, 2.1003034114837646, 2.228775978088379, 2.357248544692993, 2.4857211112976074, 2.6141936779022217, 2.742666244506836, 2.87113881111145, 2.9996113777160645, 3.1280837059020996, 3.256556510925293, 3.385028839111328, 3.5135014057159424, 3.6419739723205566, 3.770446538925171, 3.898919105529785, 4.02739143371582, 4.155864238739014, 4.284336566925049, 4.412809371948242]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 13.0, 6.0, 8.0, 9.0, 7.0, 13.0, 16.0, 16.0, 19.0, 17.0, 16.0, 33.0, 41.0, 35.0, 33.0, 49.0, 46.0, 45.0, 43.0, 42.0, 38.0, 42.0, 44.0, 32.0, 47.0, 37.0, 28.0, 28.0, 25.0, 19.0, 27.0, 26.0, 15.0, 12.0, 7.0, 9.0, 11.0, 8.0, 9.0, 12.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.215472936630249, -3.0964808464050293, -2.9774887561798096, -2.85849666595459, -2.73950457572937, -2.6205124855041504, -2.5015206336975098, -2.382528305053711, -2.2635364532470703, -2.1445443630218506, -2.025552272796631, -1.9065601825714111, -1.7875680923461914, -1.6685760021209717, -1.5495840311050415, -1.4305919408798218, -1.3115997314453125, -1.1926076412200928, -1.073615550994873, -0.9546235203742981, -0.8356314301490784, -0.7166393399238586, -0.5976473093032837, -0.47865521907806396, -0.35966312885284424, -0.2406710535287857, -0.12167897820472717, -0.002686917781829834, 0.11630517244338989, 0.23529726266860962, 0.35428929328918457, 0.4732813835144043, 0.5922732353210449, 0.7112653255462646, 0.8302574157714844, 0.9492494463920593, 1.0682415962219238, 1.1872336864471436, 1.3062256574630737, 1.4252177476882935, 1.5442098379135132, 1.663201928138733, 1.7821940183639526, 1.9011859893798828, 2.0201780796051025, 2.1391701698303223, 2.258162260055542, 2.3771543502807617, 2.4961464405059814, 2.615138530731201, 2.734130620956421, 2.8531227111816406, 2.9721148014068604, 3.09110689163208, 3.2100987434387207, 3.3290910720825195, 3.44808292388916, 3.56707501411438, 3.6860671043395996, 3.8050591945648193, 3.924051284790039, 4.04304313659668, 4.1620354652404785, 4.281027317047119, 4.400019645690918]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [6.0, 2.0, 2.0, 4.0, 7.0, 11.0, 23.0, 23.0, 33.0, 56.0, 81.0, 109.0, 174.0, 227.0, 385.0, 513.0, 798.0, 1278.0, 1881.0, 2914.0, 4544.0, 7108.0, 11989.0, 20427.0, 37089.0, 70599.0, 144992.0, 320320.0, 713516.0, 1160673.0, 891250.0, 416525.0, 185878.0, 89589.0, 45823.0, 25475.0, 14841.0, 8999.0, 5542.0, 3530.0, 2334.0, 1518.0, 1038.0, 657.0, 453.0, 335.0, 201.0, 155.0, 115.0, 80.0, 53.0, 34.0, 25.0, 15.0, 18.0, 15.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0], "bins": [-3.912109375, -3.780303955078125, -3.64849853515625, -3.516693115234375, -3.3848876953125, -3.253082275390625, -3.12127685546875, -2.989471435546875, -2.857666015625, -2.725860595703125, -2.59405517578125, -2.462249755859375, -2.3304443359375, -2.198638916015625, -2.06683349609375, -1.935028076171875, -1.80322265625, -1.671417236328125, -1.53961181640625, -1.407806396484375, -1.2760009765625, -1.144195556640625, -1.01239013671875, -0.880584716796875, -0.748779296875, -0.616973876953125, -0.48516845703125, -0.353363037109375, -0.2215576171875, -0.089752197265625, 0.04205322265625, 0.173858642578125, 0.3056640625, 0.437469482421875, 0.56927490234375, 0.701080322265625, 0.8328857421875, 0.964691162109375, 1.09649658203125, 1.228302001953125, 1.360107421875, 1.491912841796875, 1.62371826171875, 1.755523681640625, 1.8873291015625, 2.019134521484375, 2.15093994140625, 2.282745361328125, 2.41455078125, 2.546356201171875, 2.67816162109375, 2.809967041015625, 2.9417724609375, 3.073577880859375, 3.20538330078125, 3.337188720703125, 3.468994140625, 3.600799560546875, 3.73260498046875, 3.864410400390625, 3.9962158203125, 4.128021240234375, 4.25982666015625, 4.391632080078125, 4.5234375]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 3.0, 6.0, 8.0, 5.0, 9.0, 8.0, 11.0, 16.0, 22.0, 12.0, 16.0, 19.0, 25.0, 32.0, 36.0, 38.0, 57.0, 43.0, 48.0, 48.0, 39.0, 41.0, 51.0, 41.0, 47.0, 41.0, 33.0, 27.0, 25.0, 29.0, 27.0, 24.0, 19.0, 20.0, 11.0, 10.0, 10.0, 8.0, 10.0, 5.0, 2.0, 4.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.59765625, -2.51446533203125, -2.4312744140625, -2.34808349609375, -2.264892578125, -2.18170166015625, -2.0985107421875, -2.01531982421875, -1.93212890625, -1.84893798828125, -1.7657470703125, -1.68255615234375, -1.599365234375, -1.51617431640625, -1.4329833984375, -1.34979248046875, -1.2666015625, -1.18341064453125, -1.1002197265625, -1.01702880859375, -0.933837890625, -0.85064697265625, -0.7674560546875, -0.68426513671875, -0.60107421875, -0.51788330078125, -0.4346923828125, -0.35150146484375, -0.268310546875, -0.18511962890625, -0.1019287109375, -0.01873779296875, 0.064453125, 0.14764404296875, 0.2308349609375, 0.31402587890625, 0.397216796875, 0.48040771484375, 0.5635986328125, 0.64678955078125, 0.72998046875, 0.81317138671875, 0.8963623046875, 0.97955322265625, 1.062744140625, 1.14593505859375, 1.2291259765625, 1.31231689453125, 1.3955078125, 1.47869873046875, 1.5618896484375, 1.64508056640625, 1.728271484375, 1.81146240234375, 1.8946533203125, 1.97784423828125, 2.06103515625, 2.14422607421875, 2.2274169921875, 2.31060791015625, 2.393798828125, 2.47698974609375, 2.5601806640625, 2.64337158203125, 2.7265625]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 8.0, 9.0, 18.0, 24.0, 44.0, 69.0, 103.0, 147.0, 224.0, 388.0, 598.0, 974.0, 1548.0, 2549.0, 4324.0, 7447.0, 12894.0, 23277.0, 43894.0, 84899.0, 167711.0, 341824.0, 659716.0, 992087.0, 861342.0, 488852.0, 244020.0, 119948.0, 61260.0, 32569.0, 17473.0, 9771.0, 5633.0, 3363.0, 1981.0, 1193.0, 789.0, 491.0, 286.0, 200.0, 113.0, 66.0, 49.0, 38.0, 20.0, 10.0, 12.0, 11.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.828125, -3.70367431640625, -3.5792236328125, -3.45477294921875, -3.330322265625, -3.20587158203125, -3.0814208984375, -2.95697021484375, -2.83251953125, -2.70806884765625, -2.5836181640625, -2.45916748046875, -2.334716796875, -2.21026611328125, -2.0858154296875, -1.96136474609375, -1.8369140625, -1.71246337890625, -1.5880126953125, -1.46356201171875, -1.339111328125, -1.21466064453125, -1.0902099609375, -0.96575927734375, -0.84130859375, -0.71685791015625, -0.5924072265625, -0.46795654296875, -0.343505859375, -0.21905517578125, -0.0946044921875, 0.02984619140625, 0.154296875, 0.27874755859375, 0.4031982421875, 0.52764892578125, 0.652099609375, 0.77655029296875, 0.9010009765625, 1.02545166015625, 1.14990234375, 1.27435302734375, 1.3988037109375, 1.52325439453125, 1.647705078125, 1.77215576171875, 1.8966064453125, 2.02105712890625, 2.1455078125, 2.26995849609375, 2.3944091796875, 2.51885986328125, 2.643310546875, 2.76776123046875, 2.8922119140625, 3.01666259765625, 3.14111328125, 3.26556396484375, 3.3900146484375, 3.51446533203125, 3.638916015625, 3.76336669921875, 3.8878173828125, 4.01226806640625, 4.13671875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 6.0, 10.0, 8.0, 17.0, 19.0, 25.0, 25.0, 32.0, 26.0, 56.0, 65.0, 66.0, 112.0, 120.0, 143.0, 177.0, 204.0, 207.0, 234.0, 243.0, 291.0, 245.0, 252.0, 247.0, 209.0, 188.0, 138.0, 134.0, 118.0, 85.0, 73.0, 67.0, 50.0, 36.0, 30.0, 18.0, 22.0, 11.0, 18.0, 12.0, 11.0, 5.0, 6.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.376953125, -1.3339996337890625, -1.291046142578125, -1.2480926513671875, -1.20513916015625, -1.1621856689453125, -1.119232177734375, -1.0762786865234375, -1.0333251953125, -0.9903717041015625, -0.947418212890625, -0.9044647216796875, -0.86151123046875, -0.8185577392578125, -0.775604248046875, -0.7326507568359375, -0.689697265625, -0.6467437744140625, -0.603790283203125, -0.5608367919921875, -0.51788330078125, -0.4749298095703125, -0.431976318359375, -0.3890228271484375, -0.3460693359375, -0.3031158447265625, -0.260162353515625, -0.2172088623046875, -0.17425537109375, -0.1313018798828125, -0.088348388671875, -0.0453948974609375, -0.00244140625, 0.0405120849609375, 0.083465576171875, 0.1264190673828125, 0.16937255859375, 0.2123260498046875, 0.255279541015625, 0.2982330322265625, 0.3411865234375, 0.3841400146484375, 0.427093505859375, 0.4700469970703125, 0.51300048828125, 0.5559539794921875, 0.598907470703125, 0.6418609619140625, 0.684814453125, 0.7277679443359375, 0.770721435546875, 0.8136749267578125, 0.85662841796875, 0.8995819091796875, 0.942535400390625, 0.9854888916015625, 1.0284423828125, 1.0713958740234375, 1.114349365234375, 1.1573028564453125, 1.20025634765625, 1.2432098388671875, 1.286163330078125, 1.3291168212890625, 1.3720703125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 7.0, 6.0, 15.0, 11.0, 11.0, 13.0, 13.0, 28.0, 20.0, 30.0, 34.0, 42.0, 48.0, 51.0, 68.0, 65.0, 57.0, 77.0, 61.0, 73.0, 43.0, 41.0, 41.0, 24.0, 22.0, 15.0, 15.0, 18.0, 11.0, 15.0, 10.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9282546043395996, -3.803725481033325, -3.679196357727051, -3.5546674728393555, -3.430138349533081, -3.3056092262268066, -3.1810801029205322, -3.056550979614258, -2.9320220947265625, -2.807492971420288, -2.6829638481140137, -2.5584349632263184, -2.433905839920044, -2.3093767166137695, -2.184847593307495, -2.0603184700012207, -1.9357893466949463, -1.8112602233886719, -1.686731219291687, -1.5622020959854126, -1.4376730918884277, -1.3131439685821533, -1.188614845275879, -1.0640857219696045, -0.9395567178726196, -0.81502765417099, -0.6904985904693604, -0.5659694671630859, -0.4414404034614563, -0.31691133975982666, -0.19238221645355225, -0.06785315275192261, 0.05667591094970703, 0.18120498955249786, 0.3057340681552887, 0.4302631616592407, 0.5547922253608704, 0.6793212890625, 0.8038504123687744, 0.928379476070404, 1.0529085397720337, 1.177437663078308, 1.301966667175293, 1.4264957904815674, 1.5510249137878418, 1.6755539178848267, 1.800083041191101, 1.924612045288086, 2.0491411685943604, 2.1736702919006348, 2.298199415206909, 2.4227285385131836, 2.547257423400879, 2.6717865467071533, 2.7963156700134277, 2.920844793319702, 3.0453739166259766, 3.169903039932251, 3.2944321632385254, 3.4189610481262207, 3.543490171432495, 3.6680192947387695, 3.792548418045044, 3.9170775413513184, 4.041606426239014]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 1.0, 2.0, 5.0, 4.0, 9.0, 7.0, 12.0, 12.0, 10.0, 19.0, 21.0, 17.0, 30.0, 35.0, 31.0, 45.0, 47.0, 42.0, 34.0, 47.0, 50.0, 47.0, 39.0, 54.0, 35.0, 43.0, 33.0, 34.0, 39.0, 30.0, 26.0, 29.0, 16.0, 19.0, 16.0, 15.0, 11.0, 6.0, 6.0, 5.0, 6.0, 1.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.831113815307617, -3.70617938041687, -3.581244707107544, -3.456310272216797, -3.33137583732605, -3.2064414024353027, -3.0815067291259766, -2.9565722942352295, -2.8316378593444824, -2.7067034244537354, -2.581768751144409, -2.456834316253662, -2.331899881362915, -2.206965446472168, -2.082030773162842, -1.9570963382720947, -1.832161784172058, -1.7072272300720215, -1.5822927951812744, -1.4573582410812378, -1.3324238061904907, -1.207489252090454, -1.082554817199707, -0.9576202630996704, -0.8326857686042786, -0.7077512741088867, -0.5828167796134949, -0.45788225531578064, -0.3329477608203888, -0.20801323652267456, -0.08307874202728271, 0.04185575246810913, 0.16679024696350098, 0.2917247414588928, 0.41665923595428467, 0.5415937900543213, 0.6665282249450684, 0.791462779045105, 0.9163972735404968, 1.0413317680358887, 1.1662662029266357, 1.2912007570266724, 1.4161351919174194, 1.541069746017456, 1.6660041809082031, 1.7909387350082397, 1.9158732891082764, 2.0408077239990234, 2.1657423973083496, 2.2906768321990967, 2.415611505508423, 2.54054594039917, 2.665480375289917, 2.790414810180664, 2.9153494834899902, 3.0402839183807373, 3.1652183532714844, 3.2901527881622314, 3.4150874614715576, 3.5400218963623047, 3.6649563312530518, 3.789890766143799, 3.914825439453125, 4.039759635925293, 4.164694309234619]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 12.0, 18.0, 22.0, 35.0, 61.0, 81.0, 112.0, 200.0, 302.0, 508.0, 771.0, 1371.0, 2184.0, 4042.0, 7181.0, 13424.0, 25936.0, 53862.0, 121419.0, 277392.0, 292498.0, 130367.0, 57599.0, 27586.0, 13930.0, 7530.0, 4110.0, 2368.0, 1376.0, 800.0, 545.0, 322.0, 208.0, 123.0, 77.0, 61.0, 44.0, 17.0, 13.0, 13.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.40625, -1.3609466552734375, -1.315643310546875, -1.2703399658203125, -1.22503662109375, -1.1797332763671875, -1.134429931640625, -1.0891265869140625, -1.0438232421875, -0.9985198974609375, -0.953216552734375, -0.9079132080078125, -0.86260986328125, -0.8173065185546875, -0.772003173828125, -0.7266998291015625, -0.681396484375, -0.6360931396484375, -0.590789794921875, -0.5454864501953125, -0.50018310546875, -0.4548797607421875, -0.409576416015625, -0.3642730712890625, -0.3189697265625, -0.2736663818359375, -0.228363037109375, -0.1830596923828125, -0.13775634765625, -0.0924530029296875, -0.047149658203125, -0.0018463134765625, 0.04345703125, 0.0887603759765625, 0.134063720703125, 0.1793670654296875, 0.22467041015625, 0.2699737548828125, 0.315277099609375, 0.3605804443359375, 0.4058837890625, 0.4511871337890625, 0.496490478515625, 0.5417938232421875, 0.58709716796875, 0.6324005126953125, 0.677703857421875, 0.7230072021484375, 0.768310546875, 0.8136138916015625, 0.858917236328125, 0.9042205810546875, 0.94952392578125, 0.9948272705078125, 1.040130615234375, 1.0854339599609375, 1.1307373046875, 1.1760406494140625, 1.221343994140625, 1.2666473388671875, 1.31195068359375, 1.3572540283203125, 1.402557373046875, 1.4478607177734375, 1.4931640625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 3.0, 11.0, 6.0, 8.0, 9.0, 20.0, 13.0, 23.0, 24.0, 33.0, 32.0, 44.0, 41.0, 39.0, 56.0, 45.0, 47.0, 52.0, 47.0, 44.0, 46.0, 41.0, 51.0, 44.0, 30.0, 28.0, 29.0, 30.0, 26.0, 10.0, 18.0, 13.0, 5.0, 7.0, 4.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.2337646484375, -4.096435546875, -3.9591064453125, -3.82177734375, -3.6844482421875, -3.547119140625, -3.4097900390625, -3.2724609375, -3.1351318359375, -2.997802734375, -2.8604736328125, -2.72314453125, -2.5858154296875, -2.448486328125, -2.3111572265625, -2.173828125, -2.0364990234375, -1.899169921875, -1.7618408203125, -1.62451171875, -1.4871826171875, -1.349853515625, -1.2125244140625, -1.0751953125, -0.9378662109375, -0.800537109375, -0.6632080078125, -0.52587890625, -0.3885498046875, -0.251220703125, -0.1138916015625, 0.0234375, 0.1607666015625, 0.298095703125, 0.4354248046875, 0.57275390625, 0.7100830078125, 0.847412109375, 0.9847412109375, 1.1220703125, 1.2593994140625, 1.396728515625, 1.5340576171875, 1.67138671875, 1.8087158203125, 1.946044921875, 2.0833740234375, 2.220703125, 2.3580322265625, 2.495361328125, 2.6326904296875, 2.77001953125, 2.9073486328125, 3.044677734375, 3.1820068359375, 3.3193359375, 3.4566650390625, 3.593994140625, 3.7313232421875, 3.86865234375, 4.0059814453125, 4.143310546875, 4.2806396484375, 4.41796875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 11.0, 7.0, 6.0, 7.0, 7.0, 14.0, 16.0, 20.0, 33.0, 46.0, 66.0, 90.0, 109.0, 138.0, 182.0, 287.0, 428.0, 583.0, 927.0, 1607.0, 3183.0, 7354.0, 20937.0, 103711.0, 871030.0, 22005.0, 7734.0, 3310.0, 1702.0, 969.0, 625.0, 398.0, 286.0, 177.0, 121.0, 99.0, 93.0, 74.0, 37.0, 33.0, 18.0, 13.0, 12.0, 17.0, 8.0, 11.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.736328125, -3.6231689453125, -3.510009765625, -3.3968505859375, -3.28369140625, -3.1705322265625, -3.057373046875, -2.9442138671875, -2.8310546875, -2.7178955078125, -2.604736328125, -2.4915771484375, -2.37841796875, -2.2652587890625, -2.152099609375, -2.0389404296875, -1.92578125, -1.8126220703125, -1.699462890625, -1.5863037109375, -1.47314453125, -1.3599853515625, -1.246826171875, -1.1336669921875, -1.0205078125, -0.9073486328125, -0.794189453125, -0.6810302734375, -0.56787109375, -0.4547119140625, -0.341552734375, -0.2283935546875, -0.115234375, -0.0020751953125, 0.111083984375, 0.2242431640625, 0.33740234375, 0.4505615234375, 0.563720703125, 0.6768798828125, 0.7900390625, 0.9031982421875, 1.016357421875, 1.1295166015625, 1.24267578125, 1.3558349609375, 1.468994140625, 1.5821533203125, 1.6953125, 1.8084716796875, 1.921630859375, 2.0347900390625, 2.14794921875, 2.2611083984375, 2.374267578125, 2.4874267578125, 2.6005859375, 2.7137451171875, 2.826904296875, 2.9400634765625, 3.05322265625, 3.1663818359375, 3.279541015625, 3.3927001953125, 3.505859375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 7.0, 2.0, 5.0, 4.0, 1.0, 9.0, 11.0, 5.0, 9.0, 5.0, 14.0, 20.0, 14.0, 19.0, 19.0, 18.0, 17.0, 23.0, 27.0, 34.0, 28.0, 30.0, 27.0, 35.0, 34.0, 28.0, 45.0, 34.0, 34.0, 27.0, 26.0, 27.0, 33.0, 39.0, 20.0, 31.0, 32.0, 24.0, 30.0, 20.0, 22.0, 21.0, 17.0, 16.0, 11.0, 8.0, 13.0, 11.0, 6.0, 6.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.9404296875, -1.8780364990234375, -1.815643310546875, -1.7532501220703125, -1.69085693359375, -1.6284637451171875, -1.566070556640625, -1.5036773681640625, -1.4412841796875, -1.3788909912109375, -1.316497802734375, -1.2541046142578125, -1.19171142578125, -1.1293182373046875, -1.066925048828125, -1.0045318603515625, -0.942138671875, -0.8797454833984375, -0.817352294921875, -0.7549591064453125, -0.69256591796875, -0.6301727294921875, -0.567779541015625, -0.5053863525390625, -0.4429931640625, -0.3805999755859375, -0.318206787109375, -0.2558135986328125, -0.19342041015625, -0.1310272216796875, -0.068634033203125, -0.0062408447265625, 0.05615234375, 0.1185455322265625, 0.180938720703125, 0.2433319091796875, 0.30572509765625, 0.3681182861328125, 0.430511474609375, 0.4929046630859375, 0.5552978515625, 0.6176910400390625, 0.680084228515625, 0.7424774169921875, 0.80487060546875, 0.8672637939453125, 0.929656982421875, 0.9920501708984375, 1.054443359375, 1.1168365478515625, 1.179229736328125, 1.2416229248046875, 1.30401611328125, 1.3664093017578125, 1.428802490234375, 1.4911956787109375, 1.5535888671875, 1.6159820556640625, 1.678375244140625, 1.7407684326171875, 1.80316162109375, 1.8655548095703125, 1.927947998046875, 1.9903411865234375, 2.052734375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 7.0, 8.0, 19.0, 19.0, 23.0, 26.0, 46.0, 55.0, 72.0, 118.0, 113.0, 194.0, 274.0, 354.0, 514.0, 703.0, 1065.0, 1613.0, 2404.0, 4099.0, 7404.0, 15673.0, 44828.0, 905199.0, 33897.0, 12963.0, 6450.0, 3556.0, 2189.0, 1397.0, 910.0, 591.0, 470.0, 336.0, 250.0, 193.0, 127.0, 110.0, 65.0, 68.0, 46.0, 24.0, 26.0, 21.0, 9.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1817626953125, -0.17615127563476562, -0.17053985595703125, -0.16492843627929688, -0.1593170166015625, -0.15370559692382812, -0.14809417724609375, -0.14248275756835938, -0.136871337890625, -0.13125991821289062, -0.12564849853515625, -0.12003707885742188, -0.1144256591796875, -0.10881423950195312, -0.10320281982421875, -0.09759140014648438, -0.09197998046875, -0.08636856079101562, -0.08075714111328125, -0.07514572143554688, -0.0695343017578125, -0.06392288208007812, -0.05831146240234375, -0.052700042724609375, -0.047088623046875, -0.041477203369140625, -0.03586578369140625, -0.030254364013671875, -0.0246429443359375, -0.019031524658203125, -0.01342010498046875, -0.007808685302734375, -0.002197265625, 0.003414154052734375, 0.00902557373046875, 0.014636993408203125, 0.0202484130859375, 0.025859832763671875, 0.03147125244140625, 0.037082672119140625, 0.042694091796875, 0.048305511474609375, 0.05391693115234375, 0.059528350830078125, 0.0651397705078125, 0.07075119018554688, 0.07636260986328125, 0.08197402954101562, 0.08758544921875, 0.09319686889648438, 0.09880828857421875, 0.10441970825195312, 0.1100311279296875, 0.11564254760742188, 0.12125396728515625, 0.12686538696289062, 0.132476806640625, 0.13808822631835938, 0.14369964599609375, 0.14931106567382812, 0.1549224853515625, 0.16053390502929688, 0.16614532470703125, 0.17175674438476562, 0.1773681640625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 8.0, 14.0, 9.0, 9.0, 17.0, 15.0, 19.0, 24.0, 24.0, 27.0, 40.0, 52.0, 44.0, 37.0, 61.0, 61.0, 68.0, 55.0, 55.0, 47.0, 60.0, 43.0, 36.0, 29.0, 20.0, 16.0, 20.0, 13.0, 13.0, 7.0, 10.0, 6.0, 9.0, 4.0, 5.0, 8.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.030632019042969e-05, -4.870537668466568e-05, -4.710443317890167e-05, -4.5503489673137665e-05, -4.390254616737366e-05, -4.230160266160965e-05, -4.070065915584564e-05, -3.9099715650081635e-05, -3.749877214431763e-05, -3.589782863855362e-05, -3.429688513278961e-05, -3.2695941627025604e-05, -3.10949981212616e-05, -2.949405461549759e-05, -2.789311110973358e-05, -2.6292167603969574e-05, -2.4691224098205566e-05, -2.309028059244156e-05, -2.148933708667755e-05, -1.9888393580913544e-05, -1.8287450075149536e-05, -1.668650656938553e-05, -1.5085563063621521e-05, -1.3484619557857513e-05, -1.1883676052093506e-05, -1.0282732546329498e-05, -8.68178904056549e-06, -7.080845534801483e-06, -5.479902029037476e-06, -3.878958523273468e-06, -2.2780150175094604e-06, -6.770715117454529e-07, 9.238719940185547e-07, 2.5248154997825623e-06, 4.12575900554657e-06, 5.726702511310577e-06, 7.327646017074585e-06, 8.928589522838593e-06, 1.05295330286026e-05, 1.2130476534366608e-05, 1.3731420040130615e-05, 1.5332363545894623e-05, 1.693330705165863e-05, 1.8534250557422638e-05, 2.0135194063186646e-05, 2.1736137568950653e-05, 2.333708107471466e-05, 2.4938024580478668e-05, 2.6538968086242676e-05, 2.8139911592006683e-05, 2.974085509777069e-05, 3.13417986035347e-05, 3.2942742109298706e-05, 3.4543685615062714e-05, 3.614462912082672e-05, 3.774557262659073e-05, 3.9346516132354736e-05, 4.0947459638118744e-05, 4.254840314388275e-05, 4.414934664964676e-05, 4.5750290155410767e-05, 4.7351233661174774e-05, 4.895217716693878e-05, 5.055312067270279e-05, 5.21540641784668e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 10.0, 13.0, 30.0, 33.0, 58.0, 69.0, 111.0, 169.0, 217.0, 315.0, 500.0, 710.0, 1066.0, 1602.0, 2428.0, 3872.0, 6009.0, 9564.0, 15320.0, 25445.0, 43860.0, 82074.0, 178833.0, 314325.0, 172712.0, 80200.0, 42718.0, 24758.0, 15122.0, 9463.0, 5976.0, 3815.0, 2422.0, 1553.0, 1034.0, 718.0, 459.0, 269.0, 225.0, 142.0, 112.0, 60.0, 49.0, 37.0, 18.0, 14.0, 17.0, 2.0, 4.0, 8.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.07568359375, -0.07327938079833984, -0.07087516784667969, -0.06847095489501953, -0.06606674194335938, -0.06366252899169922, -0.06125831604003906, -0.058854103088378906, -0.05644989013671875, -0.054045677185058594, -0.05164146423339844, -0.04923725128173828, -0.046833038330078125, -0.04442882537841797, -0.04202461242675781, -0.039620399475097656, -0.0372161865234375, -0.034811973571777344, -0.03240776062011719, -0.03000354766845703, -0.027599334716796875, -0.02519512176513672, -0.022790908813476562, -0.020386695861816406, -0.01798248291015625, -0.015578269958496094, -0.013174057006835938, -0.010769844055175781, -0.008365631103515625, -0.005961418151855469, -0.0035572052001953125, -0.0011529922485351562, 0.001251220703125, 0.0036554336547851562, 0.0060596466064453125, 0.008463859558105469, 0.010868072509765625, 0.013272285461425781, 0.015676498413085938, 0.018080711364746094, 0.02048492431640625, 0.022889137268066406, 0.025293350219726562, 0.02769756317138672, 0.030101776123046875, 0.03250598907470703, 0.03491020202636719, 0.037314414978027344, 0.0397186279296875, 0.042122840881347656, 0.04452705383300781, 0.04693126678466797, 0.049335479736328125, 0.05173969268798828, 0.05414390563964844, 0.056548118591308594, 0.05895233154296875, 0.061356544494628906, 0.06376075744628906, 0.06616497039794922, 0.06856918334960938, 0.07097339630126953, 0.07337760925292969, 0.07578182220458984, 0.07818603515625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 7.0, 8.0, 4.0, 11.0, 7.0, 8.0, 16.0, 9.0, 16.0, 12.0, 23.0, 23.0, 39.0, 44.0, 64.0, 113.0, 121.0, 123.0, 83.0, 50.0, 39.0, 35.0, 24.0, 22.0, 13.0, 16.0, 11.0, 14.0, 5.0, 6.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.036102294921875, -0.03516793251037598, -0.03423357009887695, -0.03329920768737793, -0.032364845275878906, -0.03143048286437988, -0.03049612045288086, -0.029561758041381836, -0.028627395629882812, -0.02769303321838379, -0.026758670806884766, -0.025824308395385742, -0.02488994598388672, -0.023955583572387695, -0.023021221160888672, -0.02208685874938965, -0.021152496337890625, -0.0202181339263916, -0.019283771514892578, -0.018349409103393555, -0.01741504669189453, -0.016480684280395508, -0.015546321868896484, -0.014611959457397461, -0.013677597045898438, -0.012743234634399414, -0.01180887222290039, -0.010874509811401367, -0.009940147399902344, -0.00900578498840332, -0.008071422576904297, -0.0071370601654052734, -0.00620269775390625, -0.0052683353424072266, -0.004333972930908203, -0.0033996105194091797, -0.0024652481079101562, -0.0015308856964111328, -0.0005965232849121094, 0.00033783912658691406, 0.0012722015380859375, 0.002206563949584961, 0.0031409263610839844, 0.004075288772583008, 0.005009651184082031, 0.005944013595581055, 0.006878376007080078, 0.007812738418579102, 0.008747100830078125, 0.009681463241577148, 0.010615825653076172, 0.011550188064575195, 0.012484550476074219, 0.013418912887573242, 0.014353275299072266, 0.015287637710571289, 0.016222000122070312, 0.017156362533569336, 0.01809072494506836, 0.019025087356567383, 0.019959449768066406, 0.02089381217956543, 0.021828174591064453, 0.022762537002563477, 0.0236968994140625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 7.0, 7.0, 13.0, 11.0, 15.0, 11.0, 15.0, 30.0, 23.0, 28.0, 43.0, 41.0, 51.0, 51.0, 63.0, 63.0, 63.0, 70.0, 67.0, 57.0, 50.0, 31.0, 39.0, 25.0, 23.0, 15.0, 19.0, 13.0, 14.0, 13.0, 10.0, 2.0, 1.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.9366846084594727, -3.8147196769714355, -3.6927547454833984, -3.5707898139953613, -3.448824882507324, -3.326859951019287, -3.204894781112671, -3.082929849624634, -2.9609649181365967, -2.8389999866485596, -2.7170350551605225, -2.5950701236724854, -2.473104953765869, -2.351140022277832, -2.229175090789795, -2.107210159301758, -1.9852452278137207, -1.8632802963256836, -1.7413153648376465, -1.6193503141403198, -1.4973853826522827, -1.3754204511642456, -1.253455400466919, -1.1314904689788818, -1.0095255374908447, -0.8875606060028076, -0.7655956149101257, -0.6436306238174438, -0.5216656923294067, -0.39970076084136963, -0.27773576974868774, -0.15577077865600586, -0.03380560874938965, 0.08815935254096985, 0.21012431383132935, 0.33208927512168884, 0.45405423641204834, 0.5760191679000854, 0.6979841589927673, 0.8199491500854492, 0.9419140815734863, 1.0638790130615234, 1.1858439445495605, 1.3078089952468872, 1.4297739267349243, 1.5517388582229614, 1.673703908920288, 1.7956688404083252, 1.9176337718963623, 2.0395987033843994, 2.1615636348724365, 2.2835285663604736, 2.40549373626709, 2.527458667755127, 2.649423599243164, 2.771388530731201, 2.8933534622192383, 3.0153183937072754, 3.1372833251953125, 3.2592482566833496, 3.3812131881713867, 3.503178119659424, 3.62514328956604, 3.747108221054077, 3.8690731525421143]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 1.0, 3.0, 4.0, 4.0, 10.0, 6.0, 12.0, 12.0, 12.0, 17.0, 21.0, 19.0, 29.0, 35.0, 33.0, 43.0, 48.0, 41.0, 34.0, 48.0, 53.0, 42.0, 40.0, 55.0, 34.0, 42.0, 36.0, 32.0, 37.0, 31.0, 30.0, 25.0, 16.0, 20.0, 15.0, 15.0, 10.0, 7.0, 6.0, 5.0, 5.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8114423751831055, -3.686762809753418, -3.5620832443237305, -3.437403678894043, -3.3127238750457764, -3.188044309616089, -3.0633647441864014, -2.938685178756714, -2.8140056133270264, -2.689326047897339, -2.5646464824676514, -2.4399666786193848, -2.3152871131896973, -2.1906075477600098, -2.0659279823303223, -1.9412484169006348, -1.8165687322616577, -1.6918891668319702, -1.5672094821929932, -1.4425299167633057, -1.3178503513336182, -1.1931707859039307, -1.0684911012649536, -0.9438115358352661, -0.8191319108009338, -0.6944522857666016, -0.5697727203369141, -0.4450930953025818, -0.3204135000705719, -0.195733904838562, -0.07105427980422974, 0.053625285625457764, 0.17830491065979004, 0.3029845058917999, 0.4276641011238098, 0.5523437261581421, 0.6770232915878296, 0.8017029166221619, 0.9263825416564941, 1.0510621070861816, 1.1757416725158691, 1.3004212379455566, 1.4251009225845337, 1.5497804880142212, 1.6744600534439087, 1.7991397380828857, 1.9238193035125732, 2.0484988689422607, 2.1731786727905273, 2.297858238220215, 2.4225378036499023, 2.54721736907959, 2.6718971729278564, 2.796576738357544, 2.9212563037872314, 3.045935869216919, 3.1706154346466064, 3.295295000076294, 3.4199745655059814, 3.544654369354248, 3.6693339347839355, 3.794013500213623, 3.9186930656433105, 4.043372631072998, 4.1680521965026855]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 7.0, 1.0, 5.0, 8.0, 12.0, 13.0, 29.0, 36.0, 52.0, 91.0, 133.0, 169.0, 239.0, 358.0, 523.0, 742.0, 1173.0, 1594.0, 2339.0, 3526.0, 5311.0, 7895.0, 11896.0, 18108.0, 27693.0, 42177.0, 63877.0, 93024.0, 124812.0, 144800.0, 140586.0, 113202.0, 81730.0, 55161.0, 36247.0, 23887.0, 15629.0, 10336.0, 6877.0, 4543.0, 3085.0, 2100.0, 1424.0, 976.0, 658.0, 455.0, 323.0, 233.0, 166.0, 118.0, 53.0, 57.0, 31.0, 14.0, 20.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-2.609375, -2.527374267578125, -2.44537353515625, -2.363372802734375, -2.2813720703125, -2.199371337890625, -2.11737060546875, -2.035369873046875, -1.953369140625, -1.871368408203125, -1.78936767578125, -1.707366943359375, -1.6253662109375, -1.543365478515625, -1.46136474609375, -1.379364013671875, -1.29736328125, -1.215362548828125, -1.13336181640625, -1.051361083984375, -0.9693603515625, -0.887359619140625, -0.80535888671875, -0.723358154296875, -0.641357421875, -0.559356689453125, -0.47735595703125, -0.395355224609375, -0.3133544921875, -0.231353759765625, -0.14935302734375, -0.067352294921875, 0.0146484375, 0.096649169921875, 0.17864990234375, 0.260650634765625, 0.3426513671875, 0.424652099609375, 0.50665283203125, 0.588653564453125, 0.670654296875, 0.752655029296875, 0.83465576171875, 0.916656494140625, 0.9986572265625, 1.080657958984375, 1.16265869140625, 1.244659423828125, 1.32666015625, 1.408660888671875, 1.49066162109375, 1.572662353515625, 1.6546630859375, 1.736663818359375, 1.81866455078125, 1.900665283203125, 1.982666015625, 2.064666748046875, 2.14666748046875, 2.228668212890625, 2.3106689453125, 2.392669677734375, 2.47467041015625, 2.556671142578125, 2.638671875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 7.0, 7.0, 12.0, 11.0, 13.0, 18.0, 16.0, 21.0, 22.0, 35.0, 39.0, 32.0, 33.0, 51.0, 44.0, 49.0, 33.0, 46.0, 44.0, 42.0, 37.0, 35.0, 38.0, 29.0, 35.0, 38.0, 30.0, 29.0, 31.0, 20.0, 14.0, 13.0, 13.0, 12.0, 13.0, 7.0, 2.0, 4.0, 4.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.351898193359375, -3.23309326171875, -3.114288330078125, -2.9954833984375, -2.876678466796875, -2.75787353515625, -2.639068603515625, -2.520263671875, -2.401458740234375, -2.28265380859375, -2.163848876953125, -2.0450439453125, -1.926239013671875, -1.80743408203125, -1.688629150390625, -1.56982421875, -1.451019287109375, -1.33221435546875, -1.213409423828125, -1.0946044921875, -0.975799560546875, -0.85699462890625, -0.738189697265625, -0.619384765625, -0.500579833984375, -0.38177490234375, -0.262969970703125, -0.1441650390625, -0.025360107421875, 0.09344482421875, 0.212249755859375, 0.3310546875, 0.449859619140625, 0.56866455078125, 0.687469482421875, 0.8062744140625, 0.925079345703125, 1.04388427734375, 1.162689208984375, 1.281494140625, 1.400299072265625, 1.51910400390625, 1.637908935546875, 1.7567138671875, 1.875518798828125, 1.99432373046875, 2.113128662109375, 2.23193359375, 2.350738525390625, 2.46954345703125, 2.588348388671875, 2.7071533203125, 2.825958251953125, 2.94476318359375, 3.063568115234375, 3.182373046875, 3.301177978515625, 3.41998291015625, 3.538787841796875, 3.6575927734375, 3.776397705078125, 3.89520263671875, 4.014007568359375, 4.1328125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 11.0, 10.0, 14.0, 25.0, 35.0, 45.0, 73.0, 128.0, 198.0, 311.0, 475.0, 770.0, 1178.0, 1969.0, 3100.0, 4883.0, 8040.0, 13114.0, 21530.0, 35584.0, 58155.0, 91558.0, 133814.0, 166401.0, 162160.0, 125006.0, 83946.0, 52929.0, 32405.0, 19613.0, 12006.0, 7086.0, 4481.0, 2820.0, 1704.0, 1100.0, 639.0, 437.0, 296.0, 190.0, 98.0, 70.0, 51.0, 36.0, 17.0, 19.0, 14.0, 2.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.794921875, -2.701446533203125, -2.60797119140625, -2.514495849609375, -2.4210205078125, -2.327545166015625, -2.23406982421875, -2.140594482421875, -2.047119140625, -1.953643798828125, -1.86016845703125, -1.766693115234375, -1.6732177734375, -1.579742431640625, -1.48626708984375, -1.392791748046875, -1.29931640625, -1.205841064453125, -1.11236572265625, -1.018890380859375, -0.9254150390625, -0.831939697265625, -0.73846435546875, -0.644989013671875, -0.551513671875, -0.458038330078125, -0.36456298828125, -0.271087646484375, -0.1776123046875, -0.084136962890625, 0.00933837890625, 0.102813720703125, 0.1962890625, 0.289764404296875, 0.38323974609375, 0.476715087890625, 0.5701904296875, 0.663665771484375, 0.75714111328125, 0.850616455078125, 0.944091796875, 1.037567138671875, 1.13104248046875, 1.224517822265625, 1.3179931640625, 1.411468505859375, 1.50494384765625, 1.598419189453125, 1.69189453125, 1.785369873046875, 1.87884521484375, 1.972320556640625, 2.0657958984375, 2.159271240234375, 2.25274658203125, 2.346221923828125, 2.439697265625, 2.533172607421875, 2.62664794921875, 2.720123291015625, 2.8135986328125, 2.907073974609375, 3.00054931640625, 3.094024658203125, 3.1875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 8.0, 10.0, 5.0, 8.0, 10.0, 4.0, 15.0, 35.0, 24.0, 21.0, 31.0, 28.0, 28.0, 33.0, 52.0, 43.0, 48.0, 42.0, 41.0, 39.0, 34.0, 38.0, 43.0, 37.0, 39.0, 37.0, 40.0, 31.0, 25.0, 21.0, 14.0, 17.0, 22.0, 14.0, 9.0, 9.0, 4.0, 14.0, 4.0, 2.0, 6.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-2.255859375, -2.192718505859375, -2.12957763671875, -2.066436767578125, -2.0032958984375, -1.940155029296875, -1.87701416015625, -1.813873291015625, -1.750732421875, -1.687591552734375, -1.62445068359375, -1.561309814453125, -1.4981689453125, -1.435028076171875, -1.37188720703125, -1.308746337890625, -1.24560546875, -1.182464599609375, -1.11932373046875, -1.056182861328125, -0.9930419921875, -0.929901123046875, -0.86676025390625, -0.803619384765625, -0.740478515625, -0.677337646484375, -0.61419677734375, -0.551055908203125, -0.4879150390625, -0.424774169921875, -0.36163330078125, -0.298492431640625, -0.2353515625, -0.172210693359375, -0.10906982421875, -0.045928955078125, 0.0172119140625, 0.080352783203125, 0.14349365234375, 0.206634521484375, 0.269775390625, 0.332916259765625, 0.39605712890625, 0.459197998046875, 0.5223388671875, 0.585479736328125, 0.64862060546875, 0.711761474609375, 0.77490234375, 0.838043212890625, 0.90118408203125, 0.964324951171875, 1.0274658203125, 1.090606689453125, 1.15374755859375, 1.216888427734375, 1.280029296875, 1.343170166015625, 1.40631103515625, 1.469451904296875, 1.5325927734375, 1.595733642578125, 1.65887451171875, 1.722015380859375, 1.78515625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 8.0, 11.0, 15.0, 37.0, 53.0, 81.0, 93.0, 149.0, 295.0, 417.0, 628.0, 1002.0, 1482.0, 2439.0, 3987.0, 6205.0, 10291.0, 16960.0, 27792.0, 46394.0, 75322.0, 118014.0, 162619.0, 177102.0, 144575.0, 96988.0, 60764.0, 36869.0, 22406.0, 13567.0, 8321.0, 5186.0, 3095.0, 1909.0, 1313.0, 752.0, 506.0, 309.0, 207.0, 138.0, 86.0, 67.0, 32.0, 38.0, 16.0, 7.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.91748046875, -0.8881454467773438, -0.8588104248046875, -0.8294754028320312, -0.800140380859375, -0.7708053588867188, -0.7414703369140625, -0.7121353149414062, -0.68280029296875, -0.6534652709960938, -0.6241302490234375, -0.5947952270507812, -0.565460205078125, -0.5361251831054688, -0.5067901611328125, -0.47745513916015625, -0.4481201171875, -0.41878509521484375, -0.3894500732421875, -0.36011505126953125, -0.330780029296875, -0.30144500732421875, -0.2721099853515625, -0.24277496337890625, -0.21343994140625, -0.18410491943359375, -0.1547698974609375, -0.12543487548828125, -0.096099853515625, -0.06676483154296875, -0.0374298095703125, -0.00809478759765625, 0.021240234375, 0.05057525634765625, 0.0799102783203125, 0.10924530029296875, 0.138580322265625, 0.16791534423828125, 0.1972503662109375, 0.22658538818359375, 0.25592041015625, 0.28525543212890625, 0.3145904541015625, 0.34392547607421875, 0.373260498046875, 0.40259552001953125, 0.4319305419921875, 0.46126556396484375, 0.4906005859375, 0.5199356079101562, 0.5492706298828125, 0.5786056518554688, 0.607940673828125, 0.6372756958007812, 0.6666107177734375, 0.6959457397460938, 0.72528076171875, 0.7546157836914062, 0.7839508056640625, 0.8132858276367188, 0.842620849609375, 0.8719558715820312, 0.9012908935546875, 0.9306259155273438, 0.9599609375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 6.0, 1.0, 5.0, 6.0, 13.0, 8.0, 13.0, 13.0, 30.0, 18.0, 21.0, 33.0, 30.0, 38.0, 42.0, 32.0, 44.0, 39.0, 34.0, 44.0, 49.0, 45.0, 42.0, 45.0, 54.0, 36.0, 36.0, 31.0, 28.0, 31.0, 22.0, 21.0, 12.0, 12.0, 8.0, 4.0, 10.0, 5.0, 4.0, 5.0, 2.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.27501106262207e-05, -5.096849054098129e-05, -4.918687045574188e-05, -4.740525037050247e-05, -4.562363028526306e-05, -4.384201020002365e-05, -4.206039011478424e-05, -4.027877002954483e-05, -3.849714994430542e-05, -3.671552985906601e-05, -3.49339097738266e-05, -3.315228968858719e-05, -3.137066960334778e-05, -2.9589049518108368e-05, -2.7807429432868958e-05, -2.6025809347629547e-05, -2.4244189262390137e-05, -2.2462569177150726e-05, -2.0680949091911316e-05, -1.8899329006671906e-05, -1.7117708921432495e-05, -1.5336088836193085e-05, -1.3554468750953674e-05, -1.1772848665714264e-05, -9.991228580474854e-06, -8.209608495235443e-06, -6.427988409996033e-06, -4.646368324756622e-06, -2.864748239517212e-06, -1.0831281542778015e-06, 6.984919309616089e-07, 2.4801120162010193e-06, 4.26173210144043e-06, 6.04335218667984e-06, 7.82497227191925e-06, 9.606592357158661e-06, 1.1388212442398071e-05, 1.3169832527637482e-05, 1.4951452612876892e-05, 1.6733072698116302e-05, 1.8514692783355713e-05, 2.0296312868595123e-05, 2.2077932953834534e-05, 2.3859553039073944e-05, 2.5641173124313354e-05, 2.7422793209552765e-05, 2.9204413294792175e-05, 3.0986033380031586e-05, 3.2767653465270996e-05, 3.4549273550510406e-05, 3.633089363574982e-05, 3.811251372098923e-05, 3.989413380622864e-05, 4.167575389146805e-05, 4.345737397670746e-05, 4.523899406194687e-05, 4.702061414718628e-05, 4.880223423242569e-05, 5.05838543176651e-05, 5.236547440290451e-05, 5.414709448814392e-05, 5.592871457338333e-05, 5.771033465862274e-05, 5.949195474386215e-05, 6.127357482910156e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 16.0, 22.0, 37.0, 65.0, 86.0, 148.0, 235.0, 361.0, 539.0, 837.0, 1362.0, 2094.0, 3411.0, 5445.0, 9001.0, 14618.0, 23608.0, 39076.0, 63153.0, 99479.0, 144954.0, 175162.0, 158454.0, 114482.0, 73450.0, 45810.0, 27828.0, 16888.0, 10459.0, 6482.0, 4103.0, 2578.0, 1573.0, 955.0, 611.0, 396.0, 294.0, 187.0, 98.0, 75.0, 40.0, 30.0, 25.0, 10.0, 3.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.93603515625, -0.907379150390625, -0.87872314453125, -0.850067138671875, -0.8214111328125, -0.792755126953125, -0.76409912109375, -0.735443115234375, -0.706787109375, -0.678131103515625, -0.64947509765625, -0.620819091796875, -0.5921630859375, -0.563507080078125, -0.53485107421875, -0.506195068359375, -0.4775390625, -0.448883056640625, -0.42022705078125, -0.391571044921875, -0.3629150390625, -0.334259033203125, -0.30560302734375, -0.276947021484375, -0.248291015625, -0.219635009765625, -0.19097900390625, -0.162322998046875, -0.1336669921875, -0.105010986328125, -0.07635498046875, -0.047698974609375, -0.01904296875, 0.009613037109375, 0.03826904296875, 0.066925048828125, 0.0955810546875, 0.124237060546875, 0.15289306640625, 0.181549072265625, 0.210205078125, 0.238861083984375, 0.26751708984375, 0.296173095703125, 0.3248291015625, 0.353485107421875, 0.38214111328125, 0.410797119140625, 0.439453125, 0.468109130859375, 0.49676513671875, 0.525421142578125, 0.5540771484375, 0.582733154296875, 0.61138916015625, 0.640045166015625, 0.668701171875, 0.697357177734375, 0.72601318359375, 0.754669189453125, 0.7833251953125, 0.811981201171875, 0.84063720703125, 0.869293212890625, 0.89794921875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 8.0, 10.0, 13.0, 6.0, 22.0, 12.0, 15.0, 27.0, 29.0, 45.0, 45.0, 36.0, 59.0, 53.0, 65.0, 64.0, 70.0, 60.0, 62.0, 49.0, 42.0, 42.0, 20.0, 28.0, 25.0, 18.0, 20.0, 12.0, 12.0, 14.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.362060546875, -0.3492012023925781, -0.33634185791015625, -0.3234825134277344, -0.3106231689453125, -0.2977638244628906, -0.28490447998046875, -0.2720451354980469, -0.259185791015625, -0.24632644653320312, -0.23346710205078125, -0.22060775756835938, -0.2077484130859375, -0.19488906860351562, -0.18202972412109375, -0.16917037963867188, -0.15631103515625, -0.14345169067382812, -0.13059234619140625, -0.11773300170898438, -0.1048736572265625, -0.09201431274414062, -0.07915496826171875, -0.06629562377929688, -0.053436279296875, -0.040576934814453125, -0.02771759033203125, -0.014858245849609375, -0.0019989013671875, 0.010860443115234375, 0.02371978759765625, 0.036579132080078125, 0.0494384765625, 0.062297821044921875, 0.07515716552734375, 0.08801651000976562, 0.1008758544921875, 0.11373519897460938, 0.12659454345703125, 0.13945388793945312, 0.152313232421875, 0.16517257690429688, 0.17803192138671875, 0.19089126586914062, 0.2037506103515625, 0.21660995483398438, 0.22946929931640625, 0.24232864379882812, 0.25518798828125, 0.2680473327636719, 0.28090667724609375, 0.2937660217285156, 0.3066253662109375, 0.3194847106933594, 0.33234405517578125, 0.3452033996582031, 0.358062744140625, 0.3709220886230469, 0.38378143310546875, 0.3966407775878906, 0.4095001220703125, 0.4223594665527344, 0.43521881103515625, 0.4480781555175781, 0.4609375]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 10.0, 8.0, 4.0, 13.0, 17.0, 9.0, 15.0, 15.0, 27.0, 35.0, 39.0, 34.0, 52.0, 59.0, 54.0, 70.0, 62.0, 65.0, 73.0, 64.0, 50.0, 47.0, 28.0, 28.0, 22.0, 22.0, 18.0, 15.0, 13.0, 8.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.200759410858154, -4.075186252593994, -3.949612855911255, -3.8240396976470947, -3.6984665393829346, -3.5728931427001953, -3.447319984436035, -3.321746826171875, -3.196173667907715, -3.0706005096435547, -2.9450271129608154, -2.8194539546966553, -2.693880796432495, -2.568307399749756, -2.4427342414855957, -2.3171610832214355, -2.1915876865386963, -2.066014528274536, -1.9404412508010864, -1.8148679733276367, -1.6892948150634766, -1.5637215375900269, -1.4381482601165771, -1.312575101852417, -1.1870018243789673, -1.0614285469055176, -0.9358553886413574, -0.8102821111679077, -0.6847088932991028, -0.5591356754302979, -0.43356239795684814, -0.3079891800880432, -0.18241572380065918, -0.056842491030693054, 0.06873074173927307, 0.1943039894104004, 0.3198772072792053, 0.44545042514801025, 0.57102370262146, 0.6965969204902649, 0.8221701383590698, 0.9477433562278748, 1.0733165740966797, 1.1988898515701294, 1.324463129043579, 1.4500362873077393, 1.575609564781189, 1.7011828422546387, 1.8267560005187988, 1.9523292779922485, 2.0779025554656982, 2.2034757137298584, 2.3290488719940186, 2.454622268676758, 2.580195426940918, 2.705768585205078, 2.8313417434692383, 2.9569149017333984, 3.0824882984161377, 3.208061456680298, 3.333634614944458, 3.4592080116271973, 3.5847811698913574, 3.7103543281555176, 3.835927724838257]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 2.0, 5.0, 7.0, 6.0, 13.0, 13.0, 13.0, 12.0, 21.0, 25.0, 20.0, 24.0, 30.0, 31.0, 38.0, 42.0, 48.0, 37.0, 55.0, 34.0, 33.0, 51.0, 44.0, 31.0, 49.0, 30.0, 39.0, 27.0, 34.0, 28.0, 25.0, 24.0, 18.0, 19.0, 12.0, 12.0, 13.0, 11.0, 5.0, 5.0, 5.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.68568754196167, -3.5652732849121094, -3.444859027862549, -3.3244447708129883, -3.2040305137634277, -3.083616256713867, -2.9632019996643066, -2.842787742614746, -2.7223734855651855, -2.601959228515625, -2.4815449714660645, -2.361130714416504, -2.2407164573669434, -2.120302200317383, -1.9998878240585327, -1.8794735670089722, -1.759059190750122, -1.6386449337005615, -1.518230676651001, -1.3978164196014404, -1.2774021625518799, -1.1569879055023193, -1.0365735292434692, -0.9161592721939087, -0.7957450151443481, -0.6753307580947876, -0.554916501045227, -0.43450218439102173, -0.3140879273414612, -0.19367367029190063, -0.07325935363769531, 0.047154903411865234, 0.16756916046142578, 0.28798341751098633, 0.40839770436286926, 0.5288119912147522, 0.6492262482643127, 0.7696405053138733, 0.8900548219680786, 1.0104690790176392, 1.1308833360671997, 1.2512975931167603, 1.3717118501663208, 1.492126226425171, 1.6125404834747314, 1.732954740524292, 1.8533689975738525, 1.973783254623413, 2.0941975116729736, 2.214611768722534, 2.3350260257720947, 2.4554402828216553, 2.575854539871216, 2.6962687969207764, 2.816683292388916, 2.9370975494384766, 3.057511806488037, 3.1779260635375977, 3.298340320587158, 3.4187545776367188, 3.5391688346862793, 3.65958309173584, 3.7799973487854004, 3.900411605834961, 4.0208258628845215]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 4.0, 6.0, 9.0, 11.0, 19.0, 17.0, 47.0, 53.0, 79.0, 106.0, 148.0, 182.0, 252.0, 372.0, 514.0, 788.0, 1101.0, 1628.0, 2441.0, 3699.0, 5923.0, 9559.0, 15928.0, 28473.0, 53160.0, 106006.0, 226653.0, 506757.0, 992243.0, 1084439.0, 603567.0, 274050.0, 128536.0, 64876.0, 34173.0, 19149.0, 10974.0, 6782.0, 3976.0, 2581.0, 1672.0, 1082.0, 723.0, 491.0, 336.0, 244.0, 152.0, 97.0, 74.0, 53.0, 34.0, 20.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.1171875, -3.989013671875, -3.86083984375, -3.732666015625, -3.6044921875, -3.476318359375, -3.34814453125, -3.219970703125, -3.091796875, -2.963623046875, -2.83544921875, -2.707275390625, -2.5791015625, -2.450927734375, -2.32275390625, -2.194580078125, -2.06640625, -1.938232421875, -1.81005859375, -1.681884765625, -1.5537109375, -1.425537109375, -1.29736328125, -1.169189453125, -1.041015625, -0.912841796875, -0.78466796875, -0.656494140625, -0.5283203125, -0.400146484375, -0.27197265625, -0.143798828125, -0.015625, 0.112548828125, 0.24072265625, 0.368896484375, 0.4970703125, 0.625244140625, 0.75341796875, 0.881591796875, 1.009765625, 1.137939453125, 1.26611328125, 1.394287109375, 1.5224609375, 1.650634765625, 1.77880859375, 1.906982421875, 2.03515625, 2.163330078125, 2.29150390625, 2.419677734375, 2.5478515625, 2.676025390625, 2.80419921875, 2.932373046875, 3.060546875, 3.188720703125, 3.31689453125, 3.445068359375, 3.5732421875, 3.701416015625, 3.82958984375, 3.957763671875, 4.0859375]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 11.0, 10.0, 9.0, 17.0, 17.0, 21.0, 17.0, 30.0, 34.0, 34.0, 26.0, 29.0, 41.0, 34.0, 39.0, 51.0, 47.0, 41.0, 42.0, 36.0, 35.0, 44.0, 36.0, 30.0, 36.0, 30.0, 27.0, 28.0, 16.0, 18.0, 21.0, 17.0, 9.0, 11.0, 10.0, 2.0, 3.0, 8.0, 5.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.59765625, -2.517364501953125, -2.43707275390625, -2.356781005859375, -2.2764892578125, -2.196197509765625, -2.11590576171875, -2.035614013671875, -1.955322265625, -1.875030517578125, -1.79473876953125, -1.714447021484375, -1.6341552734375, -1.553863525390625, -1.47357177734375, -1.393280029296875, -1.31298828125, -1.232696533203125, -1.15240478515625, -1.072113037109375, -0.9918212890625, -0.911529541015625, -0.83123779296875, -0.750946044921875, -0.670654296875, -0.590362548828125, -0.51007080078125, -0.429779052734375, -0.3494873046875, -0.269195556640625, -0.18890380859375, -0.108612060546875, -0.0283203125, 0.051971435546875, 0.13226318359375, 0.212554931640625, 0.2928466796875, 0.373138427734375, 0.45343017578125, 0.533721923828125, 0.614013671875, 0.694305419921875, 0.77459716796875, 0.854888916015625, 0.9351806640625, 1.015472412109375, 1.09576416015625, 1.176055908203125, 1.25634765625, 1.336639404296875, 1.41693115234375, 1.497222900390625, 1.5775146484375, 1.657806396484375, 1.73809814453125, 1.818389892578125, 1.898681640625, 1.978973388671875, 2.05926513671875, 2.139556884765625, 2.2198486328125, 2.300140380859375, 2.38043212890625, 2.460723876953125, 2.541015625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 17.0, 22.0, 27.0, 51.0, 73.0, 105.0, 186.0, 268.0, 402.0, 620.0, 985.0, 1518.0, 2361.0, 3910.0, 6331.0, 10541.0, 17805.0, 31719.0, 57767.0, 108097.0, 209266.0, 404819.0, 717628.0, 944365.0, 754414.0, 434868.0, 226467.0, 117204.0, 61465.0, 33576.0, 18678.0, 11134.0, 6709.0, 4004.0, 2514.0, 1526.0, 996.0, 647.0, 402.0, 259.0, 175.0, 120.0, 68.0, 47.0, 49.0, 27.0, 21.0, 6.0, 9.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 3.0], "bins": [-3.669921875, -3.553619384765625, -3.43731689453125, -3.321014404296875, -3.2047119140625, -3.088409423828125, -2.97210693359375, -2.855804443359375, -2.739501953125, -2.623199462890625, -2.50689697265625, -2.390594482421875, -2.2742919921875, -2.157989501953125, -2.04168701171875, -1.925384521484375, -1.80908203125, -1.692779541015625, -1.57647705078125, -1.460174560546875, -1.3438720703125, -1.227569580078125, -1.11126708984375, -0.994964599609375, -0.878662109375, -0.762359619140625, -0.64605712890625, -0.529754638671875, -0.4134521484375, -0.297149658203125, -0.18084716796875, -0.064544677734375, 0.0517578125, 0.168060302734375, 0.28436279296875, 0.400665283203125, 0.5169677734375, 0.633270263671875, 0.74957275390625, 0.865875244140625, 0.982177734375, 1.098480224609375, 1.21478271484375, 1.331085205078125, 1.4473876953125, 1.563690185546875, 1.67999267578125, 1.796295166015625, 1.91259765625, 2.028900146484375, 2.14520263671875, 2.261505126953125, 2.3778076171875, 2.494110107421875, 2.61041259765625, 2.726715087890625, 2.843017578125, 2.959320068359375, 3.07562255859375, 3.191925048828125, 3.3082275390625, 3.424530029296875, 3.54083251953125, 3.657135009765625, 3.7734375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 16.0, 10.0, 8.0, 9.0, 23.0, 25.0, 34.0, 47.0, 70.0, 83.0, 102.0, 122.0, 140.0, 186.0, 202.0, 269.0, 268.0, 301.0, 297.0, 304.0, 277.0, 255.0, 213.0, 180.0, 141.0, 109.0, 95.0, 69.0, 47.0, 41.0, 23.0, 27.0, 24.0, 18.0, 12.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.255645751953125, -1.20660400390625, -1.157562255859375, -1.1085205078125, -1.059478759765625, -1.01043701171875, -0.961395263671875, -0.912353515625, -0.863311767578125, -0.81427001953125, -0.765228271484375, -0.7161865234375, -0.667144775390625, -0.61810302734375, -0.569061279296875, -0.52001953125, -0.470977783203125, -0.42193603515625, -0.372894287109375, -0.3238525390625, -0.274810791015625, -0.22576904296875, -0.176727294921875, -0.127685546875, -0.078643798828125, -0.02960205078125, 0.019439697265625, 0.0684814453125, 0.117523193359375, 0.16656494140625, 0.215606689453125, 0.2646484375, 0.313690185546875, 0.36273193359375, 0.411773681640625, 0.4608154296875, 0.509857177734375, 0.55889892578125, 0.607940673828125, 0.656982421875, 0.706024169921875, 0.75506591796875, 0.804107666015625, 0.8531494140625, 0.902191162109375, 0.95123291015625, 1.000274658203125, 1.04931640625, 1.098358154296875, 1.14739990234375, 1.196441650390625, 1.2454833984375, 1.294525146484375, 1.34356689453125, 1.392608642578125, 1.441650390625, 1.490692138671875, 1.53973388671875, 1.588775634765625, 1.6378173828125, 1.686859130859375, 1.73590087890625, 1.784942626953125, 1.833984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 4.0, 4.0, 3.0, 15.0, 11.0, 15.0, 17.0, 27.0, 31.0, 32.0, 46.0, 44.0, 53.0, 71.0, 78.0, 78.0, 74.0, 60.0, 65.0, 46.0, 43.0, 38.0, 21.0, 30.0, 17.0, 17.0, 13.0, 7.0, 6.0, 12.0, 3.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.6329586505889893, -3.5007519721984863, -3.3685455322265625, -3.2363388538360596, -3.1041321754455566, -2.971925735473633, -2.83971905708313, -2.707512378692627, -2.575305938720703, -2.4430992603302, -2.3108928203582764, -2.1786861419677734, -2.0464797019958496, -1.9142730236053467, -1.7820663452148438, -1.6498597860336304, -1.517653226852417, -1.3854466676712036, -1.2532401084899902, -1.1210334300994873, -0.9888268709182739, -0.8566203117370605, -0.7244136929512024, -0.5922070741653442, -0.46000051498413086, -0.3277939260005951, -0.19558733701705933, -0.06338074803352356, 0.06882584095001221, 0.20103240013122559, 0.33323901891708374, 0.4654456377029419, 0.5976519584655762, 0.7298585176467896, 0.8620651364326477, 0.9942717552185059, 1.1264783143997192, 1.2586848735809326, 1.3908915519714355, 1.523098111152649, 1.6553046703338623, 1.7875112295150757, 1.919717788696289, 2.051924467086792, 2.184131145477295, 2.3163375854492188, 2.4485442638397217, 2.5807509422302246, 2.7129573822021484, 2.8451640605926514, 2.977370500564575, 3.109577178955078, 3.241783618927002, 3.373990297317505, 3.506196975708008, 3.6384034156799316, 3.7706100940704346, 3.9028167724609375, 4.035023212432861, 4.167229652404785, 4.299436569213867, 4.431643009185791, 4.563849449157715, 4.696056365966797, 4.828262805938721]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 11.0, 15.0, 10.0, 22.0, 15.0, 22.0, 39.0, 35.0, 34.0, 49.0, 42.0, 45.0, 46.0, 35.0, 45.0, 57.0, 42.0, 55.0, 44.0, 43.0, 35.0, 34.0, 38.0, 29.0, 30.0, 13.0, 20.0, 14.0, 14.0, 11.0, 10.0, 5.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.198182106018066, -4.0661492347717285, -3.9341166019439697, -3.802083969116211, -3.670051097869873, -3.5380184650421143, -3.4059858322143555, -3.2739529609680176, -3.141920328140259, -3.0098876953125, -2.877854824066162, -2.7458221912384033, -2.6137895584106445, -2.4817566871643066, -2.349724054336548, -2.217691421508789, -2.085658550262451, -1.9536257982254028, -1.8215930461883545, -1.6895604133605957, -1.5575276613235474, -1.425494909286499, -1.2934622764587402, -1.161429524421692, -1.0293967723846436, -0.8973640203475952, -0.7653313279151917, -0.6332986354827881, -0.5012658834457397, -0.3692331314086914, -0.23720043897628784, -0.10516774654388428, 0.026865482330322266, 0.15889820456504822, 0.29093092679977417, 0.4229636490345001, 0.5549963712692261, 0.6870291233062744, 0.819061815738678, 0.9510945081710815, 1.0831272602081299, 1.2151600122451782, 1.3471927642822266, 1.4792253971099854, 1.6112581491470337, 1.743290901184082, 1.8753235340118408, 2.0073561668395996, 2.1393890380859375, 2.2714216709136963, 2.403454542160034, 2.535487174987793, 2.667520046234131, 2.7995526790618896, 2.9315853118896484, 3.0636181831359863, 3.195650815963745, 3.327683448791504, 3.459716320037842, 3.5917489528656006, 3.7237815856933594, 3.8558144569396973, 3.987847089767456, 4.119879722595215, 4.251912593841553]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 9.0, 11.0, 19.0, 21.0, 25.0, 49.0, 93.0, 113.0, 189.0, 264.0, 481.0, 716.0, 1315.0, 2062.0, 3653.0, 6023.0, 10488.0, 19427.0, 36711.0, 75394.0, 182837.0, 359913.0, 188353.0, 77348.0, 37131.0, 19537.0, 11038.0, 6268.0, 3600.0, 2138.0, 1294.0, 758.0, 477.0, 288.0, 148.0, 113.0, 81.0, 60.0, 38.0, 28.0, 16.0, 6.0, 13.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4296875, -1.3843231201171875, -1.338958740234375, -1.2935943603515625, -1.24822998046875, -1.2028656005859375, -1.157501220703125, -1.1121368408203125, -1.0667724609375, -1.0214080810546875, -0.976043701171875, -0.9306793212890625, -0.88531494140625, -0.8399505615234375, -0.794586181640625, -0.7492218017578125, -0.703857421875, -0.6584930419921875, -0.613128662109375, -0.5677642822265625, -0.52239990234375, -0.4770355224609375, -0.431671142578125, -0.3863067626953125, -0.3409423828125, -0.2955780029296875, -0.250213623046875, -0.2048492431640625, -0.15948486328125, -0.1141204833984375, -0.068756103515625, -0.0233917236328125, 0.02197265625, 0.0673370361328125, 0.112701416015625, 0.1580657958984375, 0.20343017578125, 0.2487945556640625, 0.294158935546875, 0.3395233154296875, 0.3848876953125, 0.4302520751953125, 0.475616455078125, 0.5209808349609375, 0.56634521484375, 0.6117095947265625, 0.657073974609375, 0.7024383544921875, 0.747802734375, 0.7931671142578125, 0.838531494140625, 0.8838958740234375, 0.92926025390625, 0.9746246337890625, 1.019989013671875, 1.0653533935546875, 1.1107177734375, 1.1560821533203125, 1.201446533203125, 1.2468109130859375, 1.29217529296875, 1.3375396728515625, 1.382904052734375, 1.4282684326171875, 1.4736328125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 4.0, 10.0, 8.0, 9.0, 20.0, 16.0, 14.0, 18.0, 23.0, 24.0, 37.0, 34.0, 55.0, 49.0, 40.0, 50.0, 49.0, 42.0, 42.0, 49.0, 45.0, 40.0, 42.0, 31.0, 39.0, 30.0, 30.0, 23.0, 28.0, 22.0, 18.0, 9.0, 8.0, 11.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.08984375, -3.9580078125, -3.826171875, -3.6943359375, -3.5625, -3.4306640625, -3.298828125, -3.1669921875, -3.03515625, -2.9033203125, -2.771484375, -2.6396484375, -2.5078125, -2.3759765625, -2.244140625, -2.1123046875, -1.98046875, -1.8486328125, -1.716796875, -1.5849609375, -1.453125, -1.3212890625, -1.189453125, -1.0576171875, -0.92578125, -0.7939453125, -0.662109375, -0.5302734375, -0.3984375, -0.2666015625, -0.134765625, -0.0029296875, 0.12890625, 0.2607421875, 0.392578125, 0.5244140625, 0.65625, 0.7880859375, 0.919921875, 1.0517578125, 1.18359375, 1.3154296875, 1.447265625, 1.5791015625, 1.7109375, 1.8427734375, 1.974609375, 2.1064453125, 2.23828125, 2.3701171875, 2.501953125, 2.6337890625, 2.765625, 2.8974609375, 3.029296875, 3.1611328125, 3.29296875, 3.4248046875, 3.556640625, 3.6884765625, 3.8203125, 3.9521484375, 4.083984375, 4.2158203125, 4.34765625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 9.0, 6.0, 4.0, 10.0, 16.0, 16.0, 23.0, 32.0, 34.0, 51.0, 55.0, 96.0, 109.0, 144.0, 204.0, 285.0, 393.0, 620.0, 951.0, 1555.0, 2819.0, 6120.0, 15416.0, 51171.0, 914179.0, 32509.0, 10952.0, 4573.0, 2258.0, 1282.0, 732.0, 539.0, 365.0, 253.0, 185.0, 155.0, 94.0, 71.0, 53.0, 62.0, 27.0, 25.0, 30.0, 16.0, 19.0, 9.0, 3.0, 3.0, 7.0, 2.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-3.34765625, -3.240814208984375, -3.13397216796875, -3.027130126953125, -2.9202880859375, -2.813446044921875, -2.70660400390625, -2.599761962890625, -2.492919921875, -2.386077880859375, -2.27923583984375, -2.172393798828125, -2.0655517578125, -1.958709716796875, -1.85186767578125, -1.745025634765625, -1.63818359375, -1.531341552734375, -1.42449951171875, -1.317657470703125, -1.2108154296875, -1.103973388671875, -0.99713134765625, -0.890289306640625, -0.783447265625, -0.676605224609375, -0.56976318359375, -0.462921142578125, -0.3560791015625, -0.249237060546875, -0.14239501953125, -0.035552978515625, 0.0712890625, 0.178131103515625, 0.28497314453125, 0.391815185546875, 0.4986572265625, 0.605499267578125, 0.71234130859375, 0.819183349609375, 0.926025390625, 1.032867431640625, 1.13970947265625, 1.246551513671875, 1.3533935546875, 1.460235595703125, 1.56707763671875, 1.673919677734375, 1.78076171875, 1.887603759765625, 1.99444580078125, 2.101287841796875, 2.2081298828125, 2.314971923828125, 2.42181396484375, 2.528656005859375, 2.635498046875, 2.742340087890625, 2.84918212890625, 2.956024169921875, 3.0628662109375, 3.169708251953125, 3.27655029296875, 3.383392333984375, 3.490234375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 8.0, 5.0, 9.0, 7.0, 11.0, 22.0, 13.0, 16.0, 24.0, 22.0, 28.0, 25.0, 32.0, 40.0, 39.0, 47.0, 38.0, 40.0, 36.0, 46.0, 51.0, 39.0, 52.0, 41.0, 47.0, 35.0, 27.0, 35.0, 28.0, 18.0, 17.0, 19.0, 10.0, 14.0, 17.0, 9.0, 7.0, 11.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.85546875, -2.777618408203125, -2.69976806640625, -2.621917724609375, -2.5440673828125, -2.466217041015625, -2.38836669921875, -2.310516357421875, -2.232666015625, -2.154815673828125, -2.07696533203125, -1.999114990234375, -1.9212646484375, -1.843414306640625, -1.76556396484375, -1.687713623046875, -1.60986328125, -1.532012939453125, -1.45416259765625, -1.376312255859375, -1.2984619140625, -1.220611572265625, -1.14276123046875, -1.064910888671875, -0.987060546875, -0.909210205078125, -0.83135986328125, -0.753509521484375, -0.6756591796875, -0.597808837890625, -0.51995849609375, -0.442108154296875, -0.3642578125, -0.286407470703125, -0.20855712890625, -0.130706787109375, -0.0528564453125, 0.024993896484375, 0.10284423828125, 0.180694580078125, 0.258544921875, 0.336395263671875, 0.41424560546875, 0.492095947265625, 0.5699462890625, 0.647796630859375, 0.72564697265625, 0.803497314453125, 0.88134765625, 0.959197998046875, 1.03704833984375, 1.114898681640625, 1.1927490234375, 1.270599365234375, 1.34844970703125, 1.426300048828125, 1.504150390625, 1.582000732421875, 1.65985107421875, 1.737701416015625, 1.8155517578125, 1.893402099609375, 1.97125244140625, 2.049102783203125, 2.126953125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 6.0, 2.0, 8.0, 10.0, 9.0, 8.0, 16.0, 27.0, 24.0, 34.0, 48.0, 80.0, 107.0, 133.0, 199.0, 297.0, 459.0, 757.0, 1414.0, 2561.0, 5400.0, 14289.0, 60554.0, 922603.0, 23615.0, 8041.0, 3442.0, 1731.0, 933.0, 566.0, 361.0, 239.0, 160.0, 128.0, 89.0, 58.0, 40.0, 28.0, 14.0, 19.0, 9.0, 11.0, 12.0, 9.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.2467041015625, -0.2392749786376953, -0.23184585571289062, -0.22441673278808594, -0.21698760986328125, -0.20955848693847656, -0.20212936401367188, -0.1947002410888672, -0.1872711181640625, -0.1798419952392578, -0.17241287231445312, -0.16498374938964844, -0.15755462646484375, -0.15012550354003906, -0.14269638061523438, -0.1352672576904297, -0.127838134765625, -0.12040901184082031, -0.11297988891601562, -0.10555076599121094, -0.09812164306640625, -0.09069252014160156, -0.08326339721679688, -0.07583427429199219, -0.0684051513671875, -0.06097602844238281, -0.053546905517578125, -0.04611778259277344, -0.03868865966796875, -0.03125953674316406, -0.023830413818359375, -0.016401290893554688, -0.00897216796875, -0.0015430450439453125, 0.005886077880859375, 0.013315200805664062, 0.02074432373046875, 0.028173446655273438, 0.035602569580078125, 0.04303169250488281, 0.0504608154296875, 0.05788993835449219, 0.06531906127929688, 0.07274818420410156, 0.08017730712890625, 0.08760643005371094, 0.09503555297851562, 0.10246467590332031, 0.109893798828125, 0.11732292175292969, 0.12475204467773438, 0.13218116760253906, 0.13961029052734375, 0.14703941345214844, 0.15446853637695312, 0.1618976593017578, 0.1693267822265625, 0.1767559051513672, 0.18418502807617188, 0.19161415100097656, 0.19904327392578125, 0.20647239685058594, 0.21390151977539062, 0.2213306427001953, 0.228759765625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 6.0, 8.0, 6.0, 2.0, 8.0, 13.0, 16.0, 11.0, 24.0, 24.0, 24.0, 55.0, 44.0, 47.0, 53.0, 52.0, 50.0, 61.0, 64.0, 58.0, 61.0, 60.0, 45.0, 45.0, 39.0, 29.0, 26.0, 19.0, 19.0, 8.0, 10.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4955482482910156e-05, -5.3402967751026154e-05, -5.185045301914215e-05, -5.029793828725815e-05, -4.8745423555374146e-05, -4.719290882349014e-05, -4.564039409160614e-05, -4.408787935972214e-05, -4.2535364627838135e-05, -4.098284989595413e-05, -3.943033516407013e-05, -3.787782043218613e-05, -3.6325305700302124e-05, -3.477279096841812e-05, -3.322027623653412e-05, -3.1667761504650116e-05, -3.0115246772766113e-05, -2.856273204088211e-05, -2.7010217308998108e-05, -2.5457702577114105e-05, -2.3905187845230103e-05, -2.23526731133461e-05, -2.0800158381462097e-05, -1.9247643649578094e-05, -1.7695128917694092e-05, -1.614261418581009e-05, -1.4590099453926086e-05, -1.3037584722042084e-05, -1.1485069990158081e-05, -9.932555258274078e-06, -8.380040526390076e-06, -6.827525794506073e-06, -5.27501106262207e-06, -3.7224963307380676e-06, -2.169981598854065e-06, -6.174668669700623e-07, 9.350478649139404e-07, 2.487562596797943e-06, 4.040077328681946e-06, 5.5925920605659485e-06, 7.145106792449951e-06, 8.697621524333954e-06, 1.0250136256217957e-05, 1.180265098810196e-05, 1.3355165719985962e-05, 1.4907680451869965e-05, 1.6460195183753967e-05, 1.801270991563797e-05, 1.9565224647521973e-05, 2.1117739379405975e-05, 2.2670254111289978e-05, 2.422276884317398e-05, 2.5775283575057983e-05, 2.7327798306941986e-05, 2.888031303882599e-05, 3.043282777070999e-05, 3.1985342502593994e-05, 3.3537857234478e-05, 3.5090371966362e-05, 3.6642886698246e-05, 3.8195401430130005e-05, 3.974791616201401e-05, 4.130043089389801e-05, 4.285294562578201e-05, 4.4405460357666016e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 17.0, 15.0, 22.0, 54.0, 69.0, 105.0, 171.0, 203.0, 339.0, 514.0, 804.0, 1157.0, 1694.0, 2557.0, 3951.0, 6086.0, 9963.0, 16797.0, 30300.0, 62658.0, 154467.0, 376499.0, 210909.0, 80511.0, 36858.0, 20073.0, 11600.0, 7047.0, 4388.0, 3076.0, 1855.0, 1204.0, 808.0, 597.0, 378.0, 265.0, 179.0, 118.0, 62.0, 52.0, 45.0, 30.0, 17.0, 11.0, 7.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.09222412109375, -0.08939933776855469, -0.08657455444335938, -0.08374977111816406, -0.08092498779296875, -0.07810020446777344, -0.07527542114257812, -0.07245063781738281, -0.0696258544921875, -0.06680107116699219, -0.06397628784179688, -0.06115150451660156, -0.05832672119140625, -0.05550193786621094, -0.052677154541015625, -0.04985237121582031, -0.047027587890625, -0.04420280456542969, -0.041378021240234375, -0.03855323791503906, -0.03572845458984375, -0.03290367126464844, -0.030078887939453125, -0.027254104614257812, -0.0244293212890625, -0.021604537963867188, -0.018779754638671875, -0.015954971313476562, -0.01313018798828125, -0.010305404663085938, -0.007480621337890625, -0.0046558380126953125, -0.0018310546875, 0.0009937286376953125, 0.003818511962890625, 0.0066432952880859375, 0.00946807861328125, 0.012292861938476562, 0.015117645263671875, 0.017942428588867188, 0.0207672119140625, 0.023591995239257812, 0.026416778564453125, 0.029241561889648438, 0.03206634521484375, 0.03489112854003906, 0.037715911865234375, 0.04054069519042969, 0.043365478515625, 0.04619026184082031, 0.049015045166015625, 0.05183982849121094, 0.05466461181640625, 0.05748939514160156, 0.060314178466796875, 0.06313896179199219, 0.0659637451171875, 0.06878852844238281, 0.07161331176757812, 0.07443809509277344, 0.07726287841796875, 0.08008766174316406, 0.08291244506835938, 0.08573722839355469, 0.08856201171875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 3.0, 8.0, 6.0, 8.0, 16.0, 15.0, 25.0, 35.0, 29.0, 38.0, 69.0, 79.0, 123.0, 125.0, 90.0, 77.0, 59.0, 37.0, 24.0, 23.0, 18.0, 14.0, 8.0, 8.0, 4.0, 8.0, 11.0, 5.0, 2.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0284423828125, -0.027662038803100586, -0.026881694793701172, -0.026101350784301758, -0.025321006774902344, -0.02454066276550293, -0.023760318756103516, -0.0229799747467041, -0.022199630737304688, -0.021419286727905273, -0.02063894271850586, -0.019858598709106445, -0.01907825469970703, -0.018297910690307617, -0.017517566680908203, -0.01673722267150879, -0.015956878662109375, -0.015176534652709961, -0.014396190643310547, -0.013615846633911133, -0.012835502624511719, -0.012055158615112305, -0.01127481460571289, -0.010494470596313477, -0.009714126586914062, -0.008933782577514648, -0.008153438568115234, -0.00737309455871582, -0.006592750549316406, -0.005812406539916992, -0.005032062530517578, -0.004251718521118164, -0.00347137451171875, -0.002691030502319336, -0.0019106864929199219, -0.0011303424835205078, -0.00034999847412109375, 0.0004303455352783203, 0.0012106895446777344, 0.0019910335540771484, 0.0027713775634765625, 0.0035517215728759766, 0.004332065582275391, 0.005112409591674805, 0.005892753601074219, 0.006673097610473633, 0.007453441619873047, 0.008233785629272461, 0.009014129638671875, 0.009794473648071289, 0.010574817657470703, 0.011355161666870117, 0.012135505676269531, 0.012915849685668945, 0.01369619369506836, 0.014476537704467773, 0.015256881713867188, 0.0160372257232666, 0.016817569732666016, 0.01759791374206543, 0.018378257751464844, 0.019158601760864258, 0.019938945770263672, 0.020719289779663086, 0.0214996337890625]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 4.0, 4.0, 2.0, 11.0, 11.0, 12.0, 11.0, 24.0, 28.0, 36.0, 34.0, 44.0, 43.0, 65.0, 72.0, 86.0, 71.0, 63.0, 64.0, 50.0, 50.0, 53.0, 25.0, 21.0, 27.0, 20.0, 17.0, 7.0, 4.0, 12.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.549168586730957, -3.4183619022369385, -3.287554979324341, -3.1567482948303223, -3.0259413719177246, -2.895134687423706, -2.7643280029296875, -2.63352108001709, -2.5027143955230713, -2.3719077110290527, -2.241100788116455, -2.1102941036224365, -1.9794872999191284, -1.8486804962158203, -1.7178738117218018, -1.5870670080184937, -1.4562602043151855, -1.3254534006118774, -1.1946465969085693, -1.0638399124145508, -0.9330331087112427, -0.8022263050079346, -0.6714195609092712, -0.5406128168106079, -0.4098060131072998, -0.2789992392063141, -0.14819246530532837, -0.01738569140434265, 0.11342108249664307, 0.24422788619995117, 0.3750346302986145, 0.5058413743972778, 0.6366481781005859, 0.767454981803894, 0.8982617259025574, 1.0290684700012207, 1.1598752737045288, 1.290682077407837, 1.4214887619018555, 1.5522955656051636, 1.6831023693084717, 1.8139091730117798, 1.944715976715088, 2.0755226612091064, 2.206329345703125, 2.3371362686157227, 2.467942953109741, 2.5987496376037598, 2.7295565605163574, 2.860363245010376, 2.9911701679229736, 3.121976852416992, 3.25278377532959, 3.3835904598236084, 3.514397144317627, 3.6452040672302246, 3.776010751724243, 3.9068174362182617, 4.037624359130859, 4.168431282043457, 4.2992377281188965, 4.430044651031494, 4.560851573944092, 4.691658020019531, 4.822464942932129]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 5.0, 10.0, 11.0, 15.0, 10.0, 23.0, 13.0, 25.0, 38.0, 34.0, 37.0, 51.0, 40.0, 45.0, 44.0, 36.0, 46.0, 58.0, 40.0, 57.0, 40.0, 43.0, 38.0, 31.0, 41.0, 28.0, 28.0, 13.0, 21.0, 13.0, 16.0, 9.0, 10.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.18418025970459, -4.053008556365967, -3.9218368530273438, -3.7906653881073, -3.6594936847686768, -3.5283219814300537, -3.3971505165100098, -3.2659788131713867, -3.1348071098327637, -3.0036354064941406, -2.8724637031555176, -2.7412922382354736, -2.6101205348968506, -2.4789488315582275, -2.3477773666381836, -2.2166056632995605, -2.0854339599609375, -1.9542622566223145, -1.823090672492981, -1.6919190883636475, -1.5607473850250244, -1.4295756816864014, -1.2984040975570679, -1.1672325134277344, -1.0360608100891113, -0.9048891663551331, -0.7737175226211548, -0.6425458788871765, -0.5113742351531982, -0.38020259141921997, -0.2490309476852417, -0.11785930395126343, 0.01331186294555664, 0.1444835066795349, 0.2756551504135132, 0.40682679414749146, 0.5379984378814697, 0.669170081615448, 0.8003417253494263, 0.9315133690834045, 1.0626850128173828, 1.1938567161560059, 1.3250283002853394, 1.4561998844146729, 1.587371587753296, 1.718543291091919, 1.8497148752212524, 1.980886459350586, 2.112058162689209, 2.243229866027832, 2.374401569366455, 2.505573034286499, 2.636744737625122, 2.767916440963745, 2.899087905883789, 3.030259609222412, 3.161431312561035, 3.292603015899658, 3.4237747192382812, 3.554946184158325, 3.6861178874969482, 3.8172895908355713, 3.9484610557556152, 4.079632759094238, 4.210804462432861]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 13.0, 19.0, 23.0, 45.0, 54.0, 93.0, 133.0, 219.0, 327.0, 493.0, 736.0, 1214.0, 1845.0, 3058.0, 5051.0, 8420.0, 14348.0, 25895.0, 46615.0, 83509.0, 139966.0, 195884.0, 195146.0, 137504.0, 81593.0, 45362.0, 25267.0, 14240.0, 8229.0, 4999.0, 3028.0, 1847.0, 1186.0, 801.0, 490.0, 310.0, 175.0, 135.0, 97.0, 75.0, 35.0, 25.0, 18.0, 13.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.3621826171875, -3.253662109375, -3.1451416015625, -3.03662109375, -2.9281005859375, -2.819580078125, -2.7110595703125, -2.6025390625, -2.4940185546875, -2.385498046875, -2.2769775390625, -2.16845703125, -2.0599365234375, -1.951416015625, -1.8428955078125, -1.734375, -1.6258544921875, -1.517333984375, -1.4088134765625, -1.30029296875, -1.1917724609375, -1.083251953125, -0.9747314453125, -0.8662109375, -0.7576904296875, -0.649169921875, -0.5406494140625, -0.43212890625, -0.3236083984375, -0.215087890625, -0.1065673828125, 0.001953125, 0.1104736328125, 0.218994140625, 0.3275146484375, 0.43603515625, 0.5445556640625, 0.653076171875, 0.7615966796875, 0.8701171875, 0.9786376953125, 1.087158203125, 1.1956787109375, 1.30419921875, 1.4127197265625, 1.521240234375, 1.6297607421875, 1.73828125, 1.8468017578125, 1.955322265625, 2.0638427734375, 2.17236328125, 2.2808837890625, 2.389404296875, 2.4979248046875, 2.6064453125, 2.7149658203125, 2.823486328125, 2.9320068359375, 3.04052734375, 3.1490478515625, 3.257568359375, 3.3660888671875, 3.474609375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 7.0, 12.0, 17.0, 18.0, 18.0, 20.0, 26.0, 27.0, 40.0, 40.0, 46.0, 65.0, 43.0, 59.0, 49.0, 41.0, 65.0, 53.0, 44.0, 43.0, 48.0, 41.0, 41.0, 21.0, 23.0, 18.0, 12.0, 19.0, 15.0, 7.0, 4.0, 6.0, 4.0, 1.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.43359375, -4.28668212890625, -4.1397705078125, -3.99285888671875, -3.845947265625, -3.69903564453125, -3.5521240234375, -3.40521240234375, -3.25830078125, -3.11138916015625, -2.9644775390625, -2.81756591796875, -2.670654296875, -2.52374267578125, -2.3768310546875, -2.22991943359375, -2.0830078125, -1.93609619140625, -1.7891845703125, -1.64227294921875, -1.495361328125, -1.34844970703125, -1.2015380859375, -1.05462646484375, -0.90771484375, -0.76080322265625, -0.6138916015625, -0.46697998046875, -0.320068359375, -0.17315673828125, -0.0262451171875, 0.12066650390625, 0.267578125, 0.41448974609375, 0.5614013671875, 0.70831298828125, 0.855224609375, 1.00213623046875, 1.1490478515625, 1.29595947265625, 1.44287109375, 1.58978271484375, 1.7366943359375, 1.88360595703125, 2.030517578125, 2.17742919921875, 2.3243408203125, 2.47125244140625, 2.6181640625, 2.76507568359375, 2.9119873046875, 3.05889892578125, 3.205810546875, 3.35272216796875, 3.4996337890625, 3.64654541015625, 3.79345703125, 3.94036865234375, 4.0872802734375, 4.23419189453125, 4.381103515625, 4.52801513671875, 4.6749267578125, 4.82183837890625, 4.96875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 6.0, 13.0, 21.0, 22.0, 36.0, 45.0, 79.0, 117.0, 163.0, 244.0, 382.0, 525.0, 924.0, 1307.0, 1959.0, 3105.0, 4888.0, 7565.0, 12023.0, 19177.0, 31103.0, 50224.0, 79964.0, 119022.0, 156363.0, 164668.0, 136179.0, 95232.0, 60940.0, 38218.0, 23481.0, 14738.0, 9183.0, 5922.0, 3822.0, 2287.0, 1502.0, 1013.0, 699.0, 478.0, 325.0, 206.0, 133.0, 78.0, 63.0, 43.0, 27.0, 16.0, 11.0, 6.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-2.705078125, -2.62109375, -2.537109375, -2.453125, -2.369140625, -2.28515625, -2.201171875, -2.1171875, -2.033203125, -1.94921875, -1.865234375, -1.78125, -1.697265625, -1.61328125, -1.529296875, -1.4453125, -1.361328125, -1.27734375, -1.193359375, -1.109375, -1.025390625, -0.94140625, -0.857421875, -0.7734375, -0.689453125, -0.60546875, -0.521484375, -0.4375, -0.353515625, -0.26953125, -0.185546875, -0.1015625, -0.017578125, 0.06640625, 0.150390625, 0.234375, 0.318359375, 0.40234375, 0.486328125, 0.5703125, 0.654296875, 0.73828125, 0.822265625, 0.90625, 0.990234375, 1.07421875, 1.158203125, 1.2421875, 1.326171875, 1.41015625, 1.494140625, 1.578125, 1.662109375, 1.74609375, 1.830078125, 1.9140625, 1.998046875, 2.08203125, 2.166015625, 2.25, 2.333984375, 2.41796875, 2.501953125, 2.5859375, 2.669921875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 6.0, 5.0, 5.0, 7.0, 5.0, 11.0, 18.0, 9.0, 20.0, 23.0, 20.0, 14.0, 26.0, 24.0, 29.0, 30.0, 31.0, 35.0, 43.0, 40.0, 44.0, 35.0, 39.0, 51.0, 41.0, 35.0, 43.0, 29.0, 33.0, 38.0, 20.0, 32.0, 22.0, 20.0, 26.0, 16.0, 18.0, 16.0, 9.0, 9.0, 4.0, 4.0, 3.0, 4.0, 2.0, 5.0, 0.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.111328125, -2.049560546875, -1.98779296875, -1.926025390625, -1.8642578125, -1.802490234375, -1.74072265625, -1.678955078125, -1.6171875, -1.555419921875, -1.49365234375, -1.431884765625, -1.3701171875, -1.308349609375, -1.24658203125, -1.184814453125, -1.123046875, -1.061279296875, -0.99951171875, -0.937744140625, -0.8759765625, -0.814208984375, -0.75244140625, -0.690673828125, -0.62890625, -0.567138671875, -0.50537109375, -0.443603515625, -0.3818359375, -0.320068359375, -0.25830078125, -0.196533203125, -0.134765625, -0.072998046875, -0.01123046875, 0.050537109375, 0.1123046875, 0.174072265625, 0.23583984375, 0.297607421875, 0.359375, 0.421142578125, 0.48291015625, 0.544677734375, 0.6064453125, 0.668212890625, 0.72998046875, 0.791748046875, 0.853515625, 0.915283203125, 0.97705078125, 1.038818359375, 1.1005859375, 1.162353515625, 1.22412109375, 1.285888671875, 1.34765625, 1.409423828125, 1.47119140625, 1.532958984375, 1.5947265625, 1.656494140625, 1.71826171875, 1.780029296875, 1.841796875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 12.0, 17.0, 26.0, 40.0, 71.0, 81.0, 123.0, 157.0, 305.0, 452.0, 682.0, 1224.0, 1946.0, 3122.0, 5376.0, 9378.0, 16478.0, 28922.0, 50621.0, 86513.0, 136573.0, 182109.0, 182378.0, 136732.0, 85814.0, 50502.0, 29197.0, 16482.0, 9421.0, 5526.0, 3268.0, 1884.0, 1152.0, 732.0, 460.0, 261.0, 175.0, 118.0, 77.0, 46.0, 36.0, 20.0, 16.0, 10.0, 4.0, 3.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88037109375, -0.8500137329101562, -0.8196563720703125, -0.7892990112304688, -0.758941650390625, -0.7285842895507812, -0.6982269287109375, -0.6678695678710938, -0.63751220703125, -0.6071548461914062, -0.5767974853515625, -0.5464401245117188, -0.516082763671875, -0.48572540283203125, -0.4553680419921875, -0.42501068115234375, -0.3946533203125, -0.36429595947265625, -0.3339385986328125, -0.30358123779296875, -0.273223876953125, -0.24286651611328125, -0.2125091552734375, -0.18215179443359375, -0.15179443359375, -0.12143707275390625, -0.0910797119140625, -0.06072235107421875, -0.030364990234375, -7.62939453125e-06, 0.0303497314453125, 0.06070709228515625, 0.091064453125, 0.12142181396484375, 0.1517791748046875, 0.18213653564453125, 0.212493896484375, 0.24285125732421875, 0.2732086181640625, 0.30356597900390625, 0.33392333984375, 0.36428070068359375, 0.3946380615234375, 0.42499542236328125, 0.455352783203125, 0.48571014404296875, 0.5160675048828125, 0.5464248657226562, 0.5767822265625, 0.6071395874023438, 0.6374969482421875, 0.6678543090820312, 0.698211669921875, 0.7285690307617188, 0.7589263916015625, 0.7892837524414062, 0.81964111328125, 0.8499984741210938, 0.8803558349609375, 0.9107131958007812, 0.941070556640625, 0.9714279174804688, 1.0017852783203125, 1.0321426391601562, 1.0625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 9.0, 6.0, 10.0, 9.0, 16.0, 24.0, 21.0, 26.0, 28.0, 30.0, 38.0, 31.0, 44.0, 51.0, 47.0, 65.0, 56.0, 59.0, 60.0, 50.0, 39.0, 38.0, 43.0, 32.0, 26.0, 25.0, 9.0, 21.0, 13.0, 12.0, 11.0, 6.0, 6.0, 1.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.42538070678711e-05, -6.224215030670166e-05, -6.0230493545532227e-05, -5.821883678436279e-05, -5.620718002319336e-05, -5.4195523262023926e-05, -5.218386650085449e-05, -5.017220973968506e-05, -4.8160552978515625e-05, -4.614889621734619e-05, -4.413723945617676e-05, -4.2125582695007324e-05, -4.011392593383789e-05, -3.810226917266846e-05, -3.6090612411499023e-05, -3.407895565032959e-05, -3.2067298889160156e-05, -3.0055642127990723e-05, -2.804398536682129e-05, -2.6032328605651855e-05, -2.4020671844482422e-05, -2.2009015083312988e-05, -1.9997358322143555e-05, -1.798570156097412e-05, -1.5974044799804688e-05, -1.3962388038635254e-05, -1.195073127746582e-05, -9.939074516296387e-06, -7.927417755126953e-06, -5.9157609939575195e-06, -3.904104232788086e-06, -1.8924474716186523e-06, 1.1920928955078125e-07, 2.130866050720215e-06, 4.1425228118896484e-06, 6.154179573059082e-06, 8.165836334228516e-06, 1.017749309539795e-05, 1.2189149856567383e-05, 1.4200806617736816e-05, 1.621246337890625e-05, 1.8224120140075684e-05, 2.0235776901245117e-05, 2.224743366241455e-05, 2.4259090423583984e-05, 2.6270747184753418e-05, 2.828240394592285e-05, 3.0294060707092285e-05, 3.230571746826172e-05, 3.431737422943115e-05, 3.6329030990600586e-05, 3.834068775177002e-05, 4.035234451293945e-05, 4.236400127410889e-05, 4.437565803527832e-05, 4.6387314796447754e-05, 4.839897155761719e-05, 5.041062831878662e-05, 5.2422285079956055e-05, 5.443394184112549e-05, 5.644559860229492e-05, 5.8457255363464355e-05, 6.046891212463379e-05, 6.248056888580322e-05, 6.449222564697266e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 13.0, 12.0, 19.0, 36.0, 45.0, 60.0, 120.0, 180.0, 251.0, 421.0, 813.0, 1370.0, 2627.0, 4753.0, 9108.0, 17383.0, 32493.0, 62153.0, 113688.0, 186185.0, 222786.0, 173389.0, 102860.0, 55369.0, 29206.0, 15303.0, 8134.0, 4269.0, 2365.0, 1231.0, 759.0, 423.0, 263.0, 153.0, 105.0, 66.0, 31.0, 35.0, 20.0, 14.0, 10.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0849609375, -1.049285888671875, -1.01361083984375, -0.977935791015625, -0.9422607421875, -0.906585693359375, -0.87091064453125, -0.835235595703125, -0.799560546875, -0.763885498046875, -0.72821044921875, -0.692535400390625, -0.6568603515625, -0.621185302734375, -0.58551025390625, -0.549835205078125, -0.51416015625, -0.478485107421875, -0.44281005859375, -0.407135009765625, -0.3714599609375, -0.335784912109375, -0.30010986328125, -0.264434814453125, -0.228759765625, -0.193084716796875, -0.15740966796875, -0.121734619140625, -0.0860595703125, -0.050384521484375, -0.01470947265625, 0.020965576171875, 0.056640625, 0.092315673828125, 0.12799072265625, 0.163665771484375, 0.1993408203125, 0.235015869140625, 0.27069091796875, 0.306365966796875, 0.342041015625, 0.377716064453125, 0.41339111328125, 0.449066162109375, 0.4847412109375, 0.520416259765625, 0.55609130859375, 0.591766357421875, 0.62744140625, 0.663116455078125, 0.69879150390625, 0.734466552734375, 0.7701416015625, 0.805816650390625, 0.84149169921875, 0.877166748046875, 0.912841796875, 0.948516845703125, 0.98419189453125, 1.019866943359375, 1.0555419921875, 1.091217041015625, 1.12689208984375, 1.162567138671875, 1.1982421875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 8.0, 6.0, 7.0, 7.0, 17.0, 16.0, 22.0, 28.0, 26.0, 27.0, 48.0, 55.0, 50.0, 64.0, 63.0, 62.0, 66.0, 84.0, 56.0, 48.0, 41.0, 46.0, 29.0, 23.0, 23.0, 23.0, 17.0, 12.0, 3.0, 8.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.406982421875, -0.39514923095703125, -0.3833160400390625, -0.37148284912109375, -0.359649658203125, -0.34781646728515625, -0.3359832763671875, -0.32415008544921875, -0.31231689453125, -0.30048370361328125, -0.2886505126953125, -0.27681732177734375, -0.264984130859375, -0.25315093994140625, -0.2413177490234375, -0.22948455810546875, -0.2176513671875, -0.20581817626953125, -0.1939849853515625, -0.18215179443359375, -0.170318603515625, -0.15848541259765625, -0.1466522216796875, -0.13481903076171875, -0.12298583984375, -0.11115264892578125, -0.0993194580078125, -0.08748626708984375, -0.075653076171875, -0.06381988525390625, -0.0519866943359375, -0.04015350341796875, -0.0283203125, -0.01648712158203125, -0.0046539306640625, 0.00717926025390625, 0.019012451171875, 0.03084564208984375, 0.0426788330078125, 0.05451202392578125, 0.06634521484375, 0.07817840576171875, 0.0900115966796875, 0.10184478759765625, 0.113677978515625, 0.12551116943359375, 0.1373443603515625, 0.14917755126953125, 0.1610107421875, 0.17284393310546875, 0.1846771240234375, 0.19651031494140625, 0.208343505859375, 0.22017669677734375, 0.2320098876953125, 0.24384307861328125, 0.25567626953125, 0.26750946044921875, 0.2793426513671875, 0.29117584228515625, 0.303009033203125, 0.31484222412109375, 0.3266754150390625, 0.33850860595703125, 0.350341796875]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 8.0, 5.0, 3.0, 5.0, 6.0, 8.0, 15.0, 13.0, 16.0, 33.0, 32.0, 35.0, 50.0, 60.0, 66.0, 81.0, 80.0, 70.0, 67.0, 77.0, 61.0, 47.0, 41.0, 21.0, 22.0, 18.0, 20.0, 14.0, 3.0, 7.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.549464464187622, -3.405575752258301, -3.2616870403289795, -3.117798328399658, -2.973909616470337, -2.8300209045410156, -2.6861319541931152, -2.542243480682373, -2.3983545303344727, -2.2544658184051514, -2.11057710647583, -1.9666883945465088, -1.8227996826171875, -1.6789109706878662, -1.5350221395492554, -1.391133427619934, -1.2472448348999023, -1.103356122970581, -0.9594674110412598, -0.8155786395072937, -0.6716899275779724, -0.5278012156486511, -0.38391244411468506, -0.24002373218536377, -0.09613502025604248, 0.04775370657444, 0.19164243340492249, 0.33553117513656616, 0.47941988706588745, 0.6233085989952087, 0.7671973705291748, 0.9110860824584961, 1.0549745559692383, 1.1988632678985596, 1.3427519798278809, 1.4866406917572021, 1.6305294036865234, 1.7744181156158447, 1.9183069467544556, 2.0621957778930664, 2.2060842514038086, 2.34997296333313, 2.493861675262451, 2.6377503871917725, 2.7816390991210938, 2.925527811050415, 3.0694165229797363, 3.2133054733276367, 3.357194185256958, 3.5010828971862793, 3.6449716091156006, 3.788860321044922, 3.932749032974243, 4.0766377449035645, 4.220526695251465, 4.364415168762207, 4.508304119110107, 4.652193069458008, 4.79608154296875, 4.93997049331665, 5.083858966827393, 5.227747917175293, 5.371636390686035, 5.5155253410339355, 5.659413814544678]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 7.0, 5.0, 6.0, 6.0, 4.0, 8.0, 9.0, 19.0, 15.0, 17.0, 28.0, 20.0, 27.0, 30.0, 37.0, 31.0, 47.0, 41.0, 36.0, 38.0, 51.0, 44.0, 38.0, 42.0, 48.0, 46.0, 44.0, 45.0, 30.0, 34.0, 21.0, 30.0, 16.0, 16.0, 7.0, 12.0, 15.0, 8.0, 10.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.010634422302246, -3.8863394260406494, -3.7620444297790527, -3.637749195098877, -3.5134541988372803, -3.3891592025756836, -3.264864206314087, -3.1405692100524902, -3.0162739753723145, -2.8919789791107178, -2.767683982849121, -2.6433887481689453, -2.5190937519073486, -2.394798755645752, -2.2705037593841553, -2.1462087631225586, -2.021913766860962, -1.8976187705993652, -1.773323655128479, -1.6490286588668823, -1.524733543395996, -1.4004385471343994, -1.2761435508728027, -1.151848554611206, -1.0275534391403198, -0.9032583832740784, -0.7789633274078369, -0.6546683311462402, -0.5303732752799988, -0.4060782194137573, -0.28178322315216064, -0.1574881672859192, -0.033193349838256836, 0.09110169112682343, 0.2153967320919037, 0.33969175815582275, 0.4639868140220642, 0.5882818698883057, 0.7125768661499023, 0.8368719220161438, 0.9611669778823853, 1.085461974143982, 1.2097570896148682, 1.3340520858764648, 1.4583470821380615, 1.5826421976089478, 1.7069371938705444, 1.8312323093414307, 1.9555273056030273, 2.079822301864624, 2.2041172981262207, 2.3284125328063965, 2.452707529067993, 2.57700252532959, 2.7012975215911865, 2.825592517852783, 2.949887752532959, 3.0741827487945557, 3.1984777450561523, 3.322772979736328, 3.447067975997925, 3.5713629722595215, 3.695657968521118, 3.819952964782715, 3.9442479610443115]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 12.0, 8.0, 16.0, 19.0, 33.0, 42.0, 61.0, 59.0, 101.0, 145.0, 213.0, 276.0, 408.0, 627.0, 902.0, 1283.0, 2104.0, 3149.0, 5151.0, 8632.0, 14709.0, 27155.0, 51395.0, 105327.0, 234546.0, 555345.0, 1110823.0, 1088141.0, 540841.0, 227824.0, 102630.0, 50181.0, 25767.0, 14295.0, 8233.0, 5033.0, 3097.0, 1856.0, 1261.0, 796.0, 566.0, 375.0, 278.0, 174.0, 102.0, 87.0, 65.0, 42.0, 42.0, 18.0, 12.0, 17.0, 6.0, 5.0, 2.0, 3.0], "bins": [-4.890625, -4.75079345703125, -4.6109619140625, -4.47113037109375, -4.331298828125, -4.19146728515625, -4.0516357421875, -3.91180419921875, -3.77197265625, -3.63214111328125, -3.4923095703125, -3.35247802734375, -3.212646484375, -3.07281494140625, -2.9329833984375, -2.79315185546875, -2.6533203125, -2.51348876953125, -2.3736572265625, -2.23382568359375, -2.093994140625, -1.95416259765625, -1.8143310546875, -1.67449951171875, -1.53466796875, -1.39483642578125, -1.2550048828125, -1.11517333984375, -0.975341796875, -0.83551025390625, -0.6956787109375, -0.55584716796875, -0.416015625, -0.27618408203125, -0.1363525390625, 0.00347900390625, 0.143310546875, 0.28314208984375, 0.4229736328125, 0.56280517578125, 0.70263671875, 0.84246826171875, 0.9822998046875, 1.12213134765625, 1.261962890625, 1.40179443359375, 1.5416259765625, 1.68145751953125, 1.8212890625, 1.96112060546875, 2.1009521484375, 2.24078369140625, 2.380615234375, 2.52044677734375, 2.6602783203125, 2.80010986328125, 2.93994140625, 3.07977294921875, 3.2196044921875, 3.35943603515625, 3.499267578125, 3.63909912109375, 3.7789306640625, 3.91876220703125, 4.05859375]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 2.0, 3.0, 7.0, 5.0, 15.0, 15.0, 12.0, 22.0, 20.0, 26.0, 23.0, 28.0, 35.0, 29.0, 37.0, 37.0, 48.0, 48.0, 44.0, 36.0, 48.0, 39.0, 51.0, 38.0, 48.0, 44.0, 34.0, 34.0, 28.0, 18.0, 24.0, 17.0, 10.0, 14.0, 9.0, 8.0, 8.0, 10.0, 7.0, 5.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.814453125, -2.72857666015625, -2.6427001953125, -2.55682373046875, -2.470947265625, -2.38507080078125, -2.2991943359375, -2.21331787109375, -2.12744140625, -2.04156494140625, -1.9556884765625, -1.86981201171875, -1.783935546875, -1.69805908203125, -1.6121826171875, -1.52630615234375, -1.4404296875, -1.35455322265625, -1.2686767578125, -1.18280029296875, -1.096923828125, -1.01104736328125, -0.9251708984375, -0.83929443359375, -0.75341796875, -0.66754150390625, -0.5816650390625, -0.49578857421875, -0.409912109375, -0.32403564453125, -0.2381591796875, -0.15228271484375, -0.06640625, 0.01947021484375, 0.1053466796875, 0.19122314453125, 0.277099609375, 0.36297607421875, 0.4488525390625, 0.53472900390625, 0.62060546875, 0.70648193359375, 0.7923583984375, 0.87823486328125, 0.964111328125, 1.04998779296875, 1.1358642578125, 1.22174072265625, 1.3076171875, 1.39349365234375, 1.4793701171875, 1.56524658203125, 1.651123046875, 1.73699951171875, 1.8228759765625, 1.90875244140625, 1.99462890625, 2.08050537109375, 2.1663818359375, 2.25225830078125, 2.338134765625, 2.42401123046875, 2.5098876953125, 2.59576416015625, 2.681640625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 5.0, 8.0, 14.0, 14.0, 25.0, 44.0, 77.0, 116.0, 170.0, 253.0, 374.0, 522.0, 735.0, 1204.0, 1803.0, 2790.0, 4366.0, 6845.0, 11129.0, 18246.0, 30847.0, 53346.0, 94891.0, 172427.0, 311507.0, 539657.0, 797328.0, 816077.0, 572157.0, 332518.0, 183269.0, 101072.0, 56928.0, 32716.0, 19134.0, 11524.0, 7191.0, 4558.0, 2888.0, 1764.0, 1296.0, 823.0, 532.0, 368.0, 219.0, 161.0, 123.0, 74.0, 59.0, 31.0, 23.0, 9.0, 14.0, 12.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0], "bins": [-3.365234375, -3.256866455078125, -3.14849853515625, -3.040130615234375, -2.9317626953125, -2.823394775390625, -2.71502685546875, -2.606658935546875, -2.498291015625, -2.389923095703125, -2.28155517578125, -2.173187255859375, -2.0648193359375, -1.956451416015625, -1.84808349609375, -1.739715576171875, -1.63134765625, -1.522979736328125, -1.41461181640625, -1.306243896484375, -1.1978759765625, -1.089508056640625, -0.98114013671875, -0.872772216796875, -0.764404296875, -0.656036376953125, -0.54766845703125, -0.439300537109375, -0.3309326171875, -0.222564697265625, -0.11419677734375, -0.005828857421875, 0.1025390625, 0.210906982421875, 0.31927490234375, 0.427642822265625, 0.5360107421875, 0.644378662109375, 0.75274658203125, 0.861114501953125, 0.969482421875, 1.077850341796875, 1.18621826171875, 1.294586181640625, 1.4029541015625, 1.511322021484375, 1.61968994140625, 1.728057861328125, 1.83642578125, 1.944793701171875, 2.05316162109375, 2.161529541015625, 2.2698974609375, 2.378265380859375, 2.48663330078125, 2.595001220703125, 2.703369140625, 2.811737060546875, 2.92010498046875, 3.028472900390625, 3.1368408203125, 3.245208740234375, 3.35357666015625, 3.461944580078125, 3.5703125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 4.0, 1.0, 6.0, 5.0, 11.0, 18.0, 13.0, 12.0, 28.0, 30.0, 25.0, 50.0, 67.0, 61.0, 96.0, 95.0, 102.0, 142.0, 162.0, 192.0, 192.0, 243.0, 258.0, 260.0, 244.0, 218.0, 243.0, 218.0, 180.0, 162.0, 113.0, 115.0, 96.0, 91.0, 64.0, 43.0, 35.0, 47.0, 27.0, 20.0, 18.0, 16.0, 10.0, 12.0, 12.0, 7.0, 6.0, 2.0, 2.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.146484375, -1.104339599609375, -1.06219482421875, -1.020050048828125, -0.9779052734375, -0.935760498046875, -0.89361572265625, -0.851470947265625, -0.809326171875, -0.767181396484375, -0.72503662109375, -0.682891845703125, -0.6407470703125, -0.598602294921875, -0.55645751953125, -0.514312744140625, -0.47216796875, -0.430023193359375, -0.38787841796875, -0.345733642578125, -0.3035888671875, -0.261444091796875, -0.21929931640625, -0.177154541015625, -0.135009765625, -0.092864990234375, -0.05072021484375, -0.008575439453125, 0.0335693359375, 0.075714111328125, 0.11785888671875, 0.160003662109375, 0.2021484375, 0.244293212890625, 0.28643798828125, 0.328582763671875, 0.3707275390625, 0.412872314453125, 0.45501708984375, 0.497161865234375, 0.539306640625, 0.581451416015625, 0.62359619140625, 0.665740966796875, 0.7078857421875, 0.750030517578125, 0.79217529296875, 0.834320068359375, 0.87646484375, 0.918609619140625, 0.96075439453125, 1.002899169921875, 1.0450439453125, 1.087188720703125, 1.12933349609375, 1.171478271484375, 1.213623046875, 1.255767822265625, 1.29791259765625, 1.340057373046875, 1.3822021484375, 1.424346923828125, 1.46649169921875, 1.508636474609375, 1.55078125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 3.0, 9.0, 14.0, 10.0, 13.0, 20.0, 20.0, 29.0, 38.0, 47.0, 60.0, 46.0, 61.0, 67.0, 68.0, 71.0, 69.0, 68.0, 48.0, 42.0, 38.0, 25.0, 25.0, 14.0, 18.0, 26.0, 12.0, 5.0, 6.0, 4.0, 4.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.060038089752197, -3.918400764465332, -3.776763439178467, -3.6351258754730225, -3.4934885501861572, -3.351851224899292, -3.2102136611938477, -3.0685763359069824, -2.926939010620117, -2.785301685333252, -2.6436643600463867, -2.5020267963409424, -2.360389471054077, -2.218752145767212, -2.0771145820617676, -1.9354772567749023, -1.793839931488037, -1.6522026062011719, -1.510565161705017, -1.3689277172088623, -1.227290391921997, -1.0856530666351318, -0.944015622138977, -0.802378237247467, -0.660740852355957, -0.519103467464447, -0.377466082572937, -0.235828697681427, -0.09419131278991699, 0.04744607210159302, 0.18908345699310303, 0.33072084188461304, 0.47235822677612305, 0.6139956116676331, 0.7556329965591431, 0.8972703814506531, 1.038907766342163, 1.1805450916290283, 1.322182536125183, 1.463819980621338, 1.6054573059082031, 1.7470946311950684, 1.8887320756912231, 2.030369520187378, 2.172006845474243, 2.3136441707611084, 2.4552817344665527, 2.596919059753418, 2.738556385040283, 2.8801937103271484, 3.0218310356140137, 3.163468599319458, 3.3051059246063232, 3.4467432498931885, 3.588380813598633, 3.730018138885498, 3.8716554641723633, 4.0132927894592285, 4.154930114746094, 4.296567440032959, 4.438204765319824, 4.579842567443848, 4.721479892730713, 4.863117218017578, 5.004754543304443]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 15.0, 6.0, 5.0, 10.0, 10.0, 10.0, 11.0, 16.0, 19.0, 26.0, 27.0, 19.0, 30.0, 28.0, 36.0, 37.0, 37.0, 45.0, 49.0, 31.0, 46.0, 39.0, 35.0, 46.0, 37.0, 30.0, 37.0, 36.0, 29.0, 29.0, 27.0, 18.0, 24.0, 16.0, 12.0, 13.0, 10.0, 4.0, 10.0, 3.0, 12.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.8531975746154785, -3.738088369369507, -3.622979164123535, -3.5078699588775635, -3.392760753631592, -3.277651786804199, -3.1625425815582275, -3.047433376312256, -2.932324171066284, -2.8172149658203125, -2.702105760574341, -2.586996555328369, -2.4718875885009766, -2.356778144836426, -2.241669178009033, -2.1265599727630615, -2.01145076751709, -1.8963415622711182, -1.7812323570251465, -1.6661232709884644, -1.5510140657424927, -1.435904860496521, -1.3207957744598389, -1.2056865692138672, -1.0905773639678955, -0.9754681587219238, -0.8603590130805969, -0.74524986743927, -0.6301406621932983, -0.5150314569473267, -0.39992231130599976, -0.28481316566467285, -0.16970372200012207, -0.05459454655647278, 0.060514628887176514, 0.1756238043308258, 0.2907329797744751, 0.4058421850204468, 0.5209513306617737, 0.6360604763031006, 0.7511696815490723, 0.866278886795044, 0.9813880324363708, 1.0964971780776978, 1.2116063833236694, 1.3267155885696411, 1.4418246746063232, 1.556933879852295, 1.6720430850982666, 1.7871522903442383, 1.90226149559021, 2.0173707008361816, 2.132479667663574, 2.247589111328125, 2.3626980781555176, 2.4778072834014893, 2.592916488647461, 2.7080256938934326, 2.8231348991394043, 2.938244104385376, 3.0533533096313477, 3.1684622764587402, 3.283571481704712, 3.3986806869506836, 3.5137898921966553]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 13.0, 23.0, 38.0, 44.0, 66.0, 76.0, 114.0, 135.0, 202.0, 323.0, 431.0, 623.0, 896.0, 1317.0, 1937.0, 2883.0, 4495.0, 6931.0, 11051.0, 17724.0, 30224.0, 52383.0, 99673.0, 200821.0, 273094.0, 155915.0, 78326.0, 42274.0, 24735.0, 15000.0, 9150.0, 5758.0, 3839.0, 2469.0, 1657.0, 1175.0, 819.0, 528.0, 386.0, 293.0, 188.0, 132.0, 106.0, 69.0, 46.0, 47.0, 37.0, 20.0, 21.0, 10.0, 9.0, 4.0, 3.0, 8.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.08203125, -1.0463409423828125, -1.010650634765625, -0.9749603271484375, -0.93927001953125, -0.9035797119140625, -0.867889404296875, -0.8321990966796875, -0.7965087890625, -0.7608184814453125, -0.725128173828125, -0.6894378662109375, -0.65374755859375, -0.6180572509765625, -0.582366943359375, -0.5466766357421875, -0.510986328125, -0.4752960205078125, -0.439605712890625, -0.4039154052734375, -0.36822509765625, -0.3325347900390625, -0.296844482421875, -0.2611541748046875, -0.2254638671875, -0.1897735595703125, -0.154083251953125, -0.1183929443359375, -0.08270263671875, -0.0470123291015625, -0.011322021484375, 0.0243682861328125, 0.06005859375, 0.0957489013671875, 0.131439208984375, 0.1671295166015625, 0.20281982421875, 0.2385101318359375, 0.274200439453125, 0.3098907470703125, 0.3455810546875, 0.3812713623046875, 0.416961669921875, 0.4526519775390625, 0.48834228515625, 0.5240325927734375, 0.559722900390625, 0.5954132080078125, 0.631103515625, 0.6667938232421875, 0.702484130859375, 0.7381744384765625, 0.77386474609375, 0.8095550537109375, 0.845245361328125, 0.8809356689453125, 0.9166259765625, 0.9523162841796875, 0.988006591796875, 1.0236968994140625, 1.05938720703125, 1.0950775146484375, 1.130767822265625, 1.1664581298828125, 1.2021484375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 5.0, 10.0, 7.0, 10.0, 8.0, 14.0, 16.0, 21.0, 13.0, 18.0, 26.0, 30.0, 23.0, 30.0, 32.0, 45.0, 41.0, 31.0, 44.0, 40.0, 52.0, 49.0, 37.0, 40.0, 39.0, 29.0, 45.0, 27.0, 22.0, 26.0, 22.0, 24.0, 24.0, 16.0, 13.0, 9.0, 12.0, 12.0, 4.0, 9.0, 5.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.73828125, -3.619354248046875, -3.50042724609375, -3.381500244140625, -3.2625732421875, -3.143646240234375, -3.02471923828125, -2.905792236328125, -2.786865234375, -2.667938232421875, -2.54901123046875, -2.430084228515625, -2.3111572265625, -2.192230224609375, -2.07330322265625, -1.954376220703125, -1.83544921875, -1.716522216796875, -1.59759521484375, -1.478668212890625, -1.3597412109375, -1.240814208984375, -1.12188720703125, -1.002960205078125, -0.884033203125, -0.765106201171875, -0.64617919921875, -0.527252197265625, -0.4083251953125, -0.289398193359375, -0.17047119140625, -0.051544189453125, 0.0673828125, 0.186309814453125, 0.30523681640625, 0.424163818359375, 0.5430908203125, 0.662017822265625, 0.78094482421875, 0.899871826171875, 1.018798828125, 1.137725830078125, 1.25665283203125, 1.375579833984375, 1.4945068359375, 1.613433837890625, 1.73236083984375, 1.851287841796875, 1.97021484375, 2.089141845703125, 2.20806884765625, 2.326995849609375, 2.4459228515625, 2.564849853515625, 2.68377685546875, 2.802703857421875, 2.921630859375, 3.040557861328125, 3.15948486328125, 3.278411865234375, 3.3973388671875, 3.516265869140625, 3.63519287109375, 3.754119873046875, 3.873046875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 20.0, 15.0, 12.0, 19.0, 23.0, 32.0, 35.0, 46.0, 64.0, 95.0, 120.0, 166.0, 249.0, 336.0, 511.0, 776.0, 1165.0, 2248.0, 4513.0, 11131.0, 34583.0, 919140.0, 47313.0, 13884.0, 5381.0, 2538.0, 1435.0, 811.0, 578.0, 315.0, 250.0, 172.0, 136.0, 91.0, 82.0, 61.0, 31.0, 37.0, 31.0, 14.0, 29.0, 13.0, 17.0, 4.0, 7.0, 8.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.8515625, -3.73345947265625, -3.6153564453125, -3.49725341796875, -3.379150390625, -3.26104736328125, -3.1429443359375, -3.02484130859375, -2.90673828125, -2.78863525390625, -2.6705322265625, -2.55242919921875, -2.434326171875, -2.31622314453125, -2.1981201171875, -2.08001708984375, -1.9619140625, -1.84381103515625, -1.7257080078125, -1.60760498046875, -1.489501953125, -1.37139892578125, -1.2532958984375, -1.13519287109375, -1.01708984375, -0.89898681640625, -0.7808837890625, -0.66278076171875, -0.544677734375, -0.42657470703125, -0.3084716796875, -0.19036865234375, -0.072265625, 0.04583740234375, 0.1639404296875, 0.28204345703125, 0.400146484375, 0.51824951171875, 0.6363525390625, 0.75445556640625, 0.87255859375, 0.99066162109375, 1.1087646484375, 1.22686767578125, 1.344970703125, 1.46307373046875, 1.5811767578125, 1.69927978515625, 1.8173828125, 1.93548583984375, 2.0535888671875, 2.17169189453125, 2.289794921875, 2.40789794921875, 2.5260009765625, 2.64410400390625, 2.76220703125, 2.88031005859375, 2.9984130859375, 3.11651611328125, 3.234619140625, 3.35272216796875, 3.4708251953125, 3.58892822265625, 3.70703125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 11.0, 7.0, 6.0, 6.0, 13.0, 8.0, 18.0, 21.0, 17.0, 19.0, 18.0, 28.0, 37.0, 34.0, 42.0, 30.0, 28.0, 50.0, 38.0, 34.0, 38.0, 47.0, 34.0, 43.0, 37.0, 34.0, 45.0, 23.0, 34.0, 37.0, 20.0, 26.0, 24.0, 25.0, 13.0, 14.0, 8.0, 7.0, 9.0, 5.0, 7.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.46484375, -2.38580322265625, -2.3067626953125, -2.22772216796875, -2.148681640625, -2.06964111328125, -1.9906005859375, -1.91156005859375, -1.83251953125, -1.75347900390625, -1.6744384765625, -1.59539794921875, -1.516357421875, -1.43731689453125, -1.3582763671875, -1.27923583984375, -1.2001953125, -1.12115478515625, -1.0421142578125, -0.96307373046875, -0.884033203125, -0.80499267578125, -0.7259521484375, -0.64691162109375, -0.56787109375, -0.48883056640625, -0.4097900390625, -0.33074951171875, -0.251708984375, -0.17266845703125, -0.0936279296875, -0.01458740234375, 0.064453125, 0.14349365234375, 0.2225341796875, 0.30157470703125, 0.380615234375, 0.45965576171875, 0.5386962890625, 0.61773681640625, 0.69677734375, 0.77581787109375, 0.8548583984375, 0.93389892578125, 1.012939453125, 1.09197998046875, 1.1710205078125, 1.25006103515625, 1.3291015625, 1.40814208984375, 1.4871826171875, 1.56622314453125, 1.645263671875, 1.72430419921875, 1.8033447265625, 1.88238525390625, 1.96142578125, 2.04046630859375, 2.1195068359375, 2.19854736328125, 2.277587890625, 2.35662841796875, 2.4356689453125, 2.51470947265625, 2.59375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 4.0, 7.0, 6.0, 11.0, 12.0, 27.0, 24.0, 36.0, 45.0, 57.0, 84.0, 120.0, 158.0, 258.0, 345.0, 632.0, 937.0, 1767.0, 3522.0, 7632.0, 22529.0, 920313.0, 63755.0, 14360.0, 5456.0, 2705.0, 1376.0, 807.0, 491.0, 323.0, 217.0, 130.0, 102.0, 72.0, 66.0, 43.0, 29.0, 18.0, 16.0, 15.0, 9.0, 8.0, 10.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.2384033203125, -0.2311382293701172, -0.22387313842773438, -0.21660804748535156, -0.20934295654296875, -0.20207786560058594, -0.19481277465820312, -0.1875476837158203, -0.1802825927734375, -0.1730175018310547, -0.16575241088867188, -0.15848731994628906, -0.15122222900390625, -0.14395713806152344, -0.13669204711914062, -0.1294269561767578, -0.122161865234375, -0.11489677429199219, -0.10763168334960938, -0.10036659240722656, -0.09310150146484375, -0.08583641052246094, -0.07857131958007812, -0.07130622863769531, -0.0640411376953125, -0.05677604675292969, -0.049510955810546875, -0.04224586486816406, -0.03498077392578125, -0.027715682983398438, -0.020450592041015625, -0.013185501098632812, -0.00592041015625, 0.0013446807861328125, 0.008609771728515625, 0.015874862670898438, 0.02313995361328125, 0.030405044555664062, 0.037670135498046875, 0.04493522644042969, 0.0522003173828125, 0.05946540832519531, 0.06673049926757812, 0.07399559020996094, 0.08126068115234375, 0.08852577209472656, 0.09579086303710938, 0.10305595397949219, 0.110321044921875, 0.11758613586425781, 0.12485122680664062, 0.13211631774902344, 0.13938140869140625, 0.14664649963378906, 0.15391159057617188, 0.1611766815185547, 0.1684417724609375, 0.1757068634033203, 0.18297195434570312, 0.19023704528808594, 0.19750213623046875, 0.20476722717285156, 0.21203231811523438, 0.2192974090576172, 0.2265625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 2.0, 3.0, 4.0, 3.0, 8.0, 2.0, 13.0, 13.0, 13.0, 15.0, 23.0, 36.0, 30.0, 36.0, 50.0, 56.0, 62.0, 56.0, 61.0, 69.0, 62.0, 66.0, 52.0, 32.0, 48.0, 34.0, 28.0, 27.0, 17.0, 22.0, 14.0, 9.0, 13.0, 9.0, 7.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9591064453125e-05, -4.809629172086716e-05, -4.6601518988609314e-05, -4.510674625635147e-05, -4.361197352409363e-05, -4.2117200791835785e-05, -4.062242805957794e-05, -3.91276553273201e-05, -3.7632882595062256e-05, -3.613810986280441e-05, -3.464333713054657e-05, -3.314856439828873e-05, -3.1653791666030884e-05, -3.015901893377304e-05, -2.8664246201515198e-05, -2.7169473469257355e-05, -2.5674700736999512e-05, -2.417992800474167e-05, -2.2685155272483826e-05, -2.1190382540225983e-05, -1.969560980796814e-05, -1.8200837075710297e-05, -1.6706064343452454e-05, -1.521129161119461e-05, -1.3716518878936768e-05, -1.2221746146678925e-05, -1.0726973414421082e-05, -9.232200682163239e-06, -7.737427949905396e-06, -6.2426552176475525e-06, -4.7478824853897095e-06, -3.2531097531318665e-06, -1.7583370208740234e-06, -2.635642886161804e-07, 1.2312084436416626e-06, 2.7259811758995056e-06, 4.220753908157349e-06, 5.715526640415192e-06, 7.210299372673035e-06, 8.705072104930878e-06, 1.019984483718872e-05, 1.1694617569446564e-05, 1.3189390301704407e-05, 1.468416303396225e-05, 1.6178935766220093e-05, 1.7673708498477936e-05, 1.916848123073578e-05, 2.0663253962993622e-05, 2.2158026695251465e-05, 2.3652799427509308e-05, 2.514757215976715e-05, 2.6642344892024994e-05, 2.8137117624282837e-05, 2.963189035654068e-05, 3.112666308879852e-05, 3.2621435821056366e-05, 3.411620855331421e-05, 3.561098128557205e-05, 3.7105754017829895e-05, 3.860052675008774e-05, 4.009529948234558e-05, 4.1590072214603424e-05, 4.308484494686127e-05, 4.457961767911911e-05, 4.607439041137695e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 2.0, 5.0, 7.0, 15.0, 18.0, 25.0, 44.0, 71.0, 103.0, 148.0, 225.0, 377.0, 570.0, 1062.0, 1751.0, 3035.0, 5740.0, 10761.0, 22244.0, 51410.0, 141097.0, 412282.0, 250858.0, 80974.0, 33185.0, 15283.0, 7603.0, 4047.0, 2244.0, 1290.0, 794.0, 449.0, 288.0, 181.0, 115.0, 83.0, 56.0, 42.0, 21.0, 18.0, 12.0, 10.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10809326171875, -0.10468769073486328, -0.10128211975097656, -0.09787654876708984, -0.09447097778320312, -0.0910654067993164, -0.08765983581542969, -0.08425426483154297, -0.08084869384765625, -0.07744312286376953, -0.07403755187988281, -0.0706319808959961, -0.06722640991210938, -0.06382083892822266, -0.06041526794433594, -0.05700969696044922, -0.0536041259765625, -0.05019855499267578, -0.04679298400878906, -0.043387413024902344, -0.039981842041015625, -0.036576271057128906, -0.03317070007324219, -0.02976512908935547, -0.02635955810546875, -0.02295398712158203, -0.019548416137695312, -0.016142845153808594, -0.012737274169921875, -0.009331703186035156, -0.0059261322021484375, -0.0025205612182617188, 0.000885009765625, 0.004290580749511719, 0.0076961517333984375, 0.011101722717285156, 0.014507293701171875, 0.017912864685058594, 0.021318435668945312, 0.02472400665283203, 0.02812957763671875, 0.03153514862060547, 0.03494071960449219, 0.038346290588378906, 0.041751861572265625, 0.045157432556152344, 0.04856300354003906, 0.05196857452392578, 0.0553741455078125, 0.05877971649169922, 0.06218528747558594, 0.06559085845947266, 0.06899642944335938, 0.0724020004272461, 0.07580757141113281, 0.07921314239501953, 0.08261871337890625, 0.08602428436279297, 0.08942985534667969, 0.0928354263305664, 0.09624099731445312, 0.09964656829833984, 0.10305213928222656, 0.10645771026611328, 0.10986328125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 4.0, 7.0, 7.0, 9.0, 12.0, 18.0, 21.0, 35.0, 46.0, 51.0, 106.0, 115.0, 159.0, 131.0, 74.0, 50.0, 38.0, 22.0, 17.0, 13.0, 9.0, 9.0, 8.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0292816162109375, -0.028347253799438477, -0.027412891387939453, -0.02647852897644043, -0.025544166564941406, -0.024609804153442383, -0.02367544174194336, -0.022741079330444336, -0.021806716918945312, -0.02087235450744629, -0.019937992095947266, -0.019003629684448242, -0.01806926727294922, -0.017134904861450195, -0.016200542449951172, -0.015266180038452148, -0.014331817626953125, -0.013397455215454102, -0.012463092803955078, -0.011528730392456055, -0.010594367980957031, -0.009660005569458008, -0.008725643157958984, -0.007791280746459961, -0.0068569183349609375, -0.005922555923461914, -0.004988193511962891, -0.004053831100463867, -0.0031194686889648438, -0.0021851062774658203, -0.0012507438659667969, -0.00031638145446777344, 0.00061798095703125, 0.0015523433685302734, 0.002486705780029297, 0.0034210681915283203, 0.004355430603027344, 0.005289793014526367, 0.006224155426025391, 0.007158517837524414, 0.008092880249023438, 0.009027242660522461, 0.009961605072021484, 0.010895967483520508, 0.011830329895019531, 0.012764692306518555, 0.013699054718017578, 0.014633417129516602, 0.015567779541015625, 0.01650214195251465, 0.017436504364013672, 0.018370866775512695, 0.01930522918701172, 0.020239591598510742, 0.021173954010009766, 0.02210831642150879, 0.023042678833007812, 0.023977041244506836, 0.02491140365600586, 0.025845766067504883, 0.026780128479003906, 0.02771449089050293, 0.028648853302001953, 0.029583215713500977, 0.030517578125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 1.0, 10.0, 12.0, 10.0, 18.0, 13.0, 21.0, 34.0, 37.0, 43.0, 58.0, 61.0, 66.0, 66.0, 57.0, 78.0, 78.0, 67.0, 43.0, 50.0, 28.0, 26.0, 22.0, 14.0, 22.0, 23.0, 8.0, 6.0, 4.0, 3.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.154514789581299, -4.008862495422363, -3.8632097244262695, -3.717557191848755, -3.5719046592712402, -3.4262523651123047, -3.28059983253479, -3.1349472999572754, -2.9892947673797607, -2.843642234802246, -2.6979897022247314, -2.552337169647217, -2.4066848754882812, -2.2610321044921875, -2.115379810333252, -1.9697272777557373, -1.8240747451782227, -1.678422212600708, -1.5327696800231934, -1.3871172666549683, -1.2414647340774536, -1.095812201499939, -0.9501597285270691, -0.8045072555541992, -0.6588547229766846, -0.5132021903991699, -0.36754971742630005, -0.2218972146511078, -0.07624471187591553, 0.06940782070159912, 0.215060293674469, 0.36071276664733887, 0.5063648223876953, 0.65201735496521, 0.7976698279380798, 0.9433223009109497, 1.0889748334884644, 1.234627366065979, 1.380279779434204, 1.5259323120117188, 1.6715848445892334, 1.817237377166748, 1.9628899097442627, 2.1085424423217773, 2.254194736480713, 2.3998475074768066, 2.545499801635742, 2.691152334213257, 2.8368048667907715, 2.982457399368286, 3.128109931945801, 3.2737624645233154, 3.41941499710083, 3.5650672912597656, 3.7107198238372803, 3.856372356414795, 4.0020246505737305, 4.147676944732666, 4.29332971572876, 4.438982009887695, 4.584634780883789, 4.730287075042725, 4.875939846038818, 5.021592140197754, 5.167244911193848]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 15.0, 6.0, 5.0, 10.0, 10.0, 10.0, 11.0, 15.0, 20.0, 27.0, 24.0, 20.0, 30.0, 28.0, 35.0, 41.0, 34.0, 47.0, 48.0, 32.0, 42.0, 43.0, 34.0, 47.0, 36.0, 31.0, 37.0, 37.0, 28.0, 30.0, 27.0, 16.0, 24.0, 16.0, 13.0, 13.0, 9.0, 4.0, 11.0, 2.0, 12.0, 1.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.8279619216918945, -3.713350534439087, -3.5987391471862793, -3.4841277599334717, -3.369516372680664, -3.2549049854278564, -3.140293598175049, -3.025682210922241, -2.9110708236694336, -2.796459436416626, -2.6818480491638184, -2.5672366619110107, -2.452625274658203, -2.3380138874053955, -2.223402500152588, -2.1087911128997803, -1.9941797256469727, -1.879568338394165, -1.7649569511413574, -1.6503455638885498, -1.5357341766357422, -1.4211227893829346, -1.306511402130127, -1.1919000148773193, -1.0772886276245117, -0.9626772403717041, -0.8480658531188965, -0.7334544658660889, -0.6188430786132812, -0.5042316913604736, -0.389620304107666, -0.2750089168548584, -0.16039776802062988, -0.045786380767822266, 0.06882500648498535, 0.18343639373779297, 0.2980477809906006, 0.4126591682434082, 0.5272705554962158, 0.6418819427490234, 0.756493330001831, 0.8711047172546387, 0.9857161045074463, 1.100327491760254, 1.2149388790130615, 1.3295502662658691, 1.4441616535186768, 1.5587730407714844, 1.673384428024292, 1.7879958152770996, 1.9026072025299072, 2.017218589782715, 2.1318299770355225, 2.24644136428833, 2.3610527515411377, 2.4756641387939453, 2.590275526046753, 2.7048869132995605, 2.819498300552368, 2.934109687805176, 3.0487210750579834, 3.163332462310791, 3.2779438495635986, 3.3925552368164062, 3.507166624069214]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 4.0, 4.0, 5.0, 7.0, 8.0, 7.0, 12.0, 21.0, 23.0, 49.0, 63.0, 93.0, 145.0, 181.0, 291.0, 400.0, 535.0, 805.0, 1193.0, 1769.0, 2605.0, 3928.0, 5958.0, 8917.0, 14072.0, 22203.0, 35789.0, 57601.0, 91009.0, 133486.0, 166539.0, 159513.0, 122050.0, 80603.0, 50961.0, 31619.0, 19545.0, 12495.0, 8043.0, 5148.0, 3558.0, 2299.0, 1566.0, 1049.0, 699.0, 478.0, 389.0, 221.0, 189.0, 122.0, 99.0, 60.0, 35.0, 29.0, 19.0, 17.0, 14.0, 8.0, 6.0, 4.0, 5.0, 3.0], "bins": [-3.083984375, -2.990142822265625, -2.89630126953125, -2.802459716796875, -2.7086181640625, -2.614776611328125, -2.52093505859375, -2.427093505859375, -2.333251953125, -2.239410400390625, -2.14556884765625, -2.051727294921875, -1.9578857421875, -1.864044189453125, -1.77020263671875, -1.676361083984375, -1.58251953125, -1.488677978515625, -1.39483642578125, -1.300994873046875, -1.2071533203125, -1.113311767578125, -1.01947021484375, -0.925628662109375, -0.831787109375, -0.737945556640625, -0.64410400390625, -0.550262451171875, -0.4564208984375, -0.362579345703125, -0.26873779296875, -0.174896240234375, -0.0810546875, 0.012786865234375, 0.10662841796875, 0.200469970703125, 0.2943115234375, 0.388153076171875, 0.48199462890625, 0.575836181640625, 0.669677734375, 0.763519287109375, 0.85736083984375, 0.951202392578125, 1.0450439453125, 1.138885498046875, 1.23272705078125, 1.326568603515625, 1.42041015625, 1.514251708984375, 1.60809326171875, 1.701934814453125, 1.7957763671875, 1.889617919921875, 1.98345947265625, 2.077301025390625, 2.171142578125, 2.264984130859375, 2.35882568359375, 2.452667236328125, 2.5465087890625, 2.640350341796875, 2.73419189453125, 2.828033447265625, 2.921875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 10.0, 7.0, 6.0, 9.0, 13.0, 13.0, 5.0, 14.0, 15.0, 18.0, 21.0, 29.0, 34.0, 36.0, 40.0, 41.0, 43.0, 44.0, 35.0, 54.0, 47.0, 45.0, 43.0, 33.0, 31.0, 34.0, 48.0, 28.0, 29.0, 31.0, 26.0, 18.0, 16.0, 9.0, 13.0, 11.0, 12.0, 10.0, 6.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.89453125, -3.773651123046875, -3.65277099609375, -3.531890869140625, -3.4110107421875, -3.290130615234375, -3.16925048828125, -3.048370361328125, -2.927490234375, -2.806610107421875, -2.68572998046875, -2.564849853515625, -2.4439697265625, -2.323089599609375, -2.20220947265625, -2.081329345703125, -1.96044921875, -1.839569091796875, -1.71868896484375, -1.597808837890625, -1.4769287109375, -1.356048583984375, -1.23516845703125, -1.114288330078125, -0.993408203125, -0.872528076171875, -0.75164794921875, -0.630767822265625, -0.5098876953125, -0.389007568359375, -0.26812744140625, -0.147247314453125, -0.0263671875, 0.094512939453125, 0.21539306640625, 0.336273193359375, 0.4571533203125, 0.578033447265625, 0.69891357421875, 0.819793701171875, 0.940673828125, 1.061553955078125, 1.18243408203125, 1.303314208984375, 1.4241943359375, 1.545074462890625, 1.66595458984375, 1.786834716796875, 1.90771484375, 2.028594970703125, 2.14947509765625, 2.270355224609375, 2.3912353515625, 2.512115478515625, 2.63299560546875, 2.753875732421875, 2.874755859375, 2.995635986328125, 3.11651611328125, 3.237396240234375, 3.3582763671875, 3.479156494140625, 3.60003662109375, 3.720916748046875, 3.841796875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 6.0, 3.0, 16.0, 20.0, 26.0, 43.0, 50.0, 96.0, 139.0, 191.0, 269.0, 498.0, 750.0, 1069.0, 1558.0, 2468.0, 4048.0, 6160.0, 10191.0, 16361.0, 26519.0, 43202.0, 69716.0, 106770.0, 147894.0, 167914.0, 148979.0, 108547.0, 70230.0, 43621.0, 26820.0, 16498.0, 10215.0, 6256.0, 4029.0, 2554.0, 1634.0, 1090.0, 730.0, 429.0, 314.0, 208.0, 144.0, 94.0, 69.0, 28.0, 27.0, 25.0, 12.0, 10.0, 7.0, 4.0, 1.0, 2.0, 0.0, 3.0, 3.0], "bins": [-3.0390625, -2.945587158203125, -2.85211181640625, -2.758636474609375, -2.6651611328125, -2.571685791015625, -2.47821044921875, -2.384735107421875, -2.291259765625, -2.197784423828125, -2.10430908203125, -2.010833740234375, -1.9173583984375, -1.823883056640625, -1.73040771484375, -1.636932373046875, -1.54345703125, -1.449981689453125, -1.35650634765625, -1.263031005859375, -1.1695556640625, -1.076080322265625, -0.98260498046875, -0.889129638671875, -0.795654296875, -0.702178955078125, -0.60870361328125, -0.515228271484375, -0.4217529296875, -0.328277587890625, -0.23480224609375, -0.141326904296875, -0.0478515625, 0.045623779296875, 0.13909912109375, 0.232574462890625, 0.3260498046875, 0.419525146484375, 0.51300048828125, 0.606475830078125, 0.699951171875, 0.793426513671875, 0.88690185546875, 0.980377197265625, 1.0738525390625, 1.167327880859375, 1.26080322265625, 1.354278564453125, 1.44775390625, 1.541229248046875, 1.63470458984375, 1.728179931640625, 1.8216552734375, 1.915130615234375, 2.00860595703125, 2.102081298828125, 2.195556640625, 2.289031982421875, 2.38250732421875, 2.475982666015625, 2.5694580078125, 2.662933349609375, 2.75640869140625, 2.849884033203125, 2.943359375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 8.0, 2.0, 4.0, 5.0, 5.0, 9.0, 15.0, 10.0, 15.0, 17.0, 15.0, 20.0, 21.0, 32.0, 17.0, 33.0, 38.0, 30.0, 22.0, 23.0, 35.0, 49.0, 30.0, 33.0, 41.0, 47.0, 30.0, 42.0, 38.0, 35.0, 31.0, 34.0, 23.0, 24.0, 26.0, 17.0, 21.0, 19.0, 18.0, 13.0, 7.0, 10.0, 11.0, 11.0, 6.0, 4.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.9306640625, -1.8682708740234375, -1.805877685546875, -1.7434844970703125, -1.68109130859375, -1.6186981201171875, -1.556304931640625, -1.4939117431640625, -1.4315185546875, -1.3691253662109375, -1.306732177734375, -1.2443389892578125, -1.18194580078125, -1.1195526123046875, -1.057159423828125, -0.9947662353515625, -0.932373046875, -0.8699798583984375, -0.807586669921875, -0.7451934814453125, -0.68280029296875, -0.6204071044921875, -0.558013916015625, -0.4956207275390625, -0.4332275390625, -0.3708343505859375, -0.308441162109375, -0.2460479736328125, -0.18365478515625, -0.1212615966796875, -0.058868408203125, 0.0035247802734375, 0.06591796875, 0.1283111572265625, 0.190704345703125, 0.2530975341796875, 0.31549072265625, 0.3778839111328125, 0.440277099609375, 0.5026702880859375, 0.5650634765625, 0.6274566650390625, 0.689849853515625, 0.7522430419921875, 0.81463623046875, 0.8770294189453125, 0.939422607421875, 1.0018157958984375, 1.064208984375, 1.1266021728515625, 1.188995361328125, 1.2513885498046875, 1.31378173828125, 1.3761749267578125, 1.438568115234375, 1.5009613037109375, 1.5633544921875, 1.6257476806640625, 1.688140869140625, 1.7505340576171875, 1.81292724609375, 1.8753204345703125, 1.937713623046875, 2.0001068115234375, 2.0625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 10.0, 13.0, 24.0, 36.0, 45.0, 85.0, 162.0, 183.0, 272.0, 485.0, 796.0, 1240.0, 2067.0, 3457.0, 5683.0, 9559.0, 16222.0, 27387.0, 46203.0, 77204.0, 121615.0, 167830.0, 180967.0, 145035.0, 96330.0, 59194.0, 35127.0, 20775.0, 12055.0, 7359.0, 4250.0, 2665.0, 1562.0, 1013.0, 617.0, 363.0, 239.0, 160.0, 87.0, 62.0, 46.0, 21.0, 17.0, 13.0, 13.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.044921875, -1.0134811401367188, -0.9820404052734375, -0.9505996704101562, -0.919158935546875, -0.8877182006835938, -0.8562774658203125, -0.8248367309570312, -0.79339599609375, -0.7619552612304688, -0.7305145263671875, -0.6990737915039062, -0.667633056640625, -0.6361923217773438, -0.6047515869140625, -0.5733108520507812, -0.5418701171875, -0.5104293823242188, -0.4789886474609375, -0.44754791259765625, -0.416107177734375, -0.38466644287109375, -0.3532257080078125, -0.32178497314453125, -0.29034423828125, -0.25890350341796875, -0.2274627685546875, -0.19602203369140625, -0.164581298828125, -0.13314056396484375, -0.1016998291015625, -0.07025909423828125, -0.038818359375, -0.00737762451171875, 0.0240631103515625, 0.05550384521484375, 0.086944580078125, 0.11838531494140625, 0.1498260498046875, 0.18126678466796875, 0.21270751953125, 0.24414825439453125, 0.2755889892578125, 0.30702972412109375, 0.338470458984375, 0.36991119384765625, 0.4013519287109375, 0.43279266357421875, 0.4642333984375, 0.49567413330078125, 0.5271148681640625, 0.5585556030273438, 0.589996337890625, 0.6214370727539062, 0.6528778076171875, 0.6843185424804688, 0.71575927734375, 0.7472000122070312, 0.7786407470703125, 0.8100814819335938, 0.841522216796875, 0.8729629516601562, 0.9044036865234375, 0.9358444213867188, 0.96728515625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 3.0, 11.0, 11.0, 7.0, 14.0, 20.0, 26.0, 35.0, 47.0, 39.0, 52.0, 62.0, 50.0, 59.0, 60.0, 63.0, 61.0, 49.0, 57.0, 50.0, 41.0, 42.0, 26.0, 24.0, 21.0, 11.0, 14.0, 7.0, 5.0, 2.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-9.5367431640625e-05, -9.27858054637909e-05, -9.020417928695679e-05, -8.762255311012268e-05, -8.504092693328857e-05, -8.245930075645447e-05, -7.987767457962036e-05, -7.729604840278625e-05, -7.471442222595215e-05, -7.213279604911804e-05, -6.955116987228394e-05, -6.696954369544983e-05, -6.438791751861572e-05, -6.180629134178162e-05, -5.922466516494751e-05, -5.66430389881134e-05, -5.40614128112793e-05, -5.147978663444519e-05, -4.8898160457611084e-05, -4.631653428077698e-05, -4.373490810394287e-05, -4.1153281927108765e-05, -3.857165575027466e-05, -3.599002957344055e-05, -3.3408403396606445e-05, -3.082677721977234e-05, -2.8245151042938232e-05, -2.5663524866104126e-05, -2.308189868927002e-05, -2.0500272512435913e-05, -1.7918646335601807e-05, -1.53370201587677e-05, -1.2755393981933594e-05, -1.0173767805099487e-05, -7.592141628265381e-06, -5.010515451431274e-06, -2.428889274597168e-06, 1.5273690223693848e-07, 2.734363079071045e-06, 5.315989255905151e-06, 7.897615432739258e-06, 1.0479241609573364e-05, 1.306086778640747e-05, 1.5642493963241577e-05, 1.8224120140075684e-05, 2.080574631690979e-05, 2.3387372493743896e-05, 2.5968998670578003e-05, 2.855062484741211e-05, 3.1132251024246216e-05, 3.371387720108032e-05, 3.629550337791443e-05, 3.8877129554748535e-05, 4.145875573158264e-05, 4.404038190841675e-05, 4.6622008085250854e-05, 4.920363426208496e-05, 5.178526043891907e-05, 5.4366886615753174e-05, 5.694851279258728e-05, 5.953013896942139e-05, 6.211176514625549e-05, 6.46933913230896e-05, 6.72750174999237e-05, 6.985664367675781e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 10.0, 14.0, 13.0, 27.0, 33.0, 44.0, 71.0, 90.0, 171.0, 259.0, 344.0, 545.0, 833.0, 1189.0, 1924.0, 2851.0, 4567.0, 7095.0, 11194.0, 18149.0, 29432.0, 47725.0, 76803.0, 116393.0, 154544.0, 167019.0, 140532.0, 98602.0, 63322.0, 39219.0, 24211.0, 15040.0, 9401.0, 5921.0, 3868.0, 2413.0, 1595.0, 997.0, 642.0, 467.0, 347.0, 174.0, 155.0, 105.0, 61.0, 47.0, 31.0, 17.0, 17.0, 11.0, 9.0, 6.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.94091796875, -0.91265869140625, -0.8843994140625, -0.85614013671875, -0.827880859375, -0.79962158203125, -0.7713623046875, -0.74310302734375, -0.71484375, -0.68658447265625, -0.6583251953125, -0.63006591796875, -0.601806640625, -0.57354736328125, -0.5452880859375, -0.51702880859375, -0.48876953125, -0.46051025390625, -0.4322509765625, -0.40399169921875, -0.375732421875, -0.34747314453125, -0.3192138671875, -0.29095458984375, -0.2626953125, -0.23443603515625, -0.2061767578125, -0.17791748046875, -0.149658203125, -0.12139892578125, -0.0931396484375, -0.06488037109375, -0.03662109375, -0.00836181640625, 0.0198974609375, 0.04815673828125, 0.076416015625, 0.10467529296875, 0.1329345703125, 0.16119384765625, 0.189453125, 0.21771240234375, 0.2459716796875, 0.27423095703125, 0.302490234375, 0.33074951171875, 0.3590087890625, 0.38726806640625, 0.41552734375, 0.44378662109375, 0.4720458984375, 0.50030517578125, 0.528564453125, 0.55682373046875, 0.5850830078125, 0.61334228515625, 0.6416015625, 0.66986083984375, 0.6981201171875, 0.72637939453125, 0.754638671875, 0.78289794921875, 0.8111572265625, 0.83941650390625, 0.86767578125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 4.0, 4.0, 4.0, 7.0, 8.0, 10.0, 11.0, 12.0, 18.0, 26.0, 27.0, 25.0, 47.0, 45.0, 56.0, 63.0, 68.0, 81.0, 63.0, 69.0, 54.0, 60.0, 48.0, 51.0, 29.0, 19.0, 18.0, 22.0, 14.0, 12.0, 4.0, 6.0, 1.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36865234375, -0.3553276062011719, -0.34200286865234375, -0.3286781311035156, -0.3153533935546875, -0.3020286560058594, -0.28870391845703125, -0.2753791809082031, -0.262054443359375, -0.24872970581054688, -0.23540496826171875, -0.22208023071289062, -0.2087554931640625, -0.19543075561523438, -0.18210601806640625, -0.16878128051757812, -0.15545654296875, -0.14213180541992188, -0.12880706787109375, -0.11548233032226562, -0.1021575927734375, -0.08883285522460938, -0.07550811767578125, -0.062183380126953125, -0.048858642578125, -0.035533905029296875, -0.02220916748046875, -0.008884429931640625, 0.0044403076171875, 0.017765045166015625, 0.03108978271484375, 0.044414520263671875, 0.0577392578125, 0.07106399536132812, 0.08438873291015625, 0.09771347045898438, 0.1110382080078125, 0.12436294555664062, 0.13768768310546875, 0.15101242065429688, 0.164337158203125, 0.17766189575195312, 0.19098663330078125, 0.20431137084960938, 0.2176361083984375, 0.23096084594726562, 0.24428558349609375, 0.2576103210449219, 0.27093505859375, 0.2842597961425781, 0.29758453369140625, 0.3109092712402344, 0.3242340087890625, 0.3375587463378906, 0.35088348388671875, 0.3642082214355469, 0.377532958984375, 0.3908576965332031, 0.40418243408203125, 0.4175071716308594, 0.4308319091796875, 0.4441566467285156, 0.45748138427734375, 0.4708061218261719, 0.484130859375]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 4.0, 10.0, 12.0, 8.0, 14.0, 15.0, 20.0, 19.0, 47.0, 46.0, 51.0, 57.0, 41.0, 56.0, 67.0, 71.0, 60.0, 57.0, 46.0, 52.0, 43.0, 33.0, 30.0, 21.0, 27.0, 19.0, 15.0, 9.0, 10.0, 8.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.385850429534912, -4.258136749267578, -4.130423545837402, -4.002709865570068, -3.8749961853027344, -3.7472827434539795, -3.6195693016052246, -3.4918556213378906, -3.3641419410705566, -3.2364284992218018, -3.1087148189544678, -2.981001377105713, -2.853287696838379, -2.725574254989624, -2.597860813140869, -2.470147132873535, -2.3424336910247803, -2.2147202491760254, -2.0870065689086914, -1.9592931270599365, -1.8315794467926025, -1.7038660049438477, -1.5761524438858032, -1.4484388828277588, -1.3207253217697144, -1.19301176071167, -1.0652981996536255, -0.9375846982002258, -0.8098711371421814, -0.682157576084137, -0.5544440746307373, -0.42673051357269287, -0.29901719093322754, -0.1713036447763443, -0.04359009861946106, 0.08412343263626099, 0.21183699369430542, 0.33955055475234985, 0.4672640562057495, 0.594977617263794, 0.7226911783218384, 0.8504047393798828, 0.9781183004379272, 1.1058318614959717, 1.2335453033447266, 1.3612589836120605, 1.4889724254608154, 1.6166859865188599, 1.7443995475769043, 1.8721131086349487, 1.9998266696929932, 2.127540111541748, 2.255253791809082, 2.382967233657837, 2.510680675506592, 2.638394355773926, 2.7661080360412598, 2.8938214778900146, 3.0215351581573486, 3.1492486000061035, 3.2769622802734375, 3.4046757221221924, 3.5323891639709473, 3.6601028442382812, 3.787816286087036]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 3.0, 8.0, 7.0, 12.0, 16.0, 10.0, 23.0, 13.0, 14.0, 20.0, 28.0, 36.0, 30.0, 32.0, 40.0, 39.0, 39.0, 42.0, 41.0, 41.0, 49.0, 44.0, 40.0, 37.0, 33.0, 39.0, 30.0, 34.0, 25.0, 22.0, 27.0, 21.0, 15.0, 9.0, 16.0, 14.0, 10.0, 8.0, 10.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.041362762451172, -3.920968532562256, -3.80057430267334, -3.6801798343658447, -3.5597856044769287, -3.4393913745880127, -3.3189971446990967, -3.1986026763916016, -3.0782084465026855, -2.9578142166137695, -2.8374199867248535, -2.7170255184173584, -2.5966312885284424, -2.4762370586395264, -2.3558428287506104, -2.2354483604431152, -2.115054130554199, -1.9946599006652832, -1.8742655515670776, -1.7538713216781616, -1.633476972579956, -1.51308274269104, -1.392688512802124, -1.2722941637039185, -1.151900053024292, -1.031505823135376, -0.9111114740371704, -0.7907172441482544, -0.6703228950500488, -0.5499286651611328, -0.429534375667572, -0.30914008617401123, -0.18874573707580566, -0.06835145503282547, 0.052042827010154724, 0.17243710160255432, 0.2928313910961151, 0.4132256507873535, 0.5336199402809143, 0.6540142297744751, 0.7744085192680359, 0.8948028087615967, 1.0151970386505127, 1.1355913877487183, 1.2559856176376343, 1.3763799667358398, 1.4967741966247559, 1.6171684265136719, 1.7375627756118774, 1.8579570055007935, 1.978351354598999, 2.098745584487915, 2.219139814376831, 2.339534282684326, 2.459928512573242, 2.580322742462158, 2.700716972351074, 2.8211112022399902, 2.9415054321289062, 3.0618999004364014, 3.1822941303253174, 3.3026883602142334, 3.4230825901031494, 3.5434770584106445, 3.6638712882995605]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 10.0, 12.0, 13.0, 18.0, 28.0, 34.0, 68.0, 87.0, 125.0, 162.0, 254.0, 341.0, 549.0, 808.0, 1206.0, 1819.0, 2903.0, 4987.0, 8314.0, 14575.0, 26782.0, 52457.0, 110635.0, 252347.0, 601038.0, 1151149.0, 1049264.0, 503841.0, 212741.0, 95549.0, 46205.0, 23690.0, 12995.0, 7355.0, 4272.0, 2669.0, 1713.0, 1040.0, 743.0, 439.0, 341.0, 226.0, 147.0, 106.0, 77.0, 52.0, 30.0, 21.0, 12.0, 12.0, 6.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-4.9453125, -4.79498291015625, -4.6446533203125, -4.49432373046875, -4.343994140625, -4.19366455078125, -4.0433349609375, -3.89300537109375, -3.74267578125, -3.59234619140625, -3.4420166015625, -3.29168701171875, -3.141357421875, -2.99102783203125, -2.8406982421875, -2.69036865234375, -2.5400390625, -2.38970947265625, -2.2393798828125, -2.08905029296875, -1.938720703125, -1.78839111328125, -1.6380615234375, -1.48773193359375, -1.33740234375, -1.18707275390625, -1.0367431640625, -0.88641357421875, -0.736083984375, -0.58575439453125, -0.4354248046875, -0.28509521484375, -0.134765625, 0.01556396484375, 0.1658935546875, 0.31622314453125, 0.466552734375, 0.61688232421875, 0.7672119140625, 0.91754150390625, 1.06787109375, 1.21820068359375, 1.3685302734375, 1.51885986328125, 1.669189453125, 1.81951904296875, 1.9698486328125, 2.12017822265625, 2.2705078125, 2.42083740234375, 2.5711669921875, 2.72149658203125, 2.871826171875, 3.02215576171875, 3.1724853515625, 3.32281494140625, 3.47314453125, 3.62347412109375, 3.7738037109375, 3.92413330078125, 4.074462890625, 4.22479248046875, 4.3751220703125, 4.52545166015625, 4.67578125]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 8.0, 6.0, 4.0, 6.0, 7.0, 13.0, 19.0, 21.0, 13.0, 16.0, 27.0, 24.0, 26.0, 38.0, 33.0, 38.0, 42.0, 41.0, 50.0, 47.0, 42.0, 48.0, 39.0, 37.0, 44.0, 42.0, 36.0, 33.0, 27.0, 20.0, 25.0, 25.0, 13.0, 18.0, 17.0, 10.0, 9.0, 4.0, 10.0, 6.0, 4.0, 2.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 4.0], "bins": [-3.13671875, -3.048065185546875, -2.95941162109375, -2.870758056640625, -2.7821044921875, -2.693450927734375, -2.60479736328125, -2.516143798828125, -2.427490234375, -2.338836669921875, -2.25018310546875, -2.161529541015625, -2.0728759765625, -1.984222412109375, -1.89556884765625, -1.806915283203125, -1.71826171875, -1.629608154296875, -1.54095458984375, -1.452301025390625, -1.3636474609375, -1.274993896484375, -1.18634033203125, -1.097686767578125, -1.009033203125, -0.920379638671875, -0.83172607421875, -0.743072509765625, -0.6544189453125, -0.565765380859375, -0.47711181640625, -0.388458251953125, -0.2998046875, -0.211151123046875, -0.12249755859375, -0.033843994140625, 0.0548095703125, 0.143463134765625, 0.23211669921875, 0.320770263671875, 0.409423828125, 0.498077392578125, 0.58673095703125, 0.675384521484375, 0.7640380859375, 0.852691650390625, 0.94134521484375, 1.029998779296875, 1.11865234375, 1.207305908203125, 1.29595947265625, 1.384613037109375, 1.4732666015625, 1.561920166015625, 1.65057373046875, 1.739227294921875, 1.827880859375, 1.916534423828125, 2.00518798828125, 2.093841552734375, 2.1824951171875, 2.271148681640625, 2.35980224609375, 2.448455810546875, 2.537109375]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 13.0, 18.0, 18.0, 41.0, 44.0, 71.0, 119.0, 167.0, 253.0, 379.0, 663.0, 959.0, 1609.0, 2573.0, 4367.0, 7256.0, 12543.0, 22246.0, 41383.0, 79308.0, 157935.0, 315880.0, 607319.0, 927590.0, 885864.0, 547230.0, 282723.0, 140489.0, 70828.0, 36576.0, 20144.0, 11162.0, 6537.0, 3788.0, 2241.0, 1444.0, 926.0, 609.0, 374.0, 202.0, 130.0, 99.0, 49.0, 45.0, 24.0, 16.0, 9.0, 13.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.27734375, -4.143310546875, -4.00927734375, -3.875244140625, -3.7412109375, -3.607177734375, -3.47314453125, -3.339111328125, -3.205078125, -3.071044921875, -2.93701171875, -2.802978515625, -2.6689453125, -2.534912109375, -2.40087890625, -2.266845703125, -2.1328125, -1.998779296875, -1.86474609375, -1.730712890625, -1.5966796875, -1.462646484375, -1.32861328125, -1.194580078125, -1.060546875, -0.926513671875, -0.79248046875, -0.658447265625, -0.5244140625, -0.390380859375, -0.25634765625, -0.122314453125, 0.01171875, 0.145751953125, 0.27978515625, 0.413818359375, 0.5478515625, 0.681884765625, 0.81591796875, 0.949951171875, 1.083984375, 1.218017578125, 1.35205078125, 1.486083984375, 1.6201171875, 1.754150390625, 1.88818359375, 2.022216796875, 2.15625, 2.290283203125, 2.42431640625, 2.558349609375, 2.6923828125, 2.826416015625, 2.96044921875, 3.094482421875, 3.228515625, 3.362548828125, 3.49658203125, 3.630615234375, 3.7646484375, 3.898681640625, 4.03271484375, 4.166748046875, 4.30078125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 8.0, 11.0, 13.0, 21.0, 15.0, 30.0, 33.0, 57.0, 59.0, 70.0, 95.0, 130.0, 157.0, 187.0, 197.0, 257.0, 260.0, 286.0, 273.0, 298.0, 266.0, 257.0, 192.0, 166.0, 141.0, 97.0, 105.0, 64.0, 70.0, 54.0, 48.0, 33.0, 23.0, 27.0, 10.0, 10.0, 13.0, 8.0, 6.0, 6.0, 3.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5869140625, -1.535247802734375, -1.48358154296875, -1.431915283203125, -1.3802490234375, -1.328582763671875, -1.27691650390625, -1.225250244140625, -1.173583984375, -1.121917724609375, -1.07025146484375, -1.018585205078125, -0.9669189453125, -0.915252685546875, -0.86358642578125, -0.811920166015625, -0.76025390625, -0.708587646484375, -0.65692138671875, -0.605255126953125, -0.5535888671875, -0.501922607421875, -0.45025634765625, -0.398590087890625, -0.346923828125, -0.295257568359375, -0.24359130859375, -0.191925048828125, -0.1402587890625, -0.088592529296875, -0.03692626953125, 0.014739990234375, 0.06640625, 0.118072509765625, 0.16973876953125, 0.221405029296875, 0.2730712890625, 0.324737548828125, 0.37640380859375, 0.428070068359375, 0.479736328125, 0.531402587890625, 0.58306884765625, 0.634735107421875, 0.6864013671875, 0.738067626953125, 0.78973388671875, 0.841400146484375, 0.89306640625, 0.944732666015625, 0.99639892578125, 1.048065185546875, 1.0997314453125, 1.151397705078125, 1.20306396484375, 1.254730224609375, 1.306396484375, 1.358062744140625, 1.40972900390625, 1.461395263671875, 1.5130615234375, 1.564727783203125, 1.61639404296875, 1.668060302734375, 1.7197265625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 12.0, 14.0, 17.0, 7.0, 14.0, 17.0, 33.0, 54.0, 46.0, 46.0, 57.0, 66.0, 73.0, 69.0, 74.0, 76.0, 61.0, 45.0, 35.0, 28.0, 31.0, 20.0, 19.0, 18.0, 9.0, 12.0, 5.0, 4.0, 5.0, 8.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.371648788452148, -4.223293304443359, -4.07493782043457, -3.9265825748443604, -3.7782273292541504, -3.6298718452453613, -3.4815163612365723, -3.333160877227783, -3.1848056316375732, -3.036450147628784, -2.888094902038574, -2.739739418029785, -2.591383934020996, -2.443028688430786, -2.294673204421997, -2.146317958831787, -1.997962474822998, -1.8496071100234985, -1.701251745223999, -1.55289626121521, -1.4045408964157104, -1.256185531616211, -1.1078300476074219, -0.9594746828079224, -0.8111193180084229, -0.6627639532089233, -0.514408528804779, -0.36605313420295715, -0.21769773960113525, -0.06934237480163574, 0.07901304960250854, 0.22736847400665283, 0.37572336196899414, 0.5240787267684937, 0.6724341511726379, 0.8207895755767822, 0.9691449403762817, 1.1175003051757812, 1.2658557891845703, 1.4142111539840698, 1.5625665187835693, 1.7109218835830688, 1.8592772483825684, 2.0076327323913574, 2.1559882164001465, 2.3043434619903564, 2.4526989459991455, 2.6010541915893555, 2.7494096755981445, 2.8977651596069336, 3.0461204051971436, 3.1944758892059326, 3.3428311347961426, 3.4911866188049316, 3.6395421028137207, 3.7878975868225098, 3.9362528324127197, 4.08460807800293, 4.232963562011719, 4.381319046020508, 4.529674530029297, 4.678030014038086, 4.826385021209717, 4.974740505218506, 5.123095989227295]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 7.0, 15.0, 11.0, 8.0, 16.0, 25.0, 19.0, 23.0, 22.0, 25.0, 30.0, 27.0, 39.0, 33.0, 45.0, 43.0, 50.0, 42.0, 37.0, 39.0, 47.0, 47.0, 43.0, 43.0, 25.0, 27.0, 33.0, 26.0, 19.0, 26.0, 19.0, 12.0, 15.0, 8.0, 10.0, 10.0, 3.0, 5.0, 9.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.340449810028076, -4.209873676300049, -4.0792975425720215, -3.9487216472625732, -3.818145513534546, -3.6875693798065186, -3.5569934844970703, -3.426417350769043, -3.2958412170410156, -3.1652650833129883, -3.034688949584961, -2.9041130542755127, -2.7735369205474854, -2.642960786819458, -2.5123848915100098, -2.3818087577819824, -2.251232624053955, -2.1206564903259277, -1.99008047580719, -1.8595044612884521, -1.7289283275604248, -1.5983521938323975, -1.4677761793136597, -1.3372001647949219, -1.2066240310668945, -1.0760478973388672, -0.9454718828201294, -0.8148958086967468, -0.6843197345733643, -0.5537436604499817, -0.4231675863265991, -0.29259151220321655, -0.1620159149169922, -0.03143984079360962, 0.09913623332977295, 0.22971230745315552, 0.3602883815765381, 0.49086445569992065, 0.6214405298233032, 0.7520166039466858, 0.8825926780700684, 1.0131688117980957, 1.1437448263168335, 1.2743208408355713, 1.4048969745635986, 1.535473108291626, 1.6660491228103638, 1.7966251373291016, 1.927201271057129, 2.0577774047851562, 2.1883535385131836, 2.318929433822632, 2.449505567550659, 2.5800817012786865, 2.7106575965881348, 2.841233730316162, 2.9718098640441895, 3.102385997772217, 3.232962131500244, 3.3635380268096924, 3.4941141605377197, 3.624690294265747, 3.7552661895751953, 3.8858423233032227, 4.01641845703125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 12.0, 18.0, 19.0, 23.0, 37.0, 60.0, 101.0, 108.0, 148.0, 223.0, 317.0, 472.0, 721.0, 1138.0, 1636.0, 2447.0, 3750.0, 5536.0, 8670.0, 13771.0, 21427.0, 36314.0, 63781.0, 126459.0, 253750.0, 238125.0, 116919.0, 60492.0, 34166.0, 20780.0, 12992.0, 8178.0, 5302.0, 3426.0, 2322.0, 1583.0, 1091.0, 680.0, 494.0, 332.0, 244.0, 166.0, 87.0, 85.0, 48.0, 29.0, 26.0, 22.0, 9.0, 10.0, 3.0, 3.0, 7.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1533203125, -1.117218017578125, -1.08111572265625, -1.045013427734375, -1.0089111328125, -0.972808837890625, -0.93670654296875, -0.900604248046875, -0.864501953125, -0.828399658203125, -0.79229736328125, -0.756195068359375, -0.7200927734375, -0.683990478515625, -0.64788818359375, -0.611785888671875, -0.57568359375, -0.539581298828125, -0.50347900390625, -0.467376708984375, -0.4312744140625, -0.395172119140625, -0.35906982421875, -0.322967529296875, -0.286865234375, -0.250762939453125, -0.21466064453125, -0.178558349609375, -0.1424560546875, -0.106353759765625, -0.07025146484375, -0.034149169921875, 0.001953125, 0.038055419921875, 0.07415771484375, 0.110260009765625, 0.1463623046875, 0.182464599609375, 0.21856689453125, 0.254669189453125, 0.290771484375, 0.326873779296875, 0.36297607421875, 0.399078369140625, 0.4351806640625, 0.471282958984375, 0.50738525390625, 0.543487548828125, 0.57958984375, 0.615692138671875, 0.65179443359375, 0.687896728515625, 0.7239990234375, 0.760101318359375, 0.79620361328125, 0.832305908203125, 0.868408203125, 0.904510498046875, 0.94061279296875, 0.976715087890625, 1.0128173828125, 1.048919677734375, 1.08502197265625, 1.121124267578125, 1.1572265625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 2.0, 2.0, 4.0, 7.0, 11.0, 15.0, 13.0, 14.0, 18.0, 17.0, 18.0, 30.0, 25.0, 25.0, 36.0, 43.0, 32.0, 34.0, 54.0, 56.0, 47.0, 51.0, 43.0, 41.0, 42.0, 32.0, 35.0, 40.0, 28.0, 23.0, 34.0, 18.0, 18.0, 22.0, 13.0, 18.0, 14.0, 4.0, 2.0, 3.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.3046875, -4.16461181640625, -4.0245361328125, -3.88446044921875, -3.744384765625, -3.60430908203125, -3.4642333984375, -3.32415771484375, -3.18408203125, -3.04400634765625, -2.9039306640625, -2.76385498046875, -2.623779296875, -2.48370361328125, -2.3436279296875, -2.20355224609375, -2.0634765625, -1.92340087890625, -1.7833251953125, -1.64324951171875, -1.503173828125, -1.36309814453125, -1.2230224609375, -1.08294677734375, -0.94287109375, -0.80279541015625, -0.6627197265625, -0.52264404296875, -0.382568359375, -0.24249267578125, -0.1024169921875, 0.03765869140625, 0.177734375, 0.31781005859375, 0.4578857421875, 0.59796142578125, 0.738037109375, 0.87811279296875, 1.0181884765625, 1.15826416015625, 1.29833984375, 1.43841552734375, 1.5784912109375, 1.71856689453125, 1.858642578125, 1.99871826171875, 2.1387939453125, 2.27886962890625, 2.4189453125, 2.55902099609375, 2.6990966796875, 2.83917236328125, 2.979248046875, 3.11932373046875, 3.2593994140625, 3.39947509765625, 3.53955078125, 3.67962646484375, 3.8197021484375, 3.95977783203125, 4.099853515625, 4.23992919921875, 4.3800048828125, 4.52008056640625, 4.66015625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 12.0, 15.0, 20.0, 26.0, 40.0, 55.0, 61.0, 92.0, 114.0, 177.0, 242.0, 338.0, 491.0, 789.0, 1238.0, 2339.0, 4869.0, 12830.0, 41299.0, 921323.0, 39443.0, 12121.0, 4734.0, 2251.0, 1234.0, 740.0, 465.0, 324.0, 234.0, 169.0, 117.0, 82.0, 68.0, 53.0, 30.0, 33.0, 25.0, 14.0, 16.0, 9.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-4.0078125, -3.884429931640625, -3.76104736328125, -3.637664794921875, -3.5142822265625, -3.390899658203125, -3.26751708984375, -3.144134521484375, -3.020751953125, -2.897369384765625, -2.77398681640625, -2.650604248046875, -2.5272216796875, -2.403839111328125, -2.28045654296875, -2.157073974609375, -2.03369140625, -1.910308837890625, -1.78692626953125, -1.663543701171875, -1.5401611328125, -1.416778564453125, -1.29339599609375, -1.170013427734375, -1.046630859375, -0.923248291015625, -0.79986572265625, -0.676483154296875, -0.5531005859375, -0.429718017578125, -0.30633544921875, -0.182952880859375, -0.0595703125, 0.063812255859375, 0.18719482421875, 0.310577392578125, 0.4339599609375, 0.557342529296875, 0.68072509765625, 0.804107666015625, 0.927490234375, 1.050872802734375, 1.17425537109375, 1.297637939453125, 1.4210205078125, 1.544403076171875, 1.66778564453125, 1.791168212890625, 1.91455078125, 2.037933349609375, 2.16131591796875, 2.284698486328125, 2.4080810546875, 2.531463623046875, 2.65484619140625, 2.778228759765625, 2.901611328125, 3.024993896484375, 3.14837646484375, 3.271759033203125, 3.3951416015625, 3.518524169921875, 3.64190673828125, 3.765289306640625, 3.888671875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 10.0, 9.0, 14.0, 10.0, 12.0, 15.0, 25.0, 22.0, 19.0, 28.0, 35.0, 23.0, 39.0, 31.0, 34.0, 32.0, 39.0, 27.0, 29.0, 41.0, 43.0, 48.0, 33.0, 38.0, 39.0, 33.0, 23.0, 31.0, 36.0, 27.0, 11.0, 24.0, 19.0, 16.0, 18.0, 9.0, 17.0, 12.0, 9.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.609375, -2.52978515625, -2.4501953125, -2.37060546875, -2.291015625, -2.21142578125, -2.1318359375, -2.05224609375, -1.97265625, -1.89306640625, -1.8134765625, -1.73388671875, -1.654296875, -1.57470703125, -1.4951171875, -1.41552734375, -1.3359375, -1.25634765625, -1.1767578125, -1.09716796875, -1.017578125, -0.93798828125, -0.8583984375, -0.77880859375, -0.69921875, -0.61962890625, -0.5400390625, -0.46044921875, -0.380859375, -0.30126953125, -0.2216796875, -0.14208984375, -0.0625, 0.01708984375, 0.0966796875, 0.17626953125, 0.255859375, 0.33544921875, 0.4150390625, 0.49462890625, 0.57421875, 0.65380859375, 0.7333984375, 0.81298828125, 0.892578125, 0.97216796875, 1.0517578125, 1.13134765625, 1.2109375, 1.29052734375, 1.3701171875, 1.44970703125, 1.529296875, 1.60888671875, 1.6884765625, 1.76806640625, 1.84765625, 1.92724609375, 2.0068359375, 2.08642578125, 2.166015625, 2.24560546875, 2.3251953125, 2.40478515625, 2.484375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 8.0, 8.0, 16.0, 17.0, 27.0, 35.0, 40.0, 73.0, 77.0, 134.0, 163.0, 256.0, 402.0, 673.0, 1037.0, 1804.0, 3702.0, 8582.0, 24060.0, 913774.0, 65105.0, 15601.0, 6099.0, 2844.0, 1522.0, 864.0, 527.0, 342.0, 209.0, 156.0, 103.0, 73.0, 58.0, 44.0, 28.0, 16.0, 10.0, 17.0, 18.0, 7.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2099609375, -0.20356369018554688, -0.19716644287109375, -0.19076919555664062, -0.1843719482421875, -0.17797470092773438, -0.17157745361328125, -0.16518020629882812, -0.158782958984375, -0.15238571166992188, -0.14598846435546875, -0.13959121704101562, -0.1331939697265625, -0.12679672241210938, -0.12039947509765625, -0.11400222778320312, -0.10760498046875, -0.10120773315429688, -0.09481048583984375, -0.08841323852539062, -0.0820159912109375, -0.07561874389648438, -0.06922149658203125, -0.06282424926757812, -0.056427001953125, -0.050029754638671875, -0.04363250732421875, -0.037235260009765625, -0.0308380126953125, -0.024440765380859375, -0.01804351806640625, -0.011646270751953125, -0.0052490234375, 0.001148223876953125, 0.00754547119140625, 0.013942718505859375, 0.0203399658203125, 0.026737213134765625, 0.03313446044921875, 0.039531707763671875, 0.045928955078125, 0.052326202392578125, 0.05872344970703125, 0.06512069702148438, 0.0715179443359375, 0.07791519165039062, 0.08431243896484375, 0.09070968627929688, 0.09710693359375, 0.10350418090820312, 0.10990142822265625, 0.11629867553710938, 0.1226959228515625, 0.12909317016601562, 0.13549041748046875, 0.14188766479492188, 0.148284912109375, 0.15468215942382812, 0.16107940673828125, 0.16747665405273438, 0.1738739013671875, 0.18027114868164062, 0.18666839599609375, 0.19306564331054688, 0.199462890625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 8.0, 17.0, 10.0, 16.0, 20.0, 24.0, 34.0, 26.0, 52.0, 54.0, 59.0, 71.0, 57.0, 74.0, 64.0, 65.0, 59.0, 43.0, 44.0, 38.0, 29.0, 23.0, 21.0, 18.0, 17.0, 12.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.704164505004883e-05, -5.5509619414806366e-05, -5.3977593779563904e-05, -5.244556814432144e-05, -5.091354250907898e-05, -4.938151687383652e-05, -4.7849491238594055e-05, -4.631746560335159e-05, -4.478543996810913e-05, -4.325341433286667e-05, -4.1721388697624207e-05, -4.0189363062381744e-05, -3.865733742713928e-05, -3.712531179189682e-05, -3.559328615665436e-05, -3.4061260521411896e-05, -3.2529234886169434e-05, -3.099720925092697e-05, -2.946518361568451e-05, -2.7933157980442047e-05, -2.6401132345199585e-05, -2.4869106709957123e-05, -2.333708107471466e-05, -2.18050554394722e-05, -2.0273029804229736e-05, -1.8741004168987274e-05, -1.7208978533744812e-05, -1.567695289850235e-05, -1.4144927263259888e-05, -1.2612901628017426e-05, -1.1080875992774963e-05, -9.548850357532501e-06, -8.016824722290039e-06, -6.484799087047577e-06, -4.952773451805115e-06, -3.4207478165626526e-06, -1.8887221813201904e-06, -3.5669654607772827e-07, 1.1753290891647339e-06, 2.707354724407196e-06, 4.239380359649658e-06, 5.77140599489212e-06, 7.3034316301345825e-06, 8.835457265377045e-06, 1.0367482900619507e-05, 1.1899508535861969e-05, 1.3431534171104431e-05, 1.4963559806346893e-05, 1.6495585441589355e-05, 1.8027611076831818e-05, 1.955963671207428e-05, 2.1091662347316742e-05, 2.2623687982559204e-05, 2.4155713617801666e-05, 2.568773925304413e-05, 2.721976488828659e-05, 2.8751790523529053e-05, 3.0283816158771515e-05, 3.181584179401398e-05, 3.334786742925644e-05, 3.48798930644989e-05, 3.6411918699741364e-05, 3.7943944334983826e-05, 3.947596997022629e-05, 4.100799560546875e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 11.0, 15.0, 24.0, 50.0, 67.0, 89.0, 125.0, 192.0, 290.0, 425.0, 553.0, 792.0, 1147.0, 1724.0, 2328.0, 3484.0, 5339.0, 8234.0, 12629.0, 19879.0, 32796.0, 58672.0, 116887.0, 239660.0, 255840.0, 128007.0, 63479.0, 35303.0, 20997.0, 13281.0, 8427.0, 5722.0, 3798.0, 2547.0, 1812.0, 1157.0, 818.0, 610.0, 373.0, 309.0, 197.0, 127.0, 97.0, 85.0, 51.0, 30.0, 31.0, 16.0, 11.0, 5.0, 5.0, 7.0, 0.0, 1.0], "bins": [-0.06298828125, -0.06113910675048828, -0.05928993225097656, -0.057440757751464844, -0.055591583251953125, -0.053742408752441406, -0.05189323425292969, -0.05004405975341797, -0.04819488525390625, -0.04634571075439453, -0.04449653625488281, -0.042647361755371094, -0.040798187255859375, -0.038949012756347656, -0.03709983825683594, -0.03525066375732422, -0.0334014892578125, -0.03155231475830078, -0.029703140258789062, -0.027853965759277344, -0.026004791259765625, -0.024155616760253906, -0.022306442260742188, -0.02045726776123047, -0.01860809326171875, -0.01675891876220703, -0.014909744262695312, -0.013060569763183594, -0.011211395263671875, -0.009362220764160156, -0.0075130462646484375, -0.005663871765136719, -0.003814697265625, -0.0019655227661132812, -0.0001163482666015625, 0.0017328262329101562, 0.003582000732421875, 0.005431175231933594, 0.0072803497314453125, 0.009129524230957031, 0.01097869873046875, 0.012827873229980469, 0.014677047729492188, 0.016526222229003906, 0.018375396728515625, 0.020224571228027344, 0.022073745727539062, 0.02392292022705078, 0.0257720947265625, 0.02762126922607422, 0.029470443725585938, 0.031319618225097656, 0.033168792724609375, 0.035017967224121094, 0.03686714172363281, 0.03871631622314453, 0.04056549072265625, 0.04241466522216797, 0.04426383972167969, 0.046113014221191406, 0.047962188720703125, 0.049811363220214844, 0.05166053771972656, 0.05350971221923828, 0.05535888671875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 3.0, 7.0, 5.0, 5.0, 6.0, 4.0, 9.0, 10.0, 9.0, 9.0, 18.0, 18.0, 26.0, 34.0, 36.0, 53.0, 73.0, 86.0, 91.0, 84.0, 81.0, 63.0, 54.0, 45.0, 31.0, 17.0, 18.0, 15.0, 11.0, 10.0, 8.0, 11.0, 6.0, 6.0, 5.0, 4.0, 3.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.022216796875, -0.021492958068847656, -0.020769119262695312, -0.02004528045654297, -0.019321441650390625, -0.01859760284423828, -0.017873764038085938, -0.017149925231933594, -0.01642608642578125, -0.015702247619628906, -0.014978408813476562, -0.014254570007324219, -0.013530731201171875, -0.012806892395019531, -0.012083053588867188, -0.011359214782714844, -0.0106353759765625, -0.009911537170410156, -0.009187698364257812, -0.008463859558105469, -0.007740020751953125, -0.007016181945800781, -0.0062923431396484375, -0.005568504333496094, -0.00484466552734375, -0.004120826721191406, -0.0033969879150390625, -0.0026731491088867188, -0.001949310302734375, -0.0012254714965820312, -0.0005016326904296875, 0.00022220611572265625, 0.000946044921875, 0.0016698837280273438, 0.0023937225341796875, 0.0031175613403320312, 0.003841400146484375, 0.004565238952636719, 0.0052890777587890625, 0.006012916564941406, 0.00673675537109375, 0.007460594177246094, 0.008184432983398438, 0.008908271789550781, 0.009632110595703125, 0.010355949401855469, 0.011079788208007812, 0.011803627014160156, 0.0125274658203125, 0.013251304626464844, 0.013975143432617188, 0.014698982238769531, 0.015422821044921875, 0.01614665985107422, 0.016870498657226562, 0.017594337463378906, 0.01831817626953125, 0.019042015075683594, 0.019765853881835938, 0.02048969268798828, 0.021213531494140625, 0.02193737030029297, 0.022661209106445312, 0.023385047912597656, 0.02410888671875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 13.0, 15.0, 15.0, 13.0, 12.0, 25.0, 45.0, 51.0, 48.0, 48.0, 60.0, 74.0, 71.0, 75.0, 78.0, 64.0, 48.0, 44.0, 33.0, 30.0, 20.0, 17.0, 19.0, 13.0, 11.0, 10.0, 4.0, 7.0, 6.0, 6.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.427626609802246, -4.279125690460205, -4.130624771118164, -3.982124090194702, -3.833623170852661, -3.685122489929199, -3.536621570587158, -3.388120651245117, -3.239619731903076, -3.091118812561035, -2.9426181316375732, -2.7941172122955322, -2.645616292953491, -2.4971156120300293, -2.3486146926879883, -2.2001137733459473, -2.0516130924224854, -1.9031122922897339, -1.7546113729476929, -1.6061105728149414, -1.4576096534729004, -1.309108853340149, -1.1606080532073975, -1.0121071338653564, -0.863606333732605, -0.7151054739952087, -0.5666046142578125, -0.41810381412506104, -0.2696029543876648, -0.12110209465026855, 0.02739870548248291, 0.17589962482452393, 0.3244004249572754, 0.47290128469467163, 0.6214021444320679, 0.7699029445648193, 0.9184038043022156, 1.0669046640396118, 1.2154054641723633, 1.3639063835144043, 1.5124071836471558, 1.6609079837799072, 1.8094089031219482, 1.9579097032546997, 2.106410503387451, 2.254911422729492, 2.403412342071533, 2.551913261413574, 2.700413942337036, 2.848914861679077, 2.997415542602539, 3.14591646194458, 3.294417381286621, 3.442918300628662, 3.591418981552124, 3.739919900894165, 3.888420581817627, 4.036921501159668, 4.185422420501709, 4.33392333984375, 4.482423782348633, 4.630924701690674, 4.779425621032715, 4.927926540374756, 5.076427459716797]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 8.0, 13.0, 12.0, 8.0, 17.0, 24.0, 20.0, 22.0, 23.0, 26.0, 29.0, 24.0, 39.0, 37.0, 43.0, 43.0, 50.0, 42.0, 37.0, 42.0, 46.0, 46.0, 40.0, 46.0, 26.0, 25.0, 35.0, 24.0, 19.0, 27.0, 18.0, 13.0, 15.0, 9.0, 9.0, 9.0, 3.0, 5.0, 9.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.309511184692383, -4.179261684417725, -4.049011707305908, -3.91876220703125, -3.7885124683380127, -3.6582627296447754, -3.528013229370117, -3.39776349067688, -3.2675137519836426, -3.1372640132904053, -3.007014513015747, -2.8767647743225098, -2.7465150356292725, -2.616265296936035, -2.486015796661377, -2.3557660579681396, -2.2255165576934814, -2.095266819000244, -1.9650171995162964, -1.8347675800323486, -1.7045178413391113, -1.5742682218551636, -1.4440186023712158, -1.3137688636779785, -1.1835192441940308, -1.053269624710083, -0.9230198860168457, -0.792770266532898, -0.6625205874443054, -0.5322709083557129, -0.40202128887176514, -0.2717716097831726, -0.14152193069458008, -0.011272266507148743, 0.11897739768028259, 0.24922704696655273, 0.37947672605514526, 0.5097264051437378, 0.6399760246276855, 0.7702257037162781, 0.9004753828048706, 1.0307250022888184, 1.1609747409820557, 1.2912243604660034, 1.4214739799499512, 1.5517237186431885, 1.6819733381271362, 1.812222957611084, 1.9424726963043213, 2.0727224349975586, 2.202971935272217, 2.333221673965454, 2.4634714126586914, 2.5937209129333496, 2.723970651626587, 2.854220390319824, 2.9844698905944824, 3.1147196292877197, 3.244969129562378, 3.3752188682556152, 3.5054686069488525, 3.63571834564209, 3.765967845916748, 3.8962175846099854, 4.026467323303223]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 15.0, 14.0, 27.0, 38.0, 48.0, 77.0, 151.0, 183.0, 330.0, 494.0, 778.0, 1220.0, 1940.0, 3163.0, 5304.0, 8539.0, 14554.0, 25667.0, 44178.0, 77574.0, 131497.0, 185624.0, 193501.0, 144360.0, 88270.0, 50405.0, 29009.0, 16516.0, 9727.0, 5719.0, 3625.0, 2182.0, 1380.0, 883.0, 555.0, 351.0, 243.0, 143.0, 93.0, 63.0, 45.0, 20.0, 22.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.771484375, -3.6575927734375, -3.543701171875, -3.4298095703125, -3.31591796875, -3.2020263671875, -3.088134765625, -2.9742431640625, -2.8603515625, -2.7464599609375, -2.632568359375, -2.5186767578125, -2.40478515625, -2.2908935546875, -2.177001953125, -2.0631103515625, -1.94921875, -1.8353271484375, -1.721435546875, -1.6075439453125, -1.49365234375, -1.3797607421875, -1.265869140625, -1.1519775390625, -1.0380859375, -0.9241943359375, -0.810302734375, -0.6964111328125, -0.58251953125, -0.4686279296875, -0.354736328125, -0.2408447265625, -0.126953125, -0.0130615234375, 0.100830078125, 0.2147216796875, 0.32861328125, 0.4425048828125, 0.556396484375, 0.6702880859375, 0.7841796875, 0.8980712890625, 1.011962890625, 1.1258544921875, 1.23974609375, 1.3536376953125, 1.467529296875, 1.5814208984375, 1.6953125, 1.8092041015625, 1.923095703125, 2.0369873046875, 2.15087890625, 2.2647705078125, 2.378662109375, 2.4925537109375, 2.6064453125, 2.7203369140625, 2.834228515625, 2.9481201171875, 3.06201171875, 3.1759033203125, 3.289794921875, 3.4036865234375, 3.517578125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 13.0, 10.0, 7.0, 10.0, 12.0, 24.0, 32.0, 25.0, 20.0, 27.0, 23.0, 26.0, 42.0, 42.0, 46.0, 36.0, 48.0, 51.0, 58.0, 28.0, 46.0, 54.0, 39.0, 41.0, 25.0, 22.0, 30.0, 36.0, 16.0, 20.0, 16.0, 13.0, 18.0, 12.0, 9.0, 7.0, 4.0, 6.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.8653564453125, -3.726806640625, -3.5882568359375, -3.44970703125, -3.3111572265625, -3.172607421875, -3.0340576171875, -2.8955078125, -2.7569580078125, -2.618408203125, -2.4798583984375, -2.34130859375, -2.2027587890625, -2.064208984375, -1.9256591796875, -1.787109375, -1.6485595703125, -1.510009765625, -1.3714599609375, -1.23291015625, -1.0943603515625, -0.955810546875, -0.8172607421875, -0.6787109375, -0.5401611328125, -0.401611328125, -0.2630615234375, -0.12451171875, 0.0140380859375, 0.152587890625, 0.2911376953125, 0.4296875, 0.5682373046875, 0.706787109375, 0.8453369140625, 0.98388671875, 1.1224365234375, 1.260986328125, 1.3995361328125, 1.5380859375, 1.6766357421875, 1.815185546875, 1.9537353515625, 2.09228515625, 2.2308349609375, 2.369384765625, 2.5079345703125, 2.646484375, 2.7850341796875, 2.923583984375, 3.0621337890625, 3.20068359375, 3.3392333984375, 3.477783203125, 3.6163330078125, 3.7548828125, 3.8934326171875, 4.031982421875, 4.1705322265625, 4.30908203125, 4.4476318359375, 4.586181640625, 4.7247314453125, 4.86328125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 3.0, 6.0, 6.0, 11.0, 14.0, 21.0, 38.0, 40.0, 59.0, 108.0, 131.0, 206.0, 329.0, 506.0, 721.0, 1073.0, 1656.0, 2481.0, 3601.0, 5510.0, 8473.0, 13192.0, 20788.0, 33314.0, 52681.0, 82398.0, 119952.0, 152673.0, 158275.0, 131344.0, 93029.0, 60453.0, 37934.0, 23932.0, 15024.0, 9854.0, 6351.0, 4112.0, 2787.0, 1751.0, 1257.0, 802.0, 540.0, 363.0, 256.0, 167.0, 120.0, 84.0, 55.0, 32.0, 17.0, 16.0, 9.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-2.7890625, -2.69952392578125, -2.6099853515625, -2.52044677734375, -2.430908203125, -2.34136962890625, -2.2518310546875, -2.16229248046875, -2.07275390625, -1.98321533203125, -1.8936767578125, -1.80413818359375, -1.714599609375, -1.62506103515625, -1.5355224609375, -1.44598388671875, -1.3564453125, -1.26690673828125, -1.1773681640625, -1.08782958984375, -0.998291015625, -0.90875244140625, -0.8192138671875, -0.72967529296875, -0.64013671875, -0.55059814453125, -0.4610595703125, -0.37152099609375, -0.281982421875, -0.19244384765625, -0.1029052734375, -0.01336669921875, 0.076171875, 0.16571044921875, 0.2552490234375, 0.34478759765625, 0.434326171875, 0.52386474609375, 0.6134033203125, 0.70294189453125, 0.79248046875, 0.88201904296875, 0.9715576171875, 1.06109619140625, 1.150634765625, 1.24017333984375, 1.3297119140625, 1.41925048828125, 1.5087890625, 1.59832763671875, 1.6878662109375, 1.77740478515625, 1.866943359375, 1.95648193359375, 2.0460205078125, 2.13555908203125, 2.22509765625, 2.31463623046875, 2.4041748046875, 2.49371337890625, 2.583251953125, 2.67279052734375, 2.7623291015625, 2.85186767578125, 2.94140625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 2.0, 6.0, 11.0, 7.0, 10.0, 16.0, 14.0, 17.0, 21.0, 23.0, 27.0, 18.0, 27.0, 29.0, 27.0, 33.0, 43.0, 27.0, 43.0, 43.0, 36.0, 42.0, 42.0, 53.0, 43.0, 35.0, 36.0, 33.0, 36.0, 15.0, 18.0, 19.0, 15.0, 20.0, 19.0, 13.0, 17.0, 7.0, 8.0, 10.0, 10.0, 2.0, 4.0, 6.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.056640625, -1.98883056640625, -1.9210205078125, -1.85321044921875, -1.785400390625, -1.71759033203125, -1.6497802734375, -1.58197021484375, -1.51416015625, -1.44635009765625, -1.3785400390625, -1.31072998046875, -1.242919921875, -1.17510986328125, -1.1072998046875, -1.03948974609375, -0.9716796875, -0.90386962890625, -0.8360595703125, -0.76824951171875, -0.700439453125, -0.63262939453125, -0.5648193359375, -0.49700927734375, -0.42919921875, -0.36138916015625, -0.2935791015625, -0.22576904296875, -0.157958984375, -0.09014892578125, -0.0223388671875, 0.04547119140625, 0.11328125, 0.18109130859375, 0.2489013671875, 0.31671142578125, 0.384521484375, 0.45233154296875, 0.5201416015625, 0.58795166015625, 0.65576171875, 0.72357177734375, 0.7913818359375, 0.85919189453125, 0.927001953125, 0.99481201171875, 1.0626220703125, 1.13043212890625, 1.1982421875, 1.26605224609375, 1.3338623046875, 1.40167236328125, 1.469482421875, 1.53729248046875, 1.6051025390625, 1.67291259765625, 1.74072265625, 1.80853271484375, 1.8763427734375, 1.94415283203125, 2.011962890625, 2.07977294921875, 2.1475830078125, 2.21539306640625, 2.283203125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 1.0, 11.0, 9.0, 15.0, 19.0, 25.0, 37.0, 46.0, 83.0, 111.0, 169.0, 278.0, 445.0, 684.0, 1111.0, 1945.0, 3234.0, 5880.0, 10429.0, 18858.0, 34608.0, 62279.0, 108104.0, 166634.0, 200575.0, 171660.0, 113157.0, 66109.0, 36445.0, 19935.0, 10926.0, 6138.0, 3390.0, 2020.0, 1220.0, 709.0, 447.0, 274.0, 182.0, 98.0, 75.0, 62.0, 37.0, 24.0, 18.0, 8.0, 8.0, 10.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1162109375, -1.0808258056640625, -1.045440673828125, -1.0100555419921875, -0.97467041015625, -0.9392852783203125, -0.903900146484375, -0.8685150146484375, -0.8331298828125, -0.7977447509765625, -0.762359619140625, -0.7269744873046875, -0.69158935546875, -0.6562042236328125, -0.620819091796875, -0.5854339599609375, -0.550048828125, -0.5146636962890625, -0.479278564453125, -0.4438934326171875, -0.40850830078125, -0.3731231689453125, -0.337738037109375, -0.3023529052734375, -0.2669677734375, -0.2315826416015625, -0.196197509765625, -0.1608123779296875, -0.12542724609375, -0.0900421142578125, -0.054656982421875, -0.0192718505859375, 0.01611328125, 0.0514984130859375, 0.086883544921875, 0.1222686767578125, 0.15765380859375, 0.1930389404296875, 0.228424072265625, 0.2638092041015625, 0.2991943359375, 0.3345794677734375, 0.369964599609375, 0.4053497314453125, 0.44073486328125, 0.4761199951171875, 0.511505126953125, 0.5468902587890625, 0.582275390625, 0.6176605224609375, 0.653045654296875, 0.6884307861328125, 0.72381591796875, 0.7592010498046875, 0.794586181640625, 0.8299713134765625, 0.8653564453125, 0.9007415771484375, 0.936126708984375, 0.9715118408203125, 1.00689697265625, 1.0422821044921875, 1.077667236328125, 1.1130523681640625, 1.1484375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 10.0, 3.0, 11.0, 15.0, 9.0, 10.0, 13.0, 21.0, 19.0, 32.0, 36.0, 31.0, 54.0, 51.0, 57.0, 58.0, 63.0, 50.0, 63.0, 62.0, 59.0, 49.0, 40.0, 41.0, 16.0, 23.0, 24.0, 19.0, 18.0, 9.0, 8.0, 7.0, 4.0, 4.0, 5.0, 3.0, 5.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.994340896606445e-05, -8.737575262784958e-05, -8.48080962896347e-05, -8.224043995141983e-05, -7.967278361320496e-05, -7.710512727499008e-05, -7.453747093677521e-05, -7.196981459856033e-05, -6.940215826034546e-05, -6.683450192213058e-05, -6.426684558391571e-05, -6.169918924570084e-05, -5.913153290748596e-05, -5.656387656927109e-05, -5.399622023105621e-05, -5.142856389284134e-05, -4.8860907554626465e-05, -4.629325121641159e-05, -4.3725594878196716e-05, -4.115793853998184e-05, -3.859028220176697e-05, -3.6022625863552094e-05, -3.345496952533722e-05, -3.0887313187122345e-05, -2.831965684890747e-05, -2.5752000510692596e-05, -2.3184344172477722e-05, -2.0616687834262848e-05, -1.8049031496047974e-05, -1.54813751578331e-05, -1.2913718819618225e-05, -1.034606248140335e-05, -7.778406143188477e-06, -5.210749804973602e-06, -2.643093466758728e-06, -7.543712854385376e-08, 2.4922192096710205e-06, 5.059875547885895e-06, 7.627531886100769e-06, 1.0195188224315643e-05, 1.2762844562530518e-05, 1.5330500900745392e-05, 1.7898157238960266e-05, 2.046581357717514e-05, 2.3033469915390015e-05, 2.560112625360489e-05, 2.8168782591819763e-05, 3.073643893003464e-05, 3.330409526824951e-05, 3.5871751606464386e-05, 3.843940794467926e-05, 4.1007064282894135e-05, 4.357472062110901e-05, 4.614237695932388e-05, 4.871003329753876e-05, 5.127768963575363e-05, 5.3845345973968506e-05, 5.641300231218338e-05, 5.8980658650398254e-05, 6.154831498861313e-05, 6.4115971326828e-05, 6.668362766504288e-05, 6.925128400325775e-05, 7.181894034147263e-05, 7.43865966796875e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 14.0, 15.0, 17.0, 41.0, 48.0, 78.0, 115.0, 194.0, 320.0, 547.0, 923.0, 1686.0, 2858.0, 5007.0, 8844.0, 16352.0, 29952.0, 54669.0, 95448.0, 149309.0, 191156.0, 182059.0, 129897.0, 79474.0, 44862.0, 24543.0, 13418.0, 7226.0, 4082.0, 2218.0, 1272.0, 753.0, 475.0, 264.0, 153.0, 86.0, 62.0, 43.0, 26.0, 19.0, 11.0, 6.0, 10.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.162109375, -1.126708984375, -1.09130859375, -1.055908203125, -1.0205078125, -0.985107421875, -0.94970703125, -0.914306640625, -0.87890625, -0.843505859375, -0.80810546875, -0.772705078125, -0.7373046875, -0.701904296875, -0.66650390625, -0.631103515625, -0.595703125, -0.560302734375, -0.52490234375, -0.489501953125, -0.4541015625, -0.418701171875, -0.38330078125, -0.347900390625, -0.3125, -0.277099609375, -0.24169921875, -0.206298828125, -0.1708984375, -0.135498046875, -0.10009765625, -0.064697265625, -0.029296875, 0.006103515625, 0.04150390625, 0.076904296875, 0.1123046875, 0.147705078125, 0.18310546875, 0.218505859375, 0.25390625, 0.289306640625, 0.32470703125, 0.360107421875, 0.3955078125, 0.430908203125, 0.46630859375, 0.501708984375, 0.537109375, 0.572509765625, 0.60791015625, 0.643310546875, 0.6787109375, 0.714111328125, 0.74951171875, 0.784912109375, 0.8203125, 0.855712890625, 0.89111328125, 0.926513671875, 0.9619140625, 0.997314453125, 1.03271484375, 1.068115234375, 1.103515625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 12.0, 9.0, 9.0, 16.0, 20.0, 19.0, 32.0, 41.0, 35.0, 42.0, 62.0, 67.0, 66.0, 64.0, 78.0, 79.0, 46.0, 47.0, 47.0, 41.0, 40.0, 27.0, 24.0, 14.0, 13.0, 8.0, 12.0, 8.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.58642578125, -0.571807861328125, -0.55718994140625, -0.542572021484375, -0.5279541015625, -0.513336181640625, -0.49871826171875, -0.484100341796875, -0.469482421875, -0.454864501953125, -0.44024658203125, -0.425628662109375, -0.4110107421875, -0.396392822265625, -0.38177490234375, -0.367156982421875, -0.3525390625, -0.337921142578125, -0.32330322265625, -0.308685302734375, -0.2940673828125, -0.279449462890625, -0.26483154296875, -0.250213623046875, -0.235595703125, -0.220977783203125, -0.20635986328125, -0.191741943359375, -0.1771240234375, -0.162506103515625, -0.14788818359375, -0.133270263671875, -0.11865234375, -0.104034423828125, -0.08941650390625, -0.074798583984375, -0.0601806640625, -0.045562744140625, -0.03094482421875, -0.016326904296875, -0.001708984375, 0.012908935546875, 0.02752685546875, 0.042144775390625, 0.0567626953125, 0.071380615234375, 0.08599853515625, 0.100616455078125, 0.115234375, 0.129852294921875, 0.14447021484375, 0.159088134765625, 0.1737060546875, 0.188323974609375, 0.20294189453125, 0.217559814453125, 0.232177734375, 0.246795654296875, 0.26141357421875, 0.276031494140625, 0.2906494140625, 0.305267333984375, 0.31988525390625, 0.334503173828125, 0.34912109375]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 8.0, 6.0, 8.0, 9.0, 14.0, 23.0, 24.0, 18.0, 36.0, 37.0, 49.0, 61.0, 66.0, 65.0, 71.0, 83.0, 75.0, 70.0, 54.0, 34.0, 42.0, 31.0, 18.0, 25.0, 14.0, 8.0, 13.0, 8.0, 6.0, 9.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.714995861053467, -4.561918258666992, -4.408840179443359, -4.255762100219727, -4.102684497833252, -3.9496066570281982, -3.7965288162231445, -3.643450975418091, -3.490373134613037, -3.3372952938079834, -3.1842174530029297, -3.031139612197876, -2.8780617713928223, -2.7249839305877686, -2.571906089782715, -2.418828248977661, -2.2657504081726074, -2.1126725673675537, -1.9595947265625, -1.8065168857574463, -1.6534390449523926, -1.5003612041473389, -1.3472833633422852, -1.1942055225372314, -1.0411276817321777, -0.888049840927124, -0.7349720001220703, -0.5818941593170166, -0.4288163185119629, -0.2757384777069092, -0.12266063690185547, 0.030417203903198242, 0.18349552154541016, 0.33657336235046387, 0.4896512031555176, 0.6427290439605713, 0.795806884765625, 0.9488847255706787, 1.1019625663757324, 1.2550404071807861, 1.4081182479858398, 1.5611960887908936, 1.7142739295959473, 1.867351770401001, 2.0204296112060547, 2.1735074520111084, 2.326585292816162, 2.479663133621216, 2.6327409744262695, 2.7858188152313232, 2.938896656036377, 3.0919744968414307, 3.2450523376464844, 3.398130178451538, 3.551208019256592, 3.7042858600616455, 3.857363700866699, 4.010441780090332, 4.163519382476807, 4.316596984863281, 4.469675064086914, 4.622753143310547, 4.7758307456970215, 4.928908348083496, 5.081986427307129]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 10.0, 8.0, 8.0, 14.0, 20.0, 19.0, 22.0, 17.0, 19.0, 22.0, 38.0, 26.0, 35.0, 37.0, 40.0, 42.0, 50.0, 53.0, 39.0, 42.0, 52.0, 41.0, 41.0, 30.0, 24.0, 33.0, 33.0, 33.0, 21.0, 19.0, 7.0, 10.0, 15.0, 14.0, 8.0, 14.0, 8.0, 8.0, 3.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.30297327041626, -4.173262596130371, -4.043551445007324, -3.9138407707214355, -3.784130096435547, -3.654419422149658, -3.5247085094451904, -3.3949975967407227, -3.265286922454834, -3.1355762481689453, -3.0058653354644775, -2.8761544227600098, -2.746443748474121, -2.6167330741882324, -2.4870221614837646, -2.357311248779297, -2.227600574493408, -2.0978899002075195, -1.9681789875030518, -1.8384681940078735, -1.7087574005126953, -1.579046607017517, -1.4493358135223389, -1.3196250200271606, -1.1899142265319824, -1.0602034330368042, -0.930492639541626, -0.8007818460464478, -0.6710710525512695, -0.5413602590560913, -0.4116494655609131, -0.28193867206573486, -0.15222740173339844, -0.022516608238220215, 0.10719418525695801, 0.23690497875213623, 0.36661577224731445, 0.4963265657424927, 0.6260373592376709, 0.7557481527328491, 0.8854589462280273, 1.0151697397232056, 1.1448805332183838, 1.274591326713562, 1.4043021202087402, 1.5340129137039185, 1.6637237071990967, 1.793434500694275, 1.9231452941894531, 2.052855968475342, 2.1825668811798096, 2.3122777938842773, 2.441988468170166, 2.5716991424560547, 2.7014100551605225, 2.8311209678649902, 2.960831642150879, 3.0905423164367676, 3.2202532291412354, 3.349964141845703, 3.479674816131592, 3.6093854904174805, 3.7390964031219482, 3.868807315826416, 3.9985179901123047]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 14.0, 12.0, 25.0, 37.0, 68.0, 76.0, 114.0, 191.0, 276.0, 448.0, 692.0, 1036.0, 1637.0, 2518.0, 4025.0, 6494.0, 10661.0, 18377.0, 32781.0, 62336.0, 123115.0, 256209.0, 545473.0, 981280.0, 1011209.0, 584224.0, 274628.0, 130390.0, 65423.0, 33971.0, 18644.0, 10670.0, 6326.0, 3882.0, 2447.0, 1564.0, 995.0, 658.0, 473.0, 308.0, 177.0, 121.0, 94.0, 60.0, 42.0, 29.0, 18.0, 5.0, 9.0, 10.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.42578125, -4.283203125, -4.140625, -3.998046875, -3.85546875, -3.712890625, -3.5703125, -3.427734375, -3.28515625, -3.142578125, -3.0, -2.857421875, -2.71484375, -2.572265625, -2.4296875, -2.287109375, -2.14453125, -2.001953125, -1.859375, -1.716796875, -1.57421875, -1.431640625, -1.2890625, -1.146484375, -1.00390625, -0.861328125, -0.71875, -0.576171875, -0.43359375, -0.291015625, -0.1484375, -0.005859375, 0.13671875, 0.279296875, 0.421875, 0.564453125, 0.70703125, 0.849609375, 0.9921875, 1.134765625, 1.27734375, 1.419921875, 1.5625, 1.705078125, 1.84765625, 1.990234375, 2.1328125, 2.275390625, 2.41796875, 2.560546875, 2.703125, 2.845703125, 2.98828125, 3.130859375, 3.2734375, 3.416015625, 3.55859375, 3.701171875, 3.84375, 3.986328125, 4.12890625, 4.271484375, 4.4140625, 4.556640625, 4.69921875]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 9.0, 7.0, 15.0, 13.0, 17.0, 17.0, 20.0, 25.0, 26.0, 28.0, 34.0, 28.0, 46.0, 48.0, 41.0, 44.0, 44.0, 46.0, 55.0, 41.0, 33.0, 48.0, 25.0, 27.0, 33.0, 33.0, 35.0, 31.0, 14.0, 18.0, 14.0, 19.0, 9.0, 8.0, 10.0, 4.0, 9.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.953125, -2.85675048828125, -2.7603759765625, -2.66400146484375, -2.567626953125, -2.47125244140625, -2.3748779296875, -2.27850341796875, -2.18212890625, -2.08575439453125, -1.9893798828125, -1.89300537109375, -1.796630859375, -1.70025634765625, -1.6038818359375, -1.50750732421875, -1.4111328125, -1.31475830078125, -1.2183837890625, -1.12200927734375, -1.025634765625, -0.92926025390625, -0.8328857421875, -0.73651123046875, -0.64013671875, -0.54376220703125, -0.4473876953125, -0.35101318359375, -0.254638671875, -0.15826416015625, -0.0618896484375, 0.03448486328125, 0.130859375, 0.22723388671875, 0.3236083984375, 0.41998291015625, 0.516357421875, 0.61273193359375, 0.7091064453125, 0.80548095703125, 0.90185546875, 0.99822998046875, 1.0946044921875, 1.19097900390625, 1.287353515625, 1.38372802734375, 1.4801025390625, 1.57647705078125, 1.6728515625, 1.76922607421875, 1.8656005859375, 1.96197509765625, 2.058349609375, 2.15472412109375, 2.2510986328125, 2.34747314453125, 2.44384765625, 2.54022216796875, 2.6365966796875, 2.73297119140625, 2.829345703125, 2.92572021484375, 3.0220947265625, 3.11846923828125, 3.21484375]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 2.0, 6.0, 14.0, 18.0, 20.0, 35.0, 66.0, 108.0, 170.0, 259.0, 374.0, 601.0, 1030.0, 1857.0, 3243.0, 5729.0, 10956.0, 21725.0, 44250.0, 94868.0, 207912.0, 446322.0, 842419.0, 1060869.0, 744612.0, 377163.0, 172881.0, 79691.0, 37703.0, 18316.0, 9367.0, 5011.0, 2683.0, 1567.0, 922.0, 518.0, 331.0, 226.0, 148.0, 99.0, 78.0, 35.0, 28.0, 22.0, 11.0, 4.0, 5.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08203125, -4.92010498046875, -4.7581787109375, -4.59625244140625, -4.434326171875, -4.27239990234375, -4.1104736328125, -3.94854736328125, -3.78662109375, -3.62469482421875, -3.4627685546875, -3.30084228515625, -3.138916015625, -2.97698974609375, -2.8150634765625, -2.65313720703125, -2.4912109375, -2.32928466796875, -2.1673583984375, -2.00543212890625, -1.843505859375, -1.68157958984375, -1.5196533203125, -1.35772705078125, -1.19580078125, -1.03387451171875, -0.8719482421875, -0.71002197265625, -0.548095703125, -0.38616943359375, -0.2242431640625, -0.06231689453125, 0.099609375, 0.26153564453125, 0.4234619140625, 0.58538818359375, 0.747314453125, 0.90924072265625, 1.0711669921875, 1.23309326171875, 1.39501953125, 1.55694580078125, 1.7188720703125, 1.88079833984375, 2.042724609375, 2.20465087890625, 2.3665771484375, 2.52850341796875, 2.6904296875, 2.85235595703125, 3.0142822265625, 3.17620849609375, 3.338134765625, 3.50006103515625, 3.6619873046875, 3.82391357421875, 3.98583984375, 4.14776611328125, 4.3096923828125, 4.47161865234375, 4.633544921875, 4.79547119140625, 4.9573974609375, 5.11932373046875, 5.28125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 5.0, 5.0, 7.0, 11.0, 16.0, 22.0, 32.0, 42.0, 70.0, 66.0, 88.0, 95.0, 137.0, 144.0, 191.0, 241.0, 269.0, 249.0, 276.0, 270.0, 272.0, 279.0, 213.0, 199.0, 179.0, 122.0, 110.0, 95.0, 88.0, 59.0, 51.0, 33.0, 29.0, 18.0, 16.0, 15.0, 9.0, 7.0, 6.0, 6.0, 4.0, 6.0, 9.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4033203125, -1.3482513427734375, -1.293182373046875, -1.2381134033203125, -1.18304443359375, -1.1279754638671875, -1.072906494140625, -1.0178375244140625, -0.9627685546875, -0.9076995849609375, -0.852630615234375, -0.7975616455078125, -0.74249267578125, -0.6874237060546875, -0.632354736328125, -0.5772857666015625, -0.522216796875, -0.4671478271484375, -0.412078857421875, -0.3570098876953125, -0.30194091796875, -0.2468719482421875, -0.191802978515625, -0.1367340087890625, -0.0816650390625, -0.0265960693359375, 0.028472900390625, 0.0835418701171875, 0.13861083984375, 0.1936798095703125, 0.248748779296875, 0.3038177490234375, 0.35888671875, 0.4139556884765625, 0.469024658203125, 0.5240936279296875, 0.57916259765625, 0.6342315673828125, 0.689300537109375, 0.7443695068359375, 0.7994384765625, 0.8545074462890625, 0.909576416015625, 0.9646453857421875, 1.01971435546875, 1.0747833251953125, 1.129852294921875, 1.1849212646484375, 1.239990234375, 1.2950592041015625, 1.350128173828125, 1.4051971435546875, 1.46026611328125, 1.5153350830078125, 1.570404052734375, 1.6254730224609375, 1.6805419921875, 1.7356109619140625, 1.790679931640625, 1.8457489013671875, 1.90081787109375, 1.9558868408203125, 2.010955810546875, 2.0660247802734375, 2.12109375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 8.0, 0.0, 3.0, 9.0, 13.0, 8.0, 10.0, 17.0, 13.0, 17.0, 18.0, 35.0, 36.0, 47.0, 49.0, 70.0, 55.0, 64.0, 77.0, 63.0, 60.0, 70.0, 34.0, 41.0, 35.0, 28.0, 14.0, 16.0, 12.0, 11.0, 14.0, 15.0, 10.0, 10.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.917079925537109, -4.765730857849121, -4.614381790161133, -4.4630327224731445, -4.311683654785156, -4.16033411026001, -4.0089850425720215, -3.857635974884033, -3.706286907196045, -3.5549378395080566, -3.4035887718200684, -3.252239465713501, -3.1008903980255127, -2.9495413303375244, -2.798192024230957, -2.6468429565429688, -2.4954938888549805, -2.344144821166992, -2.192795753479004, -2.0414464473724365, -1.8900973796844482, -1.73874831199646, -1.5873991250991821, -1.4360499382019043, -1.284700870513916, -1.1333518028259277, -0.9820026159286499, -0.8306534886360168, -0.6793043613433838, -0.5279552340507507, -0.3766061067581177, -0.22525691986083984, -0.07390832901000977, 0.07744079828262329, 0.22878992557525635, 0.3801390528678894, 0.5314881801605225, 0.6828373074531555, 0.8341864347457886, 0.9855356216430664, 1.1368846893310547, 1.288233757019043, 1.4395829439163208, 1.5909321308135986, 1.742281198501587, 1.8936302661895752, 2.0449795722961426, 2.196328639984131, 2.347677707672119, 2.4990267753601074, 2.6503758430480957, 2.801725149154663, 2.9530742168426514, 3.1044232845306396, 3.255772590637207, 3.4071216583251953, 3.5584707260131836, 3.709819793701172, 3.86116886138916, 4.012517929077148, 4.163866996765137, 4.315216541290283, 4.4665656089782715, 4.61791467666626, 4.769263744354248]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 0.0, 3.0, 3.0, 4.0, 13.0, 3.0, 9.0, 10.0, 24.0, 12.0, 16.0, 14.0, 30.0, 26.0, 17.0, 38.0, 28.0, 40.0, 44.0, 37.0, 51.0, 44.0, 35.0, 44.0, 60.0, 45.0, 36.0, 32.0, 41.0, 34.0, 30.0, 26.0, 13.0, 18.0, 26.0, 23.0, 21.0, 11.0, 8.0, 10.0, 4.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-5.268864631652832, -5.125741958618164, -4.982618808746338, -4.83949613571167, -4.696372985839844, -4.553250312805176, -4.41012716293335, -4.267004489898682, -4.1238813400268555, -3.9807584285736084, -3.8376355171203613, -3.6945126056671143, -3.551389694213867, -3.40826678276062, -3.265143871307373, -3.122021198272705, -2.978898286819458, -2.835775375366211, -2.692652463912964, -2.549529552459717, -2.4064066410064697, -2.2632837295532227, -2.1201610565185547, -1.977038025856018, -1.833915114402771, -1.690792202949524, -1.5476692914962769, -1.4045464992523193, -1.2614235877990723, -1.1183006763458252, -0.9751777648925781, -0.832054853439331, -0.6889317035675049, -0.5458087921142578, -0.40268591046333313, -0.25956302881240845, -0.11644011735916138, 0.026682794094085693, 0.169805645942688, 0.31292855739593506, 0.45605146884918213, 0.5991743803024292, 0.7422972917556763, 0.8854201436042786, 1.0285429954528809, 1.171665906906128, 1.314788818359375, 1.457911729812622, 1.6010346412658691, 1.7441575527191162, 1.8872804641723633, 2.0304033756256104, 2.1735262870788574, 2.3166491985321045, 2.4597721099853516, 2.6028947830200195, 2.7460179328918457, 2.8891408443450928, 3.03226375579834, 3.175386667251587, 3.318509578704834, 3.461632490158081, 3.604755401611328, 3.747878074645996, 3.891000986099243]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 7.0, 8.0, 12.0, 16.0, 30.0, 51.0, 54.0, 95.0, 214.0, 283.0, 433.0, 813.0, 1392.0, 2307.0, 4210.0, 7657.0, 14274.0, 27646.0, 55179.0, 129488.0, 332814.0, 271676.0, 102843.0, 46269.0, 23241.0, 12256.0, 6553.0, 3687.0, 2063.0, 1213.0, 670.0, 418.0, 232.0, 167.0, 123.0, 52.0, 36.0, 33.0, 15.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7314453125, -1.673492431640625, -1.61553955078125, -1.557586669921875, -1.4996337890625, -1.441680908203125, -1.38372802734375, -1.325775146484375, -1.267822265625, -1.209869384765625, -1.15191650390625, -1.093963623046875, -1.0360107421875, -0.978057861328125, -0.92010498046875, -0.862152099609375, -0.80419921875, -0.746246337890625, -0.68829345703125, -0.630340576171875, -0.5723876953125, -0.514434814453125, -0.45648193359375, -0.398529052734375, -0.340576171875, -0.282623291015625, -0.22467041015625, -0.166717529296875, -0.1087646484375, -0.050811767578125, 0.00714111328125, 0.065093994140625, 0.123046875, 0.180999755859375, 0.23895263671875, 0.296905517578125, 0.3548583984375, 0.412811279296875, 0.47076416015625, 0.528717041015625, 0.586669921875, 0.644622802734375, 0.70257568359375, 0.760528564453125, 0.8184814453125, 0.876434326171875, 0.93438720703125, 0.992340087890625, 1.05029296875, 1.108245849609375, 1.16619873046875, 1.224151611328125, 1.2821044921875, 1.340057373046875, 1.39801025390625, 1.455963134765625, 1.513916015625, 1.571868896484375, 1.62982177734375, 1.687774658203125, 1.7457275390625, 1.803680419921875, 1.86163330078125, 1.919586181640625, 1.9775390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 8.0, 8.0, 5.0, 13.0, 6.0, 14.0, 15.0, 23.0, 29.0, 16.0, 34.0, 30.0, 26.0, 34.0, 40.0, 42.0, 49.0, 55.0, 45.0, 52.0, 60.0, 38.0, 48.0, 45.0, 33.0, 35.0, 30.0, 31.0, 24.0, 29.0, 9.0, 18.0, 12.0, 13.0, 10.0, 7.0, 5.0, 5.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-6.09765625, -5.9368896484375, -5.776123046875, -5.6153564453125, -5.45458984375, -5.2938232421875, -5.133056640625, -4.9722900390625, -4.8115234375, -4.6507568359375, -4.489990234375, -4.3292236328125, -4.16845703125, -4.0076904296875, -3.846923828125, -3.6861572265625, -3.525390625, -3.3646240234375, -3.203857421875, -3.0430908203125, -2.88232421875, -2.7215576171875, -2.560791015625, -2.4000244140625, -2.2392578125, -2.0784912109375, -1.917724609375, -1.7569580078125, -1.59619140625, -1.4354248046875, -1.274658203125, -1.1138916015625, -0.953125, -0.7923583984375, -0.631591796875, -0.4708251953125, -0.31005859375, -0.1492919921875, 0.011474609375, 0.1722412109375, 0.3330078125, 0.4937744140625, 0.654541015625, 0.8153076171875, 0.97607421875, 1.1368408203125, 1.297607421875, 1.4583740234375, 1.619140625, 1.7799072265625, 1.940673828125, 2.1014404296875, 2.26220703125, 2.4229736328125, 2.583740234375, 2.7445068359375, 2.9052734375, 3.0660400390625, 3.226806640625, 3.3875732421875, 3.54833984375, 3.7091064453125, 3.869873046875, 4.0306396484375, 4.19140625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 8.0, 3.0, 3.0, 6.0, 4.0, 13.0, 16.0, 16.0, 21.0, 37.0, 35.0, 69.0, 80.0, 107.0, 151.0, 205.0, 318.0, 432.0, 658.0, 1070.0, 1966.0, 4020.0, 10470.0, 33420.0, 926039.0, 45870.0, 12812.0, 4873.0, 2330.0, 1190.0, 701.0, 479.0, 322.0, 217.0, 172.0, 107.0, 70.0, 63.0, 41.0, 46.0, 24.0, 23.0, 18.0, 12.0, 6.0, 4.0, 2.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.51171875, -4.37335205078125, -4.2349853515625, -4.09661865234375, -3.958251953125, -3.81988525390625, -3.6815185546875, -3.54315185546875, -3.40478515625, -3.26641845703125, -3.1280517578125, -2.98968505859375, -2.851318359375, -2.71295166015625, -2.5745849609375, -2.43621826171875, -2.2978515625, -2.15948486328125, -2.0211181640625, -1.88275146484375, -1.744384765625, -1.60601806640625, -1.4676513671875, -1.32928466796875, -1.19091796875, -1.05255126953125, -0.9141845703125, -0.77581787109375, -0.637451171875, -0.49908447265625, -0.3607177734375, -0.22235107421875, -0.083984375, 0.05438232421875, 0.1927490234375, 0.33111572265625, 0.469482421875, 0.60784912109375, 0.7462158203125, 0.88458251953125, 1.02294921875, 1.16131591796875, 1.2996826171875, 1.43804931640625, 1.576416015625, 1.71478271484375, 1.8531494140625, 1.99151611328125, 2.1298828125, 2.26824951171875, 2.4066162109375, 2.54498291015625, 2.683349609375, 2.82171630859375, 2.9600830078125, 3.09844970703125, 3.23681640625, 3.37518310546875, 3.5135498046875, 3.65191650390625, 3.790283203125, 3.92864990234375, 4.0670166015625, 4.20538330078125, 4.34375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 3.0, 7.0, 5.0, 11.0, 10.0, 14.0, 22.0, 18.0, 28.0, 40.0, 29.0, 30.0, 35.0, 46.0, 43.0, 54.0, 60.0, 60.0, 46.0, 47.0, 47.0, 45.0, 45.0, 36.0, 36.0, 24.0, 22.0, 26.0, 19.0, 20.0, 20.0, 11.0, 9.0, 9.0, 7.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.287109375, -3.185028076171875, -3.08294677734375, -2.980865478515625, -2.8787841796875, -2.776702880859375, -2.67462158203125, -2.572540283203125, -2.470458984375, -2.368377685546875, -2.26629638671875, -2.164215087890625, -2.0621337890625, -1.960052490234375, -1.85797119140625, -1.755889892578125, -1.65380859375, -1.551727294921875, -1.44964599609375, -1.347564697265625, -1.2454833984375, -1.143402099609375, -1.04132080078125, -0.939239501953125, -0.837158203125, -0.735076904296875, -0.63299560546875, -0.530914306640625, -0.4288330078125, -0.326751708984375, -0.22467041015625, -0.122589111328125, -0.0205078125, 0.081573486328125, 0.18365478515625, 0.285736083984375, 0.3878173828125, 0.489898681640625, 0.59197998046875, 0.694061279296875, 0.796142578125, 0.898223876953125, 1.00030517578125, 1.102386474609375, 1.2044677734375, 1.306549072265625, 1.40863037109375, 1.510711669921875, 1.61279296875, 1.714874267578125, 1.81695556640625, 1.919036865234375, 2.0211181640625, 2.123199462890625, 2.22528076171875, 2.327362060546875, 2.429443359375, 2.531524658203125, 2.63360595703125, 2.735687255859375, 2.8377685546875, 2.939849853515625, 3.04193115234375, 3.144012451171875, 3.24609375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 10.0, 10.0, 11.0, 17.0, 17.0, 28.0, 27.0, 38.0, 53.0, 79.0, 106.0, 148.0, 197.0, 282.0, 454.0, 653.0, 1005.0, 1710.0, 3325.0, 7299.0, 22032.0, 917439.0, 67214.0, 14348.0, 5419.0, 2586.0, 1404.0, 832.0, 521.0, 346.0, 250.0, 170.0, 137.0, 82.0, 75.0, 72.0, 40.0, 38.0, 28.0, 14.0, 12.0, 10.0, 6.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2748908996582031, -0.26535797119140625, -0.2558250427246094, -0.2462921142578125, -0.23675918579101562, -0.22722625732421875, -0.21769332885742188, -0.208160400390625, -0.19862747192382812, -0.18909454345703125, -0.17956161499023438, -0.1700286865234375, -0.16049575805664062, -0.15096282958984375, -0.14142990112304688, -0.13189697265625, -0.12236404418945312, -0.11283111572265625, -0.10329818725585938, -0.0937652587890625, -0.08423233032226562, -0.07469940185546875, -0.06516647338867188, -0.055633544921875, -0.046100616455078125, -0.03656768798828125, -0.027034759521484375, -0.0175018310546875, -0.007968902587890625, 0.00156402587890625, 0.011096954345703125, 0.0206298828125, 0.030162811279296875, 0.03969573974609375, 0.049228668212890625, 0.0587615966796875, 0.06829452514648438, 0.07782745361328125, 0.08736038208007812, 0.096893310546875, 0.10642623901367188, 0.11595916748046875, 0.12549209594726562, 0.1350250244140625, 0.14455795288085938, 0.15409088134765625, 0.16362380981445312, 0.17315673828125, 0.18268966674804688, 0.19222259521484375, 0.20175552368164062, 0.2112884521484375, 0.22082138061523438, 0.23035430908203125, 0.23988723754882812, 0.249420166015625, 0.2589530944824219, 0.26848602294921875, 0.2780189514160156, 0.2875518798828125, 0.2970848083496094, 0.30661773681640625, 0.3161506652832031, 0.32568359375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 0.0, 8.0, 8.0, 9.0, 8.0, 18.0, 15.0, 22.0, 19.0, 23.0, 43.0, 41.0, 35.0, 52.0, 51.0, 51.0, 54.0, 61.0, 57.0, 59.0, 47.0, 56.0, 39.0, 33.0, 33.0, 28.0, 28.0, 17.0, 15.0, 14.0, 16.0, 9.0, 6.0, 7.0, 2.0, 6.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.607439041137695e-05, -4.4704414904117584e-05, -4.3334439396858215e-05, -4.1964463889598846e-05, -4.059448838233948e-05, -3.922451287508011e-05, -3.785453736782074e-05, -3.648456186056137e-05, -3.5114586353302e-05, -3.374461084604263e-05, -3.2374635338783264e-05, -3.1004659831523895e-05, -2.9634684324264526e-05, -2.8264708817005157e-05, -2.689473330974579e-05, -2.552475780248642e-05, -2.415478229522705e-05, -2.2784806787967682e-05, -2.1414831280708313e-05, -2.0044855773448944e-05, -1.8674880266189575e-05, -1.7304904758930206e-05, -1.5934929251670837e-05, -1.4564953744411469e-05, -1.31949782371521e-05, -1.182500272989273e-05, -1.0455027222633362e-05, -9.085051715373993e-06, -7.715076208114624e-06, -6.345100700855255e-06, -4.975125193595886e-06, -3.6051496863365173e-06, -2.2351741790771484e-06, -8.651986718177795e-07, 5.047768354415894e-07, 1.8747523427009583e-06, 3.244727849960327e-06, 4.614703357219696e-06, 5.984678864479065e-06, 7.354654371738434e-06, 8.724629878997803e-06, 1.0094605386257172e-05, 1.146458089351654e-05, 1.283455640077591e-05, 1.4204531908035278e-05, 1.5574507415294647e-05, 1.6944482922554016e-05, 1.8314458429813385e-05, 1.9684433937072754e-05, 2.1054409444332123e-05, 2.2424384951591492e-05, 2.379436045885086e-05, 2.516433596611023e-05, 2.65343114733696e-05, 2.7904286980628967e-05, 2.9274262487888336e-05, 3.0644237995147705e-05, 3.2014213502407074e-05, 3.338418900966644e-05, 3.475416451692581e-05, 3.612414002418518e-05, 3.749411553144455e-05, 3.886409103870392e-05, 4.023406654596329e-05, 4.1604042053222656e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 11.0, 12.0, 23.0, 25.0, 31.0, 44.0, 69.0, 106.0, 147.0, 228.0, 352.0, 521.0, 800.0, 1240.0, 1871.0, 2987.0, 4967.0, 8258.0, 13874.0, 24626.0, 45102.0, 91216.0, 217396.0, 329187.0, 152648.0, 68762.0, 35123.0, 19450.0, 11510.0, 6645.0, 4196.0, 2503.0, 1574.0, 1030.0, 683.0, 437.0, 293.0, 205.0, 134.0, 82.0, 69.0, 28.0, 26.0, 22.0, 14.0, 13.0, 10.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1005859375, -0.09737300872802734, -0.09416007995605469, -0.09094715118408203, -0.08773422241210938, -0.08452129364013672, -0.08130836486816406, -0.0780954360961914, -0.07488250732421875, -0.0716695785522461, -0.06845664978027344, -0.06524372100830078, -0.062030792236328125, -0.05881786346435547, -0.05560493469238281, -0.052392005920410156, -0.0491790771484375, -0.045966148376464844, -0.04275321960449219, -0.03954029083251953, -0.036327362060546875, -0.03311443328857422, -0.029901504516601562, -0.026688575744628906, -0.02347564697265625, -0.020262718200683594, -0.017049789428710938, -0.013836860656738281, -0.010623931884765625, -0.007411003112792969, -0.0041980743408203125, -0.0009851455688476562, 0.002227783203125, 0.005440711975097656, 0.008653640747070312, 0.011866569519042969, 0.015079498291015625, 0.01829242706298828, 0.021505355834960938, 0.024718284606933594, 0.02793121337890625, 0.031144142150878906, 0.03435707092285156, 0.03756999969482422, 0.040782928466796875, 0.04399585723876953, 0.04720878601074219, 0.050421714782714844, 0.0536346435546875, 0.056847572326660156, 0.06006050109863281, 0.06327342987060547, 0.06648635864257812, 0.06969928741455078, 0.07291221618652344, 0.0761251449584961, 0.07933807373046875, 0.0825510025024414, 0.08576393127441406, 0.08897686004638672, 0.09218978881835938, 0.09540271759033203, 0.09861564636230469, 0.10182857513427734, 0.10504150390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 3.0, 5.0, 10.0, 14.0, 12.0, 19.0, 24.0, 34.0, 37.0, 54.0, 94.0, 165.0, 170.0, 91.0, 73.0, 47.0, 31.0, 24.0, 17.0, 8.0, 11.0, 11.0, 9.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03790283203125, -0.036595821380615234, -0.03528881072998047, -0.0339818000793457, -0.03267478942871094, -0.03136777877807617, -0.030060768127441406, -0.02875375747680664, -0.027446746826171875, -0.02613973617553711, -0.024832725524902344, -0.023525714874267578, -0.022218704223632812, -0.020911693572998047, -0.01960468292236328, -0.018297672271728516, -0.01699066162109375, -0.015683650970458984, -0.014376640319824219, -0.013069629669189453, -0.011762619018554688, -0.010455608367919922, -0.009148597717285156, -0.00784158706665039, -0.006534576416015625, -0.005227565765380859, -0.003920555114746094, -0.002613544464111328, -0.0013065338134765625, 4.76837158203125e-07, 0.0013074874877929688, 0.0026144981384277344, 0.0039215087890625, 0.005228519439697266, 0.006535530090332031, 0.007842540740966797, 0.009149551391601562, 0.010456562042236328, 0.011763572692871094, 0.01307058334350586, 0.014377593994140625, 0.01568460464477539, 0.016991615295410156, 0.018298625946044922, 0.019605636596679688, 0.020912647247314453, 0.02221965789794922, 0.023526668548583984, 0.02483367919921875, 0.026140689849853516, 0.02744770050048828, 0.028754711151123047, 0.030061721801757812, 0.03136873245239258, 0.032675743103027344, 0.03398275375366211, 0.035289764404296875, 0.03659677505493164, 0.037903785705566406, 0.03921079635620117, 0.04051780700683594, 0.0418248176574707, 0.04313182830810547, 0.044438838958740234, 0.045745849609375]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 2.0, 9.0, 13.0, 8.0, 7.0, 20.0, 10.0, 15.0, 16.0, 33.0, 42.0, 39.0, 49.0, 51.0, 69.0, 60.0, 65.0, 71.0, 65.0, 62.0, 45.0, 35.0, 41.0, 33.0, 17.0, 19.0, 10.0, 20.0, 11.0, 15.0, 9.0, 8.0, 8.0, 5.0, 4.0, 1.0, 6.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.766502380371094, -4.616898059844971, -4.467293739318848, -4.317689418792725, -4.168085098266602, -4.01848030090332, -3.8688762187957764, -3.719271659851074, -3.569667339324951, -3.420063018798828, -3.270458698272705, -3.120854377746582, -2.97124981880188, -2.821645498275757, -2.672041177749634, -2.5224366188049316, -2.3728325366973877, -2.2232282161712646, -2.0736238956451416, -1.924019455909729, -1.7744150161743164, -1.6248106956481934, -1.4752063751220703, -1.3256019353866577, -1.1759976148605347, -1.0263932943344116, -0.876788854598999, -0.727184534072876, -0.5775801539421082, -0.42797577381134033, -0.2783714532852173, -0.1287670135498047, 0.02083730697631836, 0.170441672205925, 0.3200460374355316, 0.46965038776397705, 0.6192547678947449, 0.7688591480255127, 0.9184634685516357, 1.0680679082870483, 1.2176722288131714, 1.3672765493392944, 1.516880989074707, 1.66648530960083, 1.8160896301269531, 1.9656940698623657, 2.115298271179199, 2.2649028301239014, 2.4145071506500244, 2.5641114711761475, 2.7137157917022705, 2.8633203506469727, 3.0129246711730957, 3.1625289916992188, 3.312133312225342, 3.461737632751465, 3.611341953277588, 3.760946273803711, 3.910550594329834, 4.060154914855957, 4.20975923538208, 4.359363555908203, 4.508968353271484, 4.658572673797607, 4.8081769943237305]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 4.0, 13.0, 4.0, 9.0, 10.0, 25.0, 12.0, 14.0, 16.0, 30.0, 25.0, 16.0, 42.0, 28.0, 39.0, 42.0, 39.0, 53.0, 41.0, 34.0, 44.0, 61.0, 46.0, 34.0, 36.0, 39.0, 32.0, 29.0, 27.0, 14.0, 20.0, 27.0, 18.0, 21.0, 11.0, 8.0, 11.0, 4.0, 4.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-5.213376522064209, -5.0708394050598145, -4.928301811218262, -4.785764694213867, -4.643227577209473, -4.500690460205078, -4.358152866363525, -4.215615749359131, -4.073078155517578, -3.9305408000946045, -3.78800368309021, -3.6454663276672363, -3.502929210662842, -3.360391855239868, -3.2178544998168945, -3.0753173828125, -2.9327802658081055, -2.790242910385132, -2.6477057933807373, -2.5051684379577637, -2.362631320953369, -2.2200939655303955, -2.077556610107422, -1.9350193738937378, -1.7924821376800537, -1.6499449014663696, -1.5074076652526855, -1.364870309829712, -1.2223330736160278, -1.0797958374023438, -0.9372585415840149, -0.794721245765686, -0.652184009552002, -0.5096467733383179, -0.367109477519989, -0.22457221150398254, -0.08203494548797607, 0.06050229072570801, 0.20303958654403687, 0.3455768823623657, 0.4881141185760498, 0.6306513547897339, 0.7731886506080627, 0.9157259464263916, 1.0582631826400757, 1.2008004188537598, 1.3433377742767334, 1.4858750104904175, 1.6284122467041016, 1.7709494829177856, 1.9134867191314697, 2.0560240745544434, 2.198561191558838, 2.3410985469818115, 2.483635902404785, 2.6261730194091797, 2.7687103748321533, 2.911247730255127, 3.0537848472595215, 3.196322202682495, 3.3388595581054688, 3.4813966751098633, 3.623934030532837, 3.7664713859558105, 3.909008502960205]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 21.0, 20.0, 22.0, 37.0, 62.0, 102.0, 128.0, 191.0, 324.0, 470.0, 659.0, 991.0, 1780.0, 2772.0, 4377.0, 7079.0, 11563.0, 19668.0, 33719.0, 58502.0, 100757.0, 159489.0, 199235.0, 171670.0, 113521.0, 66888.0, 38444.0, 22160.0, 12851.0, 7874.0, 4857.0, 3064.0, 1846.0, 1158.0, 810.0, 449.0, 332.0, 204.0, 163.0, 89.0, 65.0, 30.0, 28.0, 22.0, 18.0, 13.0, 9.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.66796875, -3.54815673828125, -3.4283447265625, -3.30853271484375, -3.188720703125, -3.06890869140625, -2.9490966796875, -2.82928466796875, -2.70947265625, -2.58966064453125, -2.4698486328125, -2.35003662109375, -2.230224609375, -2.11041259765625, -1.9906005859375, -1.87078857421875, -1.7509765625, -1.63116455078125, -1.5113525390625, -1.39154052734375, -1.271728515625, -1.15191650390625, -1.0321044921875, -0.91229248046875, -0.79248046875, -0.67266845703125, -0.5528564453125, -0.43304443359375, -0.313232421875, -0.19342041015625, -0.0736083984375, 0.04620361328125, 0.166015625, 0.28582763671875, 0.4056396484375, 0.52545166015625, 0.645263671875, 0.76507568359375, 0.8848876953125, 1.00469970703125, 1.12451171875, 1.24432373046875, 1.3641357421875, 1.48394775390625, 1.603759765625, 1.72357177734375, 1.8433837890625, 1.96319580078125, 2.0830078125, 2.20281982421875, 2.3226318359375, 2.44244384765625, 2.562255859375, 2.68206787109375, 2.8018798828125, 2.92169189453125, 3.04150390625, 3.16131591796875, 3.2811279296875, 3.40093994140625, 3.520751953125, 3.64056396484375, 3.7603759765625, 3.88018798828125, 4.0]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 4.0, 6.0, 8.0, 10.0, 13.0, 25.0, 16.0, 20.0, 25.0, 22.0, 30.0, 26.0, 32.0, 47.0, 49.0, 48.0, 38.0, 58.0, 56.0, 50.0, 48.0, 49.0, 39.0, 43.0, 28.0, 25.0, 37.0, 19.0, 25.0, 24.0, 21.0, 8.0, 13.0, 13.0, 7.0, 2.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-5.69921875, -5.5419921875, -5.384765625, -5.2275390625, -5.0703125, -4.9130859375, -4.755859375, -4.5986328125, -4.44140625, -4.2841796875, -4.126953125, -3.9697265625, -3.8125, -3.6552734375, -3.498046875, -3.3408203125, -3.18359375, -3.0263671875, -2.869140625, -2.7119140625, -2.5546875, -2.3974609375, -2.240234375, -2.0830078125, -1.92578125, -1.7685546875, -1.611328125, -1.4541015625, -1.296875, -1.1396484375, -0.982421875, -0.8251953125, -0.66796875, -0.5107421875, -0.353515625, -0.1962890625, -0.0390625, 0.1181640625, 0.275390625, 0.4326171875, 0.58984375, 0.7470703125, 0.904296875, 1.0615234375, 1.21875, 1.3759765625, 1.533203125, 1.6904296875, 1.84765625, 2.0048828125, 2.162109375, 2.3193359375, 2.4765625, 2.6337890625, 2.791015625, 2.9482421875, 3.10546875, 3.2626953125, 3.419921875, 3.5771484375, 3.734375, 3.8916015625, 4.048828125, 4.2060546875, 4.36328125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 5.0, 19.0, 19.0, 40.0, 58.0, 94.0, 137.0, 177.0, 303.0, 497.0, 829.0, 1216.0, 2024.0, 3187.0, 4901.0, 8231.0, 13978.0, 23452.0, 39802.0, 67532.0, 109564.0, 155299.0, 178136.0, 156738.0, 111707.0, 69090.0, 41060.0, 23972.0, 14334.0, 8398.0, 5222.0, 3167.0, 1947.0, 1242.0, 753.0, 524.0, 315.0, 210.0, 125.0, 83.0, 56.0, 45.0, 20.0, 16.0, 6.0, 12.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.265625, -3.15863037109375, -3.0516357421875, -2.94464111328125, -2.837646484375, -2.73065185546875, -2.6236572265625, -2.51666259765625, -2.40966796875, -2.30267333984375, -2.1956787109375, -2.08868408203125, -1.981689453125, -1.87469482421875, -1.7677001953125, -1.66070556640625, -1.5537109375, -1.44671630859375, -1.3397216796875, -1.23272705078125, -1.125732421875, -1.01873779296875, -0.9117431640625, -0.80474853515625, -0.69775390625, -0.59075927734375, -0.4837646484375, -0.37677001953125, -0.269775390625, -0.16278076171875, -0.0557861328125, 0.05120849609375, 0.158203125, 0.26519775390625, 0.3721923828125, 0.47918701171875, 0.586181640625, 0.69317626953125, 0.8001708984375, 0.90716552734375, 1.01416015625, 1.12115478515625, 1.2281494140625, 1.33514404296875, 1.442138671875, 1.54913330078125, 1.6561279296875, 1.76312255859375, 1.8701171875, 1.97711181640625, 2.0841064453125, 2.19110107421875, 2.298095703125, 2.40509033203125, 2.5120849609375, 2.61907958984375, 2.72607421875, 2.83306884765625, 2.9400634765625, 3.04705810546875, 3.154052734375, 3.26104736328125, 3.3680419921875, 3.47503662109375, 3.58203125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 5.0, 8.0, 7.0, 10.0, 6.0, 9.0, 17.0, 16.0, 13.0, 17.0, 14.0, 30.0, 25.0, 25.0, 26.0, 31.0, 36.0, 41.0, 36.0, 26.0, 55.0, 41.0, 30.0, 52.0, 37.0, 28.0, 49.0, 45.0, 29.0, 33.0, 31.0, 27.0, 23.0, 21.0, 16.0, 17.0, 10.0, 13.0, 16.0, 9.0, 4.0, 3.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.40625, -2.332183837890625, -2.25811767578125, -2.184051513671875, -2.1099853515625, -2.035919189453125, -1.96185302734375, -1.887786865234375, -1.813720703125, -1.739654541015625, -1.66558837890625, -1.591522216796875, -1.5174560546875, -1.443389892578125, -1.36932373046875, -1.295257568359375, -1.22119140625, -1.147125244140625, -1.07305908203125, -0.998992919921875, -0.9249267578125, -0.850860595703125, -0.77679443359375, -0.702728271484375, -0.628662109375, -0.554595947265625, -0.48052978515625, -0.406463623046875, -0.3323974609375, -0.258331298828125, -0.18426513671875, -0.110198974609375, -0.0361328125, 0.037933349609375, 0.11199951171875, 0.186065673828125, 0.2601318359375, 0.334197998046875, 0.40826416015625, 0.482330322265625, 0.556396484375, 0.630462646484375, 0.70452880859375, 0.778594970703125, 0.8526611328125, 0.926727294921875, 1.00079345703125, 1.074859619140625, 1.14892578125, 1.222991943359375, 1.29705810546875, 1.371124267578125, 1.4451904296875, 1.519256591796875, 1.59332275390625, 1.667388916015625, 1.741455078125, 1.815521240234375, 1.88958740234375, 1.963653564453125, 2.0377197265625, 2.111785888671875, 2.18585205078125, 2.259918212890625, 2.333984375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 4.0, 7.0, 10.0, 16.0, 22.0, 29.0, 52.0, 82.0, 125.0, 218.0, 333.0, 478.0, 788.0, 1253.0, 2050.0, 3480.0, 5813.0, 10085.0, 18292.0, 32403.0, 57477.0, 97807.0, 150027.0, 186587.0, 175124.0, 125795.0, 77319.0, 44314.0, 25011.0, 13998.0, 7857.0, 4546.0, 2717.0, 1695.0, 1014.0, 602.0, 383.0, 271.0, 155.0, 102.0, 82.0, 52.0, 23.0, 19.0, 21.0, 7.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.267578125, -1.2311248779296875, -1.194671630859375, -1.1582183837890625, -1.12176513671875, -1.0853118896484375, -1.048858642578125, -1.0124053955078125, -0.9759521484375, -0.9394989013671875, -0.903045654296875, -0.8665924072265625, -0.83013916015625, -0.7936859130859375, -0.757232666015625, -0.7207794189453125, -0.684326171875, -0.6478729248046875, -0.611419677734375, -0.5749664306640625, -0.53851318359375, -0.5020599365234375, -0.465606689453125, -0.4291534423828125, -0.3927001953125, -0.3562469482421875, -0.319793701171875, -0.2833404541015625, -0.24688720703125, -0.2104339599609375, -0.173980712890625, -0.1375274658203125, -0.10107421875, -0.0646209716796875, -0.028167724609375, 0.0082855224609375, 0.04473876953125, 0.0811920166015625, 0.117645263671875, 0.1540985107421875, 0.1905517578125, 0.2270050048828125, 0.263458251953125, 0.2999114990234375, 0.33636474609375, 0.3728179931640625, 0.409271240234375, 0.4457244873046875, 0.482177734375, 0.5186309814453125, 0.555084228515625, 0.5915374755859375, 0.62799072265625, 0.6644439697265625, 0.700897216796875, 0.7373504638671875, 0.7738037109375, 0.8102569580078125, 0.846710205078125, 0.8831634521484375, 0.91961669921875, 0.9560699462890625, 0.992523193359375, 1.0289764404296875, 1.0654296875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 8.0, 8.0, 8.0, 19.0, 17.0, 22.0, 30.0, 34.0, 37.0, 48.0, 51.0, 63.0, 53.0, 72.0, 53.0, 61.0, 61.0, 69.0, 49.0, 38.0, 42.0, 24.0, 29.0, 20.0, 15.0, 12.0, 9.0, 10.0, 8.0, 4.0, 7.0, 4.0, 7.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.465217590332031e-05, -9.18358564376831e-05, -8.90195369720459e-05, -8.620321750640869e-05, -8.338689804077148e-05, -8.057057857513428e-05, -7.775425910949707e-05, -7.493793964385986e-05, -7.212162017822266e-05, -6.930530071258545e-05, -6.648898124694824e-05, -6.367266178131104e-05, -6.085634231567383e-05, -5.804002285003662e-05, -5.5223703384399414e-05, -5.240738391876221e-05, -4.9591064453125e-05, -4.677474498748779e-05, -4.3958425521850586e-05, -4.114210605621338e-05, -3.832578659057617e-05, -3.5509467124938965e-05, -3.269314765930176e-05, -2.987682819366455e-05, -2.7060508728027344e-05, -2.4244189262390137e-05, -2.142786979675293e-05, -1.8611550331115723e-05, -1.5795230865478516e-05, -1.2978911399841309e-05, -1.0162591934204102e-05, -7.3462724685668945e-06, -4.5299530029296875e-06, -1.7136335372924805e-06, 1.1026859283447266e-06, 3.919005393981934e-06, 6.735324859619141e-06, 9.551644325256348e-06, 1.2367963790893555e-05, 1.5184283256530762e-05, 1.800060272216797e-05, 2.0816922187805176e-05, 2.3633241653442383e-05, 2.644956111907959e-05, 2.9265880584716797e-05, 3.2082200050354004e-05, 3.489851951599121e-05, 3.771483898162842e-05, 4.0531158447265625e-05, 4.334747791290283e-05, 4.616379737854004e-05, 4.8980116844177246e-05, 5.179643630981445e-05, 5.461275577545166e-05, 5.742907524108887e-05, 6.0245394706726074e-05, 6.306171417236328e-05, 6.587803363800049e-05, 6.86943531036377e-05, 7.15106725692749e-05, 7.432699203491211e-05, 7.714331150054932e-05, 7.995963096618652e-05, 8.277595043182373e-05, 8.559226989746094e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 10.0, 8.0, 15.0, 25.0, 32.0, 45.0, 74.0, 112.0, 170.0, 299.0, 493.0, 835.0, 1407.0, 2450.0, 4466.0, 7827.0, 14314.0, 25979.0, 46913.0, 81442.0, 130165.0, 175743.0, 184496.0, 147551.0, 96351.0, 56324.0, 31603.0, 17225.0, 9459.0, 5410.0, 2986.0, 1731.0, 1006.0, 598.0, 348.0, 228.0, 166.0, 94.0, 59.0, 34.0, 31.0, 15.0, 11.0, 7.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0146484375, -0.9786224365234375, -0.942596435546875, -0.9065704345703125, -0.87054443359375, -0.8345184326171875, -0.798492431640625, -0.7624664306640625, -0.7264404296875, -0.6904144287109375, -0.654388427734375, -0.6183624267578125, -0.58233642578125, -0.5463104248046875, -0.510284423828125, -0.4742584228515625, -0.438232421875, -0.4022064208984375, -0.366180419921875, -0.3301544189453125, -0.29412841796875, -0.2581024169921875, -0.222076416015625, -0.1860504150390625, -0.1500244140625, -0.1139984130859375, -0.077972412109375, -0.0419464111328125, -0.00592041015625, 0.0301055908203125, 0.066131591796875, 0.1021575927734375, 0.13818359375, 0.1742095947265625, 0.210235595703125, 0.2462615966796875, 0.28228759765625, 0.3183135986328125, 0.354339599609375, 0.3903656005859375, 0.4263916015625, 0.4624176025390625, 0.498443603515625, 0.5344696044921875, 0.57049560546875, 0.6065216064453125, 0.642547607421875, 0.6785736083984375, 0.714599609375, 0.7506256103515625, 0.786651611328125, 0.8226776123046875, 0.85870361328125, 0.8947296142578125, 0.930755615234375, 0.9667816162109375, 1.0028076171875, 1.0388336181640625, 1.074859619140625, 1.1108856201171875, 1.14691162109375, 1.1829376220703125, 1.218963623046875, 1.2549896240234375, 1.291015625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 9.0, 11.0, 19.0, 11.0, 17.0, 21.0, 27.0, 38.0, 45.0, 36.0, 54.0, 58.0, 61.0, 61.0, 65.0, 66.0, 48.0, 69.0, 48.0, 50.0, 28.0, 41.0, 26.0, 22.0, 22.0, 10.0, 10.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.469482421875, -0.4534721374511719, -0.43746185302734375, -0.4214515686035156, -0.4054412841796875, -0.3894309997558594, -0.37342071533203125, -0.3574104309082031, -0.341400146484375, -0.3253898620605469, -0.30937957763671875, -0.2933692932128906, -0.2773590087890625, -0.2613487243652344, -0.24533843994140625, -0.22932815551757812, -0.21331787109375, -0.19730758666992188, -0.18129730224609375, -0.16528701782226562, -0.1492767333984375, -0.13326644897460938, -0.11725616455078125, -0.10124588012695312, -0.085235595703125, -0.06922531127929688, -0.05321502685546875, -0.037204742431640625, -0.0211944580078125, -0.005184173583984375, 0.01082611083984375, 0.026836395263671875, 0.0428466796875, 0.058856964111328125, 0.07486724853515625, 0.09087753295898438, 0.1068878173828125, 0.12289810180664062, 0.13890838623046875, 0.15491867065429688, 0.170928955078125, 0.18693923950195312, 0.20294952392578125, 0.21895980834960938, 0.2349700927734375, 0.2509803771972656, 0.26699066162109375, 0.2830009460449219, 0.29901123046875, 0.3150215148925781, 0.33103179931640625, 0.3470420837402344, 0.3630523681640625, 0.3790626525878906, 0.39507293701171875, 0.4110832214355469, 0.427093505859375, 0.4431037902832031, 0.45911407470703125, 0.4751243591308594, 0.4911346435546875, 0.5071449279785156, 0.5231552124023438, 0.5391654968261719, 0.55517578125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 1.0, 7.0, 7.0, 9.0, 6.0, 11.0, 17.0, 21.0, 28.0, 36.0, 36.0, 44.0, 37.0, 48.0, 64.0, 61.0, 71.0, 65.0, 69.0, 57.0, 46.0, 37.0, 37.0, 31.0, 31.0, 18.0, 10.0, 16.0, 15.0, 10.0, 9.0, 5.0, 10.0, 7.0, 2.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.449916839599609, -4.305710315704346, -4.161503791809082, -4.017297744750977, -3.873091220855713, -3.728884696960449, -3.5846784114837646, -3.44047212600708, -3.2962656021118164, -3.1520590782165527, -3.007852792739868, -2.8636465072631836, -2.71943998336792, -2.5752334594726562, -2.4310271739959717, -2.286820888519287, -2.1426143646240234, -1.9984079599380493, -1.8542015552520752, -1.709995150566101, -1.565788745880127, -1.4215823411941528, -1.2773759365081787, -1.1331695318222046, -0.9889631271362305, -0.8447567224502563, -0.7005503177642822, -0.5563439130783081, -0.412137508392334, -0.26793110370635986, -0.12372469902038574, 0.02048170566558838, 0.1646881103515625, 0.3088945150375366, 0.45310091972351074, 0.5973073244094849, 0.741513729095459, 0.8857201337814331, 1.0299265384674072, 1.1741329431533813, 1.3183393478393555, 1.4625457525253296, 1.6067521572113037, 1.7509585618972778, 1.895164966583252, 2.0393714904785156, 2.1835777759552, 2.3277840614318848, 2.4719905853271484, 2.616197109222412, 2.7604033946990967, 2.9046096801757812, 3.048816204071045, 3.1930227279663086, 3.337229013442993, 3.4814352989196777, 3.6256418228149414, 3.769848346710205, 3.9140546321868896, 4.058260917663574, 4.202467441558838, 4.346673965454102, 4.490880012512207, 4.635086536407471, 4.779293060302734]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 3.0, 5.0, 7.0, 13.0, 9.0, 7.0, 12.0, 13.0, 20.0, 24.0, 31.0, 27.0, 33.0, 26.0, 33.0, 37.0, 44.0, 34.0, 42.0, 29.0, 45.0, 50.0, 48.0, 46.0, 41.0, 38.0, 35.0, 30.0, 35.0, 25.0, 24.0, 17.0, 26.0, 17.0, 19.0, 9.0, 9.0, 7.0, 8.0, 6.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.887059211730957, -4.745384216308594, -4.603708744049072, -4.462033748626709, -4.320358753204346, -4.178683757781982, -4.037008285522461, -3.8953332901000977, -3.7536582946777344, -3.611983060836792, -3.4703080654144287, -3.3286328315734863, -3.186957836151123, -3.0452826023101807, -2.9036073684692383, -2.761932373046875, -2.6202571392059326, -2.4785819053649902, -2.336906909942627, -2.1952316761016846, -2.0535566806793213, -1.911881446838379, -1.770206332206726, -1.6285312175750732, -1.4868561029434204, -1.3451809883117676, -1.2035058736801147, -1.061830759048462, -0.9201555848121643, -0.7784804701805115, -0.6368052959442139, -0.49513018131256104, -0.3534550666809082, -0.21177993714809418, -0.07010480761528015, 0.07157033681869507, 0.2132454514503479, 0.35492056608200073, 0.49659574031829834, 0.6382708549499512, 0.779945969581604, 0.9216210842132568, 1.0632961988449097, 1.2049713134765625, 1.3466465473175049, 1.4883215427398682, 1.6299967765808105, 1.7716718912124634, 1.9133470058441162, 2.0550222396850586, 2.196697235107422, 2.3383724689483643, 2.4800474643707275, 2.62172269821167, 2.763397693634033, 2.9050729274749756, 3.046748161315918, 3.1884233951568604, 3.3300983905792236, 3.471773624420166, 3.6134486198425293, 3.7551238536834717, 3.896799087524414, 4.038474082946777, 4.180149078369141]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 10.0, 10.0, 21.0, 26.0, 26.0, 54.0, 66.0, 97.0, 152.0, 231.0, 354.0, 568.0, 867.0, 1488.0, 2344.0, 4089.0, 6861.0, 12038.0, 21853.0, 42894.0, 87807.0, 193935.0, 434619.0, 875776.0, 1110074.0, 737776.0, 351656.0, 157626.0, 73807.0, 36734.0, 18399.0, 9885.0, 5077.0, 3000.0, 1695.0, 961.0, 570.0, 314.0, 194.0, 127.0, 72.0, 39.0, 38.0, 21.0, 14.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3046875, -5.135498046875, -4.96630859375, -4.797119140625, -4.6279296875, -4.458740234375, -4.28955078125, -4.120361328125, -3.951171875, -3.781982421875, -3.61279296875, -3.443603515625, -3.2744140625, -3.105224609375, -2.93603515625, -2.766845703125, -2.59765625, -2.428466796875, -2.25927734375, -2.090087890625, -1.9208984375, -1.751708984375, -1.58251953125, -1.413330078125, -1.244140625, -1.074951171875, -0.90576171875, -0.736572265625, -0.5673828125, -0.398193359375, -0.22900390625, -0.059814453125, 0.109375, 0.278564453125, 0.44775390625, 0.616943359375, 0.7861328125, 0.955322265625, 1.12451171875, 1.293701171875, 1.462890625, 1.632080078125, 1.80126953125, 1.970458984375, 2.1396484375, 2.308837890625, 2.47802734375, 2.647216796875, 2.81640625, 2.985595703125, 3.15478515625, 3.323974609375, 3.4931640625, 3.662353515625, 3.83154296875, 4.000732421875, 4.169921875, 4.339111328125, 4.50830078125, 4.677490234375, 4.8466796875, 5.015869140625, 5.18505859375, 5.354248046875, 5.5234375]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 5.0, 5.0, 9.0, 6.0, 5.0, 12.0, 13.0, 15.0, 21.0, 36.0, 25.0, 30.0, 39.0, 38.0, 36.0, 38.0, 44.0, 44.0, 42.0, 52.0, 47.0, 50.0, 41.0, 45.0, 44.0, 29.0, 33.0, 25.0, 30.0, 29.0, 20.0, 17.0, 18.0, 11.0, 13.0, 8.0, 4.0, 7.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.646484375, -3.533203125, -3.419921875, -3.306640625, -3.193359375, -3.080078125, -2.966796875, -2.853515625, -2.740234375, -2.626953125, -2.513671875, -2.400390625, -2.287109375, -2.173828125, -2.060546875, -1.947265625, -1.833984375, -1.720703125, -1.607421875, -1.494140625, -1.380859375, -1.267578125, -1.154296875, -1.041015625, -0.927734375, -0.814453125, -0.701171875, -0.587890625, -0.474609375, -0.361328125, -0.248046875, -0.134765625, -0.021484375, 0.091796875, 0.205078125, 0.318359375, 0.431640625, 0.544921875, 0.658203125, 0.771484375, 0.884765625, 0.998046875, 1.111328125, 1.224609375, 1.337890625, 1.451171875, 1.564453125, 1.677734375, 1.791015625, 1.904296875, 2.017578125, 2.130859375, 2.244140625, 2.357421875, 2.470703125, 2.583984375, 2.697265625, 2.810546875, 2.923828125, 3.037109375, 3.150390625, 3.263671875, 3.376953125, 3.490234375, 3.603515625]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 3.0, 8.0, 17.0, 26.0, 36.0, 45.0, 89.0, 136.0, 197.0, 292.0, 477.0, 774.0, 1242.0, 2184.0, 3587.0, 6090.0, 10824.0, 20073.0, 37726.0, 73085.0, 143855.0, 279113.0, 512094.0, 798261.0, 878217.0, 648165.0, 372430.0, 194928.0, 99041.0, 50851.0, 26421.0, 14510.0, 8001.0, 4495.0, 2640.0, 1568.0, 1001.0, 620.0, 417.0, 240.0, 172.0, 105.0, 72.0, 50.0, 29.0, 30.0, 20.0, 9.0, 9.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.35546875, -4.201171875, -4.046875, -3.892578125, -3.73828125, -3.583984375, -3.4296875, -3.275390625, -3.12109375, -2.966796875, -2.8125, -2.658203125, -2.50390625, -2.349609375, -2.1953125, -2.041015625, -1.88671875, -1.732421875, -1.578125, -1.423828125, -1.26953125, -1.115234375, -0.9609375, -0.806640625, -0.65234375, -0.498046875, -0.34375, -0.189453125, -0.03515625, 0.119140625, 0.2734375, 0.427734375, 0.58203125, 0.736328125, 0.890625, 1.044921875, 1.19921875, 1.353515625, 1.5078125, 1.662109375, 1.81640625, 1.970703125, 2.125, 2.279296875, 2.43359375, 2.587890625, 2.7421875, 2.896484375, 3.05078125, 3.205078125, 3.359375, 3.513671875, 3.66796875, 3.822265625, 3.9765625, 4.130859375, 4.28515625, 4.439453125, 4.59375, 4.748046875, 4.90234375, 5.056640625, 5.2109375, 5.365234375, 5.51953125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 16.0, 17.0, 11.0, 16.0, 30.0, 44.0, 62.0, 79.0, 101.0, 121.0, 146.0, 180.0, 244.0, 257.0, 299.0, 289.0, 316.0, 310.0, 253.0, 243.0, 208.0, 165.0, 152.0, 111.0, 78.0, 76.0, 49.0, 45.0, 37.0, 28.0, 13.0, 20.0, 11.0, 9.0, 6.0, 8.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8466796875, -1.7799224853515625, -1.713165283203125, -1.6464080810546875, -1.57965087890625, -1.5128936767578125, -1.446136474609375, -1.3793792724609375, -1.3126220703125, -1.2458648681640625, -1.179107666015625, -1.1123504638671875, -1.04559326171875, -0.9788360595703125, -0.912078857421875, -0.8453216552734375, -0.778564453125, -0.7118072509765625, -0.645050048828125, -0.5782928466796875, -0.51153564453125, -0.4447784423828125, -0.378021240234375, -0.3112640380859375, -0.2445068359375, -0.1777496337890625, -0.110992431640625, -0.0442352294921875, 0.02252197265625, 0.0892791748046875, 0.156036376953125, 0.2227935791015625, 0.28955078125, 0.3563079833984375, 0.423065185546875, 0.4898223876953125, 0.55657958984375, 0.6233367919921875, 0.690093994140625, 0.7568511962890625, 0.8236083984375, 0.8903656005859375, 0.957122802734375, 1.0238800048828125, 1.09063720703125, 1.1573944091796875, 1.224151611328125, 1.2909088134765625, 1.357666015625, 1.4244232177734375, 1.491180419921875, 1.5579376220703125, 1.62469482421875, 1.6914520263671875, 1.758209228515625, 1.8249664306640625, 1.8917236328125, 1.9584808349609375, 2.025238037109375, 2.0919952392578125, 2.15875244140625, 2.2255096435546875, 2.292266845703125, 2.3590240478515625, 2.42578125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 8.0, 8.0, 8.0, 14.0, 17.0, 22.0, 19.0, 29.0, 35.0, 50.0, 42.0, 58.0, 71.0, 72.0, 62.0, 59.0, 53.0, 70.0, 52.0, 36.0, 38.0, 23.0, 21.0, 20.0, 20.0, 11.0, 11.0, 10.0, 9.0, 12.0, 10.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.162611484527588, -4.995655536651611, -4.828700065612793, -4.661744117736816, -4.494788646697998, -4.3278326988220215, -4.160877227783203, -3.9939212799072266, -3.82696533203125, -3.6600096225738525, -3.493053913116455, -3.3260979652404785, -3.159142255783081, -2.9921865463256836, -2.825230836868286, -2.6582751274108887, -2.491319417953491, -2.3243637084960938, -2.1574079990386963, -1.9904521703720093, -1.8234963417053223, -1.6565406322479248, -1.4895849227905273, -1.3226290941238403, -1.1556733846664429, -0.9887176156044006, -0.8217618465423584, -0.6548061370849609, -0.4878503680229187, -0.32089459896087646, -0.153938889503479, 0.013016939163208008, 0.17997264862060547, 0.3469284176826477, 0.5138841867446899, 0.6808398962020874, 0.8477956652641296, 1.0147514343261719, 1.1817071437835693, 1.3486629724502563, 1.5156186819076538, 1.6825743913650513, 1.8495302200317383, 2.0164859294891357, 2.183441638946533, 2.3503975868225098, 2.517353057861328, 2.6843090057373047, 2.851264715194702, 3.0182204246520996, 3.185176134109497, 3.3521318435668945, 3.519087791442871, 3.6860435009002686, 3.852999210357666, 4.019955158233643, 4.186910629272461, 4.3538665771484375, 4.520822048187256, 4.687777996063232, 4.854733467102051, 5.021689414978027, 5.188645362854004, 5.355600833892822, 5.522556781768799]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 8.0, 6.0, 11.0, 6.0, 5.0, 11.0, 17.0, 14.0, 12.0, 19.0, 10.0, 25.0, 25.0, 27.0, 29.0, 29.0, 30.0, 28.0, 32.0, 29.0, 39.0, 36.0, 39.0, 36.0, 44.0, 51.0, 44.0, 34.0, 27.0, 23.0, 36.0, 29.0, 21.0, 31.0, 15.0, 14.0, 14.0, 14.0, 20.0, 13.0, 11.0, 9.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-4.60403299331665, -4.466729164123535, -4.32942533493042, -4.192121505737305, -4.0548176765441895, -3.917513608932495, -3.78020977973938, -3.6429059505462646, -3.5056018829345703, -3.368298053741455, -3.23099422454834, -3.0936903953552246, -2.9563863277435303, -2.819082498550415, -2.6817786693573, -2.5444748401641846, -2.4071710109710693, -2.269867181777954, -2.132563352584839, -1.995259404182434, -1.8579554557800293, -1.720651626586914, -1.5833477973937988, -1.4460439682006836, -1.3087400197982788, -1.1714361906051636, -1.0341322422027588, -0.8968284130096436, -0.7595245242118835, -0.6222206354141235, -0.4849168062210083, -0.3476129174232483, -0.21030902862548828, -0.07300515472888947, 0.06429871916770935, 0.20160257816314697, 0.338906466960907, 0.476210355758667, 0.6135141849517822, 0.7508180737495422, 0.8881219625473022, 1.0254257917404175, 1.1627297401428223, 1.3000335693359375, 1.4373373985290527, 1.5746413469314575, 1.7119451761245728, 1.8492491245269775, 1.9865529537200928, 2.123856782913208, 2.2611606121063232, 2.3984646797180176, 2.535768508911133, 2.673072338104248, 2.8103761672973633, 2.9476799964904785, 3.0849838256835938, 3.222287654876709, 3.359591484069824, 3.4968953132629395, 3.634199380874634, 3.771503210067749, 3.9088070392608643, 4.046111106872559, 4.183414936065674]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 2.0, 5.0, 8.0, 10.0, 14.0, 23.0, 31.0, 46.0, 81.0, 111.0, 166.0, 225.0, 300.0, 419.0, 705.0, 956.0, 1434.0, 2034.0, 3021.0, 4364.0, 6426.0, 9844.0, 14352.0, 21912.0, 33848.0, 55762.0, 98684.0, 186380.0, 247507.0, 147732.0, 79682.0, 46228.0, 29007.0, 18712.0, 12350.0, 8231.0, 5677.0, 3839.0, 2642.0, 1762.0, 1265.0, 885.0, 569.0, 416.0, 276.0, 186.0, 149.0, 86.0, 72.0, 51.0, 28.0, 25.0, 7.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.28515625, -1.245391845703125, -1.20562744140625, -1.165863037109375, -1.1260986328125, -1.086334228515625, -1.04656982421875, -1.006805419921875, -0.967041015625, -0.927276611328125, -0.88751220703125, -0.847747802734375, -0.8079833984375, -0.768218994140625, -0.72845458984375, -0.688690185546875, -0.64892578125, -0.609161376953125, -0.56939697265625, -0.529632568359375, -0.4898681640625, -0.450103759765625, -0.41033935546875, -0.370574951171875, -0.330810546875, -0.291046142578125, -0.25128173828125, -0.211517333984375, -0.1717529296875, -0.131988525390625, -0.09222412109375, -0.052459716796875, -0.0126953125, 0.027069091796875, 0.06683349609375, 0.106597900390625, 0.1463623046875, 0.186126708984375, 0.22589111328125, 0.265655517578125, 0.305419921875, 0.345184326171875, 0.38494873046875, 0.424713134765625, 0.4644775390625, 0.504241943359375, 0.54400634765625, 0.583770751953125, 0.62353515625, 0.663299560546875, 0.70306396484375, 0.742828369140625, 0.7825927734375, 0.822357177734375, 0.86212158203125, 0.901885986328125, 0.941650390625, 0.981414794921875, 1.02117919921875, 1.060943603515625, 1.1007080078125, 1.140472412109375, 1.18023681640625, 1.220001220703125, 1.259765625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 6.0, 9.0, 4.0, 6.0, 6.0, 12.0, 14.0, 17.0, 14.0, 20.0, 15.0, 23.0, 16.0, 32.0, 36.0, 32.0, 18.0, 39.0, 35.0, 35.0, 35.0, 38.0, 37.0, 32.0, 38.0, 50.0, 44.0, 32.0, 27.0, 32.0, 33.0, 29.0, 23.0, 24.0, 24.0, 14.0, 18.0, 20.0, 9.0, 8.0, 14.0, 11.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.76171875, -4.61895751953125, -4.4761962890625, -4.33343505859375, -4.190673828125, -4.04791259765625, -3.9051513671875, -3.76239013671875, -3.61962890625, -3.47686767578125, -3.3341064453125, -3.19134521484375, -3.048583984375, -2.90582275390625, -2.7630615234375, -2.62030029296875, -2.4775390625, -2.33477783203125, -2.1920166015625, -2.04925537109375, -1.906494140625, -1.76373291015625, -1.6209716796875, -1.47821044921875, -1.33544921875, -1.19268798828125, -1.0499267578125, -0.90716552734375, -0.764404296875, -0.62164306640625, -0.4788818359375, -0.33612060546875, -0.193359375, -0.05059814453125, 0.0921630859375, 0.23492431640625, 0.377685546875, 0.52044677734375, 0.6632080078125, 0.80596923828125, 0.94873046875, 1.09149169921875, 1.2342529296875, 1.37701416015625, 1.519775390625, 1.66253662109375, 1.8052978515625, 1.94805908203125, 2.0908203125, 2.23358154296875, 2.3763427734375, 2.51910400390625, 2.661865234375, 2.80462646484375, 2.9473876953125, 3.09014892578125, 3.23291015625, 3.37567138671875, 3.5184326171875, 3.66119384765625, 3.803955078125, 3.94671630859375, 4.0894775390625, 4.23223876953125, 4.375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 13.0, 13.0, 11.0, 29.0, 31.0, 28.0, 50.0, 94.0, 129.0, 173.0, 264.0, 468.0, 806.0, 1594.0, 3498.0, 10638.0, 51535.0, 941531.0, 25614.0, 6686.0, 2443.0, 1141.0, 647.0, 373.0, 219.0, 168.0, 133.0, 65.0, 34.0, 32.0, 30.0, 26.0, 10.0, 11.0, 9.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.5546875, -6.35784912109375, -6.1610107421875, -5.96417236328125, -5.767333984375, -5.57049560546875, -5.3736572265625, -5.17681884765625, -4.97998046875, -4.78314208984375, -4.5863037109375, -4.38946533203125, -4.192626953125, -3.99578857421875, -3.7989501953125, -3.60211181640625, -3.4052734375, -3.20843505859375, -3.0115966796875, -2.81475830078125, -2.617919921875, -2.42108154296875, -2.2242431640625, -2.02740478515625, -1.83056640625, -1.63372802734375, -1.4368896484375, -1.24005126953125, -1.043212890625, -0.84637451171875, -0.6495361328125, -0.45269775390625, -0.255859375, -0.05902099609375, 0.1378173828125, 0.33465576171875, 0.531494140625, 0.72833251953125, 0.9251708984375, 1.12200927734375, 1.31884765625, 1.51568603515625, 1.7125244140625, 1.90936279296875, 2.106201171875, 2.30303955078125, 2.4998779296875, 2.69671630859375, 2.8935546875, 3.09039306640625, 3.2872314453125, 3.48406982421875, 3.680908203125, 3.87774658203125, 4.0745849609375, 4.27142333984375, 4.46826171875, 4.66510009765625, 4.8619384765625, 5.05877685546875, 5.255615234375, 5.45245361328125, 5.6492919921875, 5.84613037109375, 6.04296875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 8.0, 16.0, 8.0, 14.0, 24.0, 21.0, 30.0, 26.0, 27.0, 37.0, 54.0, 44.0, 53.0, 57.0, 50.0, 62.0, 58.0, 52.0, 56.0, 41.0, 42.0, 34.0, 33.0, 19.0, 24.0, 17.0, 18.0, 18.0, 17.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.68359375, -3.56591796875, -3.4482421875, -3.33056640625, -3.212890625, -3.09521484375, -2.9775390625, -2.85986328125, -2.7421875, -2.62451171875, -2.5068359375, -2.38916015625, -2.271484375, -2.15380859375, -2.0361328125, -1.91845703125, -1.80078125, -1.68310546875, -1.5654296875, -1.44775390625, -1.330078125, -1.21240234375, -1.0947265625, -0.97705078125, -0.859375, -0.74169921875, -0.6240234375, -0.50634765625, -0.388671875, -0.27099609375, -0.1533203125, -0.03564453125, 0.08203125, 0.19970703125, 0.3173828125, 0.43505859375, 0.552734375, 0.67041015625, 0.7880859375, 0.90576171875, 1.0234375, 1.14111328125, 1.2587890625, 1.37646484375, 1.494140625, 1.61181640625, 1.7294921875, 1.84716796875, 1.96484375, 2.08251953125, 2.2001953125, 2.31787109375, 2.435546875, 2.55322265625, 2.6708984375, 2.78857421875, 2.90625, 3.02392578125, 3.1416015625, 3.25927734375, 3.376953125, 3.49462890625, 3.6123046875, 3.72998046875, 3.84765625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 9.0, 7.0, 9.0, 16.0, 14.0, 21.0, 33.0, 40.0, 60.0, 67.0, 143.0, 171.0, 226.0, 356.0, 523.0, 836.0, 1312.0, 2284.0, 4345.0, 9446.0, 27718.0, 925225.0, 49322.0, 13328.0, 5642.0, 2831.0, 1647.0, 929.0, 622.0, 434.0, 256.0, 200.0, 129.0, 106.0, 61.0, 47.0, 37.0, 29.0, 22.0, 11.0, 8.0, 12.0, 3.0, 7.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.25830078125, -0.2501487731933594, -0.24199676513671875, -0.23384475708007812, -0.2256927490234375, -0.21754074096679688, -0.20938873291015625, -0.20123672485351562, -0.193084716796875, -0.18493270874023438, -0.17678070068359375, -0.16862869262695312, -0.1604766845703125, -0.15232467651367188, -0.14417266845703125, -0.13602066040039062, -0.12786865234375, -0.11971664428710938, -0.11156463623046875, -0.10341262817382812, -0.0952606201171875, -0.08710861206054688, -0.07895660400390625, -0.07080459594726562, -0.062652587890625, -0.054500579833984375, -0.04634857177734375, -0.038196563720703125, -0.0300445556640625, -0.021892547607421875, -0.01374053955078125, -0.005588531494140625, 0.0025634765625, 0.010715484619140625, 0.01886749267578125, 0.027019500732421875, 0.0351715087890625, 0.043323516845703125, 0.05147552490234375, 0.059627532958984375, 0.067779541015625, 0.07593154907226562, 0.08408355712890625, 0.09223556518554688, 0.1003875732421875, 0.10853958129882812, 0.11669158935546875, 0.12484359741210938, 0.13299560546875, 0.14114761352539062, 0.14929962158203125, 0.15745162963867188, 0.1656036376953125, 0.17375564575195312, 0.18190765380859375, 0.19005966186523438, 0.198211669921875, 0.20636367797851562, 0.21451568603515625, 0.22266769409179688, 0.2308197021484375, 0.23897171020507812, 0.24712371826171875, 0.2552757263183594, 0.263427734375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 6.0, 7.0, 8.0, 16.0, 22.0, 19.0, 15.0, 15.0, 29.0, 19.0, 32.0, 49.0, 51.0, 56.0, 48.0, 60.0, 65.0, 52.0, 43.0, 33.0, 57.0, 37.0, 41.0, 43.0, 40.0, 30.0, 14.0, 21.0, 16.0, 9.0, 7.0, 8.0, 4.0, 7.0, 5.0, 1.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.62396240234375e-05, -3.506802022457123e-05, -3.3896416425704956e-05, -3.2724812626838684e-05, -3.155320882797241e-05, -3.038160502910614e-05, -2.9210001230239868e-05, -2.8038397431373596e-05, -2.6866793632507324e-05, -2.5695189833641052e-05, -2.452358603477478e-05, -2.3351982235908508e-05, -2.2180378437042236e-05, -2.1008774638175964e-05, -1.9837170839309692e-05, -1.866556704044342e-05, -1.749396324157715e-05, -1.6322359442710876e-05, -1.5150755643844604e-05, -1.3979151844978333e-05, -1.280754804611206e-05, -1.1635944247245789e-05, -1.0464340448379517e-05, -9.292736649513245e-06, -8.121132850646973e-06, -6.949529051780701e-06, -5.777925252914429e-06, -4.606321454048157e-06, -3.4347176551818848e-06, -2.263113856315613e-06, -1.0915100574493408e-06, 8.009374141693115e-08, 1.2516975402832031e-06, 2.423301339149475e-06, 3.594905138015747e-06, 4.766508936882019e-06, 5.938112735748291e-06, 7.109716534614563e-06, 8.281320333480835e-06, 9.452924132347107e-06, 1.0624527931213379e-05, 1.1796131730079651e-05, 1.2967735528945923e-05, 1.4139339327812195e-05, 1.5310943126678467e-05, 1.648254692554474e-05, 1.765415072441101e-05, 1.8825754523277283e-05, 1.9997358322143555e-05, 2.1168962121009827e-05, 2.23405659198761e-05, 2.351216971874237e-05, 2.4683773517608643e-05, 2.5855377316474915e-05, 2.7026981115341187e-05, 2.819858491420746e-05, 2.937018871307373e-05, 3.054179251194e-05, 3.1713396310806274e-05, 3.2885000109672546e-05, 3.405660390853882e-05, 3.522820770740509e-05, 3.639981150627136e-05, 3.7571415305137634e-05, 3.8743019104003906e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 2.0, 7.0, 13.0, 16.0, 13.0, 30.0, 34.0, 51.0, 60.0, 102.0, 142.0, 213.0, 329.0, 452.0, 671.0, 1028.0, 1557.0, 2337.0, 3651.0, 5725.0, 9594.0, 16301.0, 29225.0, 56677.0, 122748.0, 298236.0, 269659.0, 110598.0, 52430.0, 26931.0, 15190.0, 8974.0, 5468.0, 3406.0, 2231.0, 1410.0, 1002.0, 686.0, 419.0, 293.0, 202.0, 151.0, 93.0, 64.0, 45.0, 29.0, 19.0, 8.0, 13.0, 11.0, 6.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09967041015625, -0.09634113311767578, -0.09301185607910156, -0.08968257904052734, -0.08635330200195312, -0.0830240249633789, -0.07969474792480469, -0.07636547088623047, -0.07303619384765625, -0.06970691680908203, -0.06637763977050781, -0.0630483627319336, -0.059719085693359375, -0.056389808654785156, -0.05306053161621094, -0.04973125457763672, -0.0464019775390625, -0.04307270050048828, -0.03974342346191406, -0.036414146423339844, -0.033084869384765625, -0.029755592346191406, -0.026426315307617188, -0.02309703826904297, -0.01976776123046875, -0.01643848419189453, -0.013109207153320312, -0.009779930114746094, -0.006450653076171875, -0.0031213760375976562, 0.0002079010009765625, 0.0035371780395507812, 0.006866455078125, 0.010195732116699219, 0.013525009155273438, 0.016854286193847656, 0.020183563232421875, 0.023512840270996094, 0.026842117309570312, 0.03017139434814453, 0.03350067138671875, 0.03682994842529297, 0.04015922546386719, 0.043488502502441406, 0.046817779541015625, 0.050147056579589844, 0.05347633361816406, 0.05680561065673828, 0.0601348876953125, 0.06346416473388672, 0.06679344177246094, 0.07012271881103516, 0.07345199584960938, 0.0767812728881836, 0.08011054992675781, 0.08343982696533203, 0.08676910400390625, 0.09009838104248047, 0.09342765808105469, 0.0967569351196289, 0.10008621215820312, 0.10341548919677734, 0.10674476623535156, 0.11007404327392578, 0.1134033203125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 9.0, 5.0, 10.0, 10.0, 12.0, 17.0, 15.0, 22.0, 26.0, 37.0, 35.0, 55.0, 96.0, 98.0, 117.0, 91.0, 73.0, 50.0, 41.0, 35.0, 39.0, 23.0, 16.0, 17.0, 13.0, 6.0, 8.0, 7.0, 5.0, 2.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0275421142578125, -0.026600122451782227, -0.025658130645751953, -0.02471613883972168, -0.023774147033691406, -0.022832155227661133, -0.02189016342163086, -0.020948171615600586, -0.020006179809570312, -0.01906418800354004, -0.018122196197509766, -0.017180204391479492, -0.01623821258544922, -0.015296220779418945, -0.014354228973388672, -0.013412237167358398, -0.012470245361328125, -0.011528253555297852, -0.010586261749267578, -0.009644269943237305, -0.008702278137207031, -0.007760286331176758, -0.006818294525146484, -0.005876302719116211, -0.0049343109130859375, -0.003992319107055664, -0.0030503273010253906, -0.002108335494995117, -0.0011663436889648438, -0.0002243518829345703, 0.0007176399230957031, 0.0016596317291259766, 0.00260162353515625, 0.0035436153411865234, 0.004485607147216797, 0.00542759895324707, 0.006369590759277344, 0.007311582565307617, 0.00825357437133789, 0.009195566177368164, 0.010137557983398438, 0.011079549789428711, 0.012021541595458984, 0.012963533401489258, 0.013905525207519531, 0.014847517013549805, 0.015789508819580078, 0.01673150062561035, 0.017673492431640625, 0.0186154842376709, 0.019557476043701172, 0.020499467849731445, 0.02144145965576172, 0.022383451461791992, 0.023325443267822266, 0.02426743507385254, 0.025209426879882812, 0.026151418685913086, 0.02709341049194336, 0.028035402297973633, 0.028977394104003906, 0.02991938591003418, 0.030861377716064453, 0.03180336952209473, 0.032745361328125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 2.0, 5.0, 6.0, 7.0, 13.0, 11.0, 15.0, 19.0, 22.0, 24.0, 31.0, 46.0, 48.0, 51.0, 68.0, 78.0, 60.0, 58.0, 56.0, 62.0, 61.0, 39.0, 39.0, 25.0, 23.0, 21.0, 18.0, 16.0, 12.0, 7.0, 11.0, 7.0, 12.0, 6.0, 5.0, 1.0, 7.0, 0.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.142985820770264, -4.977904796600342, -4.81282377243042, -4.647742748260498, -4.482661724090576, -4.317580699920654, -4.152499675750732, -3.9874186515808105, -3.8223376274108887, -3.657256603240967, -3.492175579071045, -3.327094554901123, -3.162013530731201, -2.9969325065612793, -2.8318514823913574, -2.6667704582214355, -2.5016891956329346, -2.3366081714630127, -2.171527147293091, -2.006446123123169, -1.841365098953247, -1.6762840747833252, -1.5112029314041138, -1.346121907234192, -1.18104088306427, -1.0159598588943481, -0.8508788347244263, -0.6857977509498596, -0.5207167267799377, -0.35563570261001587, -0.19055461883544922, -0.025473594665527344, 0.13960742950439453, 0.3046884536743164, 0.46976950764656067, 0.6348505616188049, 0.7999315857887268, 0.9650126099586487, 1.1300936937332153, 1.2951747179031372, 1.460255742073059, 1.625336766242981, 1.7904177904129028, 1.9554989337921143, 2.120579957962036, 2.285660982131958, 2.45074200630188, 2.6158230304718018, 2.7809040546417236, 2.9459850788116455, 3.1110661029815674, 3.2761471271514893, 3.441228151321411, 3.606309175491333, 3.771390438079834, 3.936471462249756, 4.101552486419678, 4.2666335105896, 4.4317145347595215, 4.596795558929443, 4.761876583099365, 4.926957607269287, 5.092038631439209, 5.257119655609131, 5.422200679779053]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 8.0, 7.0, 10.0, 6.0, 6.0, 10.0, 17.0, 14.0, 12.0, 19.0, 13.0, 22.0, 26.0, 26.0, 32.0, 27.0, 31.0, 26.0, 32.0, 29.0, 40.0, 35.0, 41.0, 37.0, 44.0, 49.0, 47.0, 33.0, 26.0, 23.0, 35.0, 32.0, 19.0, 30.0, 15.0, 15.0, 13.0, 16.0, 18.0, 14.0, 10.0, 9.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-4.572356224060059, -4.435568809509277, -4.298780918121338, -4.161993503570557, -4.025205612182617, -3.888417959213257, -3.7516303062438965, -3.6148428916931152, -3.478055000305176, -3.3412673473358154, -3.204479694366455, -3.0676920413970947, -2.9309043884277344, -2.794116735458374, -2.6573290824890137, -2.5205416679382324, -2.383754014968872, -2.2469663619995117, -2.1101787090301514, -1.973391056060791, -1.8366034030914307, -1.6998157501220703, -1.5630282163619995, -1.4262405633926392, -1.2894529104232788, -1.1526652574539185, -1.015877604484558, -0.8790900111198425, -0.7423023581504822, -0.6055147051811218, -0.46872711181640625, -0.3319394588470459, -0.19515180587768555, -0.05836416780948639, 0.07842347025871277, 0.21521109342575073, 0.3519987463951111, 0.48878639936447144, 0.625573992729187, 0.7623616456985474, 0.8991492986679077, 1.035936951637268, 1.1727246046066284, 1.3095121383666992, 1.4462997913360596, 1.58308744430542, 1.7198750972747803, 1.8566627502441406, 1.993450403213501, 2.1302380561828613, 2.2670257091522217, 2.403813362121582, 2.5406010150909424, 2.6773886680603027, 2.814176082611084, 2.9509639739990234, 3.0877513885498047, 3.224539041519165, 3.3613266944885254, 3.4981143474578857, 3.634902000427246, 3.7716896533966064, 3.908477306365967, 4.045264720916748, 4.1820526123046875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 9.0, 9.0, 21.0, 18.0, 34.0, 31.0, 60.0, 108.0, 139.0, 165.0, 348.0, 494.0, 755.0, 1159.0, 1613.0, 2499.0, 3991.0, 6052.0, 9448.0, 15105.0, 24181.0, 39058.0, 62840.0, 96014.0, 135260.0, 160844.0, 153377.0, 118337.0, 80618.0, 51095.0, 31428.0, 19313.0, 11985.0, 7729.0, 4928.0, 3242.0, 2071.0, 1411.0, 903.0, 617.0, 403.0, 309.0, 173.0, 113.0, 80.0, 55.0, 35.0, 31.0, 27.0, 10.0, 8.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.279296875, -3.169158935546875, -3.05902099609375, -2.948883056640625, -2.8387451171875, -2.728607177734375, -2.61846923828125, -2.508331298828125, -2.398193359375, -2.288055419921875, -2.17791748046875, -2.067779541015625, -1.9576416015625, -1.847503662109375, -1.73736572265625, -1.627227783203125, -1.51708984375, -1.406951904296875, -1.29681396484375, -1.186676025390625, -1.0765380859375, -0.966400146484375, -0.85626220703125, -0.746124267578125, -0.635986328125, -0.525848388671875, -0.41571044921875, -0.305572509765625, -0.1954345703125, -0.085296630859375, 0.02484130859375, 0.134979248046875, 0.2451171875, 0.355255126953125, 0.46539306640625, 0.575531005859375, 0.6856689453125, 0.795806884765625, 0.90594482421875, 1.016082763671875, 1.126220703125, 1.236358642578125, 1.34649658203125, 1.456634521484375, 1.5667724609375, 1.676910400390625, 1.78704833984375, 1.897186279296875, 2.00732421875, 2.117462158203125, 2.22760009765625, 2.337738037109375, 2.4478759765625, 2.558013916015625, 2.66815185546875, 2.778289794921875, 2.888427734375, 2.998565673828125, 3.10870361328125, 3.218841552734375, 3.3289794921875, 3.439117431640625, 3.54925537109375, 3.659393310546875, 3.76953125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 6.0, 7.0, 8.0, 6.0, 6.0, 11.0, 19.0, 15.0, 17.0, 14.0, 16.0, 15.0, 24.0, 23.0, 25.0, 28.0, 30.0, 31.0, 45.0, 30.0, 37.0, 38.0, 45.0, 34.0, 42.0, 44.0, 51.0, 48.0, 24.0, 28.0, 28.0, 32.0, 26.0, 23.0, 20.0, 17.0, 12.0, 15.0, 10.0, 9.0, 7.0, 7.0, 7.0, 10.0, 2.0, 5.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.76171875, -4.61572265625, -4.4697265625, -4.32373046875, -4.177734375, -4.03173828125, -3.8857421875, -3.73974609375, -3.59375, -3.44775390625, -3.3017578125, -3.15576171875, -3.009765625, -2.86376953125, -2.7177734375, -2.57177734375, -2.42578125, -2.27978515625, -2.1337890625, -1.98779296875, -1.841796875, -1.69580078125, -1.5498046875, -1.40380859375, -1.2578125, -1.11181640625, -0.9658203125, -0.81982421875, -0.673828125, -0.52783203125, -0.3818359375, -0.23583984375, -0.08984375, 0.05615234375, 0.2021484375, 0.34814453125, 0.494140625, 0.64013671875, 0.7861328125, 0.93212890625, 1.078125, 1.22412109375, 1.3701171875, 1.51611328125, 1.662109375, 1.80810546875, 1.9541015625, 2.10009765625, 2.24609375, 2.39208984375, 2.5380859375, 2.68408203125, 2.830078125, 2.97607421875, 3.1220703125, 3.26806640625, 3.4140625, 3.56005859375, 3.7060546875, 3.85205078125, 3.998046875, 4.14404296875, 4.2900390625, 4.43603515625, 4.58203125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 10.0, 8.0, 19.0, 31.0, 33.0, 54.0, 80.0, 138.0, 218.0, 300.0, 482.0, 706.0, 1043.0, 1760.0, 2583.0, 3902.0, 6401.0, 9702.0, 15354.0, 24804.0, 40184.0, 63546.0, 97124.0, 134602.0, 157966.0, 150004.0, 117928.0, 80851.0, 51749.0, 32062.0, 20098.0, 12503.0, 7946.0, 5014.0, 3287.0, 2143.0, 1333.0, 855.0, 595.0, 412.0, 256.0, 153.0, 110.0, 72.0, 43.0, 32.0, 25.0, 14.0, 13.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.529296875, -3.421600341796875, -3.31390380859375, -3.206207275390625, -3.0985107421875, -2.990814208984375, -2.88311767578125, -2.775421142578125, -2.667724609375, -2.560028076171875, -2.45233154296875, -2.344635009765625, -2.2369384765625, -2.129241943359375, -2.02154541015625, -1.913848876953125, -1.80615234375, -1.698455810546875, -1.59075927734375, -1.483062744140625, -1.3753662109375, -1.267669677734375, -1.15997314453125, -1.052276611328125, -0.944580078125, -0.836883544921875, -0.72918701171875, -0.621490478515625, -0.5137939453125, -0.406097412109375, -0.29840087890625, -0.190704345703125, -0.0830078125, 0.024688720703125, 0.13238525390625, 0.240081787109375, 0.3477783203125, 0.455474853515625, 0.56317138671875, 0.670867919921875, 0.778564453125, 0.886260986328125, 0.99395751953125, 1.101654052734375, 1.2093505859375, 1.317047119140625, 1.42474365234375, 1.532440185546875, 1.64013671875, 1.747833251953125, 1.85552978515625, 1.963226318359375, 2.0709228515625, 2.178619384765625, 2.28631591796875, 2.394012451171875, 2.501708984375, 2.609405517578125, 2.71710205078125, 2.824798583984375, 2.9324951171875, 3.040191650390625, 3.14788818359375, 3.255584716796875, 3.36328125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 2.0, 6.0, 9.0, 10.0, 15.0, 21.0, 15.0, 20.0, 22.0, 16.0, 31.0, 31.0, 26.0, 38.0, 34.0, 36.0, 23.0, 46.0, 53.0, 41.0, 42.0, 36.0, 30.0, 41.0, 40.0, 34.0, 47.0, 20.0, 33.0, 19.0, 23.0, 12.0, 23.0, 19.0, 12.0, 17.0, 12.0, 9.0, 8.0, 2.0, 5.0, 6.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.48046875, -2.3916015625, -2.302734375, -2.2138671875, -2.125, -2.0361328125, -1.947265625, -1.8583984375, -1.76953125, -1.6806640625, -1.591796875, -1.5029296875, -1.4140625, -1.3251953125, -1.236328125, -1.1474609375, -1.05859375, -0.9697265625, -0.880859375, -0.7919921875, -0.703125, -0.6142578125, -0.525390625, -0.4365234375, -0.34765625, -0.2587890625, -0.169921875, -0.0810546875, 0.0078125, 0.0966796875, 0.185546875, 0.2744140625, 0.36328125, 0.4521484375, 0.541015625, 0.6298828125, 0.71875, 0.8076171875, 0.896484375, 0.9853515625, 1.07421875, 1.1630859375, 1.251953125, 1.3408203125, 1.4296875, 1.5185546875, 1.607421875, 1.6962890625, 1.78515625, 1.8740234375, 1.962890625, 2.0517578125, 2.140625, 2.2294921875, 2.318359375, 2.4072265625, 2.49609375, 2.5849609375, 2.673828125, 2.7626953125, 2.8515625, 2.9404296875, 3.029296875, 3.1181640625, 3.20703125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 8.0, 10.0, 7.0, 15.0, 24.0, 38.0, 35.0, 76.0, 79.0, 131.0, 183.0, 276.0, 486.0, 696.0, 1078.0, 1695.0, 2792.0, 4424.0, 7178.0, 11927.0, 20080.0, 32972.0, 53105.0, 83279.0, 119726.0, 151490.0, 159175.0, 134929.0, 96880.0, 63834.0, 39704.0, 24281.0, 14752.0, 8839.0, 5289.0, 3294.0, 2032.0, 1302.0, 824.0, 501.0, 360.0, 233.0, 162.0, 93.0, 64.0, 69.0, 34.0, 29.0, 24.0, 16.0, 9.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0], "bins": [-1.1923828125, -1.156463623046875, -1.12054443359375, -1.084625244140625, -1.0487060546875, -1.012786865234375, -0.97686767578125, -0.940948486328125, -0.905029296875, -0.869110107421875, -0.83319091796875, -0.797271728515625, -0.7613525390625, -0.725433349609375, -0.68951416015625, -0.653594970703125, -0.61767578125, -0.581756591796875, -0.54583740234375, -0.509918212890625, -0.4739990234375, -0.438079833984375, -0.40216064453125, -0.366241455078125, -0.330322265625, -0.294403076171875, -0.25848388671875, -0.222564697265625, -0.1866455078125, -0.150726318359375, -0.11480712890625, -0.078887939453125, -0.04296875, -0.007049560546875, 0.02886962890625, 0.064788818359375, 0.1007080078125, 0.136627197265625, 0.17254638671875, 0.208465576171875, 0.244384765625, 0.280303955078125, 0.31622314453125, 0.352142333984375, 0.3880615234375, 0.423980712890625, 0.45989990234375, 0.495819091796875, 0.53173828125, 0.567657470703125, 0.60357666015625, 0.639495849609375, 0.6754150390625, 0.711334228515625, 0.74725341796875, 0.783172607421875, 0.819091796875, 0.855010986328125, 0.89093017578125, 0.926849365234375, 0.9627685546875, 0.998687744140625, 1.03460693359375, 1.070526123046875, 1.1064453125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 6.0, 3.0, 14.0, 19.0, 12.0, 28.0, 18.0, 36.0, 35.0, 48.0, 47.0, 62.0, 83.0, 75.0, 62.0, 62.0, 63.0, 65.0, 58.0, 40.0, 37.0, 31.0, 20.0, 11.0, 16.0, 12.0, 12.0, 11.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00012803077697753906, -0.00012416578829288483, -0.00012030079960823059, -0.00011643581092357635, -0.00011257082223892212, -0.00010870583355426788, -0.00010484084486961365, -0.00010097585618495941, -9.711086750030518e-05, -9.324587881565094e-05, -8.93808901309967e-05, -8.551590144634247e-05, -8.165091276168823e-05, -7.7785924077034e-05, -7.392093539237976e-05, -7.005594670772552e-05, -6.619095802307129e-05, -6.232596933841705e-05, -5.846098065376282e-05, -5.459599196910858e-05, -5.0731003284454346e-05, -4.686601459980011e-05, -4.3001025915145874e-05, -3.913603723049164e-05, -3.52710485458374e-05, -3.1406059861183167e-05, -2.754107117652893e-05, -2.3676082491874695e-05, -1.981109380722046e-05, -1.5946105122566223e-05, -1.2081116437911987e-05, -8.216127753257751e-06, -4.351139068603516e-06, -4.861503839492798e-07, 3.378838300704956e-06, 7.243826985359192e-06, 1.1108815670013428e-05, 1.4973804354667664e-05, 1.88387930393219e-05, 2.2703781723976135e-05, 2.656877040863037e-05, 3.0433759093284607e-05, 3.429874777793884e-05, 3.816373646259308e-05, 4.2028725147247314e-05, 4.589371383190155e-05, 4.9758702516555786e-05, 5.362369120121002e-05, 5.748867988586426e-05, 6.13536685705185e-05, 6.521865725517273e-05, 6.908364593982697e-05, 7.29486346244812e-05, 7.681362330913544e-05, 8.067861199378967e-05, 8.454360067844391e-05, 8.840858936309814e-05, 9.227357804775238e-05, 9.613856673240662e-05, 0.00010000355541706085, 0.00010386854410171509, 0.00010773353278636932, 0.00011159852147102356, 0.0001154635101556778, 0.00011932849884033203]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 10.0, 2.0, 12.0, 21.0, 19.0, 40.0, 54.0, 79.0, 149.0, 219.0, 318.0, 461.0, 722.0, 1123.0, 1677.0, 2627.0, 3964.0, 6226.0, 10091.0, 16042.0, 24854.0, 38696.0, 58694.0, 84546.0, 114105.0, 135892.0, 139371.0, 122483.0, 94801.0, 66630.0, 44517.0, 28696.0, 18535.0, 11836.0, 7564.0, 4783.0, 3043.0, 2018.0, 1249.0, 825.0, 515.0, 377.0, 206.0, 172.0, 96.0, 62.0, 48.0, 38.0, 19.0, 13.0, 9.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.025390625, -0.9935150146484375, -0.961639404296875, -0.9297637939453125, -0.89788818359375, -0.8660125732421875, -0.834136962890625, -0.8022613525390625, -0.7703857421875, -0.7385101318359375, -0.706634521484375, -0.6747589111328125, -0.64288330078125, -0.6110076904296875, -0.579132080078125, -0.5472564697265625, -0.515380859375, -0.4835052490234375, -0.451629638671875, -0.4197540283203125, -0.38787841796875, -0.3560028076171875, -0.324127197265625, -0.2922515869140625, -0.2603759765625, -0.2285003662109375, -0.196624755859375, -0.1647491455078125, -0.13287353515625, -0.1009979248046875, -0.069122314453125, -0.0372467041015625, -0.00537109375, 0.0265045166015625, 0.058380126953125, 0.0902557373046875, 0.12213134765625, 0.1540069580078125, 0.185882568359375, 0.2177581787109375, 0.2496337890625, 0.2815093994140625, 0.313385009765625, 0.3452606201171875, 0.37713623046875, 0.4090118408203125, 0.440887451171875, 0.4727630615234375, 0.504638671875, 0.5365142822265625, 0.568389892578125, 0.6002655029296875, 0.63214111328125, 0.6640167236328125, 0.695892333984375, 0.7277679443359375, 0.7596435546875, 0.7915191650390625, 0.823394775390625, 0.8552703857421875, 0.88714599609375, 0.9190216064453125, 0.950897216796875, 0.9827728271484375, 1.0146484375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 3.0, 8.0, 6.0, 12.0, 17.0, 12.0, 13.0, 17.0, 31.0, 31.0, 40.0, 35.0, 33.0, 48.0, 53.0, 54.0, 72.0, 65.0, 49.0, 53.0, 63.0, 31.0, 43.0, 39.0, 36.0, 24.0, 20.0, 20.0, 14.0, 11.0, 8.0, 10.0, 9.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5185546875, -0.5031967163085938, -0.4878387451171875, -0.47248077392578125, -0.457122802734375, -0.44176483154296875, -0.4264068603515625, -0.41104888916015625, -0.39569091796875, -0.38033294677734375, -0.3649749755859375, -0.34961700439453125, -0.334259033203125, -0.31890106201171875, -0.3035430908203125, -0.28818511962890625, -0.2728271484375, -0.25746917724609375, -0.2421112060546875, -0.22675323486328125, -0.211395263671875, -0.19603729248046875, -0.1806793212890625, -0.16532135009765625, -0.14996337890625, -0.13460540771484375, -0.1192474365234375, -0.10388946533203125, -0.088531494140625, -0.07317352294921875, -0.0578155517578125, -0.04245758056640625, -0.027099609375, -0.01174163818359375, 0.0036163330078125, 0.01897430419921875, 0.034332275390625, 0.04969024658203125, 0.0650482177734375, 0.08040618896484375, 0.09576416015625, 0.11112213134765625, 0.1264801025390625, 0.14183807373046875, 0.157196044921875, 0.17255401611328125, 0.1879119873046875, 0.20326995849609375, 0.2186279296875, 0.23398590087890625, 0.2493438720703125, 0.26470184326171875, 0.280059814453125, 0.29541778564453125, 0.3107757568359375, 0.32613372802734375, 0.34149169921875, 0.35684967041015625, 0.3722076416015625, 0.38756561279296875, 0.402923583984375, 0.41828155517578125, 0.4336395263671875, 0.44899749755859375, 0.46435546875]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 6.0, 4.0, 4.0, 6.0, 7.0, 13.0, 10.0, 22.0, 18.0, 28.0, 38.0, 35.0, 38.0, 46.0, 46.0, 59.0, 72.0, 71.0, 62.0, 59.0, 64.0, 53.0, 34.0, 29.0, 30.0, 24.0, 18.0, 21.0, 13.0, 14.0, 8.0, 8.0, 7.0, 7.0, 3.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.762283802032471, -4.5966644287109375, -4.4310455322265625, -4.265426158905029, -4.099806785583496, -3.934187650680542, -3.768568515777588, -3.6029491424560547, -3.4373300075531006, -3.2717108726501465, -3.1060914993286133, -2.940472364425659, -2.774853229522705, -2.609233856201172, -2.4436147212982178, -2.2779955863952637, -2.1123762130737305, -1.9467569589614868, -1.7811377048492432, -1.615518569946289, -1.4498993158340454, -1.2842800617218018, -1.1186609268188477, -0.953041672706604, -0.7874224185943604, -0.6218031644821167, -0.4561839699745178, -0.29056474566459656, -0.12494552135467529, 0.04067373275756836, 0.20629292726516724, 0.3719121217727661, 0.537531852722168, 0.7031511068344116, 0.8687703013420105, 1.0343894958496094, 1.200008749961853, 1.3656280040740967, 1.5312471389770508, 1.6968663930892944, 1.862485647201538, 2.028104782104492, 2.1937241554260254, 2.3593432903289795, 2.5249624252319336, 2.690581798553467, 2.856200933456421, 3.021820068359375, 3.187439441680908, 3.3530585765838623, 3.5186779499053955, 3.6842970848083496, 3.849916458129883, 4.015535354614258, 4.181154727935791, 4.346774101257324, 4.512392997741699, 4.678012371063232, 4.843631267547607, 5.009250640869141, 5.174870014190674, 5.340489387512207, 5.506108283996582, 5.671727657318115, 5.837347030639648]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 8.0, 13.0, 11.0, 4.0, 14.0, 10.0, 18.0, 25.0, 22.0, 27.0, 22.0, 23.0, 21.0, 26.0, 34.0, 35.0, 39.0, 39.0, 40.0, 40.0, 49.0, 41.0, 44.0, 44.0, 41.0, 33.0, 31.0, 40.0, 34.0, 30.0, 13.0, 8.0, 16.0, 17.0, 15.0, 15.0, 11.0, 9.0, 8.0, 4.0, 4.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.872340202331543, -4.723668098449707, -4.574996471405029, -4.426324367523193, -4.277652740478516, -4.12898063659668, -3.980308771133423, -3.831636905670166, -3.682965040206909, -3.5342931747436523, -3.3856213092803955, -3.2369494438171387, -3.0882773399353027, -2.939605712890625, -2.790933609008789, -2.6422617435455322, -2.4935898780822754, -2.3449180126190186, -2.1962461471557617, -2.047574281692505, -1.8989022970199585, -1.7502304315567017, -1.6015584468841553, -1.4528865814208984, -1.3042147159576416, -1.1555428504943848, -1.006870985031128, -0.8581990003585815, -0.7095271348953247, -0.5608552694320679, -0.41218334436416626, -0.26351141929626465, -0.11483907699584961, 0.033832818269729614, 0.18250471353530884, 0.33117660880088806, 0.4798485040664673, 0.6285203695297241, 0.7771922945976257, 0.9258642196655273, 1.0745360851287842, 1.223207950592041, 1.3718798160552979, 1.5205518007278442, 1.669223666191101, 1.817895531654358, 1.9665675163269043, 2.115239381790161, 2.263911247253418, 2.412583112716675, 2.5612549781799316, 2.7099268436431885, 2.8585987091064453, 3.0072708129882812, 3.155942678451538, 3.304614543914795, 3.4532864093780518, 3.6019582748413086, 3.7506301403045654, 3.8993020057678223, 4.047974109649658, 4.196645736694336, 4.345317840576172, 4.493989944458008, 4.6426615715026855]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 6.0, 12.0, 17.0, 17.0, 31.0, 56.0, 72.0, 96.0, 154.0, 239.0, 355.0, 546.0, 873.0, 1364.0, 2105.0, 3569.0, 6051.0, 10676.0, 19610.0, 37462.0, 74557.0, 154833.0, 326635.0, 646956.0, 977332.0, 894169.0, 524996.0, 259691.0, 124226.0, 60417.0, 30575.0, 16138.0, 8639.0, 4811.0, 2820.0, 1545.0, 989.0, 599.0, 395.0, 230.0, 151.0, 97.0, 52.0, 42.0, 27.0, 18.0, 13.0, 18.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.171875, -4.9925537109375, -4.813232421875, -4.6339111328125, -4.45458984375, -4.2752685546875, -4.095947265625, -3.9166259765625, -3.7373046875, -3.5579833984375, -3.378662109375, -3.1993408203125, -3.02001953125, -2.8406982421875, -2.661376953125, -2.4820556640625, -2.302734375, -2.1234130859375, -1.944091796875, -1.7647705078125, -1.58544921875, -1.4061279296875, -1.226806640625, -1.0474853515625, -0.8681640625, -0.6888427734375, -0.509521484375, -0.3302001953125, -0.15087890625, 0.0284423828125, 0.207763671875, 0.3870849609375, 0.56640625, 0.7457275390625, 0.925048828125, 1.1043701171875, 1.28369140625, 1.4630126953125, 1.642333984375, 1.8216552734375, 2.0009765625, 2.1802978515625, 2.359619140625, 2.5389404296875, 2.71826171875, 2.8975830078125, 3.076904296875, 3.2562255859375, 3.435546875, 3.6148681640625, 3.794189453125, 3.9735107421875, 4.15283203125, 4.3321533203125, 4.511474609375, 4.6907958984375, 4.8701171875, 5.0494384765625, 5.228759765625, 5.4080810546875, 5.58740234375, 5.7667236328125, 5.946044921875, 6.1253662109375, 6.3046875]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 4.0, 5.0, 7.0, 9.0, 9.0, 10.0, 16.0, 10.0, 17.0, 11.0, 26.0, 26.0, 29.0, 23.0, 26.0, 35.0, 36.0, 42.0, 35.0, 50.0, 36.0, 47.0, 44.0, 47.0, 46.0, 40.0, 41.0, 51.0, 36.0, 29.0, 22.0, 18.0, 18.0, 13.0, 15.0, 12.0, 19.0, 11.0, 10.0, 2.0, 7.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.14453125, -4.020751953125, -3.89697265625, -3.773193359375, -3.6494140625, -3.525634765625, -3.40185546875, -3.278076171875, -3.154296875, -3.030517578125, -2.90673828125, -2.782958984375, -2.6591796875, -2.535400390625, -2.41162109375, -2.287841796875, -2.1640625, -2.040283203125, -1.91650390625, -1.792724609375, -1.6689453125, -1.545166015625, -1.42138671875, -1.297607421875, -1.173828125, -1.050048828125, -0.92626953125, -0.802490234375, -0.6787109375, -0.554931640625, -0.43115234375, -0.307373046875, -0.18359375, -0.059814453125, 0.06396484375, 0.187744140625, 0.3115234375, 0.435302734375, 0.55908203125, 0.682861328125, 0.806640625, 0.930419921875, 1.05419921875, 1.177978515625, 1.3017578125, 1.425537109375, 1.54931640625, 1.673095703125, 1.796875, 1.920654296875, 2.04443359375, 2.168212890625, 2.2919921875, 2.415771484375, 2.53955078125, 2.663330078125, 2.787109375, 2.910888671875, 3.03466796875, 3.158447265625, 3.2822265625, 3.406005859375, 3.52978515625, 3.653564453125, 3.77734375]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 6.0, 6.0, 9.0, 9.0, 21.0, 41.0, 69.0, 95.0, 165.0, 250.0, 381.0, 723.0, 1127.0, 2076.0, 3664.0, 6769.0, 12848.0, 25283.0, 51653.0, 105788.0, 216566.0, 424919.0, 723908.0, 914866.0, 765454.0, 463975.0, 240316.0, 117330.0, 56919.0, 28010.0, 14079.0, 7402.0, 4025.0, 2263.0, 1298.0, 728.0, 468.0, 284.0, 174.0, 106.0, 84.0, 43.0, 31.0, 25.0, 10.0, 11.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.05078125, -5.859130859375, -5.66748046875, -5.475830078125, -5.2841796875, -5.092529296875, -4.90087890625, -4.709228515625, -4.517578125, -4.325927734375, -4.13427734375, -3.942626953125, -3.7509765625, -3.559326171875, -3.36767578125, -3.176025390625, -2.984375, -2.792724609375, -2.60107421875, -2.409423828125, -2.2177734375, -2.026123046875, -1.83447265625, -1.642822265625, -1.451171875, -1.259521484375, -1.06787109375, -0.876220703125, -0.6845703125, -0.492919921875, -0.30126953125, -0.109619140625, 0.08203125, 0.273681640625, 0.46533203125, 0.656982421875, 0.8486328125, 1.040283203125, 1.23193359375, 1.423583984375, 1.615234375, 1.806884765625, 1.99853515625, 2.190185546875, 2.3818359375, 2.573486328125, 2.76513671875, 2.956787109375, 3.1484375, 3.340087890625, 3.53173828125, 3.723388671875, 3.9150390625, 4.106689453125, 4.29833984375, 4.489990234375, 4.681640625, 4.873291015625, 5.06494140625, 5.256591796875, 5.4482421875, 5.639892578125, 5.83154296875, 6.023193359375, 6.21484375]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 12.0, 6.0, 26.0, 27.0, 19.0, 50.0, 47.0, 60.0, 92.0, 90.0, 112.0, 144.0, 173.0, 179.0, 222.0, 245.0, 266.0, 246.0, 266.0, 228.0, 220.0, 221.0, 194.0, 173.0, 139.0, 123.0, 108.0, 80.0, 60.0, 42.0, 35.0, 34.0, 20.0, 25.0, 19.0, 13.0, 10.0, 14.0, 4.0, 8.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7255859375, -1.6573333740234375, -1.589080810546875, -1.5208282470703125, -1.45257568359375, -1.3843231201171875, -1.316070556640625, -1.2478179931640625, -1.1795654296875, -1.1113128662109375, -1.043060302734375, -0.9748077392578125, -0.90655517578125, -0.8383026123046875, -0.770050048828125, -0.7017974853515625, -0.633544921875, -0.5652923583984375, -0.497039794921875, -0.4287872314453125, -0.36053466796875, -0.2922821044921875, -0.224029541015625, -0.1557769775390625, -0.0875244140625, -0.0192718505859375, 0.048980712890625, 0.1172332763671875, 0.18548583984375, 0.2537384033203125, 0.321990966796875, 0.3902435302734375, 0.45849609375, 0.5267486572265625, 0.595001220703125, 0.6632537841796875, 0.73150634765625, 0.7997589111328125, 0.868011474609375, 0.9362640380859375, 1.0045166015625, 1.0727691650390625, 1.141021728515625, 1.2092742919921875, 1.27752685546875, 1.3457794189453125, 1.414031982421875, 1.4822845458984375, 1.550537109375, 1.6187896728515625, 1.687042236328125, 1.7552947998046875, 1.82354736328125, 1.8917999267578125, 1.960052490234375, 2.0283050537109375, 2.0965576171875, 2.1648101806640625, 2.233062744140625, 2.3013153076171875, 2.36956787109375, 2.4378204345703125, 2.506072998046875, 2.5743255615234375, 2.642578125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 6.0, 10.0, 5.0, 11.0, 13.0, 18.0, 15.0, 26.0, 21.0, 27.0, 40.0, 39.0, 43.0, 45.0, 45.0, 60.0, 65.0, 47.0, 49.0, 63.0, 42.0, 47.0, 33.0, 33.0, 24.0, 27.0, 31.0, 23.0, 12.0, 12.0, 10.0, 11.0, 3.0, 7.0, 5.0, 7.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.226681709289551, -5.05424690246582, -4.881811618804932, -4.709376811981201, -4.5369415283203125, -4.364506721496582, -4.192071914672852, -4.019637107849121, -3.8472018241882324, -3.674766778945923, -3.5023317337036133, -3.329896926879883, -3.1574618816375732, -2.9850268363952637, -2.812592029571533, -2.6401569843292236, -2.467721939086914, -2.2952868938446045, -2.122851848602295, -1.9504170417785645, -1.7779819965362549, -1.6055469512939453, -1.4331120252609253, -1.2606770992279053, -1.0882420539855957, -0.9158070683479309, -0.7433720827102661, -0.5709370970726013, -0.3985021114349365, -0.22606712579727173, -0.053632140159606934, 0.11880278587341309, 0.29123783111572266, 0.46367281675338745, 0.6361078023910522, 0.808542788028717, 0.9809777736663818, 1.1534128189086914, 1.3258477449417114, 1.4982826709747314, 1.670717716217041, 1.8431527614593506, 2.01558780670166, 2.1880226135253906, 2.3604576587677, 2.5328927040100098, 2.7053275108337402, 2.87776255607605, 3.0501976013183594, 3.222632646560669, 3.3950676918029785, 3.567502498626709, 3.7399375438690186, 3.912372589111328, 4.084807395935059, 4.257242202758789, 4.429677486419678, 4.602112293243408, 4.774547576904297, 4.946982383728027, 5.119417190551758, 5.2918524742126465, 5.464287281036377, 5.636722564697266, 5.809157371520996]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 3.0, 10.0, 9.0, 6.0, 9.0, 11.0, 13.0, 19.0, 26.0, 21.0, 24.0, 34.0, 31.0, 30.0, 34.0, 40.0, 49.0, 42.0, 60.0, 39.0, 37.0, 49.0, 37.0, 43.0, 40.0, 34.0, 35.0, 36.0, 36.0, 17.0, 21.0, 18.0, 15.0, 13.0, 12.0, 12.0, 11.0, 7.0, 4.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.471259593963623, -6.283953666687012, -6.0966477394104, -5.909341812133789, -5.7220354080200195, -5.534729480743408, -5.347423553466797, -5.1601176261901855, -4.972811698913574, -4.785505771636963, -4.598199844360352, -4.41089391708374, -4.223587989807129, -4.036281585693359, -3.848975658416748, -3.6616697311401367, -3.4743638038635254, -3.287057876586914, -3.0997519493103027, -2.9124457836151123, -2.725139856338501, -2.5378339290618896, -2.350527763366699, -2.163221836090088, -1.9759159088134766, -1.7886099815368652, -1.6013039350509644, -1.4139978885650635, -1.2266919612884521, -1.0393860340118408, -0.8520799875259399, -0.6647739410400391, -0.47746849060058594, -0.29016250371932983, -0.10285651683807373, 0.08444947004318237, 0.2717554569244385, 0.4590614438056946, 0.6463674306869507, 0.8336734771728516, 1.020979404449463, 1.2082853317260742, 1.395591378211975, 1.582897424697876, 1.7702033519744873, 1.9575092792510986, 2.144815444946289, 2.3321213722229004, 2.5194272994995117, 2.706733226776123, 2.8940391540527344, 3.081345319747925, 3.268651247024536, 3.4559571743011475, 3.643263339996338, 3.830569267272949, 4.0178751945495605, 4.205181121826172, 4.392487049102783, 4.5797929763793945, 4.767099380493164, 4.954405307769775, 5.141711235046387, 5.329017162322998, 5.516323089599609]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 14.0, 11.0, 39.0, 52.0, 69.0, 102.0, 150.0, 247.0, 327.0, 529.0, 813.0, 1189.0, 1779.0, 2712.0, 4280.0, 6799.0, 10790.0, 18054.0, 30635.0, 56594.0, 113509.0, 231167.0, 268780.0, 139345.0, 68573.0, 36719.0, 20993.0, 12514.0, 7565.0, 4980.0, 3055.0, 2111.0, 1328.0, 910.0, 545.0, 433.0, 265.0, 194.0, 121.0, 90.0, 48.0, 35.0, 30.0, 16.0, 14.0, 3.0, 4.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.7236328125, -1.671630859375, -1.61962890625, -1.567626953125, -1.515625, -1.463623046875, -1.41162109375, -1.359619140625, -1.3076171875, -1.255615234375, -1.20361328125, -1.151611328125, -1.099609375, -1.047607421875, -0.99560546875, -0.943603515625, -0.8916015625, -0.839599609375, -0.78759765625, -0.735595703125, -0.68359375, -0.631591796875, -0.57958984375, -0.527587890625, -0.4755859375, -0.423583984375, -0.37158203125, -0.319580078125, -0.267578125, -0.215576171875, -0.16357421875, -0.111572265625, -0.0595703125, -0.007568359375, 0.04443359375, 0.096435546875, 0.1484375, 0.200439453125, 0.25244140625, 0.304443359375, 0.3564453125, 0.408447265625, 0.46044921875, 0.512451171875, 0.564453125, 0.616455078125, 0.66845703125, 0.720458984375, 0.7724609375, 0.824462890625, 0.87646484375, 0.928466796875, 0.98046875, 1.032470703125, 1.08447265625, 1.136474609375, 1.1884765625, 1.240478515625, 1.29248046875, 1.344482421875, 1.396484375, 1.448486328125, 1.50048828125, 1.552490234375, 1.6044921875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 8.0, 2.0, 1.0, 9.0, 8.0, 11.0, 11.0, 15.0, 24.0, 14.0, 19.0, 19.0, 24.0, 27.0, 38.0, 36.0, 33.0, 44.0, 47.0, 44.0, 53.0, 47.0, 54.0, 43.0, 41.0, 34.0, 42.0, 38.0, 41.0, 21.0, 27.0, 23.0, 26.0, 18.0, 9.0, 19.0, 10.0, 7.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.30859375, -7.1116943359375, -6.914794921875, -6.7178955078125, -6.52099609375, -6.3240966796875, -6.127197265625, -5.9302978515625, -5.7333984375, -5.5364990234375, -5.339599609375, -5.1427001953125, -4.94580078125, -4.7489013671875, -4.552001953125, -4.3551025390625, -4.158203125, -3.9613037109375, -3.764404296875, -3.5675048828125, -3.37060546875, -3.1737060546875, -2.976806640625, -2.7799072265625, -2.5830078125, -2.3861083984375, -2.189208984375, -1.9923095703125, -1.79541015625, -1.5985107421875, -1.401611328125, -1.2047119140625, -1.0078125, -0.8109130859375, -0.614013671875, -0.4171142578125, -0.22021484375, -0.0233154296875, 0.173583984375, 0.3704833984375, 0.5673828125, 0.7642822265625, 0.961181640625, 1.1580810546875, 1.35498046875, 1.5518798828125, 1.748779296875, 1.9456787109375, 2.142578125, 2.3394775390625, 2.536376953125, 2.7332763671875, 2.93017578125, 3.1270751953125, 3.323974609375, 3.5208740234375, 3.7177734375, 3.9146728515625, 4.111572265625, 4.3084716796875, 4.50537109375, 4.7022705078125, 4.899169921875, 5.0960693359375, 5.29296875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 11.0, 8.0, 8.0, 6.0, 12.0, 10.0, 13.0, 21.0, 22.0, 36.0, 46.0, 62.0, 76.0, 85.0, 125.0, 162.0, 177.0, 247.0, 374.0, 543.0, 779.0, 1104.0, 1920.0, 3564.0, 7424.0, 17553.0, 50925.0, 901673.0, 34700.0, 13074.0, 5807.0, 2840.0, 1650.0, 1017.0, 638.0, 459.0, 352.0, 225.0, 164.0, 153.0, 107.0, 84.0, 68.0, 42.0, 42.0, 30.0, 23.0, 31.0, 13.0, 12.0, 8.0, 7.0, 9.0, 9.0, 3.0, 4.0, 3.0, 5.0], "bins": [-4.41796875, -4.28546142578125, -4.1529541015625, -4.02044677734375, -3.887939453125, -3.75543212890625, -3.6229248046875, -3.49041748046875, -3.35791015625, -3.22540283203125, -3.0928955078125, -2.96038818359375, -2.827880859375, -2.69537353515625, -2.5628662109375, -2.43035888671875, -2.2978515625, -2.16534423828125, -2.0328369140625, -1.90032958984375, -1.767822265625, -1.63531494140625, -1.5028076171875, -1.37030029296875, -1.23779296875, -1.10528564453125, -0.9727783203125, -0.84027099609375, -0.707763671875, -0.57525634765625, -0.4427490234375, -0.31024169921875, -0.177734375, -0.04522705078125, 0.0872802734375, 0.21978759765625, 0.352294921875, 0.48480224609375, 0.6173095703125, 0.74981689453125, 0.88232421875, 1.01483154296875, 1.1473388671875, 1.27984619140625, 1.412353515625, 1.54486083984375, 1.6773681640625, 1.80987548828125, 1.9423828125, 2.07489013671875, 2.2073974609375, 2.33990478515625, 2.472412109375, 2.60491943359375, 2.7374267578125, 2.86993408203125, 3.00244140625, 3.13494873046875, 3.2674560546875, 3.39996337890625, 3.532470703125, 3.66497802734375, 3.7974853515625, 3.92999267578125, 4.0625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 6.0, 9.0, 7.0, 8.0, 10.0, 16.0, 21.0, 28.0, 25.0, 25.0, 32.0, 26.0, 33.0, 37.0, 39.0, 32.0, 40.0, 47.0, 46.0, 39.0, 34.0, 48.0, 31.0, 45.0, 40.0, 27.0, 28.0, 30.0, 28.0, 16.0, 16.0, 27.0, 13.0, 14.0, 13.0, 8.0, 3.0, 8.0, 5.0, 6.0, 8.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-3.7265625, -3.614501953125, -3.50244140625, -3.390380859375, -3.2783203125, -3.166259765625, -3.05419921875, -2.942138671875, -2.830078125, -2.718017578125, -2.60595703125, -2.493896484375, -2.3818359375, -2.269775390625, -2.15771484375, -2.045654296875, -1.93359375, -1.821533203125, -1.70947265625, -1.597412109375, -1.4853515625, -1.373291015625, -1.26123046875, -1.149169921875, -1.037109375, -0.925048828125, -0.81298828125, -0.700927734375, -0.5888671875, -0.476806640625, -0.36474609375, -0.252685546875, -0.140625, -0.028564453125, 0.08349609375, 0.195556640625, 0.3076171875, 0.419677734375, 0.53173828125, 0.643798828125, 0.755859375, 0.867919921875, 0.97998046875, 1.092041015625, 1.2041015625, 1.316162109375, 1.42822265625, 1.540283203125, 1.65234375, 1.764404296875, 1.87646484375, 1.988525390625, 2.1005859375, 2.212646484375, 2.32470703125, 2.436767578125, 2.548828125, 2.660888671875, 2.77294921875, 2.885009765625, 2.9970703125, 3.109130859375, 3.22119140625, 3.333251953125, 3.4453125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 12.0, 14.0, 12.0, 24.0, 40.0, 44.0, 93.0, 108.0, 179.0, 300.0, 521.0, 1043.0, 2040.0, 5032.0, 15738.0, 899022.0, 100939.0, 14487.0, 4650.0, 1947.0, 937.0, 540.0, 310.0, 172.0, 112.0, 64.0, 51.0, 37.0, 24.0, 20.0, 12.0, 5.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40625, -0.39269256591796875, -0.3791351318359375, -0.36557769775390625, -0.352020263671875, -0.33846282958984375, -0.3249053955078125, -0.31134796142578125, -0.29779052734375, -0.28423309326171875, -0.2706756591796875, -0.25711822509765625, -0.243560791015625, -0.23000335693359375, -0.2164459228515625, -0.20288848876953125, -0.1893310546875, -0.17577362060546875, -0.1622161865234375, -0.14865875244140625, -0.135101318359375, -0.12154388427734375, -0.1079864501953125, -0.09442901611328125, -0.08087158203125, -0.06731414794921875, -0.0537567138671875, -0.04019927978515625, -0.026641845703125, -0.01308441162109375, 0.0004730224609375, 0.01403045654296875, 0.027587890625, 0.04114532470703125, 0.0547027587890625, 0.06826019287109375, 0.081817626953125, 0.09537506103515625, 0.1089324951171875, 0.12248992919921875, 0.13604736328125, 0.14960479736328125, 0.1631622314453125, 0.17671966552734375, 0.190277099609375, 0.20383453369140625, 0.2173919677734375, 0.23094940185546875, 0.2445068359375, 0.25806427001953125, 0.2716217041015625, 0.28517913818359375, 0.298736572265625, 0.31229400634765625, 0.3258514404296875, 0.33940887451171875, 0.35296630859375, 0.36652374267578125, 0.3800811767578125, 0.39363861083984375, 0.407196044921875, 0.42075347900390625, 0.4343109130859375, 0.44786834716796875, 0.46142578125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 2.0, 4.0, 6.0, 5.0, 10.0, 9.0, 9.0, 16.0, 13.0, 28.0, 21.0, 48.0, 38.0, 34.0, 50.0, 59.0, 55.0, 51.0, 47.0, 46.0, 53.0, 45.0, 38.0, 41.0, 43.0, 34.0, 32.0, 27.0, 20.0, 12.0, 22.0, 19.0, 8.0, 11.0, 14.0, 6.0, 4.0, 5.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.844499588012695e-05, -3.7321820855140686e-05, -3.619864583015442e-05, -3.507547080516815e-05, -3.3952295780181885e-05, -3.282912075519562e-05, -3.170594573020935e-05, -3.0582770705223083e-05, -2.9459595680236816e-05, -2.833642065525055e-05, -2.7213245630264282e-05, -2.6090070605278015e-05, -2.4966895580291748e-05, -2.384372055530548e-05, -2.2720545530319214e-05, -2.1597370505332947e-05, -2.047419548034668e-05, -1.9351020455360413e-05, -1.8227845430374146e-05, -1.710467040538788e-05, -1.598149538040161e-05, -1.4858320355415344e-05, -1.3735145330429077e-05, -1.261197030544281e-05, -1.1488795280456543e-05, -1.0365620255470276e-05, -9.242445230484009e-06, -8.119270205497742e-06, -6.996095180511475e-06, -5.8729201555252075e-06, -4.7497451305389404e-06, -3.6265701055526733e-06, -2.5033950805664062e-06, -1.3802200555801392e-06, -2.5704503059387207e-07, 8.66129994392395e-07, 1.989305019378662e-06, 3.112480044364929e-06, 4.235655069351196e-06, 5.358830094337463e-06, 6.4820051193237305e-06, 7.6051801443099976e-06, 8.728355169296265e-06, 9.851530194282532e-06, 1.0974705219268799e-05, 1.2097880244255066e-05, 1.3221055269241333e-05, 1.43442302942276e-05, 1.5467405319213867e-05, 1.6590580344200134e-05, 1.77137553691864e-05, 1.883693039417267e-05, 1.9960105419158936e-05, 2.1083280444145203e-05, 2.220645546913147e-05, 2.3329630494117737e-05, 2.4452805519104004e-05, 2.557598054409027e-05, 2.6699155569076538e-05, 2.7822330594062805e-05, 2.8945505619049072e-05, 3.006868064403534e-05, 3.1191855669021606e-05, 3.2315030694007874e-05, 3.343820571899414e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 11.0, 11.0, 21.0, 26.0, 37.0, 41.0, 69.0, 88.0, 164.0, 249.0, 349.0, 614.0, 921.0, 1516.0, 2693.0, 4766.0, 8619.0, 16370.0, 32713.0, 70501.0, 183938.0, 401025.0, 184120.0, 70471.0, 32466.0, 16421.0, 8746.0, 4712.0, 2687.0, 1544.0, 984.0, 554.0, 357.0, 243.0, 175.0, 103.0, 68.0, 49.0, 29.0, 32.0, 12.0, 7.0, 10.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.160888671875, -0.15608596801757812, -0.15128326416015625, -0.14648056030273438, -0.1416778564453125, -0.13687515258789062, -0.13207244873046875, -0.12726974487304688, -0.122467041015625, -0.11766433715820312, -0.11286163330078125, -0.10805892944335938, -0.1032562255859375, -0.09845352172851562, -0.09365081787109375, -0.08884811401367188, -0.08404541015625, -0.07924270629882812, -0.07444000244140625, -0.06963729858398438, -0.0648345947265625, -0.060031890869140625, -0.05522918701171875, -0.050426483154296875, -0.045623779296875, -0.040821075439453125, -0.03601837158203125, -0.031215667724609375, -0.0264129638671875, -0.021610260009765625, -0.01680755615234375, -0.012004852294921875, -0.0072021484375, -0.002399444580078125, 0.00240325927734375, 0.007205963134765625, 0.0120086669921875, 0.016811370849609375, 0.02161407470703125, 0.026416778564453125, 0.031219482421875, 0.036022186279296875, 0.04082489013671875, 0.045627593994140625, 0.0504302978515625, 0.055233001708984375, 0.06003570556640625, 0.06483840942382812, 0.06964111328125, 0.07444381713867188, 0.07924652099609375, 0.08404922485351562, 0.0888519287109375, 0.09365463256835938, 0.09845733642578125, 0.10326004028320312, 0.108062744140625, 0.11286544799804688, 0.11766815185546875, 0.12247085571289062, 0.1272735595703125, 0.13207626342773438, 0.13687896728515625, 0.14168167114257812, 0.146484375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 2.0, 3.0, 2.0, 7.0, 12.0, 19.0, 26.0, 37.0, 43.0, 82.0, 89.0, 145.0, 143.0, 119.0, 83.0, 56.0, 27.0, 28.0, 23.0, 17.0, 6.0, 2.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047149658203125, -0.0452113151550293, -0.043272972106933594, -0.04133462905883789, -0.03939628601074219, -0.037457942962646484, -0.03551959991455078, -0.03358125686645508, -0.031642913818359375, -0.029704570770263672, -0.02776622772216797, -0.025827884674072266, -0.023889541625976562, -0.02195119857788086, -0.020012855529785156, -0.018074512481689453, -0.01613616943359375, -0.014197826385498047, -0.012259483337402344, -0.01032114028930664, -0.008382797241210938, -0.006444454193115234, -0.004506111145019531, -0.002567768096923828, -0.000629425048828125, 0.0013089179992675781, 0.0032472610473632812, 0.005185604095458984, 0.0071239471435546875, 0.00906229019165039, 0.011000633239746094, 0.012938976287841797, 0.0148773193359375, 0.016815662384033203, 0.018754005432128906, 0.02069234848022461, 0.022630691528320312, 0.024569034576416016, 0.02650737762451172, 0.028445720672607422, 0.030384063720703125, 0.03232240676879883, 0.03426074981689453, 0.036199092864990234, 0.03813743591308594, 0.04007577896118164, 0.042014122009277344, 0.04395246505737305, 0.04589080810546875, 0.04782915115356445, 0.049767494201660156, 0.05170583724975586, 0.05364418029785156, 0.055582523345947266, 0.05752086639404297, 0.05945920944213867, 0.061397552490234375, 0.06333589553833008, 0.06527423858642578, 0.06721258163452148, 0.06915092468261719, 0.07108926773071289, 0.0730276107788086, 0.0749659538269043, 0.076904296875]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 7.0, 10.0, 8.0, 12.0, 15.0, 17.0, 19.0, 31.0, 23.0, 40.0, 36.0, 41.0, 38.0, 48.0, 60.0, 52.0, 57.0, 63.0, 47.0, 53.0, 51.0, 32.0, 29.0, 33.0, 23.0, 27.0, 25.0, 19.0, 8.0, 9.0, 11.0, 7.0, 6.0, 7.0, 5.0, 2.0, 3.0, 0.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.286056995391846, -5.1129350662231445, -4.939813137054443, -4.766691207885742, -4.593569278717041, -4.42044734954834, -4.247325897216797, -4.074203968048096, -3.9010820388793945, -3.7279601097106934, -3.554838180541992, -3.381716251373291, -3.208594560623169, -3.0354726314544678, -2.8623507022857666, -2.6892290115356445, -2.5161068439483643, -2.342984914779663, -2.169862985610962, -1.9967411756515503, -1.8236193656921387, -1.6504974365234375, -1.4773755073547363, -1.3042536973953247, -1.1311317682266235, -0.9580098986625671, -0.7848880290985107, -0.6117660999298096, -0.4386442303657532, -0.2655223608016968, -0.0924004316329956, 0.08072137832641602, 0.2538433074951172, 0.4269651770591736, 0.60008704662323, 0.7732089757919312, 0.9463308453559875, 1.119452714920044, 1.2925746440887451, 1.4656964540481567, 1.638818383216858, 1.811940312385559, 1.9850621223449707, 2.158184051513672, 2.331305980682373, 2.504427909851074, 2.6775498390197754, 2.8506715297698975, 3.0237934589385986, 3.1969153881073, 3.370037317276001, 3.543159008026123, 3.716280937194824, 3.8894028663635254, 4.062524795532227, 4.235646724700928, 4.408768653869629, 4.58189058303833, 4.755012512207031, 4.928134441375732, 5.101256370544434, 5.274377822875977, 5.447500228881836, 5.620621681213379, 5.79374361038208]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 8.0, 9.0, 6.0, 8.0, 12.0, 13.0, 17.0, 28.0, 20.0, 25.0, 34.0, 33.0, 29.0, 32.0, 41.0, 48.0, 41.0, 61.0, 40.0, 40.0, 45.0, 39.0, 42.0, 41.0, 33.0, 35.0, 36.0, 36.0, 17.0, 23.0, 16.0, 15.0, 12.0, 14.0, 13.0, 9.0, 7.0, 4.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.474457263946533, -6.287167072296143, -6.099876403808594, -5.912586212158203, -5.7252960205078125, -5.538005828857422, -5.350715637207031, -5.163424968719482, -4.976134777069092, -4.788844585418701, -4.601553916931152, -4.414263725280762, -4.226973533630371, -4.0396833419799805, -3.8523929119110107, -3.665102481842041, -3.4778122901916504, -3.2905220985412598, -3.10323166847229, -2.9159412384033203, -2.7286510467529297, -2.541360855102539, -2.3540704250335693, -2.1667799949645996, -1.979489803314209, -1.7921994924545288, -1.6049091815948486, -1.4176188707351685, -1.2303285598754883, -1.043038249015808, -0.8557479381561279, -0.6684576272964478, -0.4811677932739258, -0.2938774824142456, -0.10658717155456543, 0.08070313930511475, 0.2679934501647949, 0.4552837610244751, 0.6425740718841553, 0.8298643827438354, 1.0171546936035156, 1.2044450044631958, 1.391735315322876, 1.5790256261825562, 1.7663159370422363, 1.9536062479019165, 2.1408965587615967, 2.3281869888305664, 2.515477180480957, 2.7027673721313477, 2.8900578022003174, 3.077348232269287, 3.2646384239196777, 3.4519286155700684, 3.639219045639038, 3.826509475708008, 4.013799667358398, 4.201089859008789, 4.38838005065918, 4.5756707191467285, 4.762960910797119, 4.95025110244751, 5.137541770935059, 5.324831962585449, 5.51212215423584]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 4.0, 3.0, 4.0, 8.0, 14.0, 25.0, 29.0, 33.0, 63.0, 99.0, 105.0, 223.0, 339.0, 559.0, 893.0, 1394.0, 2333.0, 3849.0, 6672.0, 11679.0, 20114.0, 34491.0, 60272.0, 101394.0, 154619.0, 187609.0, 170407.0, 119257.0, 72472.0, 41721.0, 23868.0, 13848.0, 8150.0, 4778.0, 2803.0, 1678.0, 983.0, 653.0, 366.0, 248.0, 172.0, 106.0, 58.0, 56.0, 36.0, 24.0, 14.0, 16.0, 9.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 4.0], "bins": [-4.765625, -4.62408447265625, -4.4825439453125, -4.34100341796875, -4.199462890625, -4.05792236328125, -3.9163818359375, -3.77484130859375, -3.63330078125, -3.49176025390625, -3.3502197265625, -3.20867919921875, -3.067138671875, -2.92559814453125, -2.7840576171875, -2.64251708984375, -2.5009765625, -2.35943603515625, -2.2178955078125, -2.07635498046875, -1.934814453125, -1.79327392578125, -1.6517333984375, -1.51019287109375, -1.36865234375, -1.22711181640625, -1.0855712890625, -0.94403076171875, -0.802490234375, -0.66094970703125, -0.5194091796875, -0.37786865234375, -0.236328125, -0.09478759765625, 0.0467529296875, 0.18829345703125, 0.329833984375, 0.47137451171875, 0.6129150390625, 0.75445556640625, 0.89599609375, 1.03753662109375, 1.1790771484375, 1.32061767578125, 1.462158203125, 1.60369873046875, 1.7452392578125, 1.88677978515625, 2.0283203125, 2.16986083984375, 2.3114013671875, 2.45294189453125, 2.594482421875, 2.73602294921875, 2.8775634765625, 3.01910400390625, 3.16064453125, 3.30218505859375, 3.4437255859375, 3.58526611328125, 3.726806640625, 3.86834716796875, 4.0098876953125, 4.15142822265625, 4.29296875]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 4.0, 4.0, 10.0, 12.0, 14.0, 16.0, 25.0, 23.0, 32.0, 39.0, 31.0, 38.0, 37.0, 46.0, 48.0, 66.0, 60.0, 50.0, 59.0, 41.0, 51.0, 39.0, 47.0, 28.0, 43.0, 22.0, 17.0, 13.0, 21.0, 14.0, 16.0, 9.0, 6.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.32421875, -6.10333251953125, -5.8824462890625, -5.66156005859375, -5.440673828125, -5.21978759765625, -4.9989013671875, -4.77801513671875, -4.55712890625, -4.33624267578125, -4.1153564453125, -3.89447021484375, -3.673583984375, -3.45269775390625, -3.2318115234375, -3.01092529296875, -2.7900390625, -2.56915283203125, -2.3482666015625, -2.12738037109375, -1.906494140625, -1.68560791015625, -1.4647216796875, -1.24383544921875, -1.02294921875, -0.80206298828125, -0.5811767578125, -0.36029052734375, -0.139404296875, 0.08148193359375, 0.3023681640625, 0.52325439453125, 0.744140625, 0.96502685546875, 1.1859130859375, 1.40679931640625, 1.627685546875, 1.84857177734375, 2.0694580078125, 2.29034423828125, 2.51123046875, 2.73211669921875, 2.9530029296875, 3.17388916015625, 3.394775390625, 3.61566162109375, 3.8365478515625, 4.05743408203125, 4.2783203125, 4.49920654296875, 4.7200927734375, 4.94097900390625, 5.161865234375, 5.38275146484375, 5.6036376953125, 5.82452392578125, 6.04541015625, 6.26629638671875, 6.4871826171875, 6.70806884765625, 6.928955078125, 7.14984130859375, 7.3707275390625, 7.59161376953125, 7.8125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 11.0, 7.0, 9.0, 12.0, 22.0, 32.0, 62.0, 82.0, 135.0, 198.0, 289.0, 459.0, 676.0, 1046.0, 1661.0, 2550.0, 4047.0, 6349.0, 9965.0, 16191.0, 25937.0, 43199.0, 69250.0, 106732.0, 146684.0, 164754.0, 148422.0, 110615.0, 71637.0, 45160.0, 27090.0, 16701.0, 10439.0, 6520.0, 4146.0, 2624.0, 1707.0, 1145.0, 675.0, 444.0, 332.0, 184.0, 113.0, 98.0, 44.0, 41.0, 27.0, 17.0, 13.0, 7.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.900390625, -3.772674560546875, -3.64495849609375, -3.517242431640625, -3.3895263671875, -3.261810302734375, -3.13409423828125, -3.006378173828125, -2.878662109375, -2.750946044921875, -2.62322998046875, -2.495513916015625, -2.3677978515625, -2.240081787109375, -2.11236572265625, -1.984649658203125, -1.85693359375, -1.729217529296875, -1.60150146484375, -1.473785400390625, -1.3460693359375, -1.218353271484375, -1.09063720703125, -0.962921142578125, -0.835205078125, -0.707489013671875, -0.57977294921875, -0.452056884765625, -0.3243408203125, -0.196624755859375, -0.06890869140625, 0.058807373046875, 0.1865234375, 0.314239501953125, 0.44195556640625, 0.569671630859375, 0.6973876953125, 0.825103759765625, 0.95281982421875, 1.080535888671875, 1.208251953125, 1.335968017578125, 1.46368408203125, 1.591400146484375, 1.7191162109375, 1.846832275390625, 1.97454833984375, 2.102264404296875, 2.22998046875, 2.357696533203125, 2.48541259765625, 2.613128662109375, 2.7408447265625, 2.868560791015625, 2.99627685546875, 3.123992919921875, 3.251708984375, 3.379425048828125, 3.50714111328125, 3.634857177734375, 3.7625732421875, 3.890289306640625, 4.01800537109375, 4.145721435546875, 4.2734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 2.0, 6.0, 5.0, 11.0, 6.0, 12.0, 10.0, 16.0, 11.0, 11.0, 12.0, 17.0, 26.0, 28.0, 18.0, 27.0, 47.0, 37.0, 28.0, 52.0, 39.0, 48.0, 39.0, 38.0, 38.0, 42.0, 45.0, 33.0, 31.0, 29.0, 35.0, 29.0, 21.0, 26.0, 14.0, 18.0, 20.0, 14.0, 9.0, 9.0, 14.0, 7.0, 5.0, 6.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.34765625, -3.244140625, -3.140625, -3.037109375, -2.93359375, -2.830078125, -2.7265625, -2.623046875, -2.51953125, -2.416015625, -2.3125, -2.208984375, -2.10546875, -2.001953125, -1.8984375, -1.794921875, -1.69140625, -1.587890625, -1.484375, -1.380859375, -1.27734375, -1.173828125, -1.0703125, -0.966796875, -0.86328125, -0.759765625, -0.65625, -0.552734375, -0.44921875, -0.345703125, -0.2421875, -0.138671875, -0.03515625, 0.068359375, 0.171875, 0.275390625, 0.37890625, 0.482421875, 0.5859375, 0.689453125, 0.79296875, 0.896484375, 1.0, 1.103515625, 1.20703125, 1.310546875, 1.4140625, 1.517578125, 1.62109375, 1.724609375, 1.828125, 1.931640625, 2.03515625, 2.138671875, 2.2421875, 2.345703125, 2.44921875, 2.552734375, 2.65625, 2.759765625, 2.86328125, 2.966796875, 3.0703125, 3.173828125, 3.27734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 5.0, 11.0, 13.0, 19.0, 32.0, 48.0, 56.0, 93.0, 145.0, 206.0, 307.0, 428.0, 595.0, 940.0, 1366.0, 2256.0, 3342.0, 5404.0, 8623.0, 13575.0, 21695.0, 34399.0, 53721.0, 80313.0, 111693.0, 137814.0, 146476.0, 130367.0, 100243.0, 69925.0, 45522.0, 28963.0, 18179.0, 11414.0, 7205.0, 4654.0, 2889.0, 1868.0, 1242.0, 832.0, 520.0, 356.0, 243.0, 159.0, 128.0, 85.0, 65.0, 44.0, 24.0, 27.0, 8.0, 8.0, 6.0, 6.0, 5.0], "bins": [-1.4873046875, -1.4451904296875, -1.403076171875, -1.3609619140625, -1.31884765625, -1.2767333984375, -1.234619140625, -1.1925048828125, -1.150390625, -1.1082763671875, -1.066162109375, -1.0240478515625, -0.98193359375, -0.9398193359375, -0.897705078125, -0.8555908203125, -0.8134765625, -0.7713623046875, -0.729248046875, -0.6871337890625, -0.64501953125, -0.6029052734375, -0.560791015625, -0.5186767578125, -0.4765625, -0.4344482421875, -0.392333984375, -0.3502197265625, -0.30810546875, -0.2659912109375, -0.223876953125, -0.1817626953125, -0.1396484375, -0.0975341796875, -0.055419921875, -0.0133056640625, 0.02880859375, 0.0709228515625, 0.113037109375, 0.1551513671875, 0.197265625, 0.2393798828125, 0.281494140625, 0.3236083984375, 0.36572265625, 0.4078369140625, 0.449951171875, 0.4920654296875, 0.5341796875, 0.5762939453125, 0.618408203125, 0.6605224609375, 0.70263671875, 0.7447509765625, 0.786865234375, 0.8289794921875, 0.87109375, 0.9132080078125, 0.955322265625, 0.9974365234375, 1.03955078125, 1.0816650390625, 1.123779296875, 1.1658935546875, 1.2080078125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 9.0, 11.0, 23.0, 26.0, 27.0, 23.0, 30.0, 22.0, 41.0, 48.0, 52.0, 40.0, 50.0, 53.0, 51.0, 52.0, 53.0, 47.0, 46.0, 48.0, 42.0, 35.0, 24.0, 22.0, 18.0, 19.0, 12.0, 13.0, 12.0, 9.0, 7.0, 5.0, 3.0, 3.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00014090538024902344, -0.00013705063611268997, -0.0001331958919763565, -0.00012934114784002304, -0.00012548640370368958, -0.00012163165956735611, -0.00011777691543102264, -0.00011392217129468918, -0.00011006742715835571, -0.00010621268302202225, -0.00010235793888568878, -9.850319474935532e-05, -9.464845061302185e-05, -9.079370647668839e-05, -8.693896234035492e-05, -8.308421820402145e-05, -7.922947406768799e-05, -7.537472993135452e-05, -7.151998579502106e-05, -6.766524165868759e-05, -6.381049752235413e-05, -5.995575338602066e-05, -5.6101009249687195e-05, -5.224626511335373e-05, -4.8391520977020264e-05, -4.45367768406868e-05, -4.068203270435333e-05, -3.682728856801987e-05, -3.29725444316864e-05, -2.9117800295352936e-05, -2.526305615901947e-05, -2.1408312022686005e-05, -1.755356788635254e-05, -1.3698823750019073e-05, -9.844079613685608e-06, -5.989335477352142e-06, -2.1345913410186768e-06, 1.7201527953147888e-06, 5.574896931648254e-06, 9.42964106798172e-06, 1.3284385204315186e-05, 1.713912934064865e-05, 2.0993873476982117e-05, 2.4848617613315582e-05, 2.8703361749649048e-05, 3.2558105885982513e-05, 3.641285002231598e-05, 4.0267594158649445e-05, 4.412233829498291e-05, 4.7977082431316376e-05, 5.183182656764984e-05, 5.568657070398331e-05, 5.954131484031677e-05, 6.339605897665024e-05, 6.72508031129837e-05, 7.110554724931717e-05, 7.496029138565063e-05, 7.88150355219841e-05, 8.266977965831757e-05, 8.652452379465103e-05, 9.03792679309845e-05, 9.423401206731796e-05, 9.808875620365143e-05, 0.0001019435003399849, 0.00010579824447631836]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 8.0, 9.0, 16.0, 24.0, 39.0, 45.0, 62.0, 101.0, 141.0, 226.0, 365.0, 546.0, 857.0, 1339.0, 2328.0, 3651.0, 6133.0, 10975.0, 19447.0, 34553.0, 60237.0, 99325.0, 147960.0, 178534.0, 167938.0, 125024.0, 79833.0, 46832.0, 26472.0, 14704.0, 8361.0, 4869.0, 2835.0, 1751.0, 1056.0, 683.0, 456.0, 259.0, 195.0, 108.0, 87.0, 63.0, 36.0, 27.0, 9.0, 13.0, 6.0, 5.0, 8.0, 0.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5673828125, -1.5147247314453125, -1.462066650390625, -1.4094085693359375, -1.35675048828125, -1.3040924072265625, -1.251434326171875, -1.1987762451171875, -1.1461181640625, -1.0934600830078125, -1.040802001953125, -0.9881439208984375, -0.93548583984375, -0.8828277587890625, -0.830169677734375, -0.7775115966796875, -0.724853515625, -0.6721954345703125, -0.619537353515625, -0.5668792724609375, -0.51422119140625, -0.4615631103515625, -0.408905029296875, -0.3562469482421875, -0.3035888671875, -0.2509307861328125, -0.198272705078125, -0.1456146240234375, -0.09295654296875, -0.0402984619140625, 0.012359619140625, 0.0650177001953125, 0.11767578125, 0.1703338623046875, 0.222991943359375, 0.2756500244140625, 0.32830810546875, 0.3809661865234375, 0.433624267578125, 0.4862823486328125, 0.5389404296875, 0.5915985107421875, 0.644256591796875, 0.6969146728515625, 0.74957275390625, 0.8022308349609375, 0.854888916015625, 0.9075469970703125, 0.960205078125, 1.0128631591796875, 1.065521240234375, 1.1181793212890625, 1.17083740234375, 1.2234954833984375, 1.276153564453125, 1.3288116455078125, 1.3814697265625, 1.4341278076171875, 1.486785888671875, 1.5394439697265625, 1.59210205078125, 1.6447601318359375, 1.697418212890625, 1.7500762939453125, 1.802734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 5.0, 11.0, 9.0, 11.0, 30.0, 29.0, 25.0, 49.0, 45.0, 47.0, 78.0, 61.0, 82.0, 68.0, 64.0, 66.0, 59.0, 54.0, 39.0, 41.0, 24.0, 18.0, 22.0, 15.0, 8.0, 12.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69775390625, -0.6728363037109375, -0.647918701171875, -0.6230010986328125, -0.59808349609375, -0.5731658935546875, -0.548248291015625, -0.5233306884765625, -0.4984130859375, -0.4734954833984375, -0.448577880859375, -0.4236602783203125, -0.39874267578125, -0.3738250732421875, -0.348907470703125, -0.3239898681640625, -0.299072265625, -0.2741546630859375, -0.249237060546875, -0.2243194580078125, -0.19940185546875, -0.1744842529296875, -0.149566650390625, -0.1246490478515625, -0.0997314453125, -0.0748138427734375, -0.049896240234375, -0.0249786376953125, -6.103515625e-05, 0.0248565673828125, 0.049774169921875, 0.0746917724609375, 0.099609375, 0.1245269775390625, 0.149444580078125, 0.1743621826171875, 0.19927978515625, 0.2241973876953125, 0.249114990234375, 0.2740325927734375, 0.2989501953125, 0.3238677978515625, 0.348785400390625, 0.3737030029296875, 0.39862060546875, 0.4235382080078125, 0.448455810546875, 0.4733734130859375, 0.498291015625, 0.5232086181640625, 0.548126220703125, 0.5730438232421875, 0.59796142578125, 0.6228790283203125, 0.647796630859375, 0.6727142333984375, 0.6976318359375, 0.7225494384765625, 0.747467041015625, 0.7723846435546875, 0.79730224609375, 0.8222198486328125, 0.847137451171875, 0.8720550537109375, 0.89697265625]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 3.0, 4.0, 3.0, 3.0, 5.0, 4.0, 13.0, 17.0, 11.0, 19.0, 21.0, 24.0, 16.0, 29.0, 34.0, 36.0, 48.0, 36.0, 46.0, 48.0, 60.0, 65.0, 51.0, 40.0, 43.0, 42.0, 31.0, 38.0, 34.0, 28.0, 22.0, 21.0, 16.0, 14.0, 9.0, 12.0, 6.0, 7.0, 8.0, 6.0, 6.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.806588649749756, -4.642242908477783, -4.477897644042969, -4.313551902770996, -4.149206638336182, -3.984860897064209, -3.8205153942108154, -3.656169891357422, -3.4918243885040283, -3.3274788856506348, -3.163133382797241, -2.9987878799438477, -2.834442138671875, -2.6700968742370605, -2.505751132965088, -2.3414056301116943, -2.177060127258301, -2.0127146244049072, -1.8483691215515137, -1.6840234994888306, -1.519677996635437, -1.3553324937820435, -1.1909868717193604, -1.0266413688659668, -0.8622958660125732, -0.6979503631591797, -0.5336048007011414, -0.3692592680454254, -0.20491373538970947, -0.04056823253631592, 0.12377732992172241, 0.28812289237976074, 0.4524679183959961, 0.6168134212493896, 0.781158983707428, 0.9455045461654663, 1.1098500490188599, 1.2741955518722534, 1.4385411739349365, 1.60288667678833, 1.7672321796417236, 1.9315776824951172, 2.0959231853485107, 2.2602686882019043, 2.424614429473877, 2.5889596939086914, 2.753305435180664, 2.9176509380340576, 3.081996440887451, 3.2463419437408447, 3.4106874465942383, 3.575032949447632, 3.7393784523010254, 3.903724193572998, 4.0680694580078125, 4.232415199279785, 4.396760940551758, 4.5611066818237305, 4.725451946258545, 4.889797687530518, 5.054142951965332, 5.218488693237305, 5.382833957672119, 5.547179698944092, 5.711524963378906]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 5.0, 7.0, 8.0, 7.0, 13.0, 12.0, 17.0, 16.0, 24.0, 17.0, 27.0, 24.0, 31.0, 34.0, 29.0, 42.0, 32.0, 42.0, 37.0, 48.0, 38.0, 42.0, 41.0, 35.0, 41.0, 32.0, 40.0, 31.0, 28.0, 24.0, 28.0, 26.0, 14.0, 15.0, 25.0, 13.0, 8.0, 6.0, 10.0, 11.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0], "bins": [-6.309025287628174, -6.136289596557617, -5.9635539054870605, -5.790818214416504, -5.618082523345947, -5.445346832275391, -5.272611618041992, -5.099875450134277, -4.927140235900879, -4.754404544830322, -4.581668853759766, -4.408933162689209, -4.236197471618652, -4.063461780548096, -3.890726327896118, -3.7179906368255615, -3.545254707336426, -3.372519016265869, -3.1997833251953125, -3.027047634124756, -2.854311943054199, -2.6815762519836426, -2.508840799331665, -2.3361051082611084, -2.1633694171905518, -1.9906337261199951, -1.8178980350494385, -1.6451624631881714, -1.4724267721176147, -1.299691081047058, -1.126955509185791, -0.9542198181152344, -0.7814841270446777, -0.6087484359741211, -0.43601280450820923, -0.26327717304229736, -0.09054148197174072, 0.08219420909881592, 0.254929780960083, 0.42766547203063965, 0.6004011631011963, 0.7731368541717529, 0.9458724856376648, 1.1186081171035767, 1.2913438081741333, 1.46407949924469, 1.636815071105957, 1.8095507621765137, 1.9822864532470703, 2.155022144317627, 2.3277578353881836, 2.5004935264587402, 2.673229217529297, 2.8459649085998535, 3.018700361251831, 3.1914360523223877, 3.3641717433929443, 3.536907434463501, 3.7096431255340576, 3.882378578186035, 4.055114269256592, 4.227849960327148, 4.400585651397705, 4.573321342468262, 4.746057033538818]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 5.0, 4.0, 4.0, 7.0, 19.0, 26.0, 35.0, 50.0, 62.0, 93.0, 165.0, 238.0, 389.0, 585.0, 941.0, 1400.0, 2336.0, 3971.0, 6618.0, 11387.0, 20038.0, 36539.0, 67736.0, 126861.0, 238192.0, 434331.0, 697130.0, 845969.0, 709005.0, 449009.0, 250698.0, 133941.0, 71303.0, 38220.0, 20337.0, 11182.0, 6272.0, 3671.0, 2166.0, 1245.0, 804.0, 471.0, 315.0, 170.0, 114.0, 74.0, 50.0, 40.0, 17.0, 22.0, 9.0, 8.0, 9.0, 8.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.80859375, -5.6182861328125, -5.427978515625, -5.2376708984375, -5.04736328125, -4.8570556640625, -4.666748046875, -4.4764404296875, -4.2861328125, -4.0958251953125, -3.905517578125, -3.7152099609375, -3.52490234375, -3.3345947265625, -3.144287109375, -2.9539794921875, -2.763671875, -2.5733642578125, -2.383056640625, -2.1927490234375, -2.00244140625, -1.8121337890625, -1.621826171875, -1.4315185546875, -1.2412109375, -1.0509033203125, -0.860595703125, -0.6702880859375, -0.47998046875, -0.2896728515625, -0.099365234375, 0.0909423828125, 0.28125, 0.4715576171875, 0.661865234375, 0.8521728515625, 1.04248046875, 1.2327880859375, 1.423095703125, 1.6134033203125, 1.8037109375, 1.9940185546875, 2.184326171875, 2.3746337890625, 2.56494140625, 2.7552490234375, 2.945556640625, 3.1358642578125, 3.326171875, 3.5164794921875, 3.706787109375, 3.8970947265625, 4.08740234375, 4.2777099609375, 4.468017578125, 4.6583251953125, 4.8486328125, 5.0389404296875, 5.229248046875, 5.4195556640625, 5.60986328125, 5.8001708984375, 5.990478515625, 6.1807861328125, 6.37109375]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 3.0, 2.0, 8.0, 8.0, 12.0, 12.0, 9.0, 14.0, 14.0, 18.0, 24.0, 31.0, 37.0, 41.0, 25.0, 33.0, 33.0, 41.0, 27.0, 56.0, 45.0, 49.0, 44.0, 44.0, 37.0, 42.0, 34.0, 34.0, 31.0, 33.0, 30.0, 26.0, 14.0, 17.0, 15.0, 14.0, 10.0, 5.0, 8.0, 9.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.12109375, -4.97314453125, -4.8251953125, -4.67724609375, -4.529296875, -4.38134765625, -4.2333984375, -4.08544921875, -3.9375, -3.78955078125, -3.6416015625, -3.49365234375, -3.345703125, -3.19775390625, -3.0498046875, -2.90185546875, -2.75390625, -2.60595703125, -2.4580078125, -2.31005859375, -2.162109375, -2.01416015625, -1.8662109375, -1.71826171875, -1.5703125, -1.42236328125, -1.2744140625, -1.12646484375, -0.978515625, -0.83056640625, -0.6826171875, -0.53466796875, -0.38671875, -0.23876953125, -0.0908203125, 0.05712890625, 0.205078125, 0.35302734375, 0.5009765625, 0.64892578125, 0.796875, 0.94482421875, 1.0927734375, 1.24072265625, 1.388671875, 1.53662109375, 1.6845703125, 1.83251953125, 1.98046875, 2.12841796875, 2.2763671875, 2.42431640625, 2.572265625, 2.72021484375, 2.8681640625, 3.01611328125, 3.1640625, 3.31201171875, 3.4599609375, 3.60791015625, 3.755859375, 3.90380859375, 4.0517578125, 4.19970703125, 4.34765625]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 14.0, 11.0, 16.0, 22.0, 50.0, 80.0, 96.0, 159.0, 234.0, 391.0, 573.0, 861.0, 1449.0, 2427.0, 3800.0, 6052.0, 10154.0, 16903.0, 28136.0, 48053.0, 80307.0, 134169.0, 219741.0, 339168.0, 481229.0, 599746.0, 621705.0, 533272.0, 393541.0, 262705.0, 164058.0, 98710.0, 58401.0, 34850.0, 20577.0, 12538.0, 7666.0, 4624.0, 2950.0, 1687.0, 1147.0, 691.0, 454.0, 306.0, 206.0, 133.0, 67.0, 58.0, 43.0, 19.0, 11.0, 15.0, 8.0, 2.0, 2.0, 1.0, 3.0], "bins": [-5.5234375, -5.3570556640625, -5.190673828125, -5.0242919921875, -4.85791015625, -4.6915283203125, -4.525146484375, -4.3587646484375, -4.1923828125, -4.0260009765625, -3.859619140625, -3.6932373046875, -3.52685546875, -3.3604736328125, -3.194091796875, -3.0277099609375, -2.861328125, -2.6949462890625, -2.528564453125, -2.3621826171875, -2.19580078125, -2.0294189453125, -1.863037109375, -1.6966552734375, -1.5302734375, -1.3638916015625, -1.197509765625, -1.0311279296875, -0.86474609375, -0.6983642578125, -0.531982421875, -0.3656005859375, -0.19921875, -0.0328369140625, 0.133544921875, 0.2999267578125, 0.46630859375, 0.6326904296875, 0.799072265625, 0.9654541015625, 1.1318359375, 1.2982177734375, 1.464599609375, 1.6309814453125, 1.79736328125, 1.9637451171875, 2.130126953125, 2.2965087890625, 2.462890625, 2.6292724609375, 2.795654296875, 2.9620361328125, 3.12841796875, 3.2947998046875, 3.461181640625, 3.6275634765625, 3.7939453125, 3.9603271484375, 4.126708984375, 4.2930908203125, 4.45947265625, 4.6258544921875, 4.792236328125, 4.9586181640625, 5.125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 10.0, 15.0, 10.0, 18.0, 25.0, 26.0, 34.0, 48.0, 60.0, 77.0, 81.0, 132.0, 131.0, 177.0, 167.0, 214.0, 222.0, 227.0, 272.0, 259.0, 237.0, 235.0, 199.0, 207.0, 152.0, 153.0, 117.0, 93.0, 88.0, 78.0, 72.0, 45.0, 40.0, 38.0, 23.0, 15.0, 14.0, 13.0, 9.0, 6.0, 7.0, 7.0, 4.0, 0.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.41015625, -2.328643798828125, -2.24713134765625, -2.165618896484375, -2.0841064453125, -2.002593994140625, -1.92108154296875, -1.839569091796875, -1.758056640625, -1.676544189453125, -1.59503173828125, -1.513519287109375, -1.4320068359375, -1.350494384765625, -1.26898193359375, -1.187469482421875, -1.10595703125, -1.024444580078125, -0.94293212890625, -0.861419677734375, -0.7799072265625, -0.698394775390625, -0.61688232421875, -0.535369873046875, -0.453857421875, -0.372344970703125, -0.29083251953125, -0.209320068359375, -0.1278076171875, -0.046295166015625, 0.03521728515625, 0.116729736328125, 0.1982421875, 0.279754638671875, 0.36126708984375, 0.442779541015625, 0.5242919921875, 0.605804443359375, 0.68731689453125, 0.768829345703125, 0.850341796875, 0.931854248046875, 1.01336669921875, 1.094879150390625, 1.1763916015625, 1.257904052734375, 1.33941650390625, 1.420928955078125, 1.50244140625, 1.583953857421875, 1.66546630859375, 1.746978759765625, 1.8284912109375, 1.910003662109375, 1.99151611328125, 2.073028564453125, 2.154541015625, 2.236053466796875, 2.31756591796875, 2.399078369140625, 2.4805908203125, 2.562103271484375, 2.64361572265625, 2.725128173828125, 2.806640625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 8.0, 13.0, 12.0, 17.0, 20.0, 25.0, 34.0, 42.0, 47.0, 49.0, 55.0, 55.0, 63.0, 55.0, 66.0, 64.0, 59.0, 47.0, 32.0, 40.0, 32.0, 38.0, 20.0, 15.0, 17.0, 11.0, 15.0, 9.0, 9.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.876069068908691, -6.6299662590026855, -6.3838629722595215, -6.137760162353516, -5.89165735244751, -5.645554542541504, -5.39945125579834, -5.153348445892334, -4.907245635986328, -4.661142826080322, -4.415039539337158, -4.168936729431152, -3.9228339195251465, -3.6767308712005615, -3.4306278228759766, -3.1845250129699707, -2.9384219646453857, -2.692318916320801, -2.446216106414795, -2.20011305809021, -1.954010248184204, -1.7079071998596191, -1.4618042707443237, -1.2157013416290283, -0.9695984125137329, -0.7234954833984375, -0.4773925244808197, -0.2312895655632019, 0.014813363552093506, 0.2609163522720337, 0.5070192813873291, 0.7531222105026245, 0.9992251396179199, 1.2453280687332153, 1.4914309978485107, 1.7375340461730957, 1.9836368560791016, 2.2297399044036865, 2.4758429527282715, 2.7219457626342773, 2.968048572540283, 3.214151620864868, 3.460254430770874, 3.706357479095459, 3.952460289001465, 4.198563575744629, 4.444666385650635, 4.690769195556641, 4.936872482299805, 5.1829752922058105, 5.429078578948975, 5.6751813888549805, 5.921284198760986, 6.167387008666992, 6.413490295410156, 6.659593105316162, 6.905695915222168, 7.151798725128174, 7.397902011871338, 7.644004821777344, 7.89010763168335, 8.136210441589355, 8.38231372833252, 8.628416061401367, 8.874519348144531]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 8.0, 2.0, 6.0, 9.0, 12.0, 13.0, 11.0, 12.0, 18.0, 25.0, 20.0, 26.0, 31.0, 29.0, 34.0, 28.0, 35.0, 45.0, 47.0, 34.0, 39.0, 40.0, 42.0, 38.0, 52.0, 45.0, 33.0, 33.0, 29.0, 30.0, 25.0, 30.0, 17.0, 26.0, 14.0, 14.0, 8.0, 11.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.3872480392456055, -7.169459342956543, -6.9516706466674805, -6.733881950378418, -6.5160932540893555, -6.298304557800293, -6.0805158615112305, -5.862727165222168, -5.6449384689331055, -5.427149772644043, -5.2093610763549805, -4.991572380065918, -4.7737836837768555, -4.555994987487793, -4.3382062911987305, -4.120417594909668, -3.9026284217834473, -3.6848397254943848, -3.4670510292053223, -3.2492623329162598, -3.0314736366271973, -2.8136849403381348, -2.595896005630493, -2.3781073093414307, -2.160318613052368, -1.9425299167633057, -1.7247412204742432, -1.5069524049758911, -1.2891637086868286, -1.0713750123977661, -0.8535861968994141, -0.6357975006103516, -0.41800832748413086, -0.20021960139274597, 0.017569124698638916, 0.2353578805923462, 0.4531465768814087, 0.6709352731704712, 0.8887240886688232, 1.1065127849578857, 1.3243014812469482, 1.5420901775360107, 1.7598788738250732, 1.9776676893234253, 2.1954565048217773, 2.41324520111084, 2.6310338973999023, 2.848822593688965, 3.0666112899780273, 3.28439998626709, 3.5021886825561523, 3.719977378845215, 3.9377660751342773, 4.15555477142334, 4.373343467712402, 4.591132164001465, 4.808920860290527, 5.02670955657959, 5.244498252868652, 5.462286949157715, 5.680075645446777, 5.89786434173584, 6.115653038024902, 6.333441734313965, 6.5512309074401855]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 11.0, 13.0, 18.0, 20.0, 32.0, 45.0, 74.0, 111.0, 147.0, 231.0, 364.0, 570.0, 886.0, 1410.0, 2350.0, 3871.0, 6198.0, 10186.0, 17294.0, 30449.0, 57081.0, 118576.0, 260300.0, 274578.0, 126129.0, 60394.0, 31630.0, 18151.0, 10392.0, 6357.0, 3850.0, 2429.0, 1549.0, 1028.0, 657.0, 390.0, 274.0, 179.0, 111.0, 60.0, 62.0, 35.0, 21.0, 15.0, 9.0, 4.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.271484375, -2.200592041015625, -2.12969970703125, -2.058807373046875, -1.9879150390625, -1.917022705078125, -1.84613037109375, -1.775238037109375, -1.704345703125, -1.633453369140625, -1.56256103515625, -1.491668701171875, -1.4207763671875, -1.349884033203125, -1.27899169921875, -1.208099365234375, -1.13720703125, -1.066314697265625, -0.99542236328125, -0.924530029296875, -0.8536376953125, -0.782745361328125, -0.71185302734375, -0.640960693359375, -0.570068359375, -0.499176025390625, -0.42828369140625, -0.357391357421875, -0.2864990234375, -0.215606689453125, -0.14471435546875, -0.073822021484375, -0.0029296875, 0.067962646484375, 0.13885498046875, 0.209747314453125, 0.2806396484375, 0.351531982421875, 0.42242431640625, 0.493316650390625, 0.564208984375, 0.635101318359375, 0.70599365234375, 0.776885986328125, 0.8477783203125, 0.918670654296875, 0.98956298828125, 1.060455322265625, 1.13134765625, 1.202239990234375, 1.27313232421875, 1.344024658203125, 1.4149169921875, 1.485809326171875, 1.55670166015625, 1.627593994140625, 1.698486328125, 1.769378662109375, 1.84027099609375, 1.911163330078125, 1.9820556640625, 2.052947998046875, 2.12384033203125, 2.194732666015625, 2.265625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 6.0, 8.0, 11.0, 8.0, 5.0, 11.0, 13.0, 27.0, 18.0, 21.0, 20.0, 31.0, 22.0, 35.0, 21.0, 41.0, 34.0, 44.0, 45.0, 54.0, 39.0, 43.0, 39.0, 54.0, 37.0, 34.0, 36.0, 39.0, 26.0, 33.0, 21.0, 19.0, 25.0, 16.0, 17.0, 10.0, 10.0, 11.0, 7.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.3203125, -7.0867919921875, -6.853271484375, -6.6197509765625, -6.38623046875, -6.1527099609375, -5.919189453125, -5.6856689453125, -5.4521484375, -5.2186279296875, -4.985107421875, -4.7515869140625, -4.51806640625, -4.2845458984375, -4.051025390625, -3.8175048828125, -3.583984375, -3.3504638671875, -3.116943359375, -2.8834228515625, -2.64990234375, -2.4163818359375, -2.182861328125, -1.9493408203125, -1.7158203125, -1.4822998046875, -1.248779296875, -1.0152587890625, -0.78173828125, -0.5482177734375, -0.314697265625, -0.0811767578125, 0.15234375, 0.3858642578125, 0.619384765625, 0.8529052734375, 1.08642578125, 1.3199462890625, 1.553466796875, 1.7869873046875, 2.0205078125, 2.2540283203125, 2.487548828125, 2.7210693359375, 2.95458984375, 3.1881103515625, 3.421630859375, 3.6551513671875, 3.888671875, 4.1221923828125, 4.355712890625, 4.5892333984375, 4.82275390625, 5.0562744140625, 5.289794921875, 5.5233154296875, 5.7568359375, 5.9903564453125, 6.223876953125, 6.4573974609375, 6.69091796875, 6.9244384765625, 7.157958984375, 7.3914794921875, 7.625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 7.0, 13.0, 14.0, 15.0, 17.0, 19.0, 26.0, 42.0, 66.0, 80.0, 106.0, 123.0, 209.0, 308.0, 416.0, 720.0, 1138.0, 2038.0, 4429.0, 11565.0, 39010.0, 928033.0, 38827.0, 11617.0, 4296.0, 2102.0, 1117.0, 683.0, 461.0, 305.0, 183.0, 149.0, 126.0, 81.0, 60.0, 35.0, 32.0, 20.0, 20.0, 17.0, 7.0, 10.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.82421875, -6.6004638671875, -6.376708984375, -6.1529541015625, -5.92919921875, -5.7054443359375, -5.481689453125, -5.2579345703125, -5.0341796875, -4.8104248046875, -4.586669921875, -4.3629150390625, -4.13916015625, -3.9154052734375, -3.691650390625, -3.4678955078125, -3.244140625, -3.0203857421875, -2.796630859375, -2.5728759765625, -2.34912109375, -2.1253662109375, -1.901611328125, -1.6778564453125, -1.4541015625, -1.2303466796875, -1.006591796875, -0.7828369140625, -0.55908203125, -0.3353271484375, -0.111572265625, 0.1121826171875, 0.3359375, 0.5596923828125, 0.783447265625, 1.0072021484375, 1.23095703125, 1.4547119140625, 1.678466796875, 1.9022216796875, 2.1259765625, 2.3497314453125, 2.573486328125, 2.7972412109375, 3.02099609375, 3.2447509765625, 3.468505859375, 3.6922607421875, 3.916015625, 4.1397705078125, 4.363525390625, 4.5872802734375, 4.81103515625, 5.0347900390625, 5.258544921875, 5.4822998046875, 5.7060546875, 5.9298095703125, 6.153564453125, 6.3773193359375, 6.60107421875, 6.8248291015625, 7.048583984375, 7.2723388671875, 7.49609375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 7.0, 7.0, 7.0, 15.0, 15.0, 18.0, 15.0, 9.0, 19.0, 27.0, 25.0, 33.0, 31.0, 37.0, 45.0, 25.0, 32.0, 44.0, 43.0, 38.0, 23.0, 43.0, 51.0, 35.0, 49.0, 34.0, 32.0, 31.0, 34.0, 16.0, 27.0, 14.0, 22.0, 18.0, 11.0, 9.0, 10.0, 9.0, 9.0, 9.0, 5.0, 4.0, 2.0, 5.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-4.4375, -4.3040771484375, -4.170654296875, -4.0372314453125, -3.90380859375, -3.7703857421875, -3.636962890625, -3.5035400390625, -3.3701171875, -3.2366943359375, -3.103271484375, -2.9698486328125, -2.83642578125, -2.7030029296875, -2.569580078125, -2.4361572265625, -2.302734375, -2.1693115234375, -2.035888671875, -1.9024658203125, -1.76904296875, -1.6356201171875, -1.502197265625, -1.3687744140625, -1.2353515625, -1.1019287109375, -0.968505859375, -0.8350830078125, -0.70166015625, -0.5682373046875, -0.434814453125, -0.3013916015625, -0.16796875, -0.0345458984375, 0.098876953125, 0.2322998046875, 0.36572265625, 0.4991455078125, 0.632568359375, 0.7659912109375, 0.8994140625, 1.0328369140625, 1.166259765625, 1.2996826171875, 1.43310546875, 1.5665283203125, 1.699951171875, 1.8333740234375, 1.966796875, 2.1002197265625, 2.233642578125, 2.3670654296875, 2.50048828125, 2.6339111328125, 2.767333984375, 2.9007568359375, 3.0341796875, 3.1676025390625, 3.301025390625, 3.4344482421875, 3.56787109375, 3.7012939453125, 3.834716796875, 3.9681396484375, 4.1015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 8.0, 7.0, 17.0, 14.0, 19.0, 36.0, 35.0, 55.0, 78.0, 103.0, 180.0, 266.0, 409.0, 722.0, 1229.0, 2360.0, 5257.0, 15125.0, 85274.0, 906711.0, 18379.0, 6201.0, 2620.0, 1342.0, 757.0, 464.0, 277.0, 178.0, 120.0, 109.0, 48.0, 40.0, 37.0, 21.0, 15.0, 11.0, 3.0, 7.0, 7.0, 2.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.52490234375, -0.509033203125, -0.4931640625, -0.477294921875, -0.46142578125, -0.445556640625, -0.4296875, -0.413818359375, -0.39794921875, -0.382080078125, -0.3662109375, -0.350341796875, -0.33447265625, -0.318603515625, -0.302734375, -0.286865234375, -0.27099609375, -0.255126953125, -0.2392578125, -0.223388671875, -0.20751953125, -0.191650390625, -0.17578125, -0.159912109375, -0.14404296875, -0.128173828125, -0.1123046875, -0.096435546875, -0.08056640625, -0.064697265625, -0.048828125, -0.032958984375, -0.01708984375, -0.001220703125, 0.0146484375, 0.030517578125, 0.04638671875, 0.062255859375, 0.078125, 0.093994140625, 0.10986328125, 0.125732421875, 0.1416015625, 0.157470703125, 0.17333984375, 0.189208984375, 0.205078125, 0.220947265625, 0.23681640625, 0.252685546875, 0.2685546875, 0.284423828125, 0.30029296875, 0.316162109375, 0.33203125, 0.347900390625, 0.36376953125, 0.379638671875, 0.3955078125, 0.411376953125, 0.42724609375, 0.443115234375, 0.458984375, 0.474853515625, 0.49072265625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 10.0, 5.0, 11.0, 15.0, 19.0, 13.0, 30.0, 27.0, 29.0, 42.0, 49.0, 48.0, 61.0, 66.0, 57.0, 63.0, 54.0, 52.0, 39.0, 37.0, 43.0, 37.0, 36.0, 28.0, 19.0, 19.0, 18.0, 11.0, 14.0, 10.0, 7.0, 7.0, 8.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3974647521972656e-05, -3.2912008464336395e-05, -3.1849369406700134e-05, -3.078673034906387e-05, -2.9724091291427612e-05, -2.866145223379135e-05, -2.759881317615509e-05, -2.653617411851883e-05, -2.547353506088257e-05, -2.4410896003246307e-05, -2.3348256945610046e-05, -2.2285617887973785e-05, -2.1222978830337524e-05, -2.0160339772701263e-05, -1.9097700715065002e-05, -1.803506165742874e-05, -1.697242259979248e-05, -1.590978354215622e-05, -1.4847144484519958e-05, -1.3784505426883698e-05, -1.2721866369247437e-05, -1.1659227311611176e-05, -1.0596588253974915e-05, -9.533949196338654e-06, -8.471310138702393e-06, -7.408671081066132e-06, -6.346032023429871e-06, -5.28339296579361e-06, -4.220753908157349e-06, -3.1581148505210876e-06, -2.0954757928848267e-06, -1.0328367352485657e-06, 2.9802322387695312e-08, 1.0924413800239563e-06, 2.1550804376602173e-06, 3.2177194952964783e-06, 4.280358552932739e-06, 5.342997610569e-06, 6.405636668205261e-06, 7.468275725841522e-06, 8.530914783477783e-06, 9.593553841114044e-06, 1.0656192898750305e-05, 1.1718831956386566e-05, 1.2781471014022827e-05, 1.3844110071659088e-05, 1.4906749129295349e-05, 1.596938818693161e-05, 1.703202724456787e-05, 1.8094666302204132e-05, 1.9157305359840393e-05, 2.0219944417476654e-05, 2.1282583475112915e-05, 2.2345222532749176e-05, 2.3407861590385437e-05, 2.4470500648021698e-05, 2.553313970565796e-05, 2.659577876329422e-05, 2.765841782093048e-05, 2.8721056878566742e-05, 2.9783695936203003e-05, 3.0846334993839264e-05, 3.1908974051475525e-05, 3.2971613109111786e-05, 3.403425216674805e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 8.0, 18.0, 14.0, 23.0, 30.0, 44.0, 70.0, 92.0, 125.0, 179.0, 261.0, 364.0, 483.0, 688.0, 1000.0, 1438.0, 2124.0, 3092.0, 4968.0, 7721.0, 12527.0, 21320.0, 37855.0, 72595.0, 158372.0, 318648.0, 203855.0, 89885.0, 45407.0, 24857.0, 14514.0, 8891.0, 5566.0, 3658.0, 2408.0, 1687.0, 1112.0, 783.0, 531.0, 408.0, 268.0, 163.0, 147.0, 120.0, 70.0, 61.0, 35.0, 21.0, 17.0, 12.0, 5.0, 4.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.153076171875, -0.1482391357421875, -0.143402099609375, -0.1385650634765625, -0.13372802734375, -0.1288909912109375, -0.124053955078125, -0.1192169189453125, -0.1143798828125, -0.1095428466796875, -0.104705810546875, -0.0998687744140625, -0.09503173828125, -0.0901947021484375, -0.085357666015625, -0.0805206298828125, -0.07568359375, -0.0708465576171875, -0.066009521484375, -0.0611724853515625, -0.05633544921875, -0.0514984130859375, -0.046661376953125, -0.0418243408203125, -0.0369873046875, -0.0321502685546875, -0.027313232421875, -0.0224761962890625, -0.01763916015625, -0.0128021240234375, -0.007965087890625, -0.0031280517578125, 0.001708984375, 0.0065460205078125, 0.011383056640625, 0.0162200927734375, 0.02105712890625, 0.0258941650390625, 0.030731201171875, 0.0355682373046875, 0.0404052734375, 0.0452423095703125, 0.050079345703125, 0.0549163818359375, 0.05975341796875, 0.0645904541015625, 0.069427490234375, 0.0742645263671875, 0.0791015625, 0.0839385986328125, 0.088775634765625, 0.0936126708984375, 0.09844970703125, 0.1032867431640625, 0.108123779296875, 0.1129608154296875, 0.1177978515625, 0.1226348876953125, 0.127471923828125, 0.1323089599609375, 0.13714599609375, 0.1419830322265625, 0.146820068359375, 0.1516571044921875, 0.156494140625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 8.0, 5.0, 4.0, 10.0, 13.0, 9.0, 17.0, 14.0, 29.0, 31.0, 45.0, 61.0, 61.0, 97.0, 89.0, 83.0, 81.0, 59.0, 47.0, 47.0, 25.0, 40.0, 24.0, 15.0, 8.0, 8.0, 10.0, 9.0, 8.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.046783447265625, -0.045262813568115234, -0.04374217987060547, -0.0422215461730957, -0.04070091247558594, -0.03918027877807617, -0.037659645080566406, -0.03613901138305664, -0.034618377685546875, -0.03309774398803711, -0.031577110290527344, -0.030056476593017578, -0.028535842895507812, -0.027015209197998047, -0.02549457550048828, -0.023973941802978516, -0.02245330810546875, -0.020932674407958984, -0.01941204071044922, -0.017891407012939453, -0.016370773315429688, -0.014850139617919922, -0.013329505920410156, -0.01180887222290039, -0.010288238525390625, -0.00876760482788086, -0.007246971130371094, -0.005726337432861328, -0.0042057037353515625, -0.002685070037841797, -0.0011644363403320312, 0.0003561973571777344, 0.0018768310546875, 0.0033974647521972656, 0.004918098449707031, 0.006438732147216797, 0.007959365844726562, 0.009479999542236328, 0.011000633239746094, 0.01252126693725586, 0.014041900634765625, 0.01556253433227539, 0.017083168029785156, 0.018603801727294922, 0.020124435424804688, 0.021645069122314453, 0.02316570281982422, 0.024686336517333984, 0.02620697021484375, 0.027727603912353516, 0.02924823760986328, 0.030768871307373047, 0.03228950500488281, 0.03381013870239258, 0.035330772399902344, 0.03685140609741211, 0.038372039794921875, 0.03989267349243164, 0.041413307189941406, 0.04293394088745117, 0.04445457458496094, 0.0459752082824707, 0.04749584197998047, 0.049016475677490234, 0.050537109375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 9.0, 5.0, 16.0, 16.0, 12.0, 30.0, 23.0, 45.0, 45.0, 53.0, 43.0, 56.0, 60.0, 55.0, 58.0, 60.0, 63.0, 58.0, 44.0, 27.0, 42.0, 33.0, 31.0, 12.0, 23.0, 16.0, 13.0, 9.0, 9.0, 9.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.894561767578125, -6.650949954986572, -6.407338619232178, -6.163726806640625, -5.920114994049072, -5.676503658294678, -5.432891845703125, -5.1892805099487305, -4.945668697357178, -4.702056884765625, -4.4584455490112305, -4.214833736419678, -3.971222162246704, -3.7276105880737305, -3.4839987754821777, -3.240387201309204, -2.9967753887176514, -2.7531638145446777, -2.509552001953125, -2.2659404277801514, -2.0223288536071777, -1.7787171602249146, -1.5351054668426514, -1.2914938926696777, -1.0478821992874146, -0.8042705655097961, -0.5606589317321777, -0.31704723834991455, -0.07343560457229614, 0.17017602920532227, 0.41378772258758545, 0.6573992967605591, 0.9010109901428223, 1.1446226835250854, 1.388234257698059, 1.6318459510803223, 1.875457525253296, 2.1190690994262695, 2.3626809120178223, 2.606292486190796, 2.8499040603637695, 3.093515634536743, 3.337127447128296, 3.5807390213012695, 3.824350595474243, 4.067962169647217, 4.3115739822387695, 4.555185317993164, 4.798797607421875, 5.042409420013428, 5.286020755767822, 5.529632568359375, 5.773244380950928, 6.016855716705322, 6.260467529296875, 6.5040788650512695, 6.747690677642822, 6.991302490234375, 7.2349138259887695, 7.478525638580322, 7.722137451171875, 7.9657487869262695, 8.209360122680664, 8.452972412109375, 8.69658374786377]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 2.0, 6.0, 8.0, 12.0, 14.0, 11.0, 12.0, 18.0, 24.0, 18.0, 26.0, 32.0, 30.0, 34.0, 26.0, 36.0, 46.0, 48.0, 31.0, 41.0, 42.0, 40.0, 36.0, 54.0, 44.0, 36.0, 31.0, 28.0, 31.0, 23.0, 32.0, 18.0, 25.0, 16.0, 13.0, 8.0, 13.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.366312503814697, -7.148375511169434, -6.93043851852417, -6.712501525878906, -6.494564056396484, -6.276627540588379, -6.058690071105957, -5.840753078460693, -5.62281608581543, -5.404879093170166, -5.186942100524902, -4.969005107879639, -4.751068115234375, -4.533130645751953, -4.3151936531066895, -4.097256660461426, -3.879319667816162, -3.6613826751708984, -3.4434456825256348, -3.225508451461792, -3.0075714588165283, -2.7896344661712646, -2.571697235107422, -2.353760242462158, -2.1358232498168945, -1.9178862571716309, -1.6999491453170776, -1.4820120334625244, -1.2640750408172607, -1.046138048171997, -0.8282009363174438, -0.6102638244628906, -0.39232730865478516, -0.1743902564048767, 0.04354679584503174, 0.2614838480949402, 0.47942090034484863, 0.6973578929901123, 0.9152950048446655, 1.1332321166992188, 1.3511691093444824, 1.569106101989746, 1.7870432138442993, 2.0049803256988525, 2.222917318344116, 2.44085431098938, 2.6587915420532227, 2.8767285346984863, 3.09466552734375, 3.3126025199890137, 3.5305395126342773, 3.74847674369812, 3.966413736343384, 4.184350967407227, 4.40228796005249, 4.620224952697754, 4.838161945343018, 5.056098937988281, 5.274035930633545, 5.491972923278809, 5.7099103927612305, 5.927846908569336, 6.145784378051758, 6.3637213706970215, 6.581658363342285]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 7.0, 17.0, 16.0, 29.0, 33.0, 61.0, 89.0, 125.0, 187.0, 241.0, 397.0, 508.0, 810.0, 1237.0, 1752.0, 2601.0, 4014.0, 6167.0, 9492.0, 14703.0, 22598.0, 34963.0, 52955.0, 77768.0, 106856.0, 133568.0, 143154.0, 127589.0, 99810.0, 70415.0, 47475.0, 30907.0, 20288.0, 13020.0, 8341.0, 5437.0, 3673.0, 2381.0, 1541.0, 1022.0, 745.0, 491.0, 296.0, 238.0, 174.0, 106.0, 79.0, 49.0, 37.0, 28.0, 18.0, 21.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0], "bins": [-4.03515625, -3.910491943359375, -3.78582763671875, -3.661163330078125, -3.5364990234375, -3.411834716796875, -3.28717041015625, -3.162506103515625, -3.037841796875, -2.913177490234375, -2.78851318359375, -2.663848876953125, -2.5391845703125, -2.414520263671875, -2.28985595703125, -2.165191650390625, -2.04052734375, -1.915863037109375, -1.79119873046875, -1.666534423828125, -1.5418701171875, -1.417205810546875, -1.29254150390625, -1.167877197265625, -1.043212890625, -0.918548583984375, -0.79388427734375, -0.669219970703125, -0.5445556640625, -0.419891357421875, -0.29522705078125, -0.170562744140625, -0.0458984375, 0.078765869140625, 0.20343017578125, 0.328094482421875, 0.4527587890625, 0.577423095703125, 0.70208740234375, 0.826751708984375, 0.951416015625, 1.076080322265625, 1.20074462890625, 1.325408935546875, 1.4500732421875, 1.574737548828125, 1.69940185546875, 1.824066162109375, 1.94873046875, 2.073394775390625, 2.19805908203125, 2.322723388671875, 2.4473876953125, 2.572052001953125, 2.69671630859375, 2.821380615234375, 2.946044921875, 3.070709228515625, 3.19537353515625, 3.320037841796875, 3.4447021484375, 3.569366455078125, 3.69403076171875, 3.818695068359375, 3.943359375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 8.0, 11.0, 7.0, 13.0, 14.0, 11.0, 10.0, 13.0, 15.0, 21.0, 22.0, 29.0, 21.0, 22.0, 27.0, 37.0, 37.0, 27.0, 37.0, 43.0, 44.0, 43.0, 43.0, 52.0, 38.0, 29.0, 23.0, 39.0, 28.0, 29.0, 33.0, 29.0, 28.0, 16.0, 18.0, 18.0, 10.0, 11.0, 13.0, 10.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-7.17578125, -6.96746826171875, -6.7591552734375, -6.55084228515625, -6.342529296875, -6.13421630859375, -5.9259033203125, -5.71759033203125, -5.50927734375, -5.30096435546875, -5.0926513671875, -4.88433837890625, -4.676025390625, -4.46771240234375, -4.2593994140625, -4.05108642578125, -3.8427734375, -3.63446044921875, -3.4261474609375, -3.21783447265625, -3.009521484375, -2.80120849609375, -2.5928955078125, -2.38458251953125, -2.17626953125, -1.96795654296875, -1.7596435546875, -1.55133056640625, -1.343017578125, -1.13470458984375, -0.9263916015625, -0.71807861328125, -0.509765625, -0.30145263671875, -0.0931396484375, 0.11517333984375, 0.323486328125, 0.53179931640625, 0.7401123046875, 0.94842529296875, 1.15673828125, 1.36505126953125, 1.5733642578125, 1.78167724609375, 1.989990234375, 2.19830322265625, 2.4066162109375, 2.61492919921875, 2.8232421875, 3.03155517578125, 3.2398681640625, 3.44818115234375, 3.656494140625, 3.86480712890625, 4.0731201171875, 4.28143310546875, 4.48974609375, 4.69805908203125, 4.9063720703125, 5.11468505859375, 5.322998046875, 5.53131103515625, 5.7396240234375, 5.94793701171875, 6.15625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [6.0, 4.0, 3.0, 12.0, 16.0, 25.0, 25.0, 52.0, 75.0, 99.0, 131.0, 161.0, 272.0, 372.0, 497.0, 842.0, 1169.0, 1696.0, 2633.0, 3922.0, 6091.0, 9402.0, 14892.0, 23749.0, 37183.0, 58589.0, 87788.0, 122785.0, 147634.0, 148167.0, 124086.0, 90273.0, 60327.0, 38016.0, 24171.0, 15368.0, 9628.0, 6164.0, 4040.0, 2679.0, 1759.0, 1199.0, 797.0, 560.0, 379.0, 238.0, 188.0, 135.0, 94.0, 55.0, 44.0, 25.0, 17.0, 17.0, 11.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.994140625, -3.856536865234375, -3.71893310546875, -3.581329345703125, -3.4437255859375, -3.306121826171875, -3.16851806640625, -3.030914306640625, -2.893310546875, -2.755706787109375, -2.61810302734375, -2.480499267578125, -2.3428955078125, -2.205291748046875, -2.06768798828125, -1.930084228515625, -1.79248046875, -1.654876708984375, -1.51727294921875, -1.379669189453125, -1.2420654296875, -1.104461669921875, -0.96685791015625, -0.829254150390625, -0.691650390625, -0.554046630859375, -0.41644287109375, -0.278839111328125, -0.1412353515625, -0.003631591796875, 0.13397216796875, 0.271575927734375, 0.4091796875, 0.546783447265625, 0.68438720703125, 0.821990966796875, 0.9595947265625, 1.097198486328125, 1.23480224609375, 1.372406005859375, 1.510009765625, 1.647613525390625, 1.78521728515625, 1.922821044921875, 2.0604248046875, 2.198028564453125, 2.33563232421875, 2.473236083984375, 2.61083984375, 2.748443603515625, 2.88604736328125, 3.023651123046875, 3.1612548828125, 3.298858642578125, 3.43646240234375, 3.574066162109375, 3.711669921875, 3.849273681640625, 3.98687744140625, 4.124481201171875, 4.2620849609375, 4.399688720703125, 4.53729248046875, 4.674896240234375, 4.8125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 2.0, 2.0, 4.0, 6.0, 9.0, 4.0, 8.0, 9.0, 10.0, 13.0, 21.0, 14.0, 26.0, 26.0, 24.0, 24.0, 22.0, 27.0, 41.0, 38.0, 34.0, 38.0, 37.0, 37.0, 54.0, 31.0, 40.0, 43.0, 33.0, 44.0, 24.0, 36.0, 28.0, 30.0, 21.0, 16.0, 24.0, 18.0, 15.0, 19.0, 8.0, 7.0, 6.0, 6.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-4.14453125, -4.018524169921875, -3.89251708984375, -3.766510009765625, -3.6405029296875, -3.514495849609375, -3.38848876953125, -3.262481689453125, -3.136474609375, -3.010467529296875, -2.88446044921875, -2.758453369140625, -2.6324462890625, -2.506439208984375, -2.38043212890625, -2.254425048828125, -2.12841796875, -2.002410888671875, -1.87640380859375, -1.750396728515625, -1.6243896484375, -1.498382568359375, -1.37237548828125, -1.246368408203125, -1.120361328125, -0.994354248046875, -0.86834716796875, -0.742340087890625, -0.6163330078125, -0.490325927734375, -0.36431884765625, -0.238311767578125, -0.1123046875, 0.013702392578125, 0.13970947265625, 0.265716552734375, 0.3917236328125, 0.517730712890625, 0.64373779296875, 0.769744873046875, 0.895751953125, 1.021759033203125, 1.14776611328125, 1.273773193359375, 1.3997802734375, 1.525787353515625, 1.65179443359375, 1.777801513671875, 1.90380859375, 2.029815673828125, 2.15582275390625, 2.281829833984375, 2.4078369140625, 2.533843994140625, 2.65985107421875, 2.785858154296875, 2.911865234375, 3.037872314453125, 3.16387939453125, 3.289886474609375, 3.4158935546875, 3.541900634765625, 3.66790771484375, 3.793914794921875, 3.919921875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 11.0, 19.0, 23.0, 48.0, 50.0, 99.0, 151.0, 202.0, 331.0, 474.0, 786.0, 1239.0, 2053.0, 3180.0, 5009.0, 7967.0, 12587.0, 19841.0, 30539.0, 45098.0, 64546.0, 86185.0, 106911.0, 119344.0, 121762.0, 111567.0, 92354.0, 70023.0, 50538.0, 34207.0, 22270.0, 14422.0, 9262.0, 5716.0, 3558.0, 2234.0, 1353.0, 946.0, 585.0, 387.0, 252.0, 147.0, 82.0, 69.0, 35.0, 28.0, 24.0, 19.0, 9.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.34765625, -1.3069915771484375, -1.266326904296875, -1.2256622314453125, -1.18499755859375, -1.1443328857421875, -1.103668212890625, -1.0630035400390625, -1.0223388671875, -0.9816741943359375, -0.941009521484375, -0.9003448486328125, -0.85968017578125, -0.8190155029296875, -0.778350830078125, -0.7376861572265625, -0.697021484375, -0.6563568115234375, -0.615692138671875, -0.5750274658203125, -0.53436279296875, -0.4936981201171875, -0.453033447265625, -0.4123687744140625, -0.3717041015625, -0.3310394287109375, -0.290374755859375, -0.2497100830078125, -0.20904541015625, -0.1683807373046875, -0.127716064453125, -0.0870513916015625, -0.04638671875, -0.0057220458984375, 0.034942626953125, 0.0756072998046875, 0.11627197265625, 0.1569366455078125, 0.197601318359375, 0.2382659912109375, 0.2789306640625, 0.3195953369140625, 0.360260009765625, 0.4009246826171875, 0.44158935546875, 0.4822540283203125, 0.522918701171875, 0.5635833740234375, 0.604248046875, 0.6449127197265625, 0.685577392578125, 0.7262420654296875, 0.76690673828125, 0.8075714111328125, 0.848236083984375, 0.8889007568359375, 0.9295654296875, 0.9702301025390625, 1.010894775390625, 1.0515594482421875, 1.09222412109375, 1.1328887939453125, 1.173553466796875, 1.2142181396484375, 1.2548828125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 2.0, 2.0, 6.0, 4.0, 6.0, 8.0, 12.0, 18.0, 22.0, 18.0, 17.0, 25.0, 29.0, 21.0, 41.0, 37.0, 40.0, 52.0, 39.0, 38.0, 41.0, 47.0, 46.0, 42.0, 36.0, 43.0, 45.0, 35.0, 22.0, 25.0, 13.0, 21.0, 25.0, 21.0, 17.0, 13.0, 16.0, 11.0, 8.0, 6.0, 7.0, 10.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0001289844512939453, -0.00012513156980276108, -0.00012127868831157684, -0.00011742580682039261, -0.00011357292532920837, -0.00010972004383802414, -0.0001058671623468399, -0.00010201428085565567, -9.816139936447144e-05, -9.43085178732872e-05, -9.045563638210297e-05, -8.660275489091873e-05, -8.27498733997345e-05, -7.889699190855026e-05, -7.504411041736603e-05, -7.119122892618179e-05, -6.733834743499756e-05, -6.348546594381332e-05, -5.963258445262909e-05, -5.5779702961444855e-05, -5.192682147026062e-05, -4.8073939979076385e-05, -4.422105848789215e-05, -4.0368176996707916e-05, -3.651529550552368e-05, -3.266241401433945e-05, -2.8809532523155212e-05, -2.4956651031970978e-05, -2.1103769540786743e-05, -1.725088804960251e-05, -1.3398006558418274e-05, -9.54512506723404e-06, -5.692243576049805e-06, -1.83936208486557e-06, 2.0135194063186646e-06, 5.866400897502899e-06, 9.719282388687134e-06, 1.3572163879871368e-05, 1.7425045371055603e-05, 2.1277926862239838e-05, 2.5130808353424072e-05, 2.8983689844608307e-05, 3.283657133579254e-05, 3.6689452826976776e-05, 4.054233431816101e-05, 4.4395215809345245e-05, 4.824809730052948e-05, 5.2100978791713715e-05, 5.595386028289795e-05, 5.9806741774082184e-05, 6.365962326526642e-05, 6.751250475645065e-05, 7.136538624763489e-05, 7.521826773881912e-05, 7.907114923000336e-05, 8.292403072118759e-05, 8.677691221237183e-05, 9.062979370355606e-05, 9.44826751947403e-05, 9.833555668592453e-05, 0.00010218843817710876, 0.000106041319668293, 0.00010989420115947723, 0.00011374708265066147, 0.0001175999641418457]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 16.0, 10.0, 20.0, 32.0, 54.0, 79.0, 93.0, 168.0, 263.0, 413.0, 618.0, 998.0, 1509.0, 2354.0, 3659.0, 5930.0, 9606.0, 15296.0, 23894.0, 36632.0, 54765.0, 78218.0, 102260.0, 121652.0, 129406.0, 121977.0, 102502.0, 77862.0, 55462.0, 37069.0, 24230.0, 15099.0, 9638.0, 6157.0, 3832.0, 2469.0, 1464.0, 1010.0, 636.0, 412.0, 280.0, 179.0, 112.0, 77.0, 51.0, 26.0, 19.0, 20.0, 10.0, 14.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.431640625, -1.387603759765625, -1.34356689453125, -1.299530029296875, -1.2554931640625, -1.211456298828125, -1.16741943359375, -1.123382568359375, -1.079345703125, -1.035308837890625, -0.99127197265625, -0.947235107421875, -0.9031982421875, -0.859161376953125, -0.81512451171875, -0.771087646484375, -0.72705078125, -0.683013916015625, -0.63897705078125, -0.594940185546875, -0.5509033203125, -0.506866455078125, -0.46282958984375, -0.418792724609375, -0.374755859375, -0.330718994140625, -0.28668212890625, -0.242645263671875, -0.1986083984375, -0.154571533203125, -0.11053466796875, -0.066497802734375, -0.0224609375, 0.021575927734375, 0.06561279296875, 0.109649658203125, 0.1536865234375, 0.197723388671875, 0.24176025390625, 0.285797119140625, 0.329833984375, 0.373870849609375, 0.41790771484375, 0.461944580078125, 0.5059814453125, 0.550018310546875, 0.59405517578125, 0.638092041015625, 0.68212890625, 0.726165771484375, 0.77020263671875, 0.814239501953125, 0.8582763671875, 0.902313232421875, 0.94635009765625, 0.990386962890625, 1.034423828125, 1.078460693359375, 1.12249755859375, 1.166534423828125, 1.2105712890625, 1.254608154296875, 1.29864501953125, 1.342681884765625, 1.38671875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 4.0, 7.0, 6.0, 9.0, 13.0, 13.0, 14.0, 14.0, 17.0, 23.0, 39.0, 28.0, 46.0, 56.0, 44.0, 55.0, 56.0, 55.0, 50.0, 58.0, 67.0, 36.0, 39.0, 34.0, 29.0, 29.0, 32.0, 24.0, 18.0, 10.0, 10.0, 15.0, 14.0, 6.0, 6.0, 7.0, 4.0, 5.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.70654296875, -0.6869964599609375, -0.667449951171875, -0.6479034423828125, -0.62835693359375, -0.6088104248046875, -0.589263916015625, -0.5697174072265625, -0.5501708984375, -0.5306243896484375, -0.511077880859375, -0.4915313720703125, -0.47198486328125, -0.4524383544921875, -0.432891845703125, -0.4133453369140625, -0.393798828125, -0.3742523193359375, -0.354705810546875, -0.3351593017578125, -0.31561279296875, -0.2960662841796875, -0.276519775390625, -0.2569732666015625, -0.2374267578125, -0.2178802490234375, -0.198333740234375, -0.1787872314453125, -0.15924072265625, -0.1396942138671875, -0.120147705078125, -0.1006011962890625, -0.0810546875, -0.0615081787109375, -0.041961669921875, -0.0224151611328125, -0.00286865234375, 0.0166778564453125, 0.036224365234375, 0.0557708740234375, 0.0753173828125, 0.0948638916015625, 0.114410400390625, 0.1339569091796875, 0.15350341796875, 0.1730499267578125, 0.192596435546875, 0.2121429443359375, 0.231689453125, 0.2512359619140625, 0.270782470703125, 0.2903289794921875, 0.30987548828125, 0.3294219970703125, 0.348968505859375, 0.3685150146484375, 0.3880615234375, 0.4076080322265625, 0.427154541015625, 0.4467010498046875, 0.46624755859375, 0.4857940673828125, 0.505340576171875, 0.5248870849609375, 0.54443359375]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 5.0, 11.0, 15.0, 15.0, 16.0, 24.0, 34.0, 39.0, 42.0, 52.0, 65.0, 49.0, 49.0, 53.0, 69.0, 67.0, 63.0, 47.0, 36.0, 39.0, 39.0, 36.0, 18.0, 22.0, 22.0, 15.0, 18.0, 4.0, 8.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.499004364013672, -7.250592231750488, -7.002180099487305, -6.753767967224121, -6.5053558349609375, -6.256943702697754, -6.00853157043457, -5.760119438171387, -5.511707305908203, -5.2632951736450195, -5.014883041381836, -4.766470909118652, -4.518058776855469, -4.269646644592285, -4.021234512329102, -3.772822380065918, -3.5244104862213135, -3.27599835395813, -3.0275862216949463, -2.7791740894317627, -2.530761957168579, -2.2823500633239746, -2.033937931060791, -1.7855256795883179, -1.5371135473251343, -1.2887014150619507, -1.040289282798767, -0.7918772101402283, -0.5434650778770447, -0.29505300521850586, -0.046640872955322266, 0.20177125930786133, 0.4501833915710449, 0.6985955238342285, 0.9470076560974121, 1.1954197883605957, 1.4438319206237793, 1.6922439336776733, 1.940656065940857, 2.18906831741333, 2.4374804496765137, 2.6858925819396973, 2.934304714202881, 3.1827168464660645, 3.431128978729248, 3.6795411109924316, 3.9279532432556152, 4.176365375518799, 4.424777030944824, 4.673189163208008, 4.921601295471191, 5.170013427734375, 5.418425559997559, 5.666837692260742, 5.915249824523926, 6.163661956787109, 6.412074089050293, 6.660486221313477, 6.90889835357666, 7.157310485839844, 7.405722618103027, 7.654134750366211, 7.9025468826293945, 8.150959014892578, 8.399371147155762]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 6.0, 3.0, 10.0, 8.0, 4.0, 18.0, 13.0, 11.0, 20.0, 11.0, 20.0, 21.0, 30.0, 28.0, 36.0, 30.0, 39.0, 47.0, 32.0, 40.0, 51.0, 49.0, 42.0, 55.0, 46.0, 35.0, 34.0, 27.0, 33.0, 38.0, 24.0, 29.0, 20.0, 12.0, 20.0, 11.0, 13.0, 6.0, 3.0, 3.0, 5.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.1265435218811035, -6.909689426422119, -6.692835330963135, -6.47598123550415, -6.259127140045166, -6.042273044586182, -5.8254194259643555, -5.608565330505371, -5.391711235046387, -5.174857139587402, -4.958003044128418, -4.741148948669434, -4.524294853210449, -4.307440757751465, -4.0905866622924805, -3.873732805252075, -3.6568784713745117, -3.4400243759155273, -3.223170280456543, -3.0063161849975586, -2.789462089538574, -2.57260799407959, -2.3557541370391846, -2.1389000415802, -1.9220459461212158, -1.7051918506622314, -1.488337755203247, -1.2714837789535522, -1.0546296834945679, -0.8377755880355835, -0.6209216117858887, -0.4040675163269043, -0.18721389770507812, 0.029640167951583862, 0.24649423360824585, 0.46334826946258545, 0.6802023649215698, 0.8970564603805542, 1.113910436630249, 1.3307645320892334, 1.5476186275482178, 1.7644727230072021, 1.9813268184661865, 2.198180675506592, 2.415034770965576, 2.6318888664245605, 2.848742961883545, 3.0655970573425293, 3.2824511528015137, 3.499305248260498, 3.7161593437194824, 3.933013439178467, 4.149867534637451, 4.3667216300964355, 4.583575248718262, 4.800429344177246, 5.0172834396362305, 5.234137535095215, 5.450991630554199, 5.667845726013184, 5.884699821472168, 6.101553916931152, 6.318408012390137, 6.535262107849121, 6.7521162033081055]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [3.0, 5.0, 7.0, 3.0, 13.0, 21.0, 27.0, 35.0, 63.0, 82.0, 125.0, 175.0, 251.0, 345.0, 516.0, 770.0, 1224.0, 1828.0, 3018.0, 4577.0, 7367.0, 11542.0, 18923.0, 30248.0, 49934.0, 81325.0, 132267.0, 213492.0, 331830.0, 479439.0, 606144.0, 629978.0, 533861.0, 386602.0, 255377.0, 161136.0, 99236.0, 59753.0, 36388.0, 22062.0, 13320.0, 7932.0, 4865.0, 3034.0, 1827.0, 1206.0, 715.0, 501.0, 298.0, 225.0, 119.0, 94.0, 63.0, 36.0, 21.0, 26.0, 17.0, 2.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.8359375, -5.6488037109375, -5.461669921875, -5.2745361328125, -5.08740234375, -4.9002685546875, -4.713134765625, -4.5260009765625, -4.3388671875, -4.1517333984375, -3.964599609375, -3.7774658203125, -3.59033203125, -3.4031982421875, -3.216064453125, -3.0289306640625, -2.841796875, -2.6546630859375, -2.467529296875, -2.2803955078125, -2.09326171875, -1.9061279296875, -1.718994140625, -1.5318603515625, -1.3447265625, -1.1575927734375, -0.970458984375, -0.7833251953125, -0.59619140625, -0.4090576171875, -0.221923828125, -0.0347900390625, 0.15234375, 0.3394775390625, 0.526611328125, 0.7137451171875, 0.90087890625, 1.0880126953125, 1.275146484375, 1.4622802734375, 1.6494140625, 1.8365478515625, 2.023681640625, 2.2108154296875, 2.39794921875, 2.5850830078125, 2.772216796875, 2.9593505859375, 3.146484375, 3.3336181640625, 3.520751953125, 3.7078857421875, 3.89501953125, 4.0821533203125, 4.269287109375, 4.4564208984375, 4.6435546875, 4.8306884765625, 5.017822265625, 5.2049560546875, 5.39208984375, 5.5792236328125, 5.766357421875, 5.9534912109375, 6.140625]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 3.0, 7.0, 8.0, 14.0, 7.0, 11.0, 13.0, 16.0, 13.0, 16.0, 21.0, 24.0, 33.0, 39.0, 26.0, 28.0, 48.0, 49.0, 40.0, 30.0, 41.0, 49.0, 51.0, 42.0, 38.0, 37.0, 45.0, 31.0, 28.0, 31.0, 29.0, 25.0, 19.0, 10.0, 17.0, 10.0, 11.0, 8.0, 3.0, 6.0, 4.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.73046875, -5.548828125, -5.3671875, -5.185546875, -5.00390625, -4.822265625, -4.640625, -4.458984375, -4.27734375, -4.095703125, -3.9140625, -3.732421875, -3.55078125, -3.369140625, -3.1875, -3.005859375, -2.82421875, -2.642578125, -2.4609375, -2.279296875, -2.09765625, -1.916015625, -1.734375, -1.552734375, -1.37109375, -1.189453125, -1.0078125, -0.826171875, -0.64453125, -0.462890625, -0.28125, -0.099609375, 0.08203125, 0.263671875, 0.4453125, 0.626953125, 0.80859375, 0.990234375, 1.171875, 1.353515625, 1.53515625, 1.716796875, 1.8984375, 2.080078125, 2.26171875, 2.443359375, 2.625, 2.806640625, 2.98828125, 3.169921875, 3.3515625, 3.533203125, 3.71484375, 3.896484375, 4.078125, 4.259765625, 4.44140625, 4.623046875, 4.8046875, 4.986328125, 5.16796875, 5.349609375, 5.53125, 5.712890625, 5.89453125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 1.0, 5.0, 6.0, 8.0, 19.0, 22.0, 41.0, 61.0, 87.0, 153.0, 242.0, 359.0, 590.0, 999.0, 1649.0, 2815.0, 4514.0, 7554.0, 13054.0, 22543.0, 38150.0, 65439.0, 111610.0, 185243.0, 295539.0, 436727.0, 572392.0, 632455.0, 578500.0, 446520.0, 304723.0, 191391.0, 115704.0, 68474.0, 39745.0, 23289.0, 13764.0, 7928.0, 4689.0, 2880.0, 1720.0, 1016.0, 611.0, 393.0, 265.0, 153.0, 83.0, 65.0, 42.0, 23.0, 11.0, 11.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.91796875, -6.69140625, -6.46484375, -6.23828125, -6.01171875, -5.78515625, -5.55859375, -5.33203125, -5.10546875, -4.87890625, -4.65234375, -4.42578125, -4.19921875, -3.97265625, -3.74609375, -3.51953125, -3.29296875, -3.06640625, -2.83984375, -2.61328125, -2.38671875, -2.16015625, -1.93359375, -1.70703125, -1.48046875, -1.25390625, -1.02734375, -0.80078125, -0.57421875, -0.34765625, -0.12109375, 0.10546875, 0.33203125, 0.55859375, 0.78515625, 1.01171875, 1.23828125, 1.46484375, 1.69140625, 1.91796875, 2.14453125, 2.37109375, 2.59765625, 2.82421875, 3.05078125, 3.27734375, 3.50390625, 3.73046875, 3.95703125, 4.18359375, 4.41015625, 4.63671875, 4.86328125, 5.08984375, 5.31640625, 5.54296875, 5.76953125, 5.99609375, 6.22265625, 6.44921875, 6.67578125, 6.90234375, 7.12890625, 7.35546875, 7.58203125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 7.0, 5.0, 16.0, 13.0, 15.0, 42.0, 40.0, 53.0, 76.0, 92.0, 121.0, 141.0, 136.0, 161.0, 194.0, 204.0, 250.0, 271.0, 255.0, 264.0, 277.0, 243.0, 202.0, 184.0, 153.0, 127.0, 92.0, 85.0, 73.0, 67.0, 42.0, 37.0, 25.0, 23.0, 15.0, 20.0, 10.0, 12.0, 6.0, 9.0, 3.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.197265625, -3.085723876953125, -2.97418212890625, -2.862640380859375, -2.7510986328125, -2.639556884765625, -2.52801513671875, -2.416473388671875, -2.304931640625, -2.193389892578125, -2.08184814453125, -1.970306396484375, -1.8587646484375, -1.747222900390625, -1.63568115234375, -1.524139404296875, -1.41259765625, -1.301055908203125, -1.18951416015625, -1.077972412109375, -0.9664306640625, -0.854888916015625, -0.74334716796875, -0.631805419921875, -0.520263671875, -0.408721923828125, -0.29718017578125, -0.185638427734375, -0.0740966796875, 0.037445068359375, 0.14898681640625, 0.260528564453125, 0.3720703125, 0.483612060546875, 0.59515380859375, 0.706695556640625, 0.8182373046875, 0.929779052734375, 1.04132080078125, 1.152862548828125, 1.264404296875, 1.375946044921875, 1.48748779296875, 1.599029541015625, 1.7105712890625, 1.822113037109375, 1.93365478515625, 2.045196533203125, 2.15673828125, 2.268280029296875, 2.37982177734375, 2.491363525390625, 2.6029052734375, 2.714447021484375, 2.82598876953125, 2.937530517578125, 3.049072265625, 3.160614013671875, 3.27215576171875, 3.383697509765625, 3.4952392578125, 3.606781005859375, 3.71832275390625, 3.829864501953125, 3.94140625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 11.0, 7.0, 8.0, 8.0, 13.0, 14.0, 12.0, 29.0, 31.0, 29.0, 27.0, 33.0, 30.0, 48.0, 58.0, 54.0, 61.0, 57.0, 55.0, 50.0, 46.0, 47.0, 41.0, 39.0, 38.0, 24.0, 33.0, 23.0, 11.0, 9.0, 11.0, 7.0, 7.0, 9.0, 6.0, 4.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.383881568908691, -9.086286544799805, -8.788691520690918, -8.491096496582031, -8.193501472473145, -7.895906925201416, -7.598311901092529, -7.300717353820801, -7.003122329711914, -6.705527305603027, -6.407932281494141, -6.110337257385254, -5.812742710113525, -5.515147686004639, -5.217552661895752, -4.919958114624023, -4.6223626136779785, -4.324767589569092, -4.027172565460205, -3.7295777797698975, -3.43198299407959, -3.134387969970703, -2.8367929458618164, -2.539198160171509, -2.241603136062622, -1.944008231163025, -1.6464133262634277, -1.348818302154541, -1.0512233972549438, -0.7536284923553467, -0.45603346824645996, -0.15843868255615234, 0.13915634155273438, 0.43675127625465393, 0.7343462109565735, 1.0319411754608154, 1.3295360803604126, 1.6271309852600098, 1.9247260093688965, 2.222320795059204, 2.519915819168091, 2.8175108432769775, 3.115105628967285, 3.412700653076172, 3.7102956771850586, 4.007890701293945, 4.305485725402832, 4.6030802726745605, 4.900675296783447, 5.198270320892334, 5.495865345001221, 5.793459892272949, 6.091054916381836, 6.388649940490723, 6.686244964599609, 6.983839988708496, 7.281435012817383, 7.5790300369262695, 7.876625061035156, 8.174220085144043, 8.47181510925293, 8.7694091796875, 9.067005157470703, 9.364599227905273, 9.66219425201416]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 8.0, 4.0, 12.0, 10.0, 13.0, 14.0, 17.0, 20.0, 26.0, 24.0, 27.0, 34.0, 26.0, 34.0, 39.0, 57.0, 47.0, 46.0, 54.0, 48.0, 44.0, 41.0, 44.0, 38.0, 35.0, 39.0, 35.0, 26.0, 27.0, 22.0, 21.0, 11.0, 9.0, 13.0, 11.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.729223251342773, -10.417200088500977, -10.105177879333496, -9.7931547164917, -9.481132507324219, -9.169109344482422, -8.857087135314941, -8.545063972473145, -8.233041763305664, -7.921019077301025, -7.608996391296387, -7.296973705291748, -6.984951019287109, -6.672928333282471, -6.360905647277832, -6.048882484436035, -5.7368597984313965, -5.424837112426758, -5.112814426422119, -4.8007917404174805, -4.488769054412842, -4.176746368408203, -3.8647234439849854, -3.5527007579803467, -3.240678071975708, -2.9286553859710693, -2.6166326999664307, -2.304609775543213, -1.9925872087478638, -1.680564522743225, -1.3685417175292969, -1.0565190315246582, -0.7444963455200195, -0.43247362971305847, -0.12045091390609741, 0.19157183170318604, 0.5035945177078247, 0.8156172037124634, 1.1276400089263916, 1.4396626949310303, 1.751685380935669, 2.0637080669403076, 2.3757307529449463, 2.687753677368164, 2.9997763633728027, 3.3117990493774414, 3.62382173538208, 3.9358444213867188, 4.247867107391357, 4.559889793395996, 4.871912479400635, 5.183935165405273, 5.495957851409912, 5.807980537414551, 6.120003700256348, 6.432025909423828, 6.744049072265625, 7.056071758270264, 7.368094444274902, 7.680117130279541, 7.99213981628418, 8.304162979125977, 8.616185188293457, 8.928208351135254, 9.240230560302734]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 7.0, 9.0, 21.0, 20.0, 28.0, 64.0, 98.0, 135.0, 190.0, 290.0, 476.0, 650.0, 974.0, 1587.0, 2374.0, 3554.0, 5632.0, 9099.0, 14983.0, 24748.0, 44190.0, 85103.0, 182522.0, 305572.0, 176511.0, 82767.0, 43079.0, 24435.0, 14439.0, 8989.0, 5700.0, 3610.0, 2234.0, 1497.0, 1051.0, 647.0, 444.0, 273.0, 188.0, 112.0, 90.0, 53.0, 38.0, 25.0, 18.0, 11.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.60546875, -2.51708984375, -2.4287109375, -2.34033203125, -2.251953125, -2.16357421875, -2.0751953125, -1.98681640625, -1.8984375, -1.81005859375, -1.7216796875, -1.63330078125, -1.544921875, -1.45654296875, -1.3681640625, -1.27978515625, -1.19140625, -1.10302734375, -1.0146484375, -0.92626953125, -0.837890625, -0.74951171875, -0.6611328125, -0.57275390625, -0.484375, -0.39599609375, -0.3076171875, -0.21923828125, -0.130859375, -0.04248046875, 0.0458984375, 0.13427734375, 0.22265625, 0.31103515625, 0.3994140625, 0.48779296875, 0.576171875, 0.66455078125, 0.7529296875, 0.84130859375, 0.9296875, 1.01806640625, 1.1064453125, 1.19482421875, 1.283203125, 1.37158203125, 1.4599609375, 1.54833984375, 1.63671875, 1.72509765625, 1.8134765625, 1.90185546875, 1.990234375, 2.07861328125, 2.1669921875, 2.25537109375, 2.34375, 2.43212890625, 2.5205078125, 2.60888671875, 2.697265625, 2.78564453125, 2.8740234375, 2.96240234375, 3.05078125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 8.0, 11.0, 5.0, 5.0, 15.0, 12.0, 20.0, 24.0, 25.0, 28.0, 32.0, 27.0, 33.0, 37.0, 34.0, 35.0, 44.0, 43.0, 43.0, 44.0, 55.0, 44.0, 37.0, 44.0, 33.0, 38.0, 27.0, 36.0, 37.0, 19.0, 18.0, 17.0, 16.0, 4.0, 8.0, 14.0, 3.0, 9.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-10.8984375, -10.593994140625, -10.28955078125, -9.985107421875, -9.6806640625, -9.376220703125, -9.07177734375, -8.767333984375, -8.462890625, -8.158447265625, -7.85400390625, -7.549560546875, -7.2451171875, -6.940673828125, -6.63623046875, -6.331787109375, -6.02734375, -5.722900390625, -5.41845703125, -5.114013671875, -4.8095703125, -4.505126953125, -4.20068359375, -3.896240234375, -3.591796875, -3.287353515625, -2.98291015625, -2.678466796875, -2.3740234375, -2.069580078125, -1.76513671875, -1.460693359375, -1.15625, -0.851806640625, -0.54736328125, -0.242919921875, 0.0615234375, 0.365966796875, 0.67041015625, 0.974853515625, 1.279296875, 1.583740234375, 1.88818359375, 2.192626953125, 2.4970703125, 2.801513671875, 3.10595703125, 3.410400390625, 3.71484375, 4.019287109375, 4.32373046875, 4.628173828125, 4.9326171875, 5.237060546875, 5.54150390625, 5.845947265625, 6.150390625, 6.454833984375, 6.75927734375, 7.063720703125, 7.3681640625, 7.672607421875, 7.97705078125, 8.281494140625, 8.5859375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 8.0, 9.0, 12.0, 6.0, 13.0, 31.0, 34.0, 30.0, 46.0, 61.0, 70.0, 93.0, 133.0, 168.0, 218.0, 280.0, 376.0, 592.0, 800.0, 1308.0, 2286.0, 4489.0, 9914.0, 25198.0, 881317.0, 80269.0, 21740.0, 8688.0, 4091.0, 2128.0, 1310.0, 813.0, 525.0, 387.0, 265.0, 178.0, 148.0, 121.0, 85.0, 68.0, 45.0, 45.0, 31.0, 22.0, 24.0, 20.0, 10.0, 8.0, 9.0, 10.0, 3.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0], "bins": [-7.1015625, -6.879150390625, -6.65673828125, -6.434326171875, -6.2119140625, -5.989501953125, -5.76708984375, -5.544677734375, -5.322265625, -5.099853515625, -4.87744140625, -4.655029296875, -4.4326171875, -4.210205078125, -3.98779296875, -3.765380859375, -3.54296875, -3.320556640625, -3.09814453125, -2.875732421875, -2.6533203125, -2.430908203125, -2.20849609375, -1.986083984375, -1.763671875, -1.541259765625, -1.31884765625, -1.096435546875, -0.8740234375, -0.651611328125, -0.42919921875, -0.206787109375, 0.015625, 0.238037109375, 0.46044921875, 0.682861328125, 0.9052734375, 1.127685546875, 1.35009765625, 1.572509765625, 1.794921875, 2.017333984375, 2.23974609375, 2.462158203125, 2.6845703125, 2.906982421875, 3.12939453125, 3.351806640625, 3.57421875, 3.796630859375, 4.01904296875, 4.241455078125, 4.4638671875, 4.686279296875, 4.90869140625, 5.131103515625, 5.353515625, 5.575927734375, 5.79833984375, 6.020751953125, 6.2431640625, 6.465576171875, 6.68798828125, 6.910400390625, 7.1328125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 11.0, 12.0, 6.0, 4.0, 8.0, 16.0, 19.0, 17.0, 24.0, 16.0, 19.0, 36.0, 28.0, 38.0, 39.0, 37.0, 48.0, 40.0, 34.0, 37.0, 38.0, 40.0, 34.0, 42.0, 36.0, 32.0, 31.0, 24.0, 28.0, 27.0, 29.0, 22.0, 21.0, 11.0, 20.0, 10.0, 10.0, 15.0, 9.0, 8.0, 9.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.41015625, -5.24261474609375, -5.0750732421875, -4.90753173828125, -4.739990234375, -4.57244873046875, -4.4049072265625, -4.23736572265625, -4.06982421875, -3.90228271484375, -3.7347412109375, -3.56719970703125, -3.399658203125, -3.23211669921875, -3.0645751953125, -2.89703369140625, -2.7294921875, -2.56195068359375, -2.3944091796875, -2.22686767578125, -2.059326171875, -1.89178466796875, -1.7242431640625, -1.55670166015625, -1.38916015625, -1.22161865234375, -1.0540771484375, -0.88653564453125, -0.718994140625, -0.55145263671875, -0.3839111328125, -0.21636962890625, -0.048828125, 0.11871337890625, 0.2862548828125, 0.45379638671875, 0.621337890625, 0.78887939453125, 0.9564208984375, 1.12396240234375, 1.29150390625, 1.45904541015625, 1.6265869140625, 1.79412841796875, 1.961669921875, 2.12921142578125, 2.2967529296875, 2.46429443359375, 2.6318359375, 2.79937744140625, 2.9669189453125, 3.13446044921875, 3.302001953125, 3.46954345703125, 3.6370849609375, 3.80462646484375, 3.97216796875, 4.13970947265625, 4.3072509765625, 4.47479248046875, 4.642333984375, 4.80987548828125, 4.9774169921875, 5.14495849609375, 5.3125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 6.0, 15.0, 13.0, 13.0, 24.0, 28.0, 28.0, 61.0, 74.0, 87.0, 116.0, 170.0, 267.0, 318.0, 462.0, 771.0, 1151.0, 1953.0, 3517.0, 7145.0, 16554.0, 61671.0, 907214.0, 25610.0, 9833.0, 4597.0, 2513.0, 1445.0, 875.0, 566.0, 395.0, 304.0, 169.0, 141.0, 119.0, 83.0, 53.0, 47.0, 30.0, 23.0, 15.0, 17.0, 14.0, 6.0, 6.0, 5.0, 8.0, 5.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5068359375, -0.49059295654296875, -0.4743499755859375, -0.45810699462890625, -0.441864013671875, -0.42562103271484375, -0.4093780517578125, -0.39313507080078125, -0.37689208984375, -0.36064910888671875, -0.3444061279296875, -0.32816314697265625, -0.311920166015625, -0.29567718505859375, -0.2794342041015625, -0.26319122314453125, -0.2469482421875, -0.23070526123046875, -0.2144622802734375, -0.19821929931640625, -0.181976318359375, -0.16573333740234375, -0.1494903564453125, -0.13324737548828125, -0.11700439453125, -0.10076141357421875, -0.0845184326171875, -0.06827545166015625, -0.052032470703125, -0.03578948974609375, -0.0195465087890625, -0.00330352783203125, 0.012939453125, 0.02918243408203125, 0.0454254150390625, 0.06166839599609375, 0.077911376953125, 0.09415435791015625, 0.1103973388671875, 0.12664031982421875, 0.14288330078125, 0.15912628173828125, 0.1753692626953125, 0.19161224365234375, 0.207855224609375, 0.22409820556640625, 0.2403411865234375, 0.25658416748046875, 0.2728271484375, 0.28907012939453125, 0.3053131103515625, 0.32155609130859375, 0.337799072265625, 0.35404205322265625, 0.3702850341796875, 0.38652801513671875, 0.40277099609375, 0.41901397705078125, 0.4352569580078125, 0.45149993896484375, 0.467742919921875, 0.48398590087890625, 0.5002288818359375, 0.5164718627929688, 0.53271484375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 6.0, 13.0, 16.0, 22.0, 21.0, 19.0, 30.0, 31.0, 40.0, 30.0, 45.0, 48.0, 55.0, 54.0, 53.0, 39.0, 48.0, 52.0, 40.0, 54.0, 43.0, 38.0, 30.0, 25.0, 28.0, 21.0, 17.0, 15.0, 17.0, 4.0, 9.0, 2.0, 8.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.0040740966796875e-05, -2.9101967811584473e-05, -2.816319465637207e-05, -2.7224421501159668e-05, -2.6285648345947266e-05, -2.5346875190734863e-05, -2.440810203552246e-05, -2.346932888031006e-05, -2.2530555725097656e-05, -2.1591782569885254e-05, -2.065300941467285e-05, -1.971423625946045e-05, -1.8775463104248047e-05, -1.7836689949035645e-05, -1.6897916793823242e-05, -1.595914363861084e-05, -1.5020370483398438e-05, -1.4081597328186035e-05, -1.3142824172973633e-05, -1.220405101776123e-05, -1.1265277862548828e-05, -1.0326504707336426e-05, -9.387731552124023e-06, -8.448958396911621e-06, -7.510185241699219e-06, -6.571412086486816e-06, -5.632638931274414e-06, -4.693865776062012e-06, -3.7550926208496094e-06, -2.816319465637207e-06, -1.8775463104248047e-06, -9.387731552124023e-07, 0.0, 9.387731552124023e-07, 1.8775463104248047e-06, 2.816319465637207e-06, 3.7550926208496094e-06, 4.693865776062012e-06, 5.632638931274414e-06, 6.571412086486816e-06, 7.510185241699219e-06, 8.448958396911621e-06, 9.387731552124023e-06, 1.0326504707336426e-05, 1.1265277862548828e-05, 1.220405101776123e-05, 1.3142824172973633e-05, 1.4081597328186035e-05, 1.5020370483398438e-05, 1.595914363861084e-05, 1.6897916793823242e-05, 1.7836689949035645e-05, 1.8775463104248047e-05, 1.971423625946045e-05, 2.065300941467285e-05, 2.1591782569885254e-05, 2.2530555725097656e-05, 2.346932888031006e-05, 2.440810203552246e-05, 2.5346875190734863e-05, 2.6285648345947266e-05, 2.7224421501159668e-05, 2.816319465637207e-05, 2.9101967811584473e-05, 3.0040740966796875e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 9.0, 12.0, 18.0, 41.0, 33.0, 62.0, 74.0, 120.0, 146.0, 198.0, 331.0, 504.0, 721.0, 1182.0, 1746.0, 2677.0, 4408.0, 7190.0, 11852.0, 20200.0, 36041.0, 69209.0, 150042.0, 313662.0, 219778.0, 95990.0, 47665.0, 25713.0, 14929.0, 8918.0, 5381.0, 3392.0, 2157.0, 1396.0, 906.0, 599.0, 394.0, 264.0, 188.0, 126.0, 81.0, 53.0, 43.0, 24.0, 28.0, 19.0, 10.0, 7.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.2294921875, -0.2222576141357422, -0.21502304077148438, -0.20778846740722656, -0.20055389404296875, -0.19331932067871094, -0.18608474731445312, -0.1788501739501953, -0.1716156005859375, -0.1643810272216797, -0.15714645385742188, -0.14991188049316406, -0.14267730712890625, -0.13544273376464844, -0.12820816040039062, -0.12097358703613281, -0.113739013671875, -0.10650444030761719, -0.09926986694335938, -0.09203529357910156, -0.08480072021484375, -0.07756614685058594, -0.07033157348632812, -0.06309700012207031, -0.0558624267578125, -0.04862785339355469, -0.041393280029296875, -0.03415870666503906, -0.02692413330078125, -0.019689559936523438, -0.012454986572265625, -0.0052204132080078125, 0.00201416015625, 0.009248733520507812, 0.016483306884765625, 0.023717880249023438, 0.03095245361328125, 0.03818702697753906, 0.045421600341796875, 0.05265617370605469, 0.0598907470703125, 0.06712532043457031, 0.07435989379882812, 0.08159446716308594, 0.08882904052734375, 0.09606361389160156, 0.10329818725585938, 0.11053276062011719, 0.117767333984375, 0.1250019073486328, 0.13223648071289062, 0.13947105407714844, 0.14670562744140625, 0.15394020080566406, 0.16117477416992188, 0.1684093475341797, 0.1756439208984375, 0.1828784942626953, 0.19011306762695312, 0.19734764099121094, 0.20458221435546875, 0.21181678771972656, 0.21905136108398438, 0.2262859344482422, 0.2335205078125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 8.0, 8.0, 3.0, 14.0, 12.0, 13.0, 24.0, 39.0, 65.0, 87.0, 157.0, 204.0, 133.0, 64.0, 34.0, 25.0, 20.0, 21.0, 16.0, 8.0, 13.0, 8.0, 3.0, 8.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13671875, -0.133148193359375, -0.12957763671875, -0.126007080078125, -0.1224365234375, -0.118865966796875, -0.11529541015625, -0.111724853515625, -0.108154296875, -0.104583740234375, -0.10101318359375, -0.097442626953125, -0.0938720703125, -0.090301513671875, -0.08673095703125, -0.083160400390625, -0.07958984375, -0.076019287109375, -0.07244873046875, -0.068878173828125, -0.0653076171875, -0.061737060546875, -0.05816650390625, -0.054595947265625, -0.051025390625, -0.047454833984375, -0.04388427734375, -0.040313720703125, -0.0367431640625, -0.033172607421875, -0.02960205078125, -0.026031494140625, -0.0224609375, -0.018890380859375, -0.01531982421875, -0.011749267578125, -0.0081787109375, -0.004608154296875, -0.00103759765625, 0.002532958984375, 0.006103515625, 0.009674072265625, 0.01324462890625, 0.016815185546875, 0.0203857421875, 0.023956298828125, 0.02752685546875, 0.031097412109375, 0.03466796875, 0.038238525390625, 0.04180908203125, 0.045379638671875, 0.0489501953125, 0.052520751953125, 0.05609130859375, 0.059661865234375, 0.063232421875, 0.066802978515625, 0.07037353515625, 0.073944091796875, 0.0775146484375, 0.081085205078125, 0.08465576171875, 0.088226318359375, 0.091796875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 12.0, 8.0, 11.0, 12.0, 11.0, 18.0, 28.0, 25.0, 27.0, 30.0, 36.0, 38.0, 40.0, 60.0, 58.0, 69.0, 59.0, 47.0, 51.0, 46.0, 54.0, 36.0, 38.0, 31.0, 33.0, 20.0, 31.0, 9.0, 10.0, 8.0, 10.0, 11.0, 6.0, 3.0, 6.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.887971878051758, -9.582518577575684, -9.277066230773926, -8.971612930297852, -8.666159629821777, -8.360706329345703, -8.055253982543945, -7.749800682067871, -7.444347858428955, -7.138895034790039, -6.833441734313965, -6.527988910675049, -6.222536087036133, -5.917082786560059, -5.611629962921143, -5.306177139282227, -5.000723838806152, -4.695271015167236, -4.389817714691162, -4.084364891052246, -3.778911828994751, -3.473458766937256, -3.16800594329834, -2.8625528812408447, -2.5570998191833496, -2.2516467571258545, -1.946193814277649, -1.6407408714294434, -1.3352878093719482, -1.0298347473144531, -0.7243818044662476, -0.418928861618042, -0.11347675323486328, 0.19197624921798706, 0.4974292516708374, 0.8028822541236877, 1.108335256576538, 1.4137883186340332, 1.7192412614822388, 2.0246942043304443, 2.3301472663879395, 2.6356003284454346, 2.9410533905029297, 3.2465062141418457, 3.551959276199341, 3.857412338256836, 4.162865161895752, 4.468317985534668, 4.773771286010742, 5.079224109649658, 5.384677410125732, 5.690130233764648, 5.995583534240723, 6.301036357879639, 6.606489181518555, 6.911942481994629, 7.217395305633545, 7.522848129272461, 7.828301429748535, 8.13375473022461, 8.439207077026367, 8.744660377502441, 9.050113677978516, 9.355566024780273, 9.661019325256348]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 7.0, 5.0, 12.0, 10.0, 13.0, 13.0, 19.0, 19.0, 26.0, 25.0, 29.0, 33.0, 27.0, 35.0, 40.0, 54.0, 46.0, 48.0, 57.0, 43.0, 47.0, 43.0, 44.0, 33.0, 35.0, 40.0, 37.0, 23.0, 30.0, 23.0, 17.0, 10.0, 10.0, 13.0, 10.0, 3.0, 4.0, 6.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.705666542053223, -10.393790245056152, -10.081913948059082, -9.770037651062012, -9.458161354064941, -9.146285057067871, -8.8344087600708, -8.522533416748047, -8.210657119750977, -7.898780822753906, -7.586904525756836, -7.275028228759766, -6.963151931762695, -6.651275634765625, -6.339399814605713, -6.027523517608643, -5.715646743774414, -5.403770446777344, -5.091894149780273, -4.780017852783203, -4.468141555786133, -4.1562652587890625, -3.8443894386291504, -3.53251314163208, -3.2206368446350098, -2.9087605476379395, -2.596884250640869, -2.285008192062378, -1.9731318950653076, -1.6612555980682373, -1.3493794202804565, -1.0375032424926758, -0.7256259918212891, -0.4137497544288635, -0.10187351703643799, 0.21000272035598755, 0.5218789577484131, 0.8337552547454834, 1.1456314325332642, 1.457507610321045, 1.7693839073181152, 2.0812602043151855, 2.393136501312256, 2.705012559890747, 3.0168888568878174, 3.3287651538848877, 3.640641212463379, 3.952517509460449, 4.2643938064575195, 4.57627010345459, 4.88814640045166, 5.2000226974487305, 5.511898994445801, 5.823775291442871, 6.135651111602783, 6.4475274085998535, 6.759403705596924, 7.071280002593994, 7.3831562995910645, 7.695032596588135, 8.006908416748047, 8.318784713745117, 8.630661010742188, 8.942537307739258, 9.254413604736328]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 6.0, 9.0, 10.0, 25.0, 25.0, 35.0, 58.0, 99.0, 166.0, 298.0, 484.0, 823.0, 1400.0, 2593.0, 4775.0, 9149.0, 17906.0, 36333.0, 72910.0, 136866.0, 211179.0, 222856.0, 157151.0, 85918.0, 43121.0, 21202.0, 10575.0, 5584.0, 3037.0, 1663.0, 947.0, 536.0, 312.0, 188.0, 122.0, 63.0, 43.0, 25.0, 25.0, 16.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-8.359375, -8.10699462890625, -7.8546142578125, -7.60223388671875, -7.349853515625, -7.09747314453125, -6.8450927734375, -6.59271240234375, -6.34033203125, -6.08795166015625, -5.8355712890625, -5.58319091796875, -5.330810546875, -5.07843017578125, -4.8260498046875, -4.57366943359375, -4.3212890625, -4.06890869140625, -3.8165283203125, -3.56414794921875, -3.311767578125, -3.05938720703125, -2.8070068359375, -2.55462646484375, -2.30224609375, -2.04986572265625, -1.7974853515625, -1.54510498046875, -1.292724609375, -1.04034423828125, -0.7879638671875, -0.53558349609375, -0.283203125, -0.03082275390625, 0.2215576171875, 0.47393798828125, 0.726318359375, 0.97869873046875, 1.2310791015625, 1.48345947265625, 1.73583984375, 1.98822021484375, 2.2406005859375, 2.49298095703125, 2.745361328125, 2.99774169921875, 3.2501220703125, 3.50250244140625, 3.7548828125, 4.00726318359375, 4.2596435546875, 4.51202392578125, 4.764404296875, 5.01678466796875, 5.2691650390625, 5.52154541015625, 5.77392578125, 6.02630615234375, 6.2786865234375, 6.53106689453125, 6.783447265625, 7.03582763671875, 7.2882080078125, 7.54058837890625, 7.79296875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 4.0, 7.0, 8.0, 13.0, 14.0, 19.0, 9.0, 20.0, 34.0, 32.0, 42.0, 41.0, 48.0, 57.0, 50.0, 59.0, 61.0, 62.0, 59.0, 48.0, 44.0, 50.0, 40.0, 45.0, 35.0, 20.0, 20.0, 11.0, 13.0, 7.0, 11.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.984375, -10.596923828125, -10.20947265625, -9.822021484375, -9.4345703125, -9.047119140625, -8.65966796875, -8.272216796875, -7.884765625, -7.497314453125, -7.10986328125, -6.722412109375, -6.3349609375, -5.947509765625, -5.56005859375, -5.172607421875, -4.78515625, -4.397705078125, -4.01025390625, -3.622802734375, -3.2353515625, -2.847900390625, -2.46044921875, -2.072998046875, -1.685546875, -1.298095703125, -0.91064453125, -0.523193359375, -0.1357421875, 0.251708984375, 0.63916015625, 1.026611328125, 1.4140625, 1.801513671875, 2.18896484375, 2.576416015625, 2.9638671875, 3.351318359375, 3.73876953125, 4.126220703125, 4.513671875, 4.901123046875, 5.28857421875, 5.676025390625, 6.0634765625, 6.450927734375, 6.83837890625, 7.225830078125, 7.61328125, 8.000732421875, 8.38818359375, 8.775634765625, 9.1630859375, 9.550537109375, 9.93798828125, 10.325439453125, 10.712890625, 11.100341796875, 11.48779296875, 11.875244140625, 12.2626953125, 12.650146484375, 13.03759765625, 13.425048828125, 13.8125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 4.0, 4.0, 10.0, 14.0, 27.0, 22.0, 45.0, 71.0, 70.0, 118.0, 160.0, 273.0, 374.0, 510.0, 796.0, 1156.0, 1719.0, 2632.0, 3850.0, 6004.0, 8981.0, 14364.0, 22743.0, 36160.0, 56056.0, 85020.0, 118489.0, 144123.0, 147946.0, 127252.0, 93680.0, 63327.0, 40441.0, 25717.0, 16132.0, 10445.0, 6665.0, 4352.0, 2858.0, 1864.0, 1310.0, 898.0, 632.0, 380.0, 259.0, 194.0, 128.0, 85.0, 77.0, 34.0, 27.0, 20.0, 18.0, 10.0, 7.0, 7.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-5.1953125, -5.0284423828125, -4.861572265625, -4.6947021484375, -4.52783203125, -4.3609619140625, -4.194091796875, -4.0272216796875, -3.8603515625, -3.6934814453125, -3.526611328125, -3.3597412109375, -3.19287109375, -3.0260009765625, -2.859130859375, -2.6922607421875, -2.525390625, -2.3585205078125, -2.191650390625, -2.0247802734375, -1.85791015625, -1.6910400390625, -1.524169921875, -1.3572998046875, -1.1904296875, -1.0235595703125, -0.856689453125, -0.6898193359375, -0.52294921875, -0.3560791015625, -0.189208984375, -0.0223388671875, 0.14453125, 0.3114013671875, 0.478271484375, 0.6451416015625, 0.81201171875, 0.9788818359375, 1.145751953125, 1.3126220703125, 1.4794921875, 1.6463623046875, 1.813232421875, 1.9801025390625, 2.14697265625, 2.3138427734375, 2.480712890625, 2.6475830078125, 2.814453125, 2.9813232421875, 3.148193359375, 3.3150634765625, 3.48193359375, 3.6488037109375, 3.815673828125, 3.9825439453125, 4.1494140625, 4.3162841796875, 4.483154296875, 4.6500244140625, 4.81689453125, 4.9837646484375, 5.150634765625, 5.3175048828125, 5.484375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 8.0, 12.0, 11.0, 14.0, 17.0, 14.0, 22.0, 23.0, 22.0, 33.0, 27.0, 33.0, 29.0, 40.0, 40.0, 33.0, 54.0, 43.0, 42.0, 40.0, 36.0, 34.0, 41.0, 46.0, 26.0, 31.0, 24.0, 32.0, 28.0, 23.0, 21.0, 14.0, 12.0, 17.0, 13.0, 5.0, 9.0, 3.0, 10.0, 1.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.80859375, -5.630126953125, -5.45166015625, -5.273193359375, -5.0947265625, -4.916259765625, -4.73779296875, -4.559326171875, -4.380859375, -4.202392578125, -4.02392578125, -3.845458984375, -3.6669921875, -3.488525390625, -3.31005859375, -3.131591796875, -2.953125, -2.774658203125, -2.59619140625, -2.417724609375, -2.2392578125, -2.060791015625, -1.88232421875, -1.703857421875, -1.525390625, -1.346923828125, -1.16845703125, -0.989990234375, -0.8115234375, -0.633056640625, -0.45458984375, -0.276123046875, -0.09765625, 0.080810546875, 0.25927734375, 0.437744140625, 0.6162109375, 0.794677734375, 0.97314453125, 1.151611328125, 1.330078125, 1.508544921875, 1.68701171875, 1.865478515625, 2.0439453125, 2.222412109375, 2.40087890625, 2.579345703125, 2.7578125, 2.936279296875, 3.11474609375, 3.293212890625, 3.4716796875, 3.650146484375, 3.82861328125, 4.007080078125, 4.185546875, 4.364013671875, 4.54248046875, 4.720947265625, 4.8994140625, 5.077880859375, 5.25634765625, 5.434814453125, 5.61328125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 4.0, 7.0, 15.0, 19.0, 49.0, 64.0, 87.0, 119.0, 183.0, 308.0, 488.0, 743.0, 1099.0, 1826.0, 2811.0, 4407.0, 7039.0, 10663.0, 16855.0, 25340.0, 37625.0, 52775.0, 71152.0, 89590.0, 103837.0, 112568.0, 110539.0, 100684.0, 84452.0, 66031.0, 48570.0, 33733.0, 23082.0, 14963.0, 9608.0, 6248.0, 4049.0, 2452.0, 1587.0, 1034.0, 666.0, 415.0, 262.0, 184.0, 123.0, 77.0, 42.0, 24.0, 19.0, 15.0, 4.0, 6.0, 6.0, 2.0, 3.0, 4.0], "bins": [-1.55859375, -1.5125732421875, -1.466552734375, -1.4205322265625, -1.37451171875, -1.3284912109375, -1.282470703125, -1.2364501953125, -1.1904296875, -1.1444091796875, -1.098388671875, -1.0523681640625, -1.00634765625, -0.9603271484375, -0.914306640625, -0.8682861328125, -0.822265625, -0.7762451171875, -0.730224609375, -0.6842041015625, -0.63818359375, -0.5921630859375, -0.546142578125, -0.5001220703125, -0.4541015625, -0.4080810546875, -0.362060546875, -0.3160400390625, -0.27001953125, -0.2239990234375, -0.177978515625, -0.1319580078125, -0.0859375, -0.0399169921875, 0.006103515625, 0.0521240234375, 0.09814453125, 0.1441650390625, 0.190185546875, 0.2362060546875, 0.2822265625, 0.3282470703125, 0.374267578125, 0.4202880859375, 0.46630859375, 0.5123291015625, 0.558349609375, 0.6043701171875, 0.650390625, 0.6964111328125, 0.742431640625, 0.7884521484375, 0.83447265625, 0.8804931640625, 0.926513671875, 0.9725341796875, 1.0185546875, 1.0645751953125, 1.110595703125, 1.1566162109375, 1.20263671875, 1.2486572265625, 1.294677734375, 1.3406982421875, 1.38671875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 12.0, 10.0, 25.0, 21.0, 31.0, 28.0, 45.0, 43.0, 49.0, 71.0, 53.0, 45.0, 47.0, 48.0, 57.0, 54.0, 51.0, 62.0, 43.0, 34.0, 31.0, 25.0, 29.0, 20.0, 7.0, 12.0, 8.0, 6.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022923946380615234, -0.00022248364984989166, -0.00021572783589363098, -0.0002089720219373703, -0.00020221620798110962, -0.00019546039402484894, -0.00018870458006858826, -0.00018194876611232758, -0.0001751929521560669, -0.0001684371381998062, -0.00016168132424354553, -0.00015492551028728485, -0.00014816969633102417, -0.0001414138823747635, -0.0001346580684185028, -0.00012790225446224213, -0.00012114644050598145, -0.00011439062654972076, -0.00010763481259346008, -0.0001008789986371994, -9.412318468093872e-05, -8.736737072467804e-05, -8.061155676841736e-05, -7.385574281215668e-05, -6.7099928855896e-05, -6.0344114899635315e-05, -5.3588300943374634e-05, -4.683248698711395e-05, -4.007667303085327e-05, -3.332085907459259e-05, -2.656504511833191e-05, -1.9809231162071228e-05, -1.3053417205810547e-05, -6.297603249549866e-06, 4.5821070671081543e-07, 7.214024662971497e-06, 1.3969838619232178e-05, 2.072565257549286e-05, 2.748146653175354e-05, 3.423728048801422e-05, 4.09930944442749e-05, 4.7748908400535583e-05, 5.4504722356796265e-05, 6.126053631305695e-05, 6.801635026931763e-05, 7.477216422557831e-05, 8.152797818183899e-05, 8.828379213809967e-05, 9.503960609436035e-05, 0.00010179542005062103, 0.00010855123400688171, 0.0001153070479631424, 0.00012206286191940308, 0.00012881867587566376, 0.00013557448983192444, 0.00014233030378818512, 0.0001490861177444458, 0.00015584193170070648, 0.00016259774565696716, 0.00016935355961322784, 0.00017610937356948853, 0.0001828651875257492, 0.0001896210014820099, 0.00019637681543827057, 0.00020313262939453125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 8.0, 33.0, 22.0, 49.0, 63.0, 84.0, 150.0, 236.0, 330.0, 547.0, 855.0, 1366.0, 2086.0, 3654.0, 5706.0, 9346.0, 15220.0, 24067.0, 37230.0, 54705.0, 75795.0, 98317.0, 115868.0, 123201.0, 119396.0, 103573.0, 81961.0, 60260.0, 41658.0, 27393.0, 17304.0, 10602.0, 6767.0, 3952.0, 2448.0, 1560.0, 997.0, 587.0, 392.0, 267.0, 156.0, 116.0, 77.0, 61.0, 28.0, 25.0, 12.0, 8.0, 8.0, 4.0, 3.0, 3.0, 2.0], "bins": [-1.794921875, -1.74310302734375, -1.6912841796875, -1.63946533203125, -1.587646484375, -1.53582763671875, -1.4840087890625, -1.43218994140625, -1.38037109375, -1.32855224609375, -1.2767333984375, -1.22491455078125, -1.173095703125, -1.12127685546875, -1.0694580078125, -1.01763916015625, -0.9658203125, -0.91400146484375, -0.8621826171875, -0.81036376953125, -0.758544921875, -0.70672607421875, -0.6549072265625, -0.60308837890625, -0.55126953125, -0.49945068359375, -0.4476318359375, -0.39581298828125, -0.343994140625, -0.29217529296875, -0.2403564453125, -0.18853759765625, -0.13671875, -0.08489990234375, -0.0330810546875, 0.01873779296875, 0.070556640625, 0.12237548828125, 0.1741943359375, 0.22601318359375, 0.27783203125, 0.32965087890625, 0.3814697265625, 0.43328857421875, 0.485107421875, 0.53692626953125, 0.5887451171875, 0.64056396484375, 0.6923828125, 0.74420166015625, 0.7960205078125, 0.84783935546875, 0.899658203125, 0.95147705078125, 1.0032958984375, 1.05511474609375, 1.10693359375, 1.15875244140625, 1.2105712890625, 1.26239013671875, 1.314208984375, 1.36602783203125, 1.4178466796875, 1.46966552734375, 1.521484375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 5.0, 6.0, 13.0, 17.0, 16.0, 22.0, 24.0, 32.0, 31.0, 50.0, 47.0, 41.0, 63.0, 52.0, 57.0, 54.0, 65.0, 51.0, 45.0, 38.0, 42.0, 46.0, 36.0, 32.0, 27.0, 18.0, 21.0, 6.0, 15.0, 9.0, 10.0, 5.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7314453125, -0.7073135375976562, -0.6831817626953125, -0.6590499877929688, -0.634918212890625, -0.6107864379882812, -0.5866546630859375, -0.5625228881835938, -0.53839111328125, -0.5142593383789062, -0.4901275634765625, -0.46599578857421875, -0.441864013671875, -0.41773223876953125, -0.3936004638671875, -0.36946868896484375, -0.3453369140625, -0.32120513916015625, -0.2970733642578125, -0.27294158935546875, -0.248809814453125, -0.22467803955078125, -0.2005462646484375, -0.17641448974609375, -0.15228271484375, -0.12815093994140625, -0.1040191650390625, -0.07988739013671875, -0.055755615234375, -0.03162384033203125, -0.0074920654296875, 0.01663970947265625, 0.040771484375, 0.06490325927734375, 0.0890350341796875, 0.11316680908203125, 0.137298583984375, 0.16143035888671875, 0.1855621337890625, 0.20969390869140625, 0.23382568359375, 0.25795745849609375, 0.2820892333984375, 0.30622100830078125, 0.330352783203125, 0.35448455810546875, 0.3786163330078125, 0.40274810791015625, 0.4268798828125, 0.45101165771484375, 0.4751434326171875, 0.49927520751953125, 0.523406982421875, 0.5475387573242188, 0.5716705322265625, 0.5958023071289062, 0.61993408203125, 0.6440658569335938, 0.6681976318359375, 0.6923294067382812, 0.716461181640625, 0.7405929565429688, 0.7647247314453125, 0.7888565063476562, 0.81298828125]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 9.0, 9.0, 19.0, 11.0, 16.0, 19.0, 30.0, 26.0, 30.0, 35.0, 30.0, 40.0, 46.0, 60.0, 46.0, 63.0, 54.0, 57.0, 62.0, 46.0, 29.0, 40.0, 37.0, 26.0, 29.0, 21.0, 26.0, 13.0, 16.0, 13.0, 10.0, 5.0, 5.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.392475128173828, -10.096870422363281, -9.80126667022705, -9.505661964416504, -9.210058212280273, -8.914453506469727, -8.61884880065918, -8.323244094848633, -8.027640342712402, -7.732036113739014, -7.436431884765625, -7.140827178955078, -6.8452229499816895, -6.549618721008301, -6.254014015197754, -5.958409786224365, -5.662805557250977, -5.367201328277588, -5.071597099304199, -4.775992393493652, -4.480388164520264, -4.184783935546875, -3.8891794681549072, -3.5935750007629395, -3.297970771789551, -3.002366542816162, -2.7067620754241943, -2.4111576080322266, -2.115553379058838, -1.8199490308761597, -1.5243446826934814, -1.2287402153015137, -0.9331369400024414, -0.6375325918197632, -0.34192824363708496, -0.04632389545440674, 0.24928045272827148, 0.5448848009109497, 0.8404891490936279, 1.1360936164855957, 1.4316978454589844, 1.7273021936416626, 2.022906541824341, 2.3185110092163086, 2.6141152381896973, 2.909719467163086, 3.2053239345550537, 3.5009284019470215, 3.79653263092041, 4.092136859893799, 4.3877410888671875, 4.683345794677734, 4.978950023651123, 5.274554252624512, 5.570158958435059, 5.865763187408447, 6.161367416381836, 6.456971645355225, 6.752575874328613, 7.04818058013916, 7.343784809112549, 7.6393890380859375, 7.934993743896484, 8.230598449707031, 8.526202201843262]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 4.0, 9.0, 7.0, 9.0, 14.0, 11.0, 17.0, 20.0, 12.0, 24.0, 19.0, 32.0, 29.0, 29.0, 27.0, 36.0, 44.0, 39.0, 54.0, 38.0, 34.0, 42.0, 52.0, 37.0, 41.0, 42.0, 35.0, 27.0, 19.0, 38.0, 36.0, 25.0, 20.0, 15.0, 12.0, 6.0, 10.0, 5.0, 9.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-10.273642539978027, -9.980419158935547, -9.68719482421875, -9.39397144317627, -9.100748062133789, -8.807523727416992, -8.514300346374512, -8.221076965332031, -7.927852630615234, -7.634628772735596, -7.341404914855957, -7.048181533813477, -6.754957675933838, -6.461733818054199, -6.168510437011719, -5.87528657913208, -5.582062721252441, -5.288838863372803, -4.995615005493164, -4.702391624450684, -4.409167766571045, -4.115943908691406, -3.8227202892303467, -3.529496669769287, -3.2362728118896484, -2.9430489540100098, -2.64982533454895, -2.3566017150878906, -2.063377857208252, -1.7701541185379028, -1.4769303798675537, -1.1837067604064941, -0.8904819488525391, -0.5972582101821899, -0.3040344715118408, -0.0108107328414917, 0.2824130058288574, 0.5756367444992065, 0.8688604831695557, 1.1620841026306152, 1.455307960510254, 1.748531699180603, 2.041755437850952, 2.3349790573120117, 2.6282029151916504, 2.921426773071289, 3.2146503925323486, 3.507874011993408, 3.801097869873047, 4.0943217277526855, 4.387545585632324, 4.680768966674805, 4.973992824554443, 5.267216682434082, 5.5604400634765625, 5.853663921356201, 6.14688777923584, 6.4401116371154785, 6.733335494995117, 7.026558876037598, 7.319782733917236, 7.613006591796875, 7.9062299728393555, 8.199453353881836, 8.492677688598633]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 6.0, 6.0, 11.0, 32.0, 36.0, 67.0, 119.0, 177.0, 280.0, 474.0, 803.0, 1402.0, 2633.0, 4675.0, 8420.0, 15966.0, 29896.0, 57064.0, 109575.0, 207594.0, 380609.0, 624219.0, 823230.0, 762135.0, 521773.0, 301834.0, 162749.0, 85436.0, 44347.0, 22855.0, 11914.0, 6349.0, 3378.0, 1777.0, 982.0, 611.0, 350.0, 212.0, 98.0, 75.0, 46.0, 29.0, 18.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0625, -9.713134765625, -9.36376953125, -9.014404296875, -8.6650390625, -8.315673828125, -7.96630859375, -7.616943359375, -7.267578125, -6.918212890625, -6.56884765625, -6.219482421875, -5.8701171875, -5.520751953125, -5.17138671875, -4.822021484375, -4.47265625, -4.123291015625, -3.77392578125, -3.424560546875, -3.0751953125, -2.725830078125, -2.37646484375, -2.027099609375, -1.677734375, -1.328369140625, -0.97900390625, -0.629638671875, -0.2802734375, 0.069091796875, 0.41845703125, 0.767822265625, 1.1171875, 1.466552734375, 1.81591796875, 2.165283203125, 2.5146484375, 2.864013671875, 3.21337890625, 3.562744140625, 3.912109375, 4.261474609375, 4.61083984375, 4.960205078125, 5.3095703125, 5.658935546875, 6.00830078125, 6.357666015625, 6.70703125, 7.056396484375, 7.40576171875, 7.755126953125, 8.1044921875, 8.453857421875, 8.80322265625, 9.152587890625, 9.501953125, 9.851318359375, 10.20068359375, 10.550048828125, 10.8994140625, 11.248779296875, 11.59814453125, 11.947509765625, 12.296875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 5.0, 2.0, 5.0, 5.0, 10.0, 8.0, 14.0, 13.0, 16.0, 22.0, 24.0, 26.0, 16.0, 31.0, 28.0, 49.0, 35.0, 34.0, 41.0, 37.0, 45.0, 51.0, 37.0, 43.0, 51.0, 43.0, 43.0, 31.0, 47.0, 32.0, 24.0, 31.0, 19.0, 19.0, 16.0, 9.0, 10.0, 9.0, 2.0, 4.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0], "bins": [-10.6875, -10.40814208984375, -10.1287841796875, -9.84942626953125, -9.570068359375, -9.29071044921875, -9.0113525390625, -8.73199462890625, -8.45263671875, -8.17327880859375, -7.8939208984375, -7.61456298828125, -7.335205078125, -7.05584716796875, -6.7764892578125, -6.49713134765625, -6.2177734375, -5.93841552734375, -5.6590576171875, -5.37969970703125, -5.100341796875, -4.82098388671875, -4.5416259765625, -4.26226806640625, -3.98291015625, -3.70355224609375, -3.4241943359375, -3.14483642578125, -2.865478515625, -2.58612060546875, -2.3067626953125, -2.02740478515625, -1.748046875, -1.46868896484375, -1.1893310546875, -0.90997314453125, -0.630615234375, -0.35125732421875, -0.0718994140625, 0.20745849609375, 0.48681640625, 0.76617431640625, 1.0455322265625, 1.32489013671875, 1.604248046875, 1.88360595703125, 2.1629638671875, 2.44232177734375, 2.7216796875, 3.00103759765625, 3.2803955078125, 3.55975341796875, 3.839111328125, 4.11846923828125, 4.3978271484375, 4.67718505859375, 4.95654296875, 5.23590087890625, 5.5152587890625, 5.79461669921875, 6.073974609375, 6.35333251953125, 6.6326904296875, 6.91204833984375, 7.19140625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 3.0, 5.0, 10.0, 21.0, 26.0, 24.0, 67.0, 86.0, 142.0, 226.0, 331.0, 554.0, 857.0, 1344.0, 2067.0, 3316.0, 5182.0, 8255.0, 13420.0, 21944.0, 35755.0, 57860.0, 94262.0, 150174.0, 231926.0, 339537.0, 459145.0, 551103.0, 569952.0, 502725.0, 389679.0, 273925.0, 180434.0, 114760.0, 71085.0, 43691.0, 27045.0, 16209.0, 10198.0, 6291.0, 3932.0, 2524.0, 1594.0, 915.0, 636.0, 382.0, 238.0, 182.0, 103.0, 67.0, 31.0, 32.0, 6.0, 10.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.78125, -9.4775390625, -9.173828125, -8.8701171875, -8.56640625, -8.2626953125, -7.958984375, -7.6552734375, -7.3515625, -7.0478515625, -6.744140625, -6.4404296875, -6.13671875, -5.8330078125, -5.529296875, -5.2255859375, -4.921875, -4.6181640625, -4.314453125, -4.0107421875, -3.70703125, -3.4033203125, -3.099609375, -2.7958984375, -2.4921875, -2.1884765625, -1.884765625, -1.5810546875, -1.27734375, -0.9736328125, -0.669921875, -0.3662109375, -0.0625, 0.2412109375, 0.544921875, 0.8486328125, 1.15234375, 1.4560546875, 1.759765625, 2.0634765625, 2.3671875, 2.6708984375, 2.974609375, 3.2783203125, 3.58203125, 3.8857421875, 4.189453125, 4.4931640625, 4.796875, 5.1005859375, 5.404296875, 5.7080078125, 6.01171875, 6.3154296875, 6.619140625, 6.9228515625, 7.2265625, 7.5302734375, 7.833984375, 8.1376953125, 8.44140625, 8.7451171875, 9.048828125, 9.3525390625, 9.65625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 2.0, 4.0, 12.0, 16.0, 11.0, 20.0, 22.0, 27.0, 39.0, 34.0, 59.0, 91.0, 89.0, 98.0, 130.0, 155.0, 169.0, 203.0, 210.0, 223.0, 241.0, 234.0, 237.0, 208.0, 225.0, 206.0, 178.0, 163.0, 159.0, 117.0, 90.0, 74.0, 68.0, 51.0, 43.0, 34.0, 24.0, 29.0, 13.0, 16.0, 11.0, 11.0, 9.0, 9.0, 3.0, 1.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.59283447265625, -4.4434814453125, -4.29412841796875, -4.144775390625, -3.99542236328125, -3.8460693359375, -3.69671630859375, -3.54736328125, -3.39801025390625, -3.2486572265625, -3.09930419921875, -2.949951171875, -2.80059814453125, -2.6512451171875, -2.50189208984375, -2.3525390625, -2.20318603515625, -2.0538330078125, -1.90447998046875, -1.755126953125, -1.60577392578125, -1.4564208984375, -1.30706787109375, -1.15771484375, -1.00836181640625, -0.8590087890625, -0.70965576171875, -0.560302734375, -0.41094970703125, -0.2615966796875, -0.11224365234375, 0.037109375, 0.18646240234375, 0.3358154296875, 0.48516845703125, 0.634521484375, 0.78387451171875, 0.9332275390625, 1.08258056640625, 1.23193359375, 1.38128662109375, 1.5306396484375, 1.67999267578125, 1.829345703125, 1.97869873046875, 2.1280517578125, 2.27740478515625, 2.4267578125, 2.57611083984375, 2.7254638671875, 2.87481689453125, 3.024169921875, 3.17352294921875, 3.3228759765625, 3.47222900390625, 3.62158203125, 3.77093505859375, 3.9202880859375, 4.06964111328125, 4.218994140625, 4.36834716796875, 4.5177001953125, 4.66705322265625, 4.81640625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 9.0, 18.0, 7.0, 23.0, 24.0, 35.0, 48.0, 36.0, 48.0, 48.0, 70.0, 101.0, 77.0, 99.0, 46.0, 51.0, 57.0, 37.0, 26.0, 24.0, 19.0, 25.0, 15.0, 6.0, 7.0, 6.0, 7.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.40118980407715, -20.827768325805664, -20.254348754882812, -19.680927276611328, -19.107505798339844, -18.534086227416992, -17.960664749145508, -17.387245178222656, -16.813823699951172, -16.240402221679688, -15.66698169708252, -15.093561172485352, -14.520140647888184, -13.946720123291016, -13.373298645019531, -12.799878120422363, -12.226456642150879, -11.653036117553711, -11.079614639282227, -10.506194114685059, -9.93277359008789, -9.359352111816406, -8.785931587219238, -8.21251106262207, -7.639090061187744, -7.065669059753418, -6.49224853515625, -5.918827533721924, -5.345406532287598, -4.77198600769043, -4.1985650062561035, -3.6251444816589355, -3.051722526550293, -2.478301763534546, -1.9048808813095093, -1.3314599990844727, -0.7580392360687256, -0.18461847305297852, 0.38880252838134766, 0.9622230529785156, 1.5356440544128418, 2.109064817428589, 2.682485580444336, 3.255906581878662, 3.829327344894409, 4.402748107910156, 4.976169109344482, 5.54958963394165, 6.123010635375977, 6.696431636810303, 7.269852161407471, 7.843273162841797, 8.416693687438965, 8.990114212036133, 9.563535690307617, 10.136956214904785, 10.710376739501953, 11.283797264099121, 11.857218742370605, 12.430639266967773, 13.004059791564941, 13.57748031616211, 14.150901794433594, 14.724322319030762, 15.297743797302246]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 4.0, 8.0, 7.0, 3.0, 10.0, 6.0, 15.0, 12.0, 19.0, 14.0, 15.0, 14.0, 23.0, 23.0, 29.0, 29.0, 31.0, 37.0, 47.0, 26.0, 42.0, 41.0, 55.0, 41.0, 35.0, 47.0, 42.0, 34.0, 30.0, 33.0, 31.0, 25.0, 25.0, 26.0, 15.0, 21.0, 18.0, 12.0, 13.0, 10.0, 4.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.436731338500977, -13.021175384521484, -12.605618476867676, -12.190061569213867, -11.774505615234375, -11.358949661254883, -10.943392753601074, -10.527835845947266, -10.112279891967773, -9.696723937988281, -9.281167030334473, -8.865610122680664, -8.450054168701172, -8.03449821472168, -7.618941307067871, -7.203384876251221, -6.78782844543457, -6.37227201461792, -5.9567155838012695, -5.541159152984619, -5.125602722167969, -4.710046291351318, -4.294489860534668, -3.8789334297180176, -3.463376998901367, -3.047820568084717, -2.6322641372680664, -2.216707706451416, -1.8011512756347656, -1.3855948448181152, -0.9700384140014648, -0.5544819831848145, -0.13892459869384766, 0.27663183212280273, 0.6921882629394531, 1.1077446937561035, 1.523301124572754, 1.9388575553894043, 2.3544139862060547, 2.769970417022705, 3.1855268478393555, 3.601083278656006, 4.016639709472656, 4.432196140289307, 4.847752571105957, 5.263309001922607, 5.678865432739258, 6.094421863555908, 6.509978294372559, 6.925534725189209, 7.341091156005859, 7.75664758682251, 8.17220401763916, 8.587760925292969, 9.003316879272461, 9.418872833251953, 9.834429740905762, 10.24998664855957, 10.665542602539062, 11.081098556518555, 11.496655464172363, 11.912212371826172, 12.327768325805664, 12.743324279785156, 13.158881187438965]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 10.0, 11.0, 25.0, 26.0, 41.0, 59.0, 88.0, 117.0, 197.0, 314.0, 458.0, 740.0, 1155.0, 1784.0, 2948.0, 5142.0, 8603.0, 15772.0, 30414.0, 64522.0, 157406.0, 358491.0, 226405.0, 87794.0, 39693.0, 19682.0, 10640.0, 6140.0, 3661.0, 2224.0, 1406.0, 881.0, 557.0, 384.0, 253.0, 159.0, 105.0, 78.0, 61.0, 36.0, 19.0, 21.0, 12.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.546875, -5.3822021484375, -5.217529296875, -5.0528564453125, -4.88818359375, -4.7235107421875, -4.558837890625, -4.3941650390625, -4.2294921875, -4.0648193359375, -3.900146484375, -3.7354736328125, -3.57080078125, -3.4061279296875, -3.241455078125, -3.0767822265625, -2.912109375, -2.7474365234375, -2.582763671875, -2.4180908203125, -2.25341796875, -2.0887451171875, -1.924072265625, -1.7593994140625, -1.5947265625, -1.4300537109375, -1.265380859375, -1.1007080078125, -0.93603515625, -0.7713623046875, -0.606689453125, -0.4420166015625, -0.27734375, -0.1126708984375, 0.052001953125, 0.2166748046875, 0.38134765625, 0.5460205078125, 0.710693359375, 0.8753662109375, 1.0400390625, 1.2047119140625, 1.369384765625, 1.5340576171875, 1.69873046875, 1.8634033203125, 2.028076171875, 2.1927490234375, 2.357421875, 2.5220947265625, 2.686767578125, 2.8514404296875, 3.01611328125, 3.1807861328125, 3.345458984375, 3.5101318359375, 3.6748046875, 3.8394775390625, 4.004150390625, 4.1688232421875, 4.33349609375, 4.4981689453125, 4.662841796875, 4.8275146484375, 4.9921875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 10.0, 11.0, 9.0, 17.0, 9.0, 12.0, 19.0, 21.0, 21.0, 20.0, 35.0, 24.0, 30.0, 39.0, 36.0, 38.0, 56.0, 49.0, 44.0, 57.0, 46.0, 38.0, 44.0, 31.0, 36.0, 30.0, 35.0, 27.0, 29.0, 21.0, 16.0, 17.0, 9.0, 14.0, 9.0, 5.0, 7.0, 6.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.6640625, -15.1962890625, -14.728515625, -14.2607421875, -13.79296875, -13.3251953125, -12.857421875, -12.3896484375, -11.921875, -11.4541015625, -10.986328125, -10.5185546875, -10.05078125, -9.5830078125, -9.115234375, -8.6474609375, -8.1796875, -7.7119140625, -7.244140625, -6.7763671875, -6.30859375, -5.8408203125, -5.373046875, -4.9052734375, -4.4375, -3.9697265625, -3.501953125, -3.0341796875, -2.56640625, -2.0986328125, -1.630859375, -1.1630859375, -0.6953125, -0.2275390625, 0.240234375, 0.7080078125, 1.17578125, 1.6435546875, 2.111328125, 2.5791015625, 3.046875, 3.5146484375, 3.982421875, 4.4501953125, 4.91796875, 5.3857421875, 5.853515625, 6.3212890625, 6.7890625, 7.2568359375, 7.724609375, 8.1923828125, 8.66015625, 9.1279296875, 9.595703125, 10.0634765625, 10.53125, 10.9990234375, 11.466796875, 11.9345703125, 12.40234375, 12.8701171875, 13.337890625, 13.8056640625, 14.2734375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 1.0, 12.0, 13.0, 15.0, 23.0, 33.0, 33.0, 57.0, 39.0, 65.0, 89.0, 121.0, 155.0, 204.0, 264.0, 405.0, 604.0, 829.0, 1435.0, 2512.0, 5000.0, 11254.0, 32360.0, 909639.0, 51810.0, 16726.0, 6629.0, 3157.0, 1638.0, 1035.0, 669.0, 447.0, 284.0, 237.0, 196.0, 129.0, 85.0, 88.0, 53.0, 45.0, 41.0, 31.0, 20.0, 23.0, 13.0, 8.0, 9.0, 6.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 3.0], "bins": [-12.296875, -11.920654296875, -11.54443359375, -11.168212890625, -10.7919921875, -10.415771484375, -10.03955078125, -9.663330078125, -9.287109375, -8.910888671875, -8.53466796875, -8.158447265625, -7.7822265625, -7.406005859375, -7.02978515625, -6.653564453125, -6.27734375, -5.901123046875, -5.52490234375, -5.148681640625, -4.7724609375, -4.396240234375, -4.02001953125, -3.643798828125, -3.267578125, -2.891357421875, -2.51513671875, -2.138916015625, -1.7626953125, -1.386474609375, -1.01025390625, -0.634033203125, -0.2578125, 0.118408203125, 0.49462890625, 0.870849609375, 1.2470703125, 1.623291015625, 1.99951171875, 2.375732421875, 2.751953125, 3.128173828125, 3.50439453125, 3.880615234375, 4.2568359375, 4.633056640625, 5.00927734375, 5.385498046875, 5.76171875, 6.137939453125, 6.51416015625, 6.890380859375, 7.2666015625, 7.642822265625, 8.01904296875, 8.395263671875, 8.771484375, 9.147705078125, 9.52392578125, 9.900146484375, 10.2763671875, 10.652587890625, 11.02880859375, 11.405029296875, 11.78125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 5.0, 7.0, 7.0, 11.0, 8.0, 16.0, 15.0, 16.0, 16.0, 17.0, 18.0, 23.0, 26.0, 36.0, 28.0, 31.0, 33.0, 37.0, 39.0, 28.0, 42.0, 43.0, 34.0, 33.0, 39.0, 32.0, 30.0, 36.0, 41.0, 38.0, 35.0, 26.0, 33.0, 18.0, 14.0, 14.0, 14.0, 8.0, 5.0, 13.0, 7.0, 8.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.625, -8.3592529296875, -8.093505859375, -7.8277587890625, -7.56201171875, -7.2962646484375, -7.030517578125, -6.7647705078125, -6.4990234375, -6.2332763671875, -5.967529296875, -5.7017822265625, -5.43603515625, -5.1702880859375, -4.904541015625, -4.6387939453125, -4.373046875, -4.1072998046875, -3.841552734375, -3.5758056640625, -3.31005859375, -3.0443115234375, -2.778564453125, -2.5128173828125, -2.2470703125, -1.9813232421875, -1.715576171875, -1.4498291015625, -1.18408203125, -0.9183349609375, -0.652587890625, -0.3868408203125, -0.12109375, 0.1446533203125, 0.410400390625, 0.6761474609375, 0.94189453125, 1.2076416015625, 1.473388671875, 1.7391357421875, 2.0048828125, 2.2706298828125, 2.536376953125, 2.8021240234375, 3.06787109375, 3.3336181640625, 3.599365234375, 3.8651123046875, 4.130859375, 4.3966064453125, 4.662353515625, 4.9281005859375, 5.19384765625, 5.4595947265625, 5.725341796875, 5.9910888671875, 6.2568359375, 6.5225830078125, 6.788330078125, 7.0540771484375, 7.31982421875, 7.5855712890625, 7.851318359375, 8.1170654296875, 8.3828125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 7.0, 6.0, 9.0, 25.0, 23.0, 26.0, 46.0, 58.0, 52.0, 106.0, 140.0, 190.0, 320.0, 514.0, 787.0, 1273.0, 2531.0, 5565.0, 14643.0, 80842.0, 909322.0, 18682.0, 6515.0, 2891.0, 1478.0, 860.0, 514.0, 363.0, 207.0, 146.0, 109.0, 89.0, 55.0, 44.0, 26.0, 22.0, 14.0, 10.0, 12.0, 4.0, 8.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.1845703125, -1.148773193359375, -1.11297607421875, -1.077178955078125, -1.0413818359375, -1.005584716796875, -0.96978759765625, -0.933990478515625, -0.898193359375, -0.862396240234375, -0.82659912109375, -0.790802001953125, -0.7550048828125, -0.719207763671875, -0.68341064453125, -0.647613525390625, -0.61181640625, -0.576019287109375, -0.54022216796875, -0.504425048828125, -0.4686279296875, -0.432830810546875, -0.39703369140625, -0.361236572265625, -0.325439453125, -0.289642333984375, -0.25384521484375, -0.218048095703125, -0.1822509765625, -0.146453857421875, -0.11065673828125, -0.074859619140625, -0.0390625, -0.003265380859375, 0.03253173828125, 0.068328857421875, 0.1041259765625, 0.139923095703125, 0.17572021484375, 0.211517333984375, 0.247314453125, 0.283111572265625, 0.31890869140625, 0.354705810546875, 0.3905029296875, 0.426300048828125, 0.46209716796875, 0.497894287109375, 0.53369140625, 0.569488525390625, 0.60528564453125, 0.641082763671875, 0.6768798828125, 0.712677001953125, 0.74847412109375, 0.784271240234375, 0.820068359375, 0.855865478515625, 0.89166259765625, 0.927459716796875, 0.9632568359375, 0.999053955078125, 1.03485107421875, 1.070648193359375, 1.1064453125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 8.0, 4.0, 9.0, 11.0, 12.0, 12.0, 22.0, 15.0, 10.0, 11.0, 21.0, 24.0, 24.0, 27.0, 28.0, 25.0, 41.0, 37.0, 42.0, 25.0, 49.0, 48.0, 37.0, 36.0, 36.0, 36.0, 23.0, 34.0, 33.0, 28.0, 27.0, 26.0, 22.0, 29.0, 20.0, 26.0, 8.0, 16.0, 11.0, 7.0, 10.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 6.0, 1.0, 3.0], "bins": [-2.282857894897461e-05, -2.2178515791893005e-05, -2.15284526348114e-05, -2.0878389477729797e-05, -2.0228326320648193e-05, -1.957826316356659e-05, -1.8928200006484985e-05, -1.827813684940338e-05, -1.7628073692321777e-05, -1.6978010535240173e-05, -1.632794737815857e-05, -1.5677884221076965e-05, -1.5027821063995361e-05, -1.4377757906913757e-05, -1.3727694749832153e-05, -1.307763159275055e-05, -1.2427568435668945e-05, -1.1777505278587341e-05, -1.1127442121505737e-05, -1.0477378964424133e-05, -9.82731580734253e-06, -9.177252650260925e-06, -8.527189493179321e-06, -7.877126336097717e-06, -7.227063179016113e-06, -6.577000021934509e-06, -5.926936864852905e-06, -5.276873707771301e-06, -4.626810550689697e-06, -3.976747393608093e-06, -3.3266842365264893e-06, -2.6766210794448853e-06, -2.0265579223632812e-06, -1.3764947652816772e-06, -7.264316082000732e-07, -7.636845111846924e-08, 5.736947059631348e-07, 1.2237578630447388e-06, 1.8738210201263428e-06, 2.5238841772079468e-06, 3.1739473342895508e-06, 3.824010491371155e-06, 4.474073648452759e-06, 5.124136805534363e-06, 5.774199962615967e-06, 6.424263119697571e-06, 7.074326276779175e-06, 7.724389433860779e-06, 8.374452590942383e-06, 9.024515748023987e-06, 9.67457890510559e-06, 1.0324642062187195e-05, 1.0974705219268799e-05, 1.1624768376350403e-05, 1.2274831533432007e-05, 1.292489469051361e-05, 1.3574957847595215e-05, 1.4225021004676819e-05, 1.4875084161758423e-05, 1.5525147318840027e-05, 1.617521047592163e-05, 1.6825273633003235e-05, 1.747533679008484e-05, 1.8125399947166443e-05, 1.8775463104248047e-05]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 5.0, 5.0, 7.0, 15.0, 22.0, 32.0, 49.0, 82.0, 89.0, 153.0, 223.0, 330.0, 445.0, 583.0, 904.0, 1287.0, 1860.0, 2644.0, 4021.0, 5895.0, 9596.0, 15460.0, 26351.0, 48647.0, 102386.0, 255437.0, 307743.0, 127007.0, 57732.0, 30567.0, 17582.0, 10702.0, 6749.0, 4454.0, 2986.0, 1915.0, 1379.0, 949.0, 656.0, 511.0, 328.0, 212.0, 179.0, 113.0, 97.0, 51.0, 34.0, 27.0, 26.0, 10.0, 15.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.40966796875, -0.39730072021484375, -0.3849334716796875, -0.37256622314453125, -0.360198974609375, -0.34783172607421875, -0.3354644775390625, -0.32309722900390625, -0.31072998046875, -0.29836273193359375, -0.2859954833984375, -0.27362823486328125, -0.261260986328125, -0.24889373779296875, -0.2365264892578125, -0.22415924072265625, -0.2117919921875, -0.19942474365234375, -0.1870574951171875, -0.17469024658203125, -0.162322998046875, -0.14995574951171875, -0.1375885009765625, -0.12522125244140625, -0.11285400390625, -0.10048675537109375, -0.0881195068359375, -0.07575225830078125, -0.063385009765625, -0.05101776123046875, -0.0386505126953125, -0.02628326416015625, -0.013916015625, -0.00154876708984375, 0.0108184814453125, 0.02318572998046875, 0.035552978515625, 0.04792022705078125, 0.0602874755859375, 0.07265472412109375, 0.08502197265625, 0.09738922119140625, 0.1097564697265625, 0.12212371826171875, 0.134490966796875, 0.14685821533203125, 0.1592254638671875, 0.17159271240234375, 0.1839599609375, 0.19632720947265625, 0.2086944580078125, 0.22106170654296875, 0.233428955078125, 0.24579620361328125, 0.2581634521484375, 0.27053070068359375, 0.28289794921875, 0.29526519775390625, 0.3076324462890625, 0.31999969482421875, 0.332366943359375, 0.34473419189453125, 0.3571014404296875, 0.36946868896484375, 0.3818359375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 1.0, 8.0, 7.0, 8.0, 17.0, 16.0, 19.0, 20.0, 35.0, 31.0, 40.0, 39.0, 87.0, 125.0, 127.0, 99.0, 78.0, 47.0, 39.0, 30.0, 18.0, 17.0, 17.0, 15.0, 13.0, 8.0, 10.0, 5.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.1962890625, -0.19086456298828125, -0.1854400634765625, -0.18001556396484375, -0.174591064453125, -0.16916656494140625, -0.1637420654296875, -0.15831756591796875, -0.15289306640625, -0.14746856689453125, -0.1420440673828125, -0.13661956787109375, -0.131195068359375, -0.12577056884765625, -0.1203460693359375, -0.11492156982421875, -0.1094970703125, -0.10407257080078125, -0.0986480712890625, -0.09322357177734375, -0.087799072265625, -0.08237457275390625, -0.0769500732421875, -0.07152557373046875, -0.06610107421875, -0.06067657470703125, -0.0552520751953125, -0.04982757568359375, -0.044403076171875, -0.03897857666015625, -0.0335540771484375, -0.02812957763671875, -0.022705078125, -0.01728057861328125, -0.0118560791015625, -0.00643157958984375, -0.001007080078125, 0.00441741943359375, 0.0098419189453125, 0.01526641845703125, 0.02069091796875, 0.02611541748046875, 0.0315399169921875, 0.03696441650390625, 0.042388916015625, 0.04781341552734375, 0.0532379150390625, 0.05866241455078125, 0.0640869140625, 0.06951141357421875, 0.0749359130859375, 0.08036041259765625, 0.085784912109375, 0.09120941162109375, 0.0966339111328125, 0.10205841064453125, 0.10748291015625, 0.11290740966796875, 0.1183319091796875, 0.12375640869140625, 0.129180908203125, 0.13460540771484375, 0.1400299072265625, 0.14545440673828125, 0.15087890625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 4.0, 8.0, 7.0, 15.0, 10.0, 22.0, 22.0, 36.0, 35.0, 47.0, 43.0, 51.0, 54.0, 78.0, 89.0, 87.0, 74.0, 46.0, 53.0, 50.0, 30.0, 23.0, 16.0, 22.0, 25.0, 11.0, 4.0, 9.0, 6.0, 6.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.133127212524414, -20.571903228759766, -20.010679244995117, -19.4494571685791, -18.888233184814453, -18.327009201049805, -17.765785217285156, -17.204561233520508, -16.64333724975586, -16.08211326599121, -15.520890235900879, -14.95966625213623, -14.398443222045898, -13.83721923828125, -13.275995254516602, -12.714771270751953, -12.153549194335938, -11.592325210571289, -11.031102180480957, -10.469878196716309, -9.908655166625977, -9.347431182861328, -8.78620719909668, -8.224983215332031, -7.663760185241699, -7.102536678314209, -6.541313171386719, -5.98008918762207, -5.41886568069458, -4.85764217376709, -4.296418190002441, -3.735194683074951, -3.1739721298217773, -2.612748622894287, -2.0515248775482178, -1.490301251411438, -0.9290776252746582, -0.36785411834716797, 0.19336962699890137, 0.7545933723449707, 1.315816879272461, 1.8770405054092407, 2.4382641315460205, 2.99948787689209, 3.56071138381958, 4.12193489074707, 4.683158874511719, 5.244382381439209, 5.805605888366699, 6.3668293952941895, 6.92805290222168, 7.489276885986328, 8.050500869750977, 8.611723899841309, 9.172947883605957, 9.734170913696289, 10.295394897460938, 10.856618881225586, 11.417841911315918, 11.979065895080566, 12.540288925170898, 13.101512908935547, 13.662736892700195, 14.223960876464844, 14.785183906555176]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 5.0, 1.0, 3.0, 9.0, 7.0, 3.0, 10.0, 7.0, 14.0, 10.0, 22.0, 12.0, 16.0, 15.0, 20.0, 26.0, 26.0, 30.0, 35.0, 32.0, 50.0, 24.0, 48.0, 35.0, 58.0, 40.0, 38.0, 43.0, 40.0, 36.0, 29.0, 35.0, 27.0, 27.0, 25.0, 26.0, 15.0, 24.0, 15.0, 11.0, 16.0, 9.0, 4.0, 6.0, 8.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.479781150817871, -13.064188957214355, -12.648597717285156, -12.23300552368164, -11.817413330078125, -11.40182113647461, -10.98622989654541, -10.570637702941895, -10.155045509338379, -9.739453315734863, -9.323862075805664, -8.908269882202148, -8.492677688598633, -8.077085494995117, -7.661494255065918, -7.245902061462402, -6.830310344696045, -6.4147186279296875, -5.999126434326172, -5.5835347175598145, -5.167942523956299, -4.752350807189941, -4.336758613586426, -3.9211668968200684, -3.505574941635132, -3.0899829864501953, -2.674391031265259, -2.2587990760803223, -1.8432072401046753, -1.4276154041290283, -1.0120234489440918, -0.5964314937591553, -0.18083953857421875, 0.23475238680839539, 0.6503443121910095, 1.0659362077713013, 1.4815281629562378, 1.8971199989318848, 2.3127119541168213, 2.728303909301758, 3.1438958644866943, 3.559487819671631, 3.9750797748565674, 4.390671730041504, 4.806263446807861, 5.221855163574219, 5.637447357177734, 6.05303955078125, 6.468631267547607, 6.884222984313965, 7.2998151779174805, 7.715406894683838, 8.130998611450195, 8.546590805053711, 8.962182998657227, 9.377775192260742, 9.793366432189941, 10.208958625793457, 10.624549865722656, 11.040142059326172, 11.455734252929688, 11.871326446533203, 12.286917686462402, 12.702509880065918, 13.118102073669434]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 7.0, 8.0, 6.0, 11.0, 18.0, 26.0, 38.0, 61.0, 90.0, 125.0, 175.0, 284.0, 435.0, 646.0, 957.0, 1504.0, 2236.0, 3363.0, 5369.0, 8602.0, 13594.0, 21669.0, 35592.0, 57895.0, 91865.0, 132534.0, 163275.0, 159681.0, 124625.0, 84560.0, 52711.0, 32318.0, 19885.0, 12360.0, 7666.0, 4937.0, 3122.0, 2123.0, 1375.0, 898.0, 607.0, 432.0, 269.0, 197.0, 149.0, 99.0, 58.0, 34.0, 26.0, 10.0, 14.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0], "bins": [-8.84375, -8.5828857421875, -8.322021484375, -8.0611572265625, -7.80029296875, -7.5394287109375, -7.278564453125, -7.0177001953125, -6.7568359375, -6.4959716796875, -6.235107421875, -5.9742431640625, -5.71337890625, -5.4525146484375, -5.191650390625, -4.9307861328125, -4.669921875, -4.4090576171875, -4.148193359375, -3.8873291015625, -3.62646484375, -3.3656005859375, -3.104736328125, -2.8438720703125, -2.5830078125, -2.3221435546875, -2.061279296875, -1.8004150390625, -1.53955078125, -1.2786865234375, -1.017822265625, -0.7569580078125, -0.49609375, -0.2352294921875, 0.025634765625, 0.2864990234375, 0.54736328125, 0.8082275390625, 1.069091796875, 1.3299560546875, 1.5908203125, 1.8516845703125, 2.112548828125, 2.3734130859375, 2.63427734375, 2.8951416015625, 3.156005859375, 3.4168701171875, 3.677734375, 3.9385986328125, 4.199462890625, 4.4603271484375, 4.72119140625, 4.9820556640625, 5.242919921875, 5.5037841796875, 5.7646484375, 6.0255126953125, 6.286376953125, 6.5472412109375, 6.80810546875, 7.0689697265625, 7.329833984375, 7.5906982421875, 7.8515625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 6.0, 2.0, 1.0, 4.0, 3.0, 7.0, 11.0, 13.0, 9.0, 10.0, 16.0, 17.0, 17.0, 13.0, 20.0, 28.0, 24.0, 26.0, 40.0, 27.0, 29.0, 51.0, 48.0, 40.0, 53.0, 45.0, 50.0, 52.0, 36.0, 38.0, 28.0, 33.0, 33.0, 21.0, 22.0, 30.0, 16.0, 18.0, 14.0, 7.0, 9.0, 12.0, 3.0, 6.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.453125, -14.0091552734375, -13.565185546875, -13.1212158203125, -12.67724609375, -12.2332763671875, -11.789306640625, -11.3453369140625, -10.9013671875, -10.4573974609375, -10.013427734375, -9.5694580078125, -9.12548828125, -8.6815185546875, -8.237548828125, -7.7935791015625, -7.349609375, -6.9056396484375, -6.461669921875, -6.0177001953125, -5.57373046875, -5.1297607421875, -4.685791015625, -4.2418212890625, -3.7978515625, -3.3538818359375, -2.909912109375, -2.4659423828125, -2.02197265625, -1.5780029296875, -1.134033203125, -0.6900634765625, -0.24609375, 0.1978759765625, 0.641845703125, 1.0858154296875, 1.52978515625, 1.9737548828125, 2.417724609375, 2.8616943359375, 3.3056640625, 3.7496337890625, 4.193603515625, 4.6375732421875, 5.08154296875, 5.5255126953125, 5.969482421875, 6.4134521484375, 6.857421875, 7.3013916015625, 7.745361328125, 8.1893310546875, 8.63330078125, 9.0772705078125, 9.521240234375, 9.9652099609375, 10.4091796875, 10.8531494140625, 11.297119140625, 11.7410888671875, 12.18505859375, 12.6290283203125, 13.072998046875, 13.5169677734375, 13.9609375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 4.0, 14.0, 15.0, 38.0, 40.0, 55.0, 98.0, 101.0, 216.0, 386.0, 555.0, 922.0, 1454.0, 2318.0, 3838.0, 6450.0, 10905.0, 18679.0, 32986.0, 58719.0, 103056.0, 161289.0, 198323.0, 174574.0, 115837.0, 66808.0, 38171.0, 21669.0, 12523.0, 7249.0, 4388.0, 2592.0, 1591.0, 1024.0, 623.0, 348.0, 251.0, 154.0, 94.0, 67.0, 47.0, 37.0, 16.0, 11.0, 6.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.109375, -10.768798828125, -10.42822265625, -10.087646484375, -9.7470703125, -9.406494140625, -9.06591796875, -8.725341796875, -8.384765625, -8.044189453125, -7.70361328125, -7.363037109375, -7.0224609375, -6.681884765625, -6.34130859375, -6.000732421875, -5.66015625, -5.319580078125, -4.97900390625, -4.638427734375, -4.2978515625, -3.957275390625, -3.61669921875, -3.276123046875, -2.935546875, -2.594970703125, -2.25439453125, -1.913818359375, -1.5732421875, -1.232666015625, -0.89208984375, -0.551513671875, -0.2109375, 0.129638671875, 0.47021484375, 0.810791015625, 1.1513671875, 1.491943359375, 1.83251953125, 2.173095703125, 2.513671875, 2.854248046875, 3.19482421875, 3.535400390625, 3.8759765625, 4.216552734375, 4.55712890625, 4.897705078125, 5.23828125, 5.578857421875, 5.91943359375, 6.260009765625, 6.6005859375, 6.941162109375, 7.28173828125, 7.622314453125, 7.962890625, 8.303466796875, 8.64404296875, 8.984619140625, 9.3251953125, 9.665771484375, 10.00634765625, 10.346923828125, 10.6875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 6.0, 9.0, 9.0, 10.0, 17.0, 21.0, 19.0, 25.0, 25.0, 32.0, 29.0, 26.0, 44.0, 31.0, 37.0, 43.0, 43.0, 50.0, 42.0, 34.0, 45.0, 39.0, 27.0, 37.0, 22.0, 39.0, 38.0, 19.0, 22.0, 23.0, 20.0, 20.0, 10.0, 17.0, 16.0, 15.0, 10.0, 9.0, 4.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.61328125, -7.34197998046875, -7.0706787109375, -6.79937744140625, -6.528076171875, -6.25677490234375, -5.9854736328125, -5.71417236328125, -5.44287109375, -5.17156982421875, -4.9002685546875, -4.62896728515625, -4.357666015625, -4.08636474609375, -3.8150634765625, -3.54376220703125, -3.2724609375, -3.00115966796875, -2.7298583984375, -2.45855712890625, -2.187255859375, -1.91595458984375, -1.6446533203125, -1.37335205078125, -1.10205078125, -0.83074951171875, -0.5594482421875, -0.28814697265625, -0.016845703125, 0.25445556640625, 0.5257568359375, 0.79705810546875, 1.068359375, 1.33966064453125, 1.6109619140625, 1.88226318359375, 2.153564453125, 2.42486572265625, 2.6961669921875, 2.96746826171875, 3.23876953125, 3.51007080078125, 3.7813720703125, 4.05267333984375, 4.323974609375, 4.59527587890625, 4.8665771484375, 5.13787841796875, 5.4091796875, 5.68048095703125, 5.9517822265625, 6.22308349609375, 6.494384765625, 6.76568603515625, 7.0369873046875, 7.30828857421875, 7.57958984375, 7.85089111328125, 8.1221923828125, 8.39349365234375, 8.664794921875, 8.93609619140625, 9.2073974609375, 9.47869873046875, 9.75]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 15.0, 15.0, 12.0, 18.0, 36.0, 66.0, 68.0, 105.0, 153.0, 255.0, 354.0, 573.0, 824.0, 1245.0, 1982.0, 3221.0, 6012.0, 11701.0, 25496.0, 56272.0, 111484.0, 179921.0, 217882.0, 188733.0, 121412.0, 62679.0, 28805.0, 13091.0, 6571.0, 3525.0, 2083.0, 1320.0, 890.0, 614.0, 336.0, 222.0, 175.0, 104.0, 80.0, 66.0, 50.0, 22.0, 16.0, 19.0, 14.0, 5.0, 5.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.66796875, -4.524658203125, -4.38134765625, -4.238037109375, -4.0947265625, -3.951416015625, -3.80810546875, -3.664794921875, -3.521484375, -3.378173828125, -3.23486328125, -3.091552734375, -2.9482421875, -2.804931640625, -2.66162109375, -2.518310546875, -2.375, -2.231689453125, -2.08837890625, -1.945068359375, -1.8017578125, -1.658447265625, -1.51513671875, -1.371826171875, -1.228515625, -1.085205078125, -0.94189453125, -0.798583984375, -0.6552734375, -0.511962890625, -0.36865234375, -0.225341796875, -0.08203125, 0.061279296875, 0.20458984375, 0.347900390625, 0.4912109375, 0.634521484375, 0.77783203125, 0.921142578125, 1.064453125, 1.207763671875, 1.35107421875, 1.494384765625, 1.6376953125, 1.781005859375, 1.92431640625, 2.067626953125, 2.2109375, 2.354248046875, 2.49755859375, 2.640869140625, 2.7841796875, 2.927490234375, 3.07080078125, 3.214111328125, 3.357421875, 3.500732421875, 3.64404296875, 3.787353515625, 3.9306640625, 4.073974609375, 4.21728515625, 4.360595703125, 4.50390625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 10.0, 15.0, 11.0, 12.0, 17.0, 32.0, 25.0, 38.0, 44.0, 50.0, 58.0, 73.0, 58.0, 57.0, 61.0, 58.0, 63.0, 44.0, 50.0, 38.0, 25.0, 28.0, 26.0, 19.0, 19.0, 15.0, 6.0, 7.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034427642822265625, -0.00033221393823623657, -0.0003201514482498169, -0.0003080889582633972, -0.00029602646827697754, -0.00028396397829055786, -0.0002719014883041382, -0.0002598389983177185, -0.00024777650833129883, -0.00023571401834487915, -0.00022365152835845947, -0.0002115890383720398, -0.00019952654838562012, -0.00018746405839920044, -0.00017540156841278076, -0.00016333907842636108, -0.0001512765884399414, -0.00013921409845352173, -0.00012715160846710205, -0.00011508911848068237, -0.0001030266284942627, -9.096413850784302e-05, -7.890164852142334e-05, -6.683915853500366e-05, -5.4776668548583984e-05, -4.271417856216431e-05, -3.065168857574463e-05, -1.858919858932495e-05, -6.5267086029052734e-06, 5.535781383514404e-06, 1.7598271369934082e-05, 2.966076135635376e-05, 4.172325134277344e-05, 5.3785741329193115e-05, 6.584823131561279e-05, 7.791072130203247e-05, 8.997321128845215e-05, 0.00010203570127487183, 0.0001140981912612915, 0.00012616068124771118, 0.00013822317123413086, 0.00015028566122055054, 0.00016234815120697021, 0.0001744106411933899, 0.00018647313117980957, 0.00019853562116622925, 0.00021059811115264893, 0.0002226606011390686, 0.00023472309112548828, 0.00024678558111190796, 0.00025884807109832764, 0.0002709105610847473, 0.000282973051071167, 0.00029503554105758667, 0.00030709803104400635, 0.000319160521030426, 0.0003312230110168457, 0.0003432855010032654, 0.00035534799098968506, 0.00036741048097610474, 0.0003794729709625244, 0.0003915354609489441, 0.00040359795093536377, 0.00041566044092178345, 0.0004277229309082031]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 6.0, 1.0, 5.0, 10.0, 14.0, 22.0, 24.0, 33.0, 43.0, 69.0, 88.0, 156.0, 184.0, 239.0, 366.0, 567.0, 799.0, 1113.0, 1584.0, 2524.0, 4062.0, 7145.0, 14828.0, 36548.0, 88090.0, 179040.0, 253858.0, 224315.0, 129213.0, 55951.0, 22719.0, 10118.0, 5205.0, 3147.0, 2036.0, 1325.0, 1006.0, 643.0, 480.0, 279.0, 192.0, 150.0, 101.0, 84.0, 59.0, 36.0, 29.0, 17.0, 15.0, 8.0, 7.0, 7.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.4453125, -5.2681884765625, -5.091064453125, -4.9139404296875, -4.73681640625, -4.5596923828125, -4.382568359375, -4.2054443359375, -4.0283203125, -3.8511962890625, -3.674072265625, -3.4969482421875, -3.31982421875, -3.1427001953125, -2.965576171875, -2.7884521484375, -2.611328125, -2.4342041015625, -2.257080078125, -2.0799560546875, -1.90283203125, -1.7257080078125, -1.548583984375, -1.3714599609375, -1.1943359375, -1.0172119140625, -0.840087890625, -0.6629638671875, -0.48583984375, -0.3087158203125, -0.131591796875, 0.0455322265625, 0.22265625, 0.3997802734375, 0.576904296875, 0.7540283203125, 0.93115234375, 1.1082763671875, 1.285400390625, 1.4625244140625, 1.6396484375, 1.8167724609375, 1.993896484375, 2.1710205078125, 2.34814453125, 2.5252685546875, 2.702392578125, 2.8795166015625, 3.056640625, 3.2337646484375, 3.410888671875, 3.5880126953125, 3.76513671875, 3.9422607421875, 4.119384765625, 4.2965087890625, 4.4736328125, 4.6507568359375, 4.827880859375, 5.0050048828125, 5.18212890625, 5.3592529296875, 5.536376953125, 5.7135009765625, 5.890625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 4.0, 3.0, 6.0, 14.0, 23.0, 21.0, 31.0, 35.0, 36.0, 71.0, 77.0, 75.0, 85.0, 70.0, 75.0, 73.0, 52.0, 61.0, 39.0, 37.0, 37.0, 22.0, 15.0, 11.0, 9.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.03515625, -1.982177734375, -1.92919921875, -1.876220703125, -1.8232421875, -1.770263671875, -1.71728515625, -1.664306640625, -1.611328125, -1.558349609375, -1.50537109375, -1.452392578125, -1.3994140625, -1.346435546875, -1.29345703125, -1.240478515625, -1.1875, -1.134521484375, -1.08154296875, -1.028564453125, -0.9755859375, -0.922607421875, -0.86962890625, -0.816650390625, -0.763671875, -0.710693359375, -0.65771484375, -0.604736328125, -0.5517578125, -0.498779296875, -0.44580078125, -0.392822265625, -0.33984375, -0.286865234375, -0.23388671875, -0.180908203125, -0.1279296875, -0.074951171875, -0.02197265625, 0.031005859375, 0.083984375, 0.136962890625, 0.18994140625, 0.242919921875, 0.2958984375, 0.348876953125, 0.40185546875, 0.454833984375, 0.5078125, 0.560791015625, 0.61376953125, 0.666748046875, 0.7197265625, 0.772705078125, 0.82568359375, 0.878662109375, 0.931640625, 0.984619140625, 1.03759765625, 1.090576171875, 1.1435546875, 1.196533203125, 1.24951171875, 1.302490234375, 1.35546875]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 6.0, 8.0, 16.0, 14.0, 16.0, 23.0, 28.0, 33.0, 57.0, 42.0, 46.0, 54.0, 70.0, 81.0, 60.0, 71.0, 67.0, 42.0, 45.0, 46.0, 38.0, 28.0, 16.0, 15.0, 13.0, 19.0, 8.0, 5.0, 8.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.636537551879883, -20.080068588256836, -19.52359962463379, -18.967130661010742, -18.410659790039062, -17.854190826416016, -17.29772186279297, -16.741252899169922, -16.184783935546875, -15.628314971923828, -15.071846008300781, -14.515376091003418, -13.958907127380371, -13.402438163757324, -12.845968246459961, -12.289499282836914, -11.733030319213867, -11.17656135559082, -10.620092391967773, -10.06362247467041, -9.507153511047363, -8.950684547424316, -8.394214630126953, -7.837745666503906, -7.281276702880859, -6.7248077392578125, -6.168338298797607, -5.611868858337402, -5.0553998947143555, -4.498930931091309, -3.9424614906311035, -3.3859922885894775, -2.829522132873535, -2.273052930831909, -1.7165837287902832, -1.1601145267486572, -0.6036453247070312, -0.04717612266540527, 0.5092930793762207, 1.0657622814178467, 1.6222314834594727, 2.1787006855010986, 2.7351698875427246, 3.2916390895843506, 3.8481082916259766, 4.404577255249023, 4.9610466957092285, 5.517516136169434, 6.0739850997924805, 6.630454063415527, 7.186923503875732, 7.7433929443359375, 8.299861907958984, 8.856330871582031, 9.412799835205078, 9.969269752502441, 10.525738716125488, 11.082207679748535, 11.638677597045898, 12.195146560668945, 12.751615524291992, 13.308084487915039, 13.864553451538086, 14.42102336883545, 14.977492332458496]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 5.0, 2.0, 10.0, 6.0, 11.0, 8.0, 14.0, 12.0, 12.0, 12.0, 11.0, 14.0, 16.0, 21.0, 26.0, 24.0, 27.0, 31.0, 32.0, 43.0, 47.0, 41.0, 33.0, 50.0, 49.0, 31.0, 39.0, 41.0, 35.0, 28.0, 33.0, 29.0, 22.0, 31.0, 28.0, 14.0, 17.0, 14.0, 16.0, 11.0, 8.0, 8.0, 8.0, 9.0, 9.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 4.0, 2.0], "bins": [-15.908041000366211, -15.446867942810059, -14.985694885253906, -14.524521827697754, -14.063348770141602, -13.602176666259766, -13.141003608703613, -12.679830551147461, -12.218657493591309, -11.757484436035156, -11.296311378479004, -10.835138320922852, -10.373966217041016, -9.912792205810547, -9.451620101928711, -8.990447044372559, -8.529273986816406, -8.068100929260254, -7.606927871704102, -7.145755290985107, -6.684582233428955, -6.223409175872803, -5.762236595153809, -5.301063537597656, -4.839890480041504, -4.378717422485352, -3.9175446033477783, -3.456371784210205, -2.9951987266540527, -2.5340256690979004, -2.072852849960327, -1.611680030822754, -1.150507926940918, -0.6893349885940552, -0.22816205024719238, 0.2330108880996704, 0.6941838264465332, 1.1553568840026855, 1.6165297031402588, 2.077702522277832, 2.5388755798339844, 3.0000486373901367, 3.46122145652771, 3.922394275665283, 4.3835673332214355, 4.844740390777588, 5.305912971496582, 5.767086029052734, 6.228259086608887, 6.689432144165039, 7.150605201721191, 7.6117777824401855, 8.07295036315918, 8.534124374389648, 8.995296478271484, 9.456469535827637, 9.917642593383789, 10.378815650939941, 10.839988708496094, 11.301161766052246, 11.762334823608398, 12.223506927490234, 12.684679985046387, 13.145853042602539, 13.607026100158691]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 13.0, 22.0, 34.0, 41.0, 71.0, 84.0, 160.0, 218.0, 340.0, 428.0, 742.0, 1106.0, 1623.0, 2599.0, 4156.0, 6929.0, 11072.0, 19117.0, 33296.0, 60213.0, 111689.0, 211171.0, 407807.0, 726239.0, 946140.0, 739165.0, 418800.0, 221564.0, 118278.0, 64595.0, 35756.0, 20580.0, 11913.0, 7126.0, 4354.0, 2527.0, 1628.0, 982.0, 626.0, 371.0, 261.0, 140.0, 111.0, 70.0, 41.0, 28.0, 16.0, 10.0, 13.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0], "bins": [-19.90625, -19.3125, -18.71875, -18.125, -17.53125, -16.9375, -16.34375, -15.75, -15.15625, -14.5625, -13.96875, -13.375, -12.78125, -12.1875, -11.59375, -11.0, -10.40625, -9.8125, -9.21875, -8.625, -8.03125, -7.4375, -6.84375, -6.25, -5.65625, -5.0625, -4.46875, -3.875, -3.28125, -2.6875, -2.09375, -1.5, -0.90625, -0.3125, 0.28125, 0.875, 1.46875, 2.0625, 2.65625, 3.25, 3.84375, 4.4375, 5.03125, 5.625, 6.21875, 6.8125, 7.40625, 8.0, 8.59375, 9.1875, 9.78125, 10.375, 10.96875, 11.5625, 12.15625, 12.75, 13.34375, 13.9375, 14.53125, 15.125, 15.71875, 16.3125, 16.90625, 17.5, 18.09375]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 0.0, 0.0, 4.0, 2.0, 5.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 13.0, 12.0, 6.0, 20.0, 15.0, 10.0, 17.0, 19.0, 18.0, 28.0, 26.0, 32.0, 35.0, 43.0, 41.0, 39.0, 40.0, 46.0, 41.0, 48.0, 39.0, 38.0, 38.0, 35.0, 44.0, 34.0, 19.0, 34.0, 18.0, 19.0, 24.0, 10.0, 16.0, 10.0, 11.0, 6.0, 7.0, 6.0, 5.0, 7.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.3125, -14.836669921875, -14.36083984375, -13.885009765625, -13.4091796875, -12.933349609375, -12.45751953125, -11.981689453125, -11.505859375, -11.030029296875, -10.55419921875, -10.078369140625, -9.6025390625, -9.126708984375, -8.65087890625, -8.175048828125, -7.69921875, -7.223388671875, -6.74755859375, -6.271728515625, -5.7958984375, -5.320068359375, -4.84423828125, -4.368408203125, -3.892578125, -3.416748046875, -2.94091796875, -2.465087890625, -1.9892578125, -1.513427734375, -1.03759765625, -0.561767578125, -0.0859375, 0.389892578125, 0.86572265625, 1.341552734375, 1.8173828125, 2.293212890625, 2.76904296875, 3.244873046875, 3.720703125, 4.196533203125, 4.67236328125, 5.148193359375, 5.6240234375, 6.099853515625, 6.57568359375, 7.051513671875, 7.52734375, 8.003173828125, 8.47900390625, 8.954833984375, 9.4306640625, 9.906494140625, 10.38232421875, 10.858154296875, 11.333984375, 11.809814453125, 12.28564453125, 12.761474609375, 13.2373046875, 13.713134765625, 14.18896484375, 14.664794921875, 15.140625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 11.0, 15.0, 17.0, 33.0, 36.0, 63.0, 76.0, 119.0, 177.0, 259.0, 376.0, 548.0, 886.0, 1414.0, 2278.0, 3485.0, 5821.0, 9161.0, 14940.0, 25183.0, 42409.0, 72601.0, 125076.0, 213366.0, 357469.0, 560352.0, 746569.0, 716289.0, 514824.0, 319850.0, 189991.0, 110325.0, 64247.0, 37718.0, 22718.0, 13295.0, 8307.0, 5089.0, 3165.0, 2048.0, 1324.0, 794.0, 558.0, 338.0, 233.0, 138.0, 94.0, 79.0, 44.0, 21.0, 21.0, 10.0, 7.0, 8.0, 5.0, 3.0, 2.0, 3.0], "bins": [-21.390625, -20.740234375, -20.08984375, -19.439453125, -18.7890625, -18.138671875, -17.48828125, -16.837890625, -16.1875, -15.537109375, -14.88671875, -14.236328125, -13.5859375, -12.935546875, -12.28515625, -11.634765625, -10.984375, -10.333984375, -9.68359375, -9.033203125, -8.3828125, -7.732421875, -7.08203125, -6.431640625, -5.78125, -5.130859375, -4.48046875, -3.830078125, -3.1796875, -2.529296875, -1.87890625, -1.228515625, -0.578125, 0.072265625, 0.72265625, 1.373046875, 2.0234375, 2.673828125, 3.32421875, 3.974609375, 4.625, 5.275390625, 5.92578125, 6.576171875, 7.2265625, 7.876953125, 8.52734375, 9.177734375, 9.828125, 10.478515625, 11.12890625, 11.779296875, 12.4296875, 13.080078125, 13.73046875, 14.380859375, 15.03125, 15.681640625, 16.33203125, 16.982421875, 17.6328125, 18.283203125, 18.93359375, 19.583984375, 20.234375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 5.0, 6.0, 8.0, 7.0, 12.0, 14.0, 26.0, 18.0, 26.0, 36.0, 40.0, 68.0, 76.0, 101.0, 96.0, 138.0, 196.0, 208.0, 218.0, 262.0, 293.0, 305.0, 270.0, 263.0, 220.0, 204.0, 179.0, 165.0, 129.0, 101.0, 84.0, 56.0, 61.0, 36.0, 31.0, 23.0, 17.0, 20.0, 13.0, 12.0, 9.0, 9.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.15625, -9.83837890625, -9.5205078125, -9.20263671875, -8.884765625, -8.56689453125, -8.2490234375, -7.93115234375, -7.61328125, -7.29541015625, -6.9775390625, -6.65966796875, -6.341796875, -6.02392578125, -5.7060546875, -5.38818359375, -5.0703125, -4.75244140625, -4.4345703125, -4.11669921875, -3.798828125, -3.48095703125, -3.1630859375, -2.84521484375, -2.52734375, -2.20947265625, -1.8916015625, -1.57373046875, -1.255859375, -0.93798828125, -0.6201171875, -0.30224609375, 0.015625, 0.33349609375, 0.6513671875, 0.96923828125, 1.287109375, 1.60498046875, 1.9228515625, 2.24072265625, 2.55859375, 2.87646484375, 3.1943359375, 3.51220703125, 3.830078125, 4.14794921875, 4.4658203125, 4.78369140625, 5.1015625, 5.41943359375, 5.7373046875, 6.05517578125, 6.373046875, 6.69091796875, 7.0087890625, 7.32666015625, 7.64453125, 7.96240234375, 8.2802734375, 8.59814453125, 8.916015625, 9.23388671875, 9.5517578125, 9.86962890625, 10.1875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 8.0, 12.0, 22.0, 10.0, 15.0, 23.0, 18.0, 37.0, 30.0, 47.0, 55.0, 50.0, 60.0, 73.0, 65.0, 66.0, 64.0, 51.0, 53.0, 32.0, 25.0, 28.0, 33.0, 18.0, 21.0, 9.0, 12.0, 10.0, 9.0, 7.0, 8.0, 5.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.463420867919922, -28.552867889404297, -27.64231300354004, -26.731760025024414, -25.82120704650879, -24.91065216064453, -24.000099182128906, -23.08954620361328, -22.178991317749023, -21.2684383392334, -20.35788345336914, -19.447330474853516, -18.53677749633789, -17.626222610473633, -16.715669631958008, -15.805115699768066, -14.894562721252441, -13.9840087890625, -13.073455810546875, -12.162901878356934, -11.252347946166992, -10.341794967651367, -9.431241035461426, -8.520687103271484, -7.610133647918701, -6.699580192565918, -5.789026260375977, -4.878472805023193, -3.967919111251831, -3.0573654174804688, -2.1468119621276855, -1.2362580299377441, -0.32570457458496094, 0.5848490595817566, 1.4954026937484741, 2.405956268310547, 3.316509962081909, 4.2270636558532715, 5.137617111206055, 6.048171043395996, 6.958724498748779, 7.8692779541015625, 8.779831886291504, 9.690385818481445, 10.60093879699707, 11.511492729187012, 12.422046661376953, 13.332599639892578, 14.24315357208252, 15.153707504272461, 16.064260482788086, 16.974815368652344, 17.88536834716797, 18.795921325683594, 19.70647430419922, 20.617029190063477, 21.5275821685791, 22.438135147094727, 23.348690032958984, 24.25924301147461, 25.169795989990234, 26.080350875854492, 26.990903854370117, 27.901458740234375, 28.81201171875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 6.0, 7.0, 7.0, 4.0, 9.0, 9.0, 16.0, 10.0, 19.0, 16.0, 21.0, 16.0, 40.0, 26.0, 38.0, 33.0, 36.0, 41.0, 41.0, 47.0, 55.0, 51.0, 43.0, 52.0, 39.0, 46.0, 32.0, 29.0, 35.0, 30.0, 18.0, 16.0, 12.0, 15.0, 10.0, 15.0, 6.0, 11.0, 7.0, 13.0, 7.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.3554744720459, -29.37089729309082, -28.386320114135742, -27.401742935180664, -26.41716766357422, -25.43259048461914, -24.448013305664062, -23.463436126708984, -22.478858947753906, -21.494281768798828, -20.50970458984375, -19.525127410888672, -18.540550231933594, -17.555973052978516, -16.57139778137207, -15.586820602416992, -14.602243423461914, -13.617666244506836, -12.633089065551758, -11.648512840270996, -10.663935661315918, -9.67935848236084, -8.694782257080078, -7.710205078125, -6.725627899169922, -5.741050720214844, -4.756474018096924, -3.771897077560425, -2.787320137023926, -1.8027429580688477, -0.8181662559509277, 0.1664104461669922, 1.1509857177734375, 2.1355626583099365, 3.1201395988464355, 4.1047163009643555, 5.089293479919434, 6.073870658874512, 7.058447360992432, 8.043024063110352, 9.02760124206543, 10.012178421020508, 10.996755599975586, 11.981331825256348, 12.965909004211426, 13.950486183166504, 14.935062408447266, 15.919639587402344, 16.904216766357422, 17.8887939453125, 18.873371124267578, 19.857948303222656, 20.842525482177734, 21.827102661132812, 22.811677932739258, 23.796255111694336, 24.780832290649414, 25.765409469604492, 26.74998664855957, 27.73456382751465, 28.719139099121094, 29.703716278076172, 30.68829345703125, 31.672870635986328, 32.657447814941406]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 3.0, 4.0, 5.0, 1.0, 14.0, 14.0, 31.0, 30.0, 34.0, 53.0, 90.0, 122.0, 167.0, 232.0, 306.0, 457.0, 648.0, 844.0, 1258.0, 1850.0, 2716.0, 3891.0, 5955.0, 9117.0, 14109.0, 22521.0, 38462.0, 69470.0, 151684.0, 316608.0, 199964.0, 87906.0, 45639.0, 26407.0, 16367.0, 10360.0, 6759.0, 4533.0, 3023.0, 2010.0, 1479.0, 1012.0, 688.0, 498.0, 351.0, 251.0, 166.0, 138.0, 92.0, 66.0, 51.0, 26.0, 18.0, 17.0, 20.0, 9.0, 5.0, 5.0, 2.0, 7.0, 1.0, 2.0], "bins": [-8.6875, -8.4130859375, -8.138671875, -7.8642578125, -7.58984375, -7.3154296875, -7.041015625, -6.7666015625, -6.4921875, -6.2177734375, -5.943359375, -5.6689453125, -5.39453125, -5.1201171875, -4.845703125, -4.5712890625, -4.296875, -4.0224609375, -3.748046875, -3.4736328125, -3.19921875, -2.9248046875, -2.650390625, -2.3759765625, -2.1015625, -1.8271484375, -1.552734375, -1.2783203125, -1.00390625, -0.7294921875, -0.455078125, -0.1806640625, 0.09375, 0.3681640625, 0.642578125, 0.9169921875, 1.19140625, 1.4658203125, 1.740234375, 2.0146484375, 2.2890625, 2.5634765625, 2.837890625, 3.1123046875, 3.38671875, 3.6611328125, 3.935546875, 4.2099609375, 4.484375, 4.7587890625, 5.033203125, 5.3076171875, 5.58203125, 5.8564453125, 6.130859375, 6.4052734375, 6.6796875, 6.9541015625, 7.228515625, 7.5029296875, 7.77734375, 8.0517578125, 8.326171875, 8.6005859375, 8.875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 11.0, 10.0, 9.0, 14.0, 9.0, 20.0, 16.0, 26.0, 22.0, 23.0, 29.0, 41.0, 25.0, 45.0, 47.0, 37.0, 59.0, 49.0, 58.0, 54.0, 40.0, 49.0, 49.0, 39.0, 27.0, 28.0, 17.0, 20.0, 18.0, 13.0, 18.0, 9.0, 11.0, 10.0, 3.0, 12.0, 3.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.59375, -31.529296875, -30.46484375, -29.400390625, -28.3359375, -27.271484375, -26.20703125, -25.142578125, -24.078125, -23.013671875, -21.94921875, -20.884765625, -19.8203125, -18.755859375, -17.69140625, -16.626953125, -15.5625, -14.498046875, -13.43359375, -12.369140625, -11.3046875, -10.240234375, -9.17578125, -8.111328125, -7.046875, -5.982421875, -4.91796875, -3.853515625, -2.7890625, -1.724609375, -0.66015625, 0.404296875, 1.46875, 2.533203125, 3.59765625, 4.662109375, 5.7265625, 6.791015625, 7.85546875, 8.919921875, 9.984375, 11.048828125, 12.11328125, 13.177734375, 14.2421875, 15.306640625, 16.37109375, 17.435546875, 18.5, 19.564453125, 20.62890625, 21.693359375, 22.7578125, 23.822265625, 24.88671875, 25.951171875, 27.015625, 28.080078125, 29.14453125, 30.208984375, 31.2734375, 32.337890625, 33.40234375, 34.466796875, 35.53125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 10.0, 18.0, 22.0, 25.0, 28.0, 26.0, 29.0, 51.0, 89.0, 99.0, 130.0, 177.0, 233.0, 379.0, 493.0, 803.0, 1359.0, 2467.0, 5331.0, 14164.0, 50353.0, 921918.0, 30995.0, 9843.0, 4073.0, 2033.0, 1081.0, 752.0, 424.0, 313.0, 206.0, 152.0, 131.0, 98.0, 54.0, 50.0, 34.0, 21.0, 18.0, 24.0, 15.0, 14.0, 8.0, 6.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-30.734375, -29.812255859375, -28.89013671875, -27.968017578125, -27.0458984375, -26.123779296875, -25.20166015625, -24.279541015625, -23.357421875, -22.435302734375, -21.51318359375, -20.591064453125, -19.6689453125, -18.746826171875, -17.82470703125, -16.902587890625, -15.98046875, -15.058349609375, -14.13623046875, -13.214111328125, -12.2919921875, -11.369873046875, -10.44775390625, -9.525634765625, -8.603515625, -7.681396484375, -6.75927734375, -5.837158203125, -4.9150390625, -3.992919921875, -3.07080078125, -2.148681640625, -1.2265625, -0.304443359375, 0.61767578125, 1.539794921875, 2.4619140625, 3.384033203125, 4.30615234375, 5.228271484375, 6.150390625, 7.072509765625, 7.99462890625, 8.916748046875, 9.8388671875, 10.760986328125, 11.68310546875, 12.605224609375, 13.52734375, 14.449462890625, 15.37158203125, 16.293701171875, 17.2158203125, 18.137939453125, 19.06005859375, 19.982177734375, 20.904296875, 21.826416015625, 22.74853515625, 23.670654296875, 24.5927734375, 25.514892578125, 26.43701171875, 27.359130859375, 28.28125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 6.0, 9.0, 9.0, 16.0, 13.0, 20.0, 19.0, 23.0, 23.0, 23.0, 32.0, 23.0, 34.0, 36.0, 30.0, 40.0, 33.0, 42.0, 37.0, 29.0, 38.0, 41.0, 29.0, 32.0, 33.0, 39.0, 35.0, 27.0, 26.0, 14.0, 24.0, 27.0, 17.0, 21.0, 13.0, 15.0, 17.0, 3.0, 12.0, 5.0, 13.0, 6.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-17.84375, -17.29736328125, -16.7509765625, -16.20458984375, -15.658203125, -15.11181640625, -14.5654296875, -14.01904296875, -13.47265625, -12.92626953125, -12.3798828125, -11.83349609375, -11.287109375, -10.74072265625, -10.1943359375, -9.64794921875, -9.1015625, -8.55517578125, -8.0087890625, -7.46240234375, -6.916015625, -6.36962890625, -5.8232421875, -5.27685546875, -4.73046875, -4.18408203125, -3.6376953125, -3.09130859375, -2.544921875, -1.99853515625, -1.4521484375, -0.90576171875, -0.359375, 0.18701171875, 0.7333984375, 1.27978515625, 1.826171875, 2.37255859375, 2.9189453125, 3.46533203125, 4.01171875, 4.55810546875, 5.1044921875, 5.65087890625, 6.197265625, 6.74365234375, 7.2900390625, 7.83642578125, 8.3828125, 8.92919921875, 9.4755859375, 10.02197265625, 10.568359375, 11.11474609375, 11.6611328125, 12.20751953125, 12.75390625, 13.30029296875, 13.8466796875, 14.39306640625, 14.939453125, 15.48583984375, 16.0322265625, 16.57861328125, 17.125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 10.0, 6.0, 16.0, 12.0, 15.0, 34.0, 33.0, 58.0, 63.0, 114.0, 158.0, 226.0, 302.0, 454.0, 726.0, 1250.0, 2123.0, 4169.0, 8939.0, 24975.0, 918234.0, 58372.0, 14666.0, 6232.0, 2940.0, 1590.0, 950.0, 617.0, 379.0, 269.0, 171.0, 134.0, 94.0, 52.0, 36.0, 37.0, 29.0, 18.0, 13.0, 10.0, 9.0, 3.0, 8.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.884765625, -1.828948974609375, -1.77313232421875, -1.717315673828125, -1.6614990234375, -1.605682373046875, -1.54986572265625, -1.494049072265625, -1.438232421875, -1.382415771484375, -1.32659912109375, -1.270782470703125, -1.2149658203125, -1.159149169921875, -1.10333251953125, -1.047515869140625, -0.99169921875, -0.935882568359375, -0.88006591796875, -0.824249267578125, -0.7684326171875, -0.712615966796875, -0.65679931640625, -0.600982666015625, -0.545166015625, -0.489349365234375, -0.43353271484375, -0.377716064453125, -0.3218994140625, -0.266082763671875, -0.21026611328125, -0.154449462890625, -0.0986328125, -0.042816162109375, 0.01300048828125, 0.068817138671875, 0.1246337890625, 0.180450439453125, 0.23626708984375, 0.292083740234375, 0.347900390625, 0.403717041015625, 0.45953369140625, 0.515350341796875, 0.5711669921875, 0.626983642578125, 0.68280029296875, 0.738616943359375, 0.79443359375, 0.850250244140625, 0.90606689453125, 0.961883544921875, 1.0177001953125, 1.073516845703125, 1.12933349609375, 1.185150146484375, 1.240966796875, 1.296783447265625, 1.35260009765625, 1.408416748046875, 1.4642333984375, 1.520050048828125, 1.57586669921875, 1.631683349609375, 1.6875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 7.0, 7.0, 4.0, 9.0, 8.0, 7.0, 15.0, 12.0, 17.0, 20.0, 21.0, 25.0, 19.0, 32.0, 27.0, 35.0, 34.0, 34.0, 40.0, 46.0, 36.0, 40.0, 45.0, 48.0, 39.0, 38.0, 41.0, 33.0, 36.0, 28.0, 22.0, 22.0, 27.0, 22.0, 18.0, 11.0, 9.0, 15.0, 12.0, 13.0, 5.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2590160369873047e-05, -2.188514918088913e-05, -2.1180137991905212e-05, -2.0475126802921295e-05, -1.9770115613937378e-05, -1.906510442495346e-05, -1.8360093235969543e-05, -1.7655082046985626e-05, -1.695007085800171e-05, -1.6245059669017792e-05, -1.5540048480033875e-05, -1.4835037291049957e-05, -1.413002610206604e-05, -1.3425014913082123e-05, -1.2720003724098206e-05, -1.2014992535114288e-05, -1.1309981346130371e-05, -1.0604970157146454e-05, -9.899958968162537e-06, -9.19494777917862e-06, -8.489936590194702e-06, -7.784925401210785e-06, -7.079914212226868e-06, -6.3749030232429504e-06, -5.669891834259033e-06, -4.964880645275116e-06, -4.259869456291199e-06, -3.5548582673072815e-06, -2.8498470783233643e-06, -2.144835889339447e-06, -1.4398247003555298e-06, -7.348135113716125e-07, -2.9802322387695312e-08, 6.752088665962219e-07, 1.3802200555801392e-06, 2.0852312445640564e-06, 2.7902424335479736e-06, 3.495253622531891e-06, 4.200264811515808e-06, 4.905276000499725e-06, 5.610287189483643e-06, 6.31529837846756e-06, 7.020309567451477e-06, 7.725320756435394e-06, 8.430331945419312e-06, 9.135343134403229e-06, 9.840354323387146e-06, 1.0545365512371063e-05, 1.125037670135498e-05, 1.1955387890338898e-05, 1.2660399079322815e-05, 1.3365410268306732e-05, 1.407042145729065e-05, 1.4775432646274567e-05, 1.5480443835258484e-05, 1.61854550242424e-05, 1.689046621322632e-05, 1.7595477402210236e-05, 1.8300488591194153e-05, 1.900549978017807e-05, 1.9710510969161987e-05, 2.0415522158145905e-05, 2.1120533347129822e-05, 2.182554453611374e-05, 2.2530555725097656e-05]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 14.0, 8.0, 16.0, 27.0, 42.0, 61.0, 73.0, 135.0, 191.0, 289.0, 406.0, 650.0, 965.0, 1435.0, 2219.0, 3398.0, 5520.0, 8627.0, 13668.0, 22902.0, 40407.0, 77361.0, 175134.0, 330003.0, 182142.0, 79433.0, 41174.0, 23525.0, 14306.0, 8832.0, 5528.0, 3404.0, 2262.0, 1499.0, 938.0, 631.0, 457.0, 291.0, 194.0, 139.0, 92.0, 59.0, 40.0, 20.0, 19.0, 10.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.66455078125, -0.6412506103515625, -0.617950439453125, -0.5946502685546875, -0.57135009765625, -0.5480499267578125, -0.524749755859375, -0.5014495849609375, -0.4781494140625, -0.4548492431640625, -0.431549072265625, -0.4082489013671875, -0.38494873046875, -0.3616485595703125, -0.338348388671875, -0.3150482177734375, -0.291748046875, -0.2684478759765625, -0.245147705078125, -0.2218475341796875, -0.19854736328125, -0.1752471923828125, -0.151947021484375, -0.1286468505859375, -0.1053466796875, -0.0820465087890625, -0.058746337890625, -0.0354461669921875, -0.01214599609375, 0.0111541748046875, 0.034454345703125, 0.0577545166015625, 0.0810546875, 0.1043548583984375, 0.127655029296875, 0.1509552001953125, 0.17425537109375, 0.1975555419921875, 0.220855712890625, 0.2441558837890625, 0.2674560546875, 0.2907562255859375, 0.314056396484375, 0.3373565673828125, 0.36065673828125, 0.3839569091796875, 0.407257080078125, 0.4305572509765625, 0.453857421875, 0.4771575927734375, 0.500457763671875, 0.5237579345703125, 0.54705810546875, 0.5703582763671875, 0.593658447265625, 0.6169586181640625, 0.6402587890625, 0.6635589599609375, 0.686859130859375, 0.7101593017578125, 0.73345947265625, 0.7567596435546875, 0.780059814453125, 0.8033599853515625, 0.82666015625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 9.0, 4.0, 9.0, 8.0, 15.0, 10.0, 17.0, 14.0, 32.0, 32.0, 46.0, 62.0, 92.0, 129.0, 109.0, 98.0, 80.0, 47.0, 29.0, 20.0, 20.0, 14.0, 18.0, 11.0, 9.0, 4.0, 7.0, 11.0, 8.0, 9.0, 1.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.296142578125, -0.2874183654785156, -0.27869415283203125, -0.2699699401855469, -0.2612457275390625, -0.2525215148925781, -0.24379730224609375, -0.23507308959960938, -0.226348876953125, -0.21762466430664062, -0.20890045166015625, -0.20017623901367188, -0.1914520263671875, -0.18272781372070312, -0.17400360107421875, -0.16527938842773438, -0.15655517578125, -0.14783096313476562, -0.13910675048828125, -0.13038253784179688, -0.1216583251953125, -0.11293411254882812, -0.10420989990234375, -0.09548568725585938, -0.086761474609375, -0.07803726196289062, -0.06931304931640625, -0.060588836669921875, -0.0518646240234375, -0.043140411376953125, -0.03441619873046875, -0.025691986083984375, -0.0169677734375, -0.008243560791015625, 0.00048065185546875, 0.009204864501953125, 0.0179290771484375, 0.026653289794921875, 0.03537750244140625, 0.044101715087890625, 0.052825927734375, 0.061550140380859375, 0.07027435302734375, 0.07899856567382812, 0.0877227783203125, 0.09644699096679688, 0.10517120361328125, 0.11389541625976562, 0.12261962890625, 0.13134384155273438, 0.14006805419921875, 0.14879226684570312, 0.1575164794921875, 0.16624069213867188, 0.17496490478515625, 0.18368911743164062, 0.192413330078125, 0.20113754272460938, 0.20986175537109375, 0.21858596801757812, 0.2273101806640625, 0.23603439331054688, 0.24475860595703125, 0.2534828186035156, 0.26220703125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 7.0, 6.0, 13.0, 15.0, 13.0, 15.0, 23.0, 21.0, 21.0, 38.0, 40.0, 42.0, 61.0, 55.0, 71.0, 71.0, 62.0, 59.0, 51.0, 54.0, 48.0, 35.0, 26.0, 27.0, 21.0, 22.0, 9.0, 17.0, 10.0, 8.0, 8.0, 13.0, 3.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.527950286865234, -28.597877502441406, -27.667802810668945, -26.737730026245117, -25.80765724182129, -24.877582550048828, -23.947509765625, -23.017436981201172, -22.087364196777344, -21.157291412353516, -20.227216720581055, -19.297143936157227, -18.3670711517334, -17.436996459960938, -16.50692367553711, -15.576850891113281, -14.64677619934082, -13.716702461242676, -12.786629676818848, -11.856555938720703, -10.926483154296875, -9.99640941619873, -9.066335678100586, -8.136262893676758, -7.206189155578613, -6.276115894317627, -5.346042633056641, -4.415968894958496, -3.4858956336975098, -2.5558223724365234, -1.625748634338379, -0.6956753730773926, 0.23439598083496094, 1.1644693613052368, 2.0945427417755127, 3.024616241455078, 3.9546895027160645, 4.884762763977051, 5.814836502075195, 6.744909763336182, 7.674983024597168, 8.605056762695312, 9.53512954711914, 10.465203285217285, 11.39527702331543, 12.325349807739258, 13.255423545837402, 14.185497283935547, 15.115570068359375, 16.045642852783203, 16.975717544555664, 17.905790328979492, 18.83586311340332, 19.76593780517578, 20.69601058959961, 21.626083374023438, 22.556156158447266, 23.486228942871094, 24.416303634643555, 25.346376419067383, 26.27644920349121, 27.206523895263672, 28.1365966796875, 29.066669464111328, 29.99674415588379]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 9.0, 5.0, 7.0, 7.0, 4.0, 9.0, 7.0, 17.0, 10.0, 18.0, 16.0, 20.0, 18.0, 37.0, 28.0, 40.0, 31.0, 35.0, 43.0, 37.0, 52.0, 49.0, 55.0, 41.0, 55.0, 42.0, 42.0, 35.0, 27.0, 38.0, 29.0, 18.0, 14.0, 13.0, 15.0, 10.0, 15.0, 6.0, 12.0, 6.0, 13.0, 7.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.054454803466797, -30.05168342590332, -29.04891014099121, -28.046138763427734, -27.043365478515625, -26.04059410095215, -25.037822723388672, -24.035049438476562, -23.032278060913086, -22.02950668334961, -21.0267333984375, -20.023962020874023, -19.021190643310547, -18.018417358398438, -17.01564598083496, -16.012874603271484, -15.010101318359375, -14.007328987121582, -13.004556655883789, -12.001785278320312, -10.99901294708252, -9.996240615844727, -8.99346923828125, -7.990696907043457, -6.987924575805664, -5.985152244567871, -4.982380390167236, -3.9796082973480225, -2.9768362045288086, -1.9740638732910156, -0.9712920188903809, 0.031479835510253906, 1.0342483520507812, 2.037020444869995, 3.039792537689209, 4.042564392089844, 5.045336723327637, 6.04810905456543, 7.0508809089660645, 8.0536527633667, 9.056425094604492, 10.059197425842285, 11.061969757080078, 12.064741134643555, 13.067513465881348, 14.07028579711914, 15.073057174682617, 16.075828552246094, 17.078601837158203, 18.08137321472168, 19.08414649963379, 20.086917877197266, 21.089691162109375, 22.09246253967285, 23.095233917236328, 24.098007202148438, 25.100778579711914, 26.10354995727539, 27.1063232421875, 28.109094619750977, 29.111865997314453, 30.114639282226562, 31.11741065979004, 32.120182037353516, 33.122955322265625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 5.0, 8.0, 5.0, 8.0, 14.0, 18.0, 32.0, 38.0, 59.0, 101.0, 125.0, 168.0, 241.0, 356.0, 517.0, 743.0, 1101.0, 1646.0, 2553.0, 3772.0, 5981.0, 9526.0, 14960.0, 25416.0, 48818.0, 105068.0, 240339.0, 292407.0, 147427.0, 64287.0, 32696.0, 18212.0, 11225.0, 7089.0, 4593.0, 2906.0, 1980.0, 1311.0, 860.0, 573.0, 422.0, 301.0, 185.0, 143.0, 92.0, 78.0, 39.0, 37.0, 20.0, 22.0, 12.0, 6.0, 11.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-32.0625, -31.03466796875, -30.0068359375, -28.97900390625, -27.951171875, -26.92333984375, -25.8955078125, -24.86767578125, -23.83984375, -22.81201171875, -21.7841796875, -20.75634765625, -19.728515625, -18.70068359375, -17.6728515625, -16.64501953125, -15.6171875, -14.58935546875, -13.5615234375, -12.53369140625, -11.505859375, -10.47802734375, -9.4501953125, -8.42236328125, -7.39453125, -6.36669921875, -5.3388671875, -4.31103515625, -3.283203125, -2.25537109375, -1.2275390625, -0.19970703125, 0.828125, 1.85595703125, 2.8837890625, 3.91162109375, 4.939453125, 5.96728515625, 6.9951171875, 8.02294921875, 9.05078125, 10.07861328125, 11.1064453125, 12.13427734375, 13.162109375, 14.18994140625, 15.2177734375, 16.24560546875, 17.2734375, 18.30126953125, 19.3291015625, 20.35693359375, 21.384765625, 22.41259765625, 23.4404296875, 24.46826171875, 25.49609375, 26.52392578125, 27.5517578125, 28.57958984375, 29.607421875, 30.63525390625, 31.6630859375, 32.69091796875, 33.71875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 3.0, 7.0, 6.0, 13.0, 10.0, 12.0, 14.0, 17.0, 22.0, 19.0, 26.0, 31.0, 29.0, 32.0, 42.0, 44.0, 40.0, 46.0, 51.0, 63.0, 50.0, 42.0, 56.0, 34.0, 39.0, 31.0, 33.0, 22.0, 26.0, 17.0, 19.0, 14.0, 15.0, 11.0, 7.0, 9.0, 12.0, 9.0, 5.0, 7.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-34.15625, -33.1005859375, -32.044921875, -30.9892578125, -29.93359375, -28.8779296875, -27.822265625, -26.7666015625, -25.7109375, -24.6552734375, -23.599609375, -22.5439453125, -21.48828125, -20.4326171875, -19.376953125, -18.3212890625, -17.265625, -16.2099609375, -15.154296875, -14.0986328125, -13.04296875, -11.9873046875, -10.931640625, -9.8759765625, -8.8203125, -7.7646484375, -6.708984375, -5.6533203125, -4.59765625, -3.5419921875, -2.486328125, -1.4306640625, -0.375, 0.6806640625, 1.736328125, 2.7919921875, 3.84765625, 4.9033203125, 5.958984375, 7.0146484375, 8.0703125, 9.1259765625, 10.181640625, 11.2373046875, 12.29296875, 13.3486328125, 14.404296875, 15.4599609375, 16.515625, 17.5712890625, 18.626953125, 19.6826171875, 20.73828125, 21.7939453125, 22.849609375, 23.9052734375, 24.9609375, 26.0166015625, 27.072265625, 28.1279296875, 29.18359375, 30.2392578125, 31.294921875, 32.3505859375, 33.40625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 17.0, 17.0, 16.0, 29.0, 47.0, 50.0, 118.0, 138.0, 249.0, 353.0, 557.0, 880.0, 1354.0, 2270.0, 3489.0, 5766.0, 9485.0, 16972.0, 30826.0, 59804.0, 131418.0, 295401.0, 261038.0, 111128.0, 52370.0, 27178.0, 14942.0, 8773.0, 5140.0, 3155.0, 2016.0, 1257.0, 792.0, 521.0, 339.0, 211.0, 136.0, 103.0, 63.0, 45.0, 32.0, 14.0, 12.0, 8.0, 9.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.5625, -45.0556640625, -43.548828125, -42.0419921875, -40.53515625, -39.0283203125, -37.521484375, -36.0146484375, -34.5078125, -33.0009765625, -31.494140625, -29.9873046875, -28.48046875, -26.9736328125, -25.466796875, -23.9599609375, -22.453125, -20.9462890625, -19.439453125, -17.9326171875, -16.42578125, -14.9189453125, -13.412109375, -11.9052734375, -10.3984375, -8.8916015625, -7.384765625, -5.8779296875, -4.37109375, -2.8642578125, -1.357421875, 0.1494140625, 1.65625, 3.1630859375, 4.669921875, 6.1767578125, 7.68359375, 9.1904296875, 10.697265625, 12.2041015625, 13.7109375, 15.2177734375, 16.724609375, 18.2314453125, 19.73828125, 21.2451171875, 22.751953125, 24.2587890625, 25.765625, 27.2724609375, 28.779296875, 30.2861328125, 31.79296875, 33.2998046875, 34.806640625, 36.3134765625, 37.8203125, 39.3271484375, 40.833984375, 42.3408203125, 43.84765625, 45.3544921875, 46.861328125, 48.3681640625, 49.875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 7.0, 14.0, 15.0, 9.0, 12.0, 21.0, 25.0, 28.0, 30.0, 20.0, 50.0, 48.0, 41.0, 50.0, 65.0, 59.0, 46.0, 45.0, 51.0, 38.0, 41.0, 44.0, 44.0, 34.0, 33.0, 19.0, 15.0, 16.0, 13.0, 11.0, 12.0, 8.0, 9.0, 4.0, 1.0, 1.0, 5.0, 1.0, 5.0, 0.0, 2.0, 2.0], "bins": [-25.921875, -25.244140625, -24.56640625, -23.888671875, -23.2109375, -22.533203125, -21.85546875, -21.177734375, -20.5, -19.822265625, -19.14453125, -18.466796875, -17.7890625, -17.111328125, -16.43359375, -15.755859375, -15.078125, -14.400390625, -13.72265625, -13.044921875, -12.3671875, -11.689453125, -11.01171875, -10.333984375, -9.65625, -8.978515625, -8.30078125, -7.623046875, -6.9453125, -6.267578125, -5.58984375, -4.912109375, -4.234375, -3.556640625, -2.87890625, -2.201171875, -1.5234375, -0.845703125, -0.16796875, 0.509765625, 1.1875, 1.865234375, 2.54296875, 3.220703125, 3.8984375, 4.576171875, 5.25390625, 5.931640625, 6.609375, 7.287109375, 7.96484375, 8.642578125, 9.3203125, 9.998046875, 10.67578125, 11.353515625, 12.03125, 12.708984375, 13.38671875, 14.064453125, 14.7421875, 15.419921875, 16.09765625, 16.775390625, 17.453125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 5.0, 9.0, 5.0, 11.0, 15.0, 21.0, 34.0, 41.0, 67.0, 88.0, 153.0, 241.0, 397.0, 596.0, 1017.0, 1642.0, 2805.0, 4820.0, 8408.0, 15542.0, 27817.0, 48380.0, 80549.0, 119576.0, 153512.0, 163416.0, 145554.0, 108224.0, 70120.0, 41680.0, 23395.0, 12969.0, 7094.0, 4094.0, 2399.0, 1423.0, 846.0, 559.0, 356.0, 233.0, 162.0, 91.0, 58.0, 40.0, 23.0, 17.0, 24.0, 14.0, 11.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.6640625, -4.50518798828125, -4.3463134765625, -4.18743896484375, -4.028564453125, -3.86968994140625, -3.7108154296875, -3.55194091796875, -3.39306640625, -3.23419189453125, -3.0753173828125, -2.91644287109375, -2.757568359375, -2.59869384765625, -2.4398193359375, -2.28094482421875, -2.1220703125, -1.96319580078125, -1.8043212890625, -1.64544677734375, -1.486572265625, -1.32769775390625, -1.1688232421875, -1.00994873046875, -0.85107421875, -0.69219970703125, -0.5333251953125, -0.37445068359375, -0.215576171875, -0.05670166015625, 0.1021728515625, 0.26104736328125, 0.419921875, 0.57879638671875, 0.7376708984375, 0.89654541015625, 1.055419921875, 1.21429443359375, 1.3731689453125, 1.53204345703125, 1.69091796875, 1.84979248046875, 2.0086669921875, 2.16754150390625, 2.326416015625, 2.48529052734375, 2.6441650390625, 2.80303955078125, 2.9619140625, 3.12078857421875, 3.2796630859375, 3.43853759765625, 3.597412109375, 3.75628662109375, 3.9151611328125, 4.07403564453125, 4.23291015625, 4.39178466796875, 4.5506591796875, 4.70953369140625, 4.868408203125, 5.02728271484375, 5.1861572265625, 5.34503173828125, 5.50390625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 12.0, 13.0, 11.0, 13.0, 17.0, 35.0, 19.0, 29.0, 48.0, 54.0, 54.0, 52.0, 70.0, 43.0, 57.0, 57.0, 42.0, 42.0, 42.0, 44.0, 44.0, 32.0, 32.0, 20.0, 21.0, 25.0, 13.0, 10.0, 11.0, 2.0, 3.0, 4.0, 7.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 3.0], "bins": [-0.0007028579711914062, -0.0006839483976364136, -0.0006650388240814209, -0.0006461292505264282, -0.0006272196769714355, -0.0006083101034164429, -0.0005894005298614502, -0.0005704909563064575, -0.0005515813827514648, -0.0005326718091964722, -0.0005137622356414795, -0.0004948526620864868, -0.00047594308853149414, -0.00045703351497650146, -0.0004381239414215088, -0.0004192143678665161, -0.00040030479431152344, -0.00038139522075653076, -0.0003624856472015381, -0.0003435760736465454, -0.00032466650009155273, -0.00030575692653656006, -0.0002868473529815674, -0.0002679377794265747, -0.00024902820587158203, -0.00023011863231658936, -0.00021120905876159668, -0.000192299485206604, -0.00017338991165161133, -0.00015448033809661865, -0.00013557076454162598, -0.0001166611909866333, -9.775161743164062e-05, -7.884204387664795e-05, -5.9932470321655273e-05, -4.10228967666626e-05, -2.2113323211669922e-05, -3.203749656677246e-06, 1.570582389831543e-05, 3.4615397453308105e-05, 5.352497100830078e-05, 7.243454456329346e-05, 9.134411811828613e-05, 0.00011025369167327881, 0.00012916326522827148, 0.00014807283878326416, 0.00016698241233825684, 0.0001858919858932495, 0.0002048015594482422, 0.00022371113300323486, 0.00024262070655822754, 0.0002615302801132202, 0.0002804398536682129, 0.00029934942722320557, 0.00031825900077819824, 0.0003371685743331909, 0.0003560781478881836, 0.00037498772144317627, 0.00039389729499816895, 0.0004128068685531616, 0.0004317164421081543, 0.00045062601566314697, 0.00046953558921813965, 0.0004884451627731323, 0.000507354736328125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 5.0, 4.0, 5.0, 6.0, 8.0, 13.0, 27.0, 29.0, 56.0, 62.0, 97.0, 134.0, 207.0, 271.0, 403.0, 687.0, 1057.0, 1704.0, 2725.0, 4635.0, 7976.0, 14259.0, 24647.0, 42698.0, 69872.0, 104805.0, 138766.0, 156467.0, 148825.0, 119152.0, 82871.0, 53025.0, 30931.0, 17576.0, 9941.0, 5751.0, 3246.0, 2004.0, 1294.0, 830.0, 494.0, 314.0, 227.0, 142.0, 97.0, 79.0, 38.0, 31.0, 26.0, 18.0, 13.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.7421875, -4.59259033203125, -4.4429931640625, -4.29339599609375, -4.143798828125, -3.99420166015625, -3.8446044921875, -3.69500732421875, -3.54541015625, -3.39581298828125, -3.2462158203125, -3.09661865234375, -2.947021484375, -2.79742431640625, -2.6478271484375, -2.49822998046875, -2.3486328125, -2.19903564453125, -2.0494384765625, -1.89984130859375, -1.750244140625, -1.60064697265625, -1.4510498046875, -1.30145263671875, -1.15185546875, -1.00225830078125, -0.8526611328125, -0.70306396484375, -0.553466796875, -0.40386962890625, -0.2542724609375, -0.10467529296875, 0.044921875, 0.19451904296875, 0.3441162109375, 0.49371337890625, 0.643310546875, 0.79290771484375, 0.9425048828125, 1.09210205078125, 1.24169921875, 1.39129638671875, 1.5408935546875, 1.69049072265625, 1.840087890625, 1.98968505859375, 2.1392822265625, 2.28887939453125, 2.4384765625, 2.58807373046875, 2.7376708984375, 2.88726806640625, 3.036865234375, 3.18646240234375, 3.3360595703125, 3.48565673828125, 3.63525390625, 3.78485107421875, 3.9344482421875, 4.08404541015625, 4.233642578125, 4.38323974609375, 4.5328369140625, 4.68243408203125, 4.83203125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 9.0, 4.0, 10.0, 9.0, 12.0, 16.0, 18.0, 26.0, 30.0, 36.0, 31.0, 40.0, 52.0, 54.0, 44.0, 55.0, 51.0, 63.0, 38.0, 55.0, 41.0, 62.0, 45.0, 33.0, 38.0, 34.0, 21.0, 25.0, 6.0, 9.0, 7.0, 11.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.93359375, -1.88006591796875, -1.8265380859375, -1.77301025390625, -1.719482421875, -1.66595458984375, -1.6124267578125, -1.55889892578125, -1.50537109375, -1.45184326171875, -1.3983154296875, -1.34478759765625, -1.291259765625, -1.23773193359375, -1.1842041015625, -1.13067626953125, -1.0771484375, -1.02362060546875, -0.9700927734375, -0.91656494140625, -0.863037109375, -0.80950927734375, -0.7559814453125, -0.70245361328125, -0.64892578125, -0.59539794921875, -0.5418701171875, -0.48834228515625, -0.434814453125, -0.38128662109375, -0.3277587890625, -0.27423095703125, -0.220703125, -0.16717529296875, -0.1136474609375, -0.06011962890625, -0.006591796875, 0.04693603515625, 0.1004638671875, 0.15399169921875, 0.20751953125, 0.26104736328125, 0.3145751953125, 0.36810302734375, 0.421630859375, 0.47515869140625, 0.5286865234375, 0.58221435546875, 0.6357421875, 0.68927001953125, 0.7427978515625, 0.79632568359375, 0.849853515625, 0.90338134765625, 0.9569091796875, 1.01043701171875, 1.06396484375, 1.11749267578125, 1.1710205078125, 1.22454833984375, 1.278076171875, 1.33160400390625, 1.3851318359375, 1.43865966796875, 1.4921875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 10.0, 3.0, 5.0, 8.0, 11.0, 14.0, 20.0, 30.0, 25.0, 35.0, 40.0, 47.0, 48.0, 59.0, 64.0, 83.0, 69.0, 59.0, 70.0, 56.0, 35.0, 32.0, 30.0, 28.0, 24.0, 23.0, 8.0, 9.0, 14.0, 11.0, 14.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-43.41062927246094, -42.239784240722656, -41.068939208984375, -39.89809036254883, -38.72724533081055, -37.556400299072266, -36.385555267333984, -35.21470642089844, -34.043861389160156, -32.873016357421875, -31.70216941833496, -30.53132438659668, -29.360477447509766, -28.189632415771484, -27.018787384033203, -25.84794044494629, -24.677095413208008, -23.506250381469727, -22.335403442382812, -21.16455841064453, -19.993711471557617, -18.822866439819336, -17.652019500732422, -16.48117446899414, -15.310328483581543, -14.139482498168945, -12.968636512756348, -11.79779052734375, -10.626945495605469, -9.456098556518555, -8.285253524780273, -7.114407539367676, -5.943563461303711, -4.772717475891113, -3.6018717288970947, -2.431025981903076, -1.2601799964904785, -0.08933401107788086, 1.0815114974975586, 2.2523574829101562, 3.423203468322754, 4.594049453735352, 5.764895439147949, 6.935740947723389, 8.106586456298828, 9.277433395385742, 10.448278427124023, 11.619124412536621, 12.789970397949219, 13.960816383361816, 15.131662368774414, 16.302507400512695, 17.47335433959961, 18.64419937133789, 19.815044403076172, 20.985891342163086, 22.15673828125, 23.32758331298828, 24.498430252075195, 25.669275283813477, 26.84012222290039, 28.010967254638672, 29.181812286376953, 30.352659225463867, 31.52350425720215]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 8.0, 6.0, 11.0, 8.0, 10.0, 10.0, 24.0, 23.0, 33.0, 33.0, 36.0, 45.0, 42.0, 44.0, 70.0, 57.0, 48.0, 44.0, 64.0, 52.0, 40.0, 41.0, 41.0, 35.0, 27.0, 31.0, 17.0, 22.0, 12.0, 19.0, 8.0, 5.0, 9.0, 7.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.582157135009766, -43.029502868652344, -41.47685241699219, -39.92420196533203, -38.37154769897461, -36.81889343261719, -35.26624298095703, -33.713592529296875, -32.16093826293945, -30.608285903930664, -29.055633544921875, -27.502981185913086, -25.950328826904297, -24.397676467895508, -22.84502410888672, -21.29237174987793, -19.73971939086914, -18.18706703186035, -16.634414672851562, -15.081762313842773, -13.529109954833984, -11.976457595825195, -10.423805236816406, -8.871152877807617, -7.318500518798828, -5.765848159790039, -4.21319580078125, -2.660543441772461, -1.1078910827636719, 0.4447612762451172, 1.9974136352539062, 3.5500659942626953, 5.102718353271484, 6.655370712280273, 8.208023071289062, 9.760675430297852, 11.31332778930664, 12.86598014831543, 14.418632507324219, 15.971284866333008, 17.523937225341797, 19.076589584350586, 20.629241943359375, 22.181894302368164, 23.734546661376953, 25.287199020385742, 26.83985137939453, 28.39250373840332, 29.94515609741211, 31.4978084564209, 33.05046081542969, 34.603111267089844, 36.155765533447266, 37.70841979980469, 39.261070251464844, 40.813720703125, 42.36637496948242, 43.919029235839844, 45.4716796875, 47.024330139160156, 48.57698440551758, 50.129638671875, 51.682289123535156, 53.23493957519531, 54.787593841552734]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 14.0, 26.0, 32.0, 37.0, 37.0, 63.0, 95.0, 120.0, 155.0, 218.0, 333.0, 442.0, 715.0, 1110.0, 1809.0, 2827.0, 4963.0, 8043.0, 483571.0, 7481.0, 4581.0, 2681.0, 1675.0, 1007.0, 625.0, 472.0, 309.0, 194.0, 164.0, 127.0, 73.0, 61.0, 50.0, 32.0, 27.0, 27.0, 12.0, 11.0, 9.0, 5.0, 5.0, 4.0, 6.0, 0.0, 2.0, 0.0, 2.0], "bins": [-348.1280212402344, -338.3028259277344, -328.4776306152344, -318.6524658203125, -308.8272705078125, -299.0020751953125, -289.1768798828125, -279.3516845703125, -269.5265197753906, -259.7013244628906, -249.8761444091797, -240.0509490966797, -230.22576904296875, -220.40057373046875, -210.57537841796875, -200.7501983642578, -190.9250030517578, -181.0998077392578, -171.27462768554688, -161.44943237304688, -151.62425231933594, -141.79905700683594, -131.973876953125, -122.148681640625, -112.32349395751953, -102.49830627441406, -92.6731185913086, -82.84793090820312, -73.02273559570312, -63.19755172729492, -53.37236022949219, -43.54717254638672, -33.72198486328125, -23.89679718017578, -14.07160758972168, -4.246417999267578, 5.578769683837891, 15.40395736694336, 25.229148864746094, 35.05433654785156, 44.87952423095703, 54.7047119140625, 64.52989959716797, 74.35508728027344, 84.18028259277344, 94.00546264648438, 103.83065795898438, 113.65584564208984, 123.48103332519531, 133.3062286376953, 143.13140869140625, 152.95660400390625, 162.7817840576172, 172.6069793701172, 182.43215942382812, 192.25735473632812, 202.08255004882812, 211.90774536132812, 221.73292541503906, 231.55812072753906, 241.38330078125, 251.20849609375, 261.03369140625, 270.85888671875, 280.6840515136719]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 9.0, 8.0, 4.0, 12.0, 7.0, 9.0, 12.0, 25.0, 21.0, 32.0, 34.0, 32.0, 49.0, 43.0, 43.0, 72.0, 56.0, 1072.0, 48.0, 63.0, 50.0, 40.0, 40.0, 38.0, 37.0, 27.0, 33.0, 18.0, 22.0, 12.0, 16.0, 9.0, 5.0, 9.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1329.7415771484375, -1283.6824951171875, -1237.6234130859375, -1191.5643310546875, -1145.5052490234375, -1099.4461669921875, -1053.3870849609375, -1007.3280029296875, -961.2689208984375, -915.2098388671875, -869.1507568359375, -823.0916748046875, -777.0325927734375, -730.9735107421875, -684.9144287109375, -638.8553466796875, -592.7962036132812, -546.7371215820312, -500.67803955078125, -454.61895751953125, -408.55987548828125, -362.50079345703125, -316.4416809082031, -270.3825988769531, -224.32351684570312, -178.26443481445312, -132.20535278320312, -86.14625549316406, -40.08717346191406, 5.9719085693359375, 52.031005859375, 98.090087890625, 144.149169921875, 190.208251953125, 236.267333984375, 282.326416015625, 328.385498046875, 374.444580078125, 420.5036926269531, 466.5627746582031, 512.621826171875, 558.680908203125, 604.739990234375, 650.799072265625, 696.858154296875, 742.917236328125, 788.976318359375, 835.035400390625, 881.0945434570312, 927.1536254882812, 973.2127075195312, 1019.2717895507812, 1065.3309326171875, 1111.3900146484375, 1157.4490966796875, 1203.5081787109375, 1249.5672607421875, 1295.6263427734375, 1341.6854248046875, 1387.7445068359375, 1433.8035888671875, 1479.8626708984375, 1525.9217529296875, 1571.9808349609375, 1618.0399169921875]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 10.0, 11.0, 18.0, 23.0, 43.0, 75.0, 83.0, 121.0, 204.0, 287.0, 563.0, 726.0, 963.0, 1404.0, 2184.0, 3749.0, 6074.0, 9754.0, 13289.0, 18621.0, 38198.0, 31013724.0, 70807.0, 41137.0, 15300.0, 7032.0, 3803.0, 2438.0, 1429.0, 792.0, 442.0, 334.0, 204.0, 141.0, 110.0, 93.0, 56.0, 48.0, 36.0, 35.0, 25.0, 15.0, 17.0, 18.0, 17.0, 17.0, 12.0, 8.0, 4.0, 4.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-299.2801818847656, -288.4181213378906, -277.5560607910156, -266.6940002441406, -255.83193969726562, -244.96987915039062, -234.10781860351562, -223.24575805664062, -212.38369750976562, -201.52163696289062, -190.65957641601562, -179.79751586914062, -168.93545532226562, -158.07339477539062, -147.21133422851562, -136.34927368164062, -125.48721313476562, -114.62515258789062, -103.76309204101562, -92.90103149414062, -82.03897094726562, -71.17691040039062, -60.314849853515625, -49.452789306640625, -38.590728759765625, -27.728668212890625, -16.866607666015625, -6.004547119140625, 4.857513427734375, 15.719573974609375, 26.581634521484375, 37.443695068359375, 48.305755615234375, 59.167816162109375, 70.02987670898438, 80.89193725585938, 91.75399780273438, 102.61605834960938, 113.47811889648438, 124.34017944335938, 135.20223999023438, 146.06430053710938, 156.92636108398438, 167.78842163085938, 178.65048217773438, 189.51254272460938, 200.37460327148438, 211.23666381835938, 222.09872436523438, 232.96078491210938, 243.82284545898438, 254.68490600585938, 265.5469665527344, 276.4090270996094, 287.2710876464844, 298.1331481933594, 308.9952087402344, 319.8572692871094, 330.7193298339844, 341.5813903808594, 352.4434509277344, 363.3055114746094, 374.1675720214844, 385.0296325683594, 395.8916931152344]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 10.0, 22.0, 91.0, 470.0, 291.0, 53.0, 28.0, 13.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.5965576171875, -143.79571533203125, -139.994873046875, -136.1940155029297, -132.39317321777344, -128.5923309326172, -124.79148864746094, -120.99063873291016, -117.1897964477539, -113.38895416259766, -109.58810424804688, -105.78726196289062, -101.98641204833984, -98.1855697631836, -94.38471984863281, -90.58387756347656, -86.78303527832031, -82.98219299316406, -79.18134307861328, -75.38050079345703, -71.57965087890625, -67.77880859375, -63.977962493896484, -60.17711639404297, -56.37626647949219, -52.57542037963867, -48.774574279785156, -44.973731994628906, -41.17288589477539, -37.372039794921875, -33.57119369506836, -29.770349502563477, -25.969505310058594, -22.168659210205078, -18.367815017700195, -14.56696891784668, -10.76612377166748, -6.965278625488281, -3.1644325256347656, 0.6364116668701172, 4.437257766723633, 8.238102912902832, 12.038948059082031, 15.839794158935547, 19.640640258789062, 23.441484451293945, 27.24233055114746, 31.043174743652344, 34.84402084350586, 38.644866943359375, 42.44571304321289, 46.246559143066406, 50.047401428222656, 53.84824752807617, 57.64909362792969, 61.44993591308594, 65.25078582763672, 69.05162811279297, 72.85247802734375, 76.6533203125, 80.45417022705078, 84.25501251220703, 88.05586242675781, 91.85670471191406, 95.65754699707031]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 8.0, 15.0, 11.0, 16.0, 27.0, 72.0, 131.0, 201.0, 192.0, 135.0, 86.0, 40.0, 28.0, 9.0, 6.0, 9.0, 4.0, 2.0, 3.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.42645263671875, -153.40916442871094, -149.3918914794922, -145.37460327148438, -141.35733032226562, -137.3400421142578, -133.32276916503906, -129.30548095703125, -125.28820037841797, -121.27091979980469, -117.2536392211914, -113.23635864257812, -109.21907043457031, -105.20179748535156, -101.18450927734375, -97.16722869873047, -93.14994812011719, -89.1326675415039, -85.11538696289062, -81.09810638427734, -77.08082580566406, -73.06353759765625, -69.04625701904297, -65.02897644042969, -61.011695861816406, -56.994415283203125, -52.977134704589844, -48.9598503112793, -44.942569732666016, -40.925289154052734, -36.90800476074219, -32.890724182128906, -28.873443603515625, -24.856163024902344, -20.83888053894043, -16.821598052978516, -12.804317474365234, -8.787036895751953, -4.769754409790039, -0.752471923828125, 3.2648086547851562, 7.282090187072754, 11.299371719360352, 15.31665325164795, 19.333934783935547, 23.351215362548828, 27.368497848510742, 31.385780334472656, 35.40306091308594, 39.42034149169922, 43.4376220703125, 47.45490646362305, 51.47218704223633, 55.48946762084961, 59.506752014160156, 63.52403259277344, 67.54131317138672, 71.55859375, 75.57587432861328, 79.59315490722656, 83.61044311523438, 87.62771606445312, 91.64500427246094, 95.66228485107422, 99.6795654296875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 6.0, 4.0, 4.0, 7.0, 14.0, 19.0, 29.0, 17.0, 29.0, 33.0, 20.0, 39.0, 29.0, 57.0, 56.0, 56.0, 73.0, 85.0, 117.0, 155.0, 190.0, 247.0, 319.0, 452.0, 722.0, 1164.0, 2176.0, 3980.0, 8557.0, 21086.0, 63934.0, 3314800.0, 693299.0, 48108.0, 17932.0, 7990.0, 3779.0, 2071.0, 1221.0, 667.0, 326.0, 187.0, 109.0, 54.0, 30.0, 18.0, 10.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.755859375, -1.7167816162109375, -1.677703857421875, -1.6386260986328125, -1.59954833984375, -1.5604705810546875, -1.521392822265625, -1.4823150634765625, -1.4432373046875, -1.4041595458984375, -1.365081787109375, -1.3260040283203125, -1.28692626953125, -1.2478485107421875, -1.208770751953125, -1.1696929931640625, -1.130615234375, -1.0915374755859375, -1.052459716796875, -1.0133819580078125, -0.97430419921875, -0.9352264404296875, -0.896148681640625, -0.8570709228515625, -0.8179931640625, -0.7789154052734375, -0.739837646484375, -0.7007598876953125, -0.66168212890625, -0.6226043701171875, -0.583526611328125, -0.5444488525390625, -0.50537109375, -0.4662933349609375, -0.427215576171875, -0.3881378173828125, -0.34906005859375, -0.3099822998046875, -0.270904541015625, -0.2318267822265625, -0.1927490234375, -0.1536712646484375, -0.114593505859375, -0.0755157470703125, -0.03643798828125, 0.0026397705078125, 0.041717529296875, 0.0807952880859375, 0.119873046875, 0.1589508056640625, 0.198028564453125, 0.2371063232421875, 0.27618408203125, 0.3152618408203125, 0.354339599609375, 0.3934173583984375, 0.4324951171875, 0.4715728759765625, 0.510650634765625, 0.5497283935546875, 0.58880615234375, 0.6278839111328125, 0.666961669921875, 0.7060394287109375, 0.7451171875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 7.0, 10.0, 22.0, 18.0, 19.0, 53.0, 747.0, 45.0, 29.0, 11.0, 8.0, 8.0, 9.0, 8.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.3857421875, -0.37792110443115234, -0.3701000213623047, -0.36227893829345703, -0.3544578552246094, -0.3466367721557617, -0.33881568908691406, -0.3309946060180664, -0.32317352294921875, -0.3153524398803711, -0.30753135681152344, -0.2997102737426758, -0.2918891906738281, -0.28406810760498047, -0.2762470245361328, -0.26842594146728516, -0.2606048583984375, -0.25278377532958984, -0.2449626922607422, -0.23714160919189453, -0.22932052612304688, -0.22149944305419922, -0.21367835998535156, -0.2058572769165039, -0.19803619384765625, -0.1902151107788086, -0.18239402770996094, -0.17457294464111328, -0.16675186157226562, -0.15893077850341797, -0.1511096954345703, -0.14328861236572266, -0.135467529296875, -0.12764644622802734, -0.11982536315917969, -0.11200428009033203, -0.10418319702148438, -0.09636211395263672, -0.08854103088378906, -0.0807199478149414, -0.07289886474609375, -0.0650777816772461, -0.05725669860839844, -0.04943561553955078, -0.041614532470703125, -0.03379344940185547, -0.025972366333007812, -0.018151283264160156, -0.0103302001953125, -0.0025091171264648438, 0.0053119659423828125, 0.013133049011230469, 0.020954132080078125, 0.02877521514892578, 0.03659629821777344, 0.044417381286621094, 0.05223846435546875, 0.060059547424316406, 0.06788063049316406, 0.07570171356201172, 0.08352279663085938, 0.09134387969970703, 0.09916496276855469, 0.10698604583740234, 0.11480712890625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 8.0, 12.0, 16.0, 21.0, 30.0, 28.0, 45.0, 62.0, 87.0, 156.0, 271.0, 378.0, 587.0, 943.0, 1669.0, 2921.0, 5647.0, 12505.0, 30769.0, 95484.0, 431295.0, 2904333.0, 527034.0, 112617.0, 36648.0, 14821.0, 6976.0, 3581.0, 2002.0, 1207.0, 693.0, 448.0, 306.0, 203.0, 156.0, 84.0, 63.0, 42.0, 43.0, 22.0, 25.0, 15.0, 6.0, 7.0, 8.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.77978515625, -0.7565460205078125, -0.733306884765625, -0.7100677490234375, -0.68682861328125, -0.6635894775390625, -0.640350341796875, -0.6171112060546875, -0.5938720703125, -0.5706329345703125, -0.547393798828125, -0.5241546630859375, -0.50091552734375, -0.4776763916015625, -0.454437255859375, -0.4311981201171875, -0.407958984375, -0.3847198486328125, -0.361480712890625, -0.3382415771484375, -0.31500244140625, -0.2917633056640625, -0.268524169921875, -0.2452850341796875, -0.2220458984375, -0.1988067626953125, -0.175567626953125, -0.1523284912109375, -0.12908935546875, -0.1058502197265625, -0.082611083984375, -0.0593719482421875, -0.0361328125, -0.0128936767578125, 0.010345458984375, 0.0335845947265625, 0.05682373046875, 0.0800628662109375, 0.103302001953125, 0.1265411376953125, 0.1497802734375, 0.1730194091796875, 0.196258544921875, 0.2194976806640625, 0.24273681640625, 0.2659759521484375, 0.289215087890625, 0.3124542236328125, 0.335693359375, 0.3589324951171875, 0.382171630859375, 0.4054107666015625, 0.42864990234375, 0.4518890380859375, 0.475128173828125, 0.4983673095703125, 0.5216064453125, 0.5448455810546875, 0.568084716796875, 0.5913238525390625, 0.61456298828125, 0.6378021240234375, 0.661041259765625, 0.6842803955078125, 0.70751953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 15.0, 15.0, 21.0, 37.0, 34.0, 35.0, 54.0, 70.0, 85.0, 113.0, 149.0, 190.0, 215.0, 282.0, 461.0, 722.0, 349.0, 233.0, 211.0, 155.0, 109.0, 121.0, 65.0, 66.0, 55.0, 43.0, 29.0, 21.0, 27.0, 14.0, 15.0, 17.0, 17.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19921875, -0.19218063354492188, -0.18514251708984375, -0.17810440063476562, -0.1710662841796875, -0.16402816772460938, -0.15699005126953125, -0.14995193481445312, -0.142913818359375, -0.13587570190429688, -0.12883758544921875, -0.12179946899414062, -0.1147613525390625, -0.10772323608398438, -0.10068511962890625, -0.09364700317382812, -0.08660888671875, -0.07957077026367188, -0.07253265380859375, -0.06549453735351562, -0.0584564208984375, -0.051418304443359375, -0.04438018798828125, -0.037342071533203125, -0.030303955078125, -0.023265838623046875, -0.01622772216796875, -0.009189605712890625, -0.0021514892578125, 0.004886627197265625, 0.01192474365234375, 0.018962860107421875, 0.0260009765625, 0.033039093017578125, 0.04007720947265625, 0.047115325927734375, 0.0541534423828125, 0.061191558837890625, 0.06822967529296875, 0.07526779174804688, 0.082305908203125, 0.08934402465820312, 0.09638214111328125, 0.10342025756835938, 0.1104583740234375, 0.11749649047851562, 0.12453460693359375, 0.13157272338867188, 0.13861083984375, 0.14564895629882812, 0.15268707275390625, 0.15972518920898438, 0.1667633056640625, 0.17380142211914062, 0.18083953857421875, 0.18787765502929688, 0.194915771484375, 0.20195388793945312, 0.20899200439453125, 0.21603012084960938, 0.2230682373046875, 0.23010635375976562, 0.23714447021484375, 0.24418258666992188, 0.251220703125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 11.0, 47.0, 118.0, 347.0, 279.0, 112.0, 54.0, 25.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.027087688446045, -2.856955051422119, -2.6868224143981934, -2.5166897773742676, -2.346557140350342, -2.176424503326416, -2.0062918663024902, -1.836159348487854, -1.6660267114639282, -1.4958940744400024, -1.3257614374160767, -1.1556289196014404, -0.9854962229728699, -0.8153635859489441, -0.6452310085296631, -0.4750983715057373, -0.3049657344818115, -0.13483311235904694, 0.03529950976371765, 0.20543211698532104, 0.3755647540092468, 0.5456973910331726, 0.7158299684524536, 0.8859626054763794, 1.0560952425003052, 1.226227879524231, 1.3963605165481567, 1.566493034362793, 1.7366256713867188, 1.9067583084106445, 2.0768909454345703, 2.247023582458496, 2.417156219482422, 2.5872888565063477, 2.7574214935302734, 2.927554130554199, 3.097686767578125, 3.267819404602051, 3.4379520416259766, 3.6080846786499023, 3.778217315673828, 3.948349952697754, 4.11848258972168, 4.2886152267456055, 4.458747863769531, 4.628880500793457, 4.799013137817383, 4.969145774841309, 5.139278411865234, 5.30941104888916, 5.479543685913086, 5.649676322937012, 5.8198089599609375, 5.989941596984863, 6.160074234008789, 6.330206871032715, 6.500339031219482, 6.670471668243408, 6.840604305267334, 7.01073694229126, 7.1808695793151855, 7.351002216339111, 7.521134853363037, 7.691267490386963, 7.861400127410889]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 9.0, 7.0, 22.0, 29.0, 30.0, 30.0, 61.0, 61.0, 65.0, 70.0, 88.0, 62.0, 67.0, 77.0, 72.0, 64.0, 51.0, 38.0, 31.0, 23.0, 14.0, 12.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.032721519470215, -1.9488803148269653, -1.8650391101837158, -1.7811980247497559, -1.6973568201065063, -1.6135156154632568, -1.5296745300292969, -1.4458333253860474, -1.3619921207427979, -1.2781509160995483, -1.1943097114562988, -1.1104686260223389, -1.0266274213790894, -0.9427862167358398, -0.8589450716972351, -0.7751039266586304, -0.6912627220153809, -0.6074215173721313, -0.5235803723335266, -0.4397391974925995, -0.35589802265167236, -0.27205684781074524, -0.18821567296981812, -0.10437452793121338, -0.020533323287963867, 0.06330785155296326, 0.14714902639389038, 0.2309902012348175, 0.31483137607574463, 0.39867255091667175, 0.4825137257575989, 0.5663548707962036, 0.6501960754394531, 0.7340372800827026, 0.8178784251213074, 0.9017195701599121, 0.9855607748031616, 1.0694019794464111, 1.153243064880371, 1.2370842695236206, 1.3209254741668701, 1.4047666788101196, 1.4886078834533691, 1.572448968887329, 1.6562901735305786, 1.7401313781738281, 1.823972463607788, 1.9078136682510376, 1.991654872894287, 2.075495958328247, 2.159337282180786, 2.243178367614746, 2.327019691467285, 2.410860776901245, 2.494701862335205, 2.578543186187744, 2.662384271621704, 2.746225357055664, 2.830066680908203, 2.913907766342163, 2.997748851776123, 3.081590175628662, 3.165431261062622, 3.249272346496582, 3.333113670349121]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 3.0, 5.0, 6.0, 8.0, 7.0, 9.0, 13.0, 11.0, 14.0, 24.0, 38.0, 56.0, 70.0, 117.0, 207.0, 389.0, 804.0, 1816.0, 4403.0, 11903.0, 59108.0, 870084.0, 77505.0, 13331.0, 4767.0, 1957.0, 870.0, 434.0, 220.0, 123.0, 69.0, 44.0, 40.0, 23.0, 14.0, 17.0, 5.0, 7.0, 10.0, 6.0, 6.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3369140625, -1.29315185546875, -1.2493896484375, -1.20562744140625, -1.161865234375, -1.11810302734375, -1.0743408203125, -1.03057861328125, -0.98681640625, -0.94305419921875, -0.8992919921875, -0.85552978515625, -0.811767578125, -0.76800537109375, -0.7242431640625, -0.68048095703125, -0.63671875, -0.59295654296875, -0.5491943359375, -0.50543212890625, -0.461669921875, -0.41790771484375, -0.3741455078125, -0.33038330078125, -0.28662109375, -0.24285888671875, -0.1990966796875, -0.15533447265625, -0.111572265625, -0.06781005859375, -0.0240478515625, 0.01971435546875, 0.0634765625, 0.10723876953125, 0.1510009765625, 0.19476318359375, 0.238525390625, 0.28228759765625, 0.3260498046875, 0.36981201171875, 0.41357421875, 0.45733642578125, 0.5010986328125, 0.54486083984375, 0.588623046875, 0.63238525390625, 0.6761474609375, 0.71990966796875, 0.763671875, 0.80743408203125, 0.8511962890625, 0.89495849609375, 0.938720703125, 0.98248291015625, 1.0262451171875, 1.07000732421875, 1.11376953125, 1.15753173828125, 1.2012939453125, 1.24505615234375, 1.288818359375, 1.33258056640625, 1.3763427734375, 1.42010498046875, 1.4638671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 8.0, 7.0, 8.0, 13.0, 30.0, 79.0, 175.0, 276.0, 219.0, 91.0, 33.0, 8.0, 10.0, 8.0, 11.0, 8.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.301513671875, -0.2948894500732422, -0.2882652282714844, -0.28164100646972656, -0.27501678466796875, -0.26839256286621094, -0.2617683410644531, -0.2551441192626953, -0.2485198974609375, -0.2418956756591797, -0.23527145385742188, -0.22864723205566406, -0.22202301025390625, -0.21539878845214844, -0.20877456665039062, -0.2021503448486328, -0.195526123046875, -0.1889019012451172, -0.18227767944335938, -0.17565345764160156, -0.16902923583984375, -0.16240501403808594, -0.15578079223632812, -0.1491565704345703, -0.1425323486328125, -0.1359081268310547, -0.12928390502929688, -0.12265968322753906, -0.11603546142578125, -0.10941123962402344, -0.10278701782226562, -0.09616279602050781, -0.08953857421875, -0.08291435241699219, -0.07629013061523438, -0.06966590881347656, -0.06304168701171875, -0.05641746520996094, -0.049793243408203125, -0.04316902160644531, -0.0365447998046875, -0.029920578002929688, -0.023296356201171875, -0.016672134399414062, -0.01004791259765625, -0.0034236907958984375, 0.003200531005859375, 0.009824752807617188, 0.016448974609375, 0.023073196411132812, 0.029697418212890625, 0.03632164001464844, 0.04294586181640625, 0.04957008361816406, 0.056194305419921875, 0.06281852722167969, 0.0694427490234375, 0.07606697082519531, 0.08269119262695312, 0.08931541442871094, 0.09593963623046875, 0.10256385803222656, 0.10918807983398438, 0.11581230163574219, 0.1224365234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 8.0, 5.0, 11.0, 12.0, 23.0, 25.0, 34.0, 51.0, 75.0, 124.0, 222.0, 400.0, 727.0, 1536.0, 3703.0, 11878.0, 71322.0, 787010.0, 144571.0, 18065.0, 4936.0, 1844.0, 858.0, 450.0, 234.0, 160.0, 84.0, 68.0, 35.0, 25.0, 14.0, 17.0, 7.0, 8.0, 9.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6259765625, -1.572906494140625, -1.51983642578125, -1.466766357421875, -1.4136962890625, -1.360626220703125, -1.30755615234375, -1.254486083984375, -1.201416015625, -1.148345947265625, -1.09527587890625, -1.042205810546875, -0.9891357421875, -0.936065673828125, -0.88299560546875, -0.829925537109375, -0.77685546875, -0.723785400390625, -0.67071533203125, -0.617645263671875, -0.5645751953125, -0.511505126953125, -0.45843505859375, -0.405364990234375, -0.352294921875, -0.299224853515625, -0.24615478515625, -0.193084716796875, -0.1400146484375, -0.086944580078125, -0.03387451171875, 0.019195556640625, 0.072265625, 0.125335693359375, 0.17840576171875, 0.231475830078125, 0.2845458984375, 0.337615966796875, 0.39068603515625, 0.443756103515625, 0.496826171875, 0.549896240234375, 0.60296630859375, 0.656036376953125, 0.7091064453125, 0.762176513671875, 0.81524658203125, 0.868316650390625, 0.92138671875, 0.974456787109375, 1.02752685546875, 1.080596923828125, 1.1336669921875, 1.186737060546875, 1.23980712890625, 1.292877197265625, 1.345947265625, 1.399017333984375, 1.45208740234375, 1.505157470703125, 1.5582275390625, 1.611297607421875, 1.66436767578125, 1.717437744140625, 1.7705078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 5.0, 4.0, 8.0, 8.0, 13.0, 9.0, 15.0, 14.0, 23.0, 27.0, 20.0, 28.0, 33.0, 33.0, 35.0, 34.0, 36.0, 30.0, 38.0, 37.0, 43.0, 47.0, 33.0, 46.0, 41.0, 42.0, 35.0, 26.0, 35.0, 33.0, 16.0, 18.0, 21.0, 19.0, 15.0, 19.0, 10.0, 9.0, 9.0, 3.0, 5.0, 6.0, 4.0, 1.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5771484375, -0.557952880859375, -0.53875732421875, -0.519561767578125, -0.5003662109375, -0.481170654296875, -0.46197509765625, -0.442779541015625, -0.423583984375, -0.404388427734375, -0.38519287109375, -0.365997314453125, -0.3468017578125, -0.327606201171875, -0.30841064453125, -0.289215087890625, -0.27001953125, -0.250823974609375, -0.23162841796875, -0.212432861328125, -0.1932373046875, -0.174041748046875, -0.15484619140625, -0.135650634765625, -0.116455078125, -0.097259521484375, -0.07806396484375, -0.058868408203125, -0.0396728515625, -0.020477294921875, -0.00128173828125, 0.017913818359375, 0.037109375, 0.056304931640625, 0.07550048828125, 0.094696044921875, 0.1138916015625, 0.133087158203125, 0.15228271484375, 0.171478271484375, 0.190673828125, 0.209869384765625, 0.22906494140625, 0.248260498046875, 0.2674560546875, 0.286651611328125, 0.30584716796875, 0.325042724609375, 0.34423828125, 0.363433837890625, 0.38262939453125, 0.401824951171875, 0.4210205078125, 0.440216064453125, 0.45941162109375, 0.478607177734375, 0.497802734375, 0.516998291015625, 0.53619384765625, 0.555389404296875, 0.5745849609375, 0.593780517578125, 0.61297607421875, 0.632171630859375, 0.6513671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 2.0, 3.0, 8.0, 12.0, 15.0, 17.0, 19.0, 29.0, 58.0, 78.0, 119.0, 198.0, 402.0, 792.0, 1924.0, 7612.0, 489965.0, 535964.0, 7625.0, 1941.0, 785.0, 400.0, 217.0, 114.0, 82.0, 62.0, 28.0, 26.0, 14.0, 14.0, 6.0, 11.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.609375, -4.47381591796875, -4.3382568359375, -4.20269775390625, -4.067138671875, -3.93157958984375, -3.7960205078125, -3.66046142578125, -3.52490234375, -3.38934326171875, -3.2537841796875, -3.11822509765625, -2.982666015625, -2.84710693359375, -2.7115478515625, -2.57598876953125, -2.4404296875, -2.30487060546875, -2.1693115234375, -2.03375244140625, -1.898193359375, -1.76263427734375, -1.6270751953125, -1.49151611328125, -1.35595703125, -1.22039794921875, -1.0848388671875, -0.94927978515625, -0.813720703125, -0.67816162109375, -0.5426025390625, -0.40704345703125, -0.271484375, -0.13592529296875, -0.0003662109375, 0.13519287109375, 0.270751953125, 0.40631103515625, 0.5418701171875, 0.67742919921875, 0.81298828125, 0.94854736328125, 1.0841064453125, 1.21966552734375, 1.355224609375, 1.49078369140625, 1.6263427734375, 1.76190185546875, 1.8974609375, 2.03302001953125, 2.1685791015625, 2.30413818359375, 2.439697265625, 2.57525634765625, 2.7108154296875, 2.84637451171875, 2.98193359375, 3.11749267578125, 3.2530517578125, 3.38861083984375, 3.524169921875, 3.65972900390625, 3.7952880859375, 3.93084716796875, 4.06640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 8.0, 3.0, 5.0, 3.0, 5.0, 12.0, 14.0, 26.0, 23.0, 43.0, 50.0, 66.0, 105.0, 166.0, 127.0, 102.0, 52.0, 50.0, 37.0, 29.0, 17.0, 11.0, 13.0, 9.0, 8.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001953125, -0.0018971562385559082, -0.0018411874771118164, -0.0017852187156677246, -0.0017292499542236328, -0.001673281192779541, -0.0016173124313354492, -0.0015613436698913574, -0.0015053749084472656, -0.0014494061470031738, -0.001393437385559082, -0.0013374686241149902, -0.0012814998626708984, -0.0012255311012268066, -0.0011695623397827148, -0.001113593578338623, -0.0010576248168945312, -0.0010016560554504395, -0.0009456872940063477, -0.0008897185325622559, -0.0008337497711181641, -0.0007777810096740723, -0.0007218122482299805, -0.0006658434867858887, -0.0006098747253417969, -0.0005539059638977051, -0.0004979372024536133, -0.0004419684410095215, -0.0003859996795654297, -0.0003300309181213379, -0.0002740621566772461, -0.0002180933952331543, -0.0001621246337890625, -0.0001061558723449707, -5.0187110900878906e-05, 5.781650543212891e-06, 6.175041198730469e-05, 0.00011771917343139648, 0.00017368793487548828, 0.00022965669631958008, 0.0002856254577636719, 0.00034159421920776367, 0.00039756298065185547, 0.00045353174209594727, 0.0005095005035400391, 0.0005654692649841309, 0.0006214380264282227, 0.0006774067878723145, 0.0007333755493164062, 0.000789344310760498, 0.0008453130722045898, 0.0009012818336486816, 0.0009572505950927734, 0.0010132193565368652, 0.001069188117980957, 0.0011251568794250488, 0.0011811256408691406, 0.0012370944023132324, 0.0012930631637573242, 0.001349031925201416, 0.0014050006866455078, 0.0014609694480895996, 0.0015169382095336914, 0.0015729069709777832, 0.001628875732421875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 6.0, 8.0, 14.0, 25.0, 25.0, 34.0, 37.0, 56.0, 95.0, 118.0, 204.0, 316.0, 606.0, 1143.0, 2501.0, 6925.0, 43408.0, 926568.0, 53086.0, 8013.0, 2536.0, 1174.0, 598.0, 371.0, 196.0, 147.0, 107.0, 55.0, 49.0, 24.0, 21.0, 22.0, 8.0, 9.0, 10.0, 11.0, 4.0, 2.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.83203125, -2.750030517578125, -2.66802978515625, -2.586029052734375, -2.5040283203125, -2.422027587890625, -2.34002685546875, -2.258026123046875, -2.176025390625, -2.094024658203125, -2.01202392578125, -1.930023193359375, -1.8480224609375, -1.766021728515625, -1.68402099609375, -1.602020263671875, -1.52001953125, -1.438018798828125, -1.35601806640625, -1.274017333984375, -1.1920166015625, -1.110015869140625, -1.02801513671875, -0.946014404296875, -0.864013671875, -0.782012939453125, -0.70001220703125, -0.618011474609375, -0.5360107421875, -0.454010009765625, -0.37200927734375, -0.290008544921875, -0.2080078125, -0.126007080078125, -0.04400634765625, 0.037994384765625, 0.1199951171875, 0.201995849609375, 0.28399658203125, 0.365997314453125, 0.447998046875, 0.529998779296875, 0.61199951171875, 0.694000244140625, 0.7760009765625, 0.858001708984375, 0.94000244140625, 1.022003173828125, 1.10400390625, 1.186004638671875, 1.26800537109375, 1.350006103515625, 1.4320068359375, 1.514007568359375, 1.59600830078125, 1.678009033203125, 1.760009765625, 1.842010498046875, 1.92401123046875, 2.006011962890625, 2.0880126953125, 2.170013427734375, 2.25201416015625, 2.334014892578125, 2.416015625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 10.0, 19.0, 28.0, 57.0, 94.0, 226.0, 254.0, 134.0, 72.0, 37.0, 20.0, 9.0, 10.0, 2.0, 7.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5576171875, -1.502288818359375, -1.44696044921875, -1.391632080078125, -1.3363037109375, -1.280975341796875, -1.22564697265625, -1.170318603515625, -1.114990234375, -1.059661865234375, -1.00433349609375, -0.949005126953125, -0.8936767578125, -0.838348388671875, -0.78302001953125, -0.727691650390625, -0.67236328125, -0.617034912109375, -0.56170654296875, -0.506378173828125, -0.4510498046875, -0.395721435546875, -0.34039306640625, -0.285064697265625, -0.229736328125, -0.174407958984375, -0.11907958984375, -0.063751220703125, -0.0084228515625, 0.046905517578125, 0.10223388671875, 0.157562255859375, 0.212890625, 0.268218994140625, 0.32354736328125, 0.378875732421875, 0.4342041015625, 0.489532470703125, 0.54486083984375, 0.600189208984375, 0.655517578125, 0.710845947265625, 0.76617431640625, 0.821502685546875, 0.8768310546875, 0.932159423828125, 0.98748779296875, 1.042816162109375, 1.09814453125, 1.153472900390625, 1.20880126953125, 1.264129638671875, 1.3194580078125, 1.374786376953125, 1.43011474609375, 1.485443115234375, 1.540771484375, 1.596099853515625, 1.65142822265625, 1.706756591796875, 1.7620849609375, 1.817413330078125, 1.87274169921875, 1.928070068359375, 1.9833984375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 19.0, 29.0, 85.0, 335.0, 351.0, 107.0, 38.0, 18.0, 3.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.749229431152344, -28.12420082092285, -27.49917221069336, -26.874141693115234, -26.249113082885742, -25.62408447265625, -24.999053955078125, -24.374025344848633, -23.74899673461914, -23.12396812438965, -22.498939514160156, -21.87390899658203, -21.24888038635254, -20.623851776123047, -19.998821258544922, -19.37379264831543, -18.748764038085938, -18.123735427856445, -17.498706817626953, -16.873676300048828, -16.248647689819336, -15.623619079589844, -14.998589515686035, -14.373559951782227, -13.748531341552734, -13.123502731323242, -12.498473167419434, -11.873443603515625, -11.248414993286133, -10.62338638305664, -9.998356819152832, -9.373327255249023, -8.748298645019531, -8.123270034790039, -7.4982404708862305, -6.87321138381958, -6.24818229675293, -5.623153209686279, -4.998124122619629, -4.3730950355529785, -3.748065948486328, -3.1230368614196777, -2.4980077743530273, -1.872978687286377, -1.2479496002197266, -0.6229205131530762, 0.0021085739135742188, 0.6271376609802246, 1.252166748046875, 1.8771958351135254, 2.502224922180176, 3.127254009246826, 3.7522830963134766, 4.377312183380127, 5.002341270446777, 5.627370357513428, 6.252399444580078, 6.8774285316467285, 7.502457618713379, 8.127487182617188, 8.75251579284668, 9.377544403076172, 10.00257396697998, 10.627603530883789, 11.252632141113281]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 4.0, 7.0, 11.0, 5.0, 13.0, 20.0, 27.0, 41.0, 39.0, 67.0, 68.0, 84.0, 99.0, 114.0, 86.0, 80.0, 61.0, 44.0, 34.0, 24.0, 15.0, 10.0, 8.0, 6.0, 6.0, 2.0, 1.0, 5.0, 0.0, 5.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.137675285339355, -9.785412788391113, -9.433150291442871, -9.080886840820312, -8.72862434387207, -8.376361846923828, -8.024099349975586, -7.671836853027344, -7.319573879241943, -6.967311382293701, -6.615048408508301, -6.262785911560059, -5.910523414611816, -5.558260440826416, -5.205997943878174, -4.853734970092773, -4.501472473144531, -4.149209976196289, -3.7969470024108887, -3.4446845054626465, -3.092421770095825, -2.740159034729004, -2.3878965377807617, -2.0356338024139404, -1.6833710670471191, -1.3311083316802979, -0.9788457155227661, -0.6265830993652344, -0.2743203639984131, 0.0779423713684082, 0.4302048683166504, 0.7824676036834717, 1.134730339050293, 1.4869930744171143, 1.839255690574646, 2.1915183067321777, 2.543781042098999, 2.8960437774658203, 3.2483062744140625, 3.600569009780884, 3.952831745147705, 4.305094242095947, 4.657357215881348, 5.00961971282959, 5.361882209777832, 5.714145183563232, 6.066407680511475, 6.418670654296875, 6.770933151245117, 7.123195648193359, 7.47545862197876, 7.827721118927002, 8.179984092712402, 8.532246589660645, 8.884509086608887, 9.236771583557129, 9.589035034179688, 9.94129753112793, 10.293560028076172, 10.645822525024414, 10.998085975646973, 11.350348472595215, 11.702610969543457, 12.0548734664917, 12.407135963439941]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 2.0, 5.0, 14.0, 30.0, 53.0, 204.0, 1110.0, 11250.0, 4123863.0, 54811.0, 2348.0, 417.0, 99.0, 35.0, 17.0, 11.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0390625, -13.71783447265625, -13.3966064453125, -13.07537841796875, -12.754150390625, -12.43292236328125, -12.1116943359375, -11.79046630859375, -11.46923828125, -11.14801025390625, -10.8267822265625, -10.50555419921875, -10.184326171875, -9.86309814453125, -9.5418701171875, -9.22064208984375, -8.8994140625, -8.57818603515625, -8.2569580078125, -7.93572998046875, -7.614501953125, -7.29327392578125, -6.9720458984375, -6.65081787109375, -6.32958984375, -6.00836181640625, -5.6871337890625, -5.36590576171875, -5.044677734375, -4.72344970703125, -4.4022216796875, -4.08099365234375, -3.759765625, -3.43853759765625, -3.1173095703125, -2.79608154296875, -2.474853515625, -2.15362548828125, -1.8323974609375, -1.51116943359375, -1.18994140625, -0.86871337890625, -0.5474853515625, -0.22625732421875, 0.094970703125, 0.41619873046875, 0.7374267578125, 1.05865478515625, 1.3798828125, 1.70111083984375, 2.0223388671875, 2.34356689453125, 2.664794921875, 2.98602294921875, 3.3072509765625, 3.62847900390625, 3.94970703125, 4.27093505859375, 4.5921630859375, 4.91339111328125, 5.234619140625, 5.55584716796875, 5.8770751953125, 6.19830322265625, 6.51953125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 7.0, 0.0, 5.0, 6.0, 4.0, 10.0, 14.0, 13.0, 28.0, 25.0, 53.0, 69.0, 107.0, 136.0, 129.0, 115.0, 82.0, 61.0, 45.0, 20.0, 21.0, 12.0, 8.0, 4.0, 3.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11541748046875, -0.11159038543701172, -0.10776329040527344, -0.10393619537353516, -0.10010910034179688, -0.0962820053100586, -0.09245491027832031, -0.08862781524658203, -0.08480072021484375, -0.08097362518310547, -0.07714653015136719, -0.0733194351196289, -0.06949234008789062, -0.06566524505615234, -0.06183815002441406, -0.05801105499267578, -0.0541839599609375, -0.05035686492919922, -0.04652976989746094, -0.042702674865722656, -0.038875579833984375, -0.035048484802246094, -0.031221389770507812, -0.02739429473876953, -0.02356719970703125, -0.01974010467529297, -0.015913009643554688, -0.012085914611816406, -0.008258819580078125, -0.004431724548339844, -0.0006046295166015625, 0.0032224655151367188, 0.007049560546875, 0.010876655578613281, 0.014703750610351562, 0.018530845642089844, 0.022357940673828125, 0.026185035705566406, 0.030012130737304688, 0.03383922576904297, 0.03766632080078125, 0.04149341583251953, 0.04532051086425781, 0.049147605895996094, 0.052974700927734375, 0.056801795959472656, 0.06062889099121094, 0.06445598602294922, 0.0682830810546875, 0.07211017608642578, 0.07593727111816406, 0.07976436614990234, 0.08359146118164062, 0.0874185562133789, 0.09124565124511719, 0.09507274627685547, 0.09889984130859375, 0.10272693634033203, 0.10655403137207031, 0.1103811264038086, 0.11420822143554688, 0.11803531646728516, 0.12186241149902344, 0.12568950653076172, 0.1295166015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 6.0, 11.0, 20.0, 24.0, 40.0, 46.0, 76.0, 126.0, 206.0, 327.0, 503.0, 855.0, 1800.0, 3747.0, 8462.0, 22581.0, 84643.0, 2176142.0, 1777216.0, 81053.0, 21296.0, 7709.0, 3421.0, 1649.0, 912.0, 515.0, 326.0, 160.0, 134.0, 71.0, 55.0, 43.0, 25.0, 29.0, 9.0, 11.0, 8.0, 6.0, 5.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5703125, -1.51422119140625, -1.4581298828125, -1.40203857421875, -1.345947265625, -1.28985595703125, -1.2337646484375, -1.17767333984375, -1.12158203125, -1.06549072265625, -1.0093994140625, -0.95330810546875, -0.897216796875, -0.84112548828125, -0.7850341796875, -0.72894287109375, -0.6728515625, -0.61676025390625, -0.5606689453125, -0.50457763671875, -0.448486328125, -0.39239501953125, -0.3363037109375, -0.28021240234375, -0.22412109375, -0.16802978515625, -0.1119384765625, -0.05584716796875, 0.000244140625, 0.05633544921875, 0.1124267578125, 0.16851806640625, 0.224609375, 0.28070068359375, 0.3367919921875, 0.39288330078125, 0.448974609375, 0.50506591796875, 0.5611572265625, 0.61724853515625, 0.67333984375, 0.72943115234375, 0.7855224609375, 0.84161376953125, 0.897705078125, 0.95379638671875, 1.0098876953125, 1.06597900390625, 1.1220703125, 1.17816162109375, 1.2342529296875, 1.29034423828125, 1.346435546875, 1.40252685546875, 1.4586181640625, 1.51470947265625, 1.57080078125, 1.62689208984375, 1.6829833984375, 1.73907470703125, 1.795166015625, 1.85125732421875, 1.9073486328125, 1.96343994140625, 2.01953125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 10.0, 8.0, 10.0, 12.0, 12.0, 21.0, 25.0, 29.0, 47.0, 60.0, 69.0, 82.0, 174.0, 349.0, 1870.0, 707.0, 203.0, 107.0, 58.0, 52.0, 28.0, 34.0, 25.0, 15.0, 12.0, 7.0, 4.0, 7.0, 5.0, 5.0, 6.0, 2.0, 0.0, 2.0], "bins": [-0.322998046875, -0.31577301025390625, -0.3085479736328125, -0.30132293701171875, -0.294097900390625, -0.28687286376953125, -0.2796478271484375, -0.27242279052734375, -0.26519775390625, -0.25797271728515625, -0.2507476806640625, -0.24352264404296875, -0.236297607421875, -0.22907257080078125, -0.2218475341796875, -0.21462249755859375, -0.2073974609375, -0.20017242431640625, -0.1929473876953125, -0.18572235107421875, -0.178497314453125, -0.17127227783203125, -0.1640472412109375, -0.15682220458984375, -0.14959716796875, -0.14237213134765625, -0.1351470947265625, -0.12792205810546875, -0.120697021484375, -0.11347198486328125, -0.1062469482421875, -0.09902191162109375, -0.091796875, -0.08457183837890625, -0.0773468017578125, -0.07012176513671875, -0.062896728515625, -0.05567169189453125, -0.0484466552734375, -0.04122161865234375, -0.03399658203125, -0.02677154541015625, -0.0195465087890625, -0.01232147216796875, -0.005096435546875, 0.00212860107421875, 0.0093536376953125, 0.01657867431640625, 0.0238037109375, 0.03102874755859375, 0.0382537841796875, 0.04547882080078125, 0.052703857421875, 0.05992889404296875, 0.0671539306640625, 0.07437896728515625, 0.08160400390625, 0.08882904052734375, 0.0960540771484375, 0.10327911376953125, 0.110504150390625, 0.11772918701171875, 0.1249542236328125, 0.13217926025390625, 0.139404296875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 8.0, 13.0, 27.0, 84.0, 325.0, 446.0, 77.0, 20.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.641535758972168, -5.375361442565918, -5.10918664932251, -4.84301233291626, -4.576837539672852, -4.310663223266602, -4.044488906860352, -3.7783141136169434, -3.5121395587921143, -3.245965003967285, -2.979790449142456, -2.713615894317627, -2.447441577911377, -2.1812667846679688, -1.9150924682617188, -1.6489179134368896, -1.3827433586120605, -1.1165688037872314, -0.8503943085670471, -0.5842198133468628, -0.3180452585220337, -0.05187070369720459, 0.21430373191833496, 0.48047828674316406, 0.7466528415679932, 1.0128273963928223, 1.2790019512176514, 1.545176386833191, 1.81135094165802, 2.0775256156921387, 2.3436999320983887, 2.6098744869232178, 2.876049041748047, 3.142223596572876, 3.408398151397705, 3.674572467803955, 3.9407472610473633, 4.206921577453613, 4.473095893859863, 4.7392706871032715, 5.00544548034668, 5.27161979675293, 5.537794589996338, 5.803968906402588, 6.070143699645996, 6.336318016052246, 6.602492332458496, 6.868667125701904, 7.134841442108154, 7.401015758514404, 7.6671905517578125, 7.9333648681640625, 8.199539184570312, 8.465714454650879, 8.731888771057129, 8.998063087463379, 9.264237403869629, 9.530411720275879, 9.796586036682129, 10.062761306762695, 10.328935623168945, 10.595109939575195, 10.861284255981445, 11.127458572387695, 11.393633842468262]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 1.0, 10.0, 7.0, 8.0, 9.0, 11.0, 14.0, 26.0, 31.0, 32.0, 27.0, 38.0, 32.0, 51.0, 52.0, 51.0, 59.0, 63.0, 48.0, 56.0, 52.0, 54.0, 41.0, 28.0, 43.0, 27.0, 21.0, 22.0, 18.0, 11.0, 11.0, 12.0, 6.0, 8.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3520337343215942, -1.3066585063934326, -1.2612833976745605, -1.215908169746399, -1.1705330610275269, -1.1251578330993652, -1.0797827243804932, -1.0344074964523315, -0.9890323281288147, -0.9436571598052979, -0.898281991481781, -0.8529068231582642, -0.8075315952301025, -0.7621564865112305, -0.7167812585830688, -0.671406090259552, -0.6260309219360352, -0.5806557536125183, -0.5352805852890015, -0.48990538716316223, -0.4445302188396454, -0.39915505051612854, -0.3537798523902893, -0.30840468406677246, -0.2630295157432556, -0.21765434741973877, -0.17227916419506073, -0.1269039809703827, -0.08152881264686584, -0.036153644323349, 0.009221553802490234, 0.05459672212600708, 0.09997189044952393, 0.14534705877304077, 0.1907222419977188, 0.23609742522239685, 0.2814725935459137, 0.32684776186943054, 0.3722229599952698, 0.4175981283187866, 0.46297329664230347, 0.5083484649658203, 0.5537236332893372, 0.599098801612854, 0.6444740295410156, 0.6898491382598877, 0.7352243661880493, 0.7805995345115662, 0.825974702835083, 0.8713498711585999, 0.9167250394821167, 0.9621002674102783, 1.0074753761291504, 1.052850604057312, 1.0982258319854736, 1.1436009407043457, 1.1889760494232178, 1.2343512773513794, 1.2797263860702515, 1.325101613998413, 1.3704767227172852, 1.4158519506454468, 1.4612271785736084, 1.5066022872924805, 1.551977515220642]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 3.0, 9.0, 12.0, 15.0, 28.0, 40.0, 54.0, 79.0, 123.0, 175.0, 259.0, 397.0, 653.0, 1115.0, 1865.0, 3826.0, 8393.0, 20782.0, 71547.0, 562574.0, 298908.0, 47954.0, 15710.0, 6510.0, 3180.0, 1684.0, 984.0, 563.0, 370.0, 227.0, 151.0, 111.0, 87.0, 48.0, 32.0, 23.0, 22.0, 17.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.06982421875, -2.0068359375, -1.94384765625, -1.880859375, -1.81787109375, -1.7548828125, -1.69189453125, -1.62890625, -1.56591796875, -1.5029296875, -1.43994140625, -1.376953125, -1.31396484375, -1.2509765625, -1.18798828125, -1.125, -1.06201171875, -0.9990234375, -0.93603515625, -0.873046875, -0.81005859375, -0.7470703125, -0.68408203125, -0.62109375, -0.55810546875, -0.4951171875, -0.43212890625, -0.369140625, -0.30615234375, -0.2431640625, -0.18017578125, -0.1171875, -0.05419921875, 0.0087890625, 0.07177734375, 0.134765625, 0.19775390625, 0.2607421875, 0.32373046875, 0.38671875, 0.44970703125, 0.5126953125, 0.57568359375, 0.638671875, 0.70166015625, 0.7646484375, 0.82763671875, 0.890625, 0.95361328125, 1.0166015625, 1.07958984375, 1.142578125, 1.20556640625, 1.2685546875, 1.33154296875, 1.39453125, 1.45751953125, 1.5205078125, 1.58349609375, 1.646484375, 1.70947265625, 1.7724609375, 1.83544921875, 1.8984375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 1.0, 4.0, 8.0, 13.0, 15.0, 15.0, 11.0, 31.0, 37.0, 54.0, 65.0, 86.0, 84.0, 96.0, 93.0, 70.0, 77.0, 54.0, 53.0, 37.0, 27.0, 18.0, 13.0, 9.0, 2.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134033203125, -0.12993431091308594, -0.12583541870117188, -0.12173652648925781, -0.11763763427734375, -0.11353874206542969, -0.10943984985351562, -0.10534095764160156, -0.1012420654296875, -0.09714317321777344, -0.09304428100585938, -0.08894538879394531, -0.08484649658203125, -0.08074760437011719, -0.07664871215820312, -0.07254981994628906, -0.068450927734375, -0.06435203552246094, -0.060253143310546875, -0.05615425109863281, -0.05205535888671875, -0.04795646667480469, -0.043857574462890625, -0.03975868225097656, -0.0356597900390625, -0.03156089782714844, -0.027462005615234375, -0.023363113403320312, -0.01926422119140625, -0.015165328979492188, -0.011066436767578125, -0.0069675445556640625, -0.00286865234375, 0.0012302398681640625, 0.005329132080078125, 0.009428024291992188, 0.01352691650390625, 0.017625808715820312, 0.021724700927734375, 0.025823593139648438, 0.0299224853515625, 0.03402137756347656, 0.038120269775390625, 0.04221916198730469, 0.04631805419921875, 0.05041694641113281, 0.054515838623046875, 0.05861473083496094, 0.062713623046875, 0.06681251525878906, 0.07091140747070312, 0.07501029968261719, 0.07910919189453125, 0.08320808410644531, 0.08730697631835938, 0.09140586853027344, 0.0955047607421875, 0.09960365295410156, 0.10370254516601562, 0.10780143737792969, 0.11190032958984375, 0.11599922180175781, 0.12009811401367188, 0.12419700622558594, 0.1282958984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 7.0, 6.0, 4.0, 8.0, 3.0, 19.0, 12.0, 12.0, 19.0, 53.0, 279.0, 1582.0, 137152.0, 905616.0, 3204.0, 369.0, 81.0, 24.0, 13.0, 16.0, 7.0, 9.0, 11.0, 3.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-7.796875, -7.55426025390625, -7.3116455078125, -7.06903076171875, -6.826416015625, -6.58380126953125, -6.3411865234375, -6.09857177734375, -5.85595703125, -5.61334228515625, -5.3707275390625, -5.12811279296875, -4.885498046875, -4.64288330078125, -4.4002685546875, -4.15765380859375, -3.9150390625, -3.67242431640625, -3.4298095703125, -3.18719482421875, -2.944580078125, -2.70196533203125, -2.4593505859375, -2.21673583984375, -1.97412109375, -1.73150634765625, -1.4888916015625, -1.24627685546875, -1.003662109375, -0.76104736328125, -0.5184326171875, -0.27581787109375, -0.033203125, 0.20941162109375, 0.4520263671875, 0.69464111328125, 0.937255859375, 1.17987060546875, 1.4224853515625, 1.66510009765625, 1.90771484375, 2.15032958984375, 2.3929443359375, 2.63555908203125, 2.878173828125, 3.12078857421875, 3.3634033203125, 3.60601806640625, 3.8486328125, 4.09124755859375, 4.3338623046875, 4.57647705078125, 4.819091796875, 5.06170654296875, 5.3043212890625, 5.54693603515625, 5.78955078125, 6.03216552734375, 6.2747802734375, 6.51739501953125, 6.760009765625, 7.00262451171875, 7.2452392578125, 7.48785400390625, 7.73046875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 7.0, 7.0, 2.0, 9.0, 12.0, 11.0, 8.0, 25.0, 18.0, 41.0, 29.0, 37.0, 38.0, 29.0, 44.0, 46.0, 47.0, 54.0, 49.0, 49.0, 53.0, 50.0, 48.0, 41.0, 35.0, 32.0, 36.0, 27.0, 25.0, 15.0, 13.0, 18.0, 10.0, 13.0, 6.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6318359375, -0.6139297485351562, -0.5960235595703125, -0.5781173706054688, -0.560211181640625, -0.5423049926757812, -0.5243988037109375, -0.5064926147460938, -0.48858642578125, -0.47068023681640625, -0.4527740478515625, -0.43486785888671875, -0.416961669921875, -0.39905548095703125, -0.3811492919921875, -0.36324310302734375, -0.3453369140625, -0.32743072509765625, -0.3095245361328125, -0.29161834716796875, -0.273712158203125, -0.25580596923828125, -0.2378997802734375, -0.21999359130859375, -0.20208740234375, -0.18418121337890625, -0.1662750244140625, -0.14836883544921875, -0.130462646484375, -0.11255645751953125, -0.0946502685546875, -0.07674407958984375, -0.058837890625, -0.04093170166015625, -0.0230255126953125, -0.00511932373046875, 0.012786865234375, 0.03069305419921875, 0.0485992431640625, 0.06650543212890625, 0.08441162109375, 0.10231781005859375, 0.1202239990234375, 0.13813018798828125, 0.156036376953125, 0.17394256591796875, 0.1918487548828125, 0.20975494384765625, 0.2276611328125, 0.24556732177734375, 0.2634735107421875, 0.28137969970703125, 0.299285888671875, 0.31719207763671875, 0.3350982666015625, 0.35300445556640625, 0.37091064453125, 0.38881683349609375, 0.4067230224609375, 0.42462921142578125, 0.442535400390625, 0.46044158935546875, 0.4783477783203125, 0.49625396728515625, 0.51416015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 6.0, 0.0, 3.0, 4.0, 6.0, 8.0, 10.0, 3.0, 9.0, 12.0, 10.0, 21.0, 32.0, 68.0, 350.0, 2747.0, 102046.0, 936975.0, 5350.0, 618.0, 123.0, 49.0, 24.0, 12.0, 11.0, 5.0, 10.0, 7.0, 8.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7421875, -13.2357177734375, -12.729248046875, -12.2227783203125, -11.71630859375, -11.2098388671875, -10.703369140625, -10.1968994140625, -9.6904296875, -9.1839599609375, -8.677490234375, -8.1710205078125, -7.66455078125, -7.1580810546875, -6.651611328125, -6.1451416015625, -5.638671875, -5.1322021484375, -4.625732421875, -4.1192626953125, -3.61279296875, -3.1063232421875, -2.599853515625, -2.0933837890625, -1.5869140625, -1.0804443359375, -0.573974609375, -0.0675048828125, 0.43896484375, 0.9454345703125, 1.451904296875, 1.9583740234375, 2.46484375, 2.9713134765625, 3.477783203125, 3.9842529296875, 4.49072265625, 4.9971923828125, 5.503662109375, 6.0101318359375, 6.5166015625, 7.0230712890625, 7.529541015625, 8.0360107421875, 8.54248046875, 9.0489501953125, 9.555419921875, 10.0618896484375, 10.568359375, 11.0748291015625, 11.581298828125, 12.0877685546875, 12.59423828125, 13.1007080078125, 13.607177734375, 14.1136474609375, 14.6201171875, 15.1265869140625, 15.633056640625, 16.1395263671875, 16.64599609375, 17.1524658203125, 17.658935546875, 18.1654052734375, 18.671875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 7.0, 11.0, 18.0, 76.0, 657.0, 171.0, 21.0, 9.0, 4.0, 4.0, 3.0, 3.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00762176513671875, -0.007269620895385742, -0.006917476654052734, -0.0065653324127197266, -0.006213188171386719, -0.005861043930053711, -0.005508899688720703, -0.005156755447387695, -0.0048046112060546875, -0.00445246696472168, -0.004100322723388672, -0.003748178482055664, -0.0033960342407226562, -0.0030438899993896484, -0.0026917457580566406, -0.002339601516723633, -0.001987457275390625, -0.0016353130340576172, -0.0012831687927246094, -0.0009310245513916016, -0.0005788803100585938, -0.00022673606872558594, 0.00012540817260742188, 0.0004775524139404297, 0.0008296966552734375, 0.0011818408966064453, 0.0015339851379394531, 0.001886129379272461, 0.0022382736206054688, 0.0025904178619384766, 0.0029425621032714844, 0.003294706344604492, 0.0036468505859375, 0.003998994827270508, 0.004351139068603516, 0.0047032833099365234, 0.005055427551269531, 0.005407571792602539, 0.005759716033935547, 0.006111860275268555, 0.0064640045166015625, 0.00681614875793457, 0.007168292999267578, 0.007520437240600586, 0.007872581481933594, 0.008224725723266602, 0.00857686996459961, 0.008929014205932617, 0.009281158447265625, 0.009633302688598633, 0.00998544692993164, 0.010337591171264648, 0.010689735412597656, 0.011041879653930664, 0.011394023895263672, 0.01174616813659668, 0.012098312377929688, 0.012450456619262695, 0.012802600860595703, 0.013154745101928711, 0.013506889343261719, 0.013859033584594727, 0.014211177825927734, 0.014563322067260742, 0.01491546630859375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 5.0, 7.0, 11.0, 23.0, 39.0, 50.0, 96.0, 175.0, 315.0, 662.0, 1396.0, 3645.0, 11576.0, 59623.0, 882201.0, 70547.0, 11936.0, 3596.0, 1413.0, 587.0, 291.0, 152.0, 82.0, 48.0, 25.0, 17.0, 13.0, 8.0, 5.0, 4.0, 4.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.91796875, -6.67559814453125, -6.4332275390625, -6.19085693359375, -5.948486328125, -5.70611572265625, -5.4637451171875, -5.22137451171875, -4.97900390625, -4.73663330078125, -4.4942626953125, -4.25189208984375, -4.009521484375, -3.76715087890625, -3.5247802734375, -3.28240966796875, -3.0400390625, -2.79766845703125, -2.5552978515625, -2.31292724609375, -2.070556640625, -1.82818603515625, -1.5858154296875, -1.34344482421875, -1.10107421875, -0.85870361328125, -0.6163330078125, -0.37396240234375, -0.131591796875, 0.11077880859375, 0.3531494140625, 0.59552001953125, 0.837890625, 1.08026123046875, 1.3226318359375, 1.56500244140625, 1.807373046875, 2.04974365234375, 2.2921142578125, 2.53448486328125, 2.77685546875, 3.01922607421875, 3.2615966796875, 3.50396728515625, 3.746337890625, 3.98870849609375, 4.2310791015625, 4.47344970703125, 4.7158203125, 4.95819091796875, 5.2005615234375, 5.44293212890625, 5.685302734375, 5.92767333984375, 6.1700439453125, 6.41241455078125, 6.65478515625, 6.89715576171875, 7.1395263671875, 7.38189697265625, 7.624267578125, 7.86663818359375, 8.1090087890625, 8.35137939453125, 8.59375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 7.0, 14.0, 14.0, 21.0, 23.0, 43.0, 74.0, 185.0, 352.0, 102.0, 52.0, 24.0, 21.0, 6.0, 11.0, 10.0, 7.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.43359375, -4.29150390625, -4.1494140625, -4.00732421875, -3.865234375, -3.72314453125, -3.5810546875, -3.43896484375, -3.296875, -3.15478515625, -3.0126953125, -2.87060546875, -2.728515625, -2.58642578125, -2.4443359375, -2.30224609375, -2.16015625, -2.01806640625, -1.8759765625, -1.73388671875, -1.591796875, -1.44970703125, -1.3076171875, -1.16552734375, -1.0234375, -0.88134765625, -0.7392578125, -0.59716796875, -0.455078125, -0.31298828125, -0.1708984375, -0.02880859375, 0.11328125, 0.25537109375, 0.3974609375, 0.53955078125, 0.681640625, 0.82373046875, 0.9658203125, 1.10791015625, 1.25, 1.39208984375, 1.5341796875, 1.67626953125, 1.818359375, 1.96044921875, 2.1025390625, 2.24462890625, 2.38671875, 2.52880859375, 2.6708984375, 2.81298828125, 2.955078125, 3.09716796875, 3.2392578125, 3.38134765625, 3.5234375, 3.66552734375, 3.8076171875, 3.94970703125, 4.091796875, 4.23388671875, 4.3759765625, 4.51806640625, 4.66015625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 28.0, 125.0, 513.0, 277.0, 48.0, 14.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.82943344116211, -31.38722801208496, -29.94502067565918, -28.50281524658203, -27.06060791015625, -25.6184024810791, -24.176197052001953, -22.733989715576172, -21.291784286499023, -19.849578857421875, -18.407371520996094, -16.965166091918945, -15.52295970916748, -14.080753326416016, -12.638547897338867, -11.196341514587402, -9.754135131835938, -8.311928749084473, -6.869722843170166, -5.427516937255859, -3.9853105545043945, -2.5431041717529297, -1.1008987426757812, 0.3413076400756836, 1.7835140228271484, 3.225720167160034, 4.66792631149292, 6.110132217407227, 7.552338600158691, 8.994544982910156, 10.436750411987305, 11.87895679473877, 13.3211669921875, 14.763373374938965, 16.20557975769043, 17.647785186767578, 19.08999252319336, 20.532197952270508, 21.974403381347656, 23.416610717773438, 24.858816146850586, 26.301021575927734, 27.743228912353516, 29.185434341430664, 30.627639770507812, 32.069847106933594, 33.512054443359375, 34.95425796508789, 36.39646530151367, 37.83867263793945, 39.28087615966797, 40.72308349609375, 42.16529083251953, 43.60749816894531, 45.04970169067383, 46.49190902709961, 47.934112548828125, 49.376319885253906, 50.81852340698242, 52.2607307434082, 53.702938079833984, 55.1451416015625, 56.58734893798828, 58.02955627441406, 59.471763610839844]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 4.0, 4.0, 5.0, 11.0, 13.0, 25.0, 43.0, 43.0, 57.0, 69.0, 88.0, 117.0, 105.0, 83.0, 89.0, 91.0, 56.0, 30.0, 29.0, 17.0, 12.0, 11.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.269424915313721, -6.881467819213867, -6.493511199951172, -6.105554103851318, -5.717597007751465, -5.329639911651611, -4.941682815551758, -4.5537261962890625, -4.165769100189209, -3.7778120040893555, -3.389855146408081, -3.0018982887268066, -2.613941192626953, -2.2259840965270996, -1.8380272388458252, -1.4500703811645508, -1.0621132850646973, -0.6741563081741333, -0.28619933128356934, 0.10175764560699463, 0.4897146224975586, 0.8776715993881226, 1.2656285762786865, 1.653585433959961, 2.0415425300598145, 2.429499626159668, 2.8174564838409424, 3.205413341522217, 3.5933704376220703, 3.981327533721924, 4.369284629821777, 4.757241249084473, 5.145198822021484, 5.533155918121338, 5.921113014221191, 6.309069633483887, 6.69702672958374, 7.084983825683594, 7.472940444946289, 7.860897541046143, 8.248854637145996, 8.636811256408691, 9.024768829345703, 9.412725448608398, 9.800682067871094, 10.188639640808105, 10.5765962600708, 10.964553833007812, 11.352510452270508, 11.740467071533203, 12.128424644470215, 12.51638126373291, 12.904338836669922, 13.292295455932617, 13.680252075195312, 14.068208694458008, 14.45616626739502, 14.844122886657715, 15.232080459594727, 15.620037078857422, 16.007993698120117, 16.395950317382812, 16.78390884399414, 17.171865463256836, 17.55982208251953]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 8.0, 8.0, 12.0, 32.0, 100.0, 319.0, 1037.0, 5057.0, 47186.0, 4029228.0, 101174.0, 7391.0, 1508.0, 455.0, 194.0, 136.0, 96.0, 61.0, 54.0, 33.0, 37.0, 27.0, 22.0, 10.0, 15.0, 9.0, 11.0, 7.0, 10.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.2578125, -4.040771484375, -3.82373046875, -3.606689453125, -3.3896484375, -3.172607421875, -2.95556640625, -2.738525390625, -2.521484375, -2.304443359375, -2.08740234375, -1.870361328125, -1.6533203125, -1.436279296875, -1.21923828125, -1.002197265625, -0.78515625, -0.568115234375, -0.35107421875, -0.134033203125, 0.0830078125, 0.300048828125, 0.51708984375, 0.734130859375, 0.951171875, 1.168212890625, 1.38525390625, 1.602294921875, 1.8193359375, 2.036376953125, 2.25341796875, 2.470458984375, 2.6875, 2.904541015625, 3.12158203125, 3.338623046875, 3.5556640625, 3.772705078125, 3.98974609375, 4.206787109375, 4.423828125, 4.640869140625, 4.85791015625, 5.074951171875, 5.2919921875, 5.509033203125, 5.72607421875, 5.943115234375, 6.16015625, 6.377197265625, 6.59423828125, 6.811279296875, 7.0283203125, 7.245361328125, 7.46240234375, 7.679443359375, 7.896484375, 8.113525390625, 8.33056640625, 8.547607421875, 8.7646484375, 8.981689453125, 9.19873046875, 9.415771484375, 9.6328125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 6.0, 6.0, 11.0, 23.0, 50.0, 96.0, 134.0, 201.0, 183.0, 139.0, 87.0, 45.0, 24.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.102294921875, -0.09087753295898438, -0.07946014404296875, -0.06804275512695312, -0.0566253662109375, -0.045207977294921875, -0.03379058837890625, -0.022373199462890625, -0.010955810546875, 0.000461578369140625, 0.01187896728515625, 0.023296356201171875, 0.0347137451171875, 0.046131134033203125, 0.05754852294921875, 0.06896591186523438, 0.08038330078125, 0.09180068969726562, 0.10321807861328125, 0.11463546752929688, 0.1260528564453125, 0.13747024536132812, 0.14888763427734375, 0.16030502319335938, 0.171722412109375, 0.18313980102539062, 0.19455718994140625, 0.20597457885742188, 0.2173919677734375, 0.22880935668945312, 0.24022674560546875, 0.2516441345214844, 0.2630615234375, 0.2744789123535156, 0.28589630126953125, 0.2973136901855469, 0.3087310791015625, 0.3201484680175781, 0.33156585693359375, 0.3429832458496094, 0.354400634765625, 0.3658180236816406, 0.37723541259765625, 0.3886528015136719, 0.4000701904296875, 0.4114875793457031, 0.42290496826171875, 0.4343223571777344, 0.44573974609375, 0.4571571350097656, 0.46857452392578125, 0.4799919128417969, 0.4914093017578125, 0.5028266906738281, 0.5142440795898438, 0.5256614685058594, 0.537078857421875, 0.5484962463378906, 0.5599136352539062, 0.5713310241699219, 0.5827484130859375, 0.5941658020019531, 0.6055831909179688, 0.6170005798339844, 0.62841796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 10.0, 14.0, 16.0, 23.0, 46.0, 66.0, 160.0, 419.0, 1463.0, 11225.0, 801411.0, 3361747.0, 14988.0, 1814.0, 460.0, 190.0, 95.0, 42.0, 25.0, 17.0, 14.0, 8.0, 7.0, 6.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5546875, -7.33917236328125, -7.1236572265625, -6.90814208984375, -6.692626953125, -6.47711181640625, -6.2615966796875, -6.04608154296875, -5.83056640625, -5.61505126953125, -5.3995361328125, -5.18402099609375, -4.968505859375, -4.75299072265625, -4.5374755859375, -4.32196044921875, -4.1064453125, -3.89093017578125, -3.6754150390625, -3.45989990234375, -3.244384765625, -3.02886962890625, -2.8133544921875, -2.59783935546875, -2.38232421875, -2.16680908203125, -1.9512939453125, -1.73577880859375, -1.520263671875, -1.30474853515625, -1.0892333984375, -0.87371826171875, -0.658203125, -0.44268798828125, -0.2271728515625, -0.01165771484375, 0.203857421875, 0.41937255859375, 0.6348876953125, 0.85040283203125, 1.06591796875, 1.28143310546875, 1.4969482421875, 1.71246337890625, 1.927978515625, 2.14349365234375, 2.3590087890625, 2.57452392578125, 2.7900390625, 3.00555419921875, 3.2210693359375, 3.43658447265625, 3.652099609375, 3.86761474609375, 4.0831298828125, 4.29864501953125, 4.51416015625, 4.72967529296875, 4.9451904296875, 5.16070556640625, 5.376220703125, 5.59173583984375, 5.8072509765625, 6.02276611328125, 6.23828125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 3.0, 14.0, 13.0, 13.0, 36.0, 46.0, 65.0, 137.0, 262.0, 830.0, 1976.0, 343.0, 130.0, 82.0, 45.0, 30.0, 14.0, 14.0, 5.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5069198608398438, -0.4889373779296875, -0.47095489501953125, -0.452972412109375, -0.43498992919921875, -0.4170074462890625, -0.39902496337890625, -0.38104248046875, -0.36305999755859375, -0.3450775146484375, -0.32709503173828125, -0.309112548828125, -0.29113006591796875, -0.2731475830078125, -0.25516510009765625, -0.2371826171875, -0.21920013427734375, -0.2012176513671875, -0.18323516845703125, -0.165252685546875, -0.14727020263671875, -0.1292877197265625, -0.11130523681640625, -0.09332275390625, -0.07534027099609375, -0.0573577880859375, -0.03937530517578125, -0.021392822265625, -0.00341033935546875, 0.0145721435546875, 0.03255462646484375, 0.050537109375, 0.06851959228515625, 0.0865020751953125, 0.10448455810546875, 0.122467041015625, 0.14044952392578125, 0.1584320068359375, 0.17641448974609375, 0.19439697265625, 0.21237945556640625, 0.2303619384765625, 0.24834442138671875, 0.266326904296875, 0.28430938720703125, 0.3022918701171875, 0.32027435302734375, 0.3382568359375, 0.35623931884765625, 0.3742218017578125, 0.39220428466796875, 0.410186767578125, 0.42816925048828125, 0.4461517333984375, 0.46413421630859375, 0.48211669921875, 0.5000991821289062, 0.5180816650390625, 0.5360641479492188, 0.554046630859375, 0.5720291137695312, 0.5900115966796875, 0.6079940795898438, 0.6259765625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 33.0, 136.0, 492.0, 269.0, 59.0, 12.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.613971710205078, -16.29903221130371, -15.984094619750977, -15.66915512084961, -15.354216575622559, -15.039278030395508, -14.724339485168457, -14.409400939941406, -14.094462394714355, -13.779523849487305, -13.464585304260254, -13.149646759033203, -12.834707260131836, -12.519768714904785, -12.204830169677734, -11.889891624450684, -11.574953079223633, -11.260014533996582, -10.945075988769531, -10.630136489868164, -10.315197944641113, -10.000259399414062, -9.685320854187012, -9.370382308959961, -9.055442810058594, -8.740504264831543, -8.425565719604492, -8.110626220703125, -7.795688152313232, -7.480749130249023, -7.165810585021973, -6.850872039794922, -6.535933971405029, -6.2209954261779785, -5.9060564041137695, -5.591117858886719, -5.276179313659668, -4.961240768432617, -4.646301746368408, -4.331363201141357, -4.016424179077148, -3.7014853954315186, -3.3865468502044678, -3.071608066558838, -2.756669521331787, -2.4417307376861572, -2.1267919540405273, -1.8118534088134766, -1.4969148635864258, -1.1819761991500854, -0.8670374751091003, -0.5520987510681152, -0.2371600866317749, 0.07777857780456543, 0.3927173614501953, 0.7076559066772461, 1.022594690322876, 1.3375333547592163, 1.6524720191955566, 1.9674108028411865, 2.2823495864868164, 2.597288131713867, 2.912226915359497, 3.227165460586548, 3.5421042442321777]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 12.0, 33.0, 48.0, 90.0, 134.0, 132.0, 156.0, 149.0, 112.0, 64.0, 43.0, 14.0, 9.0, 6.0, 1.0, 0.0, 0.0, 3.0], "bins": [-7.740879535675049, -7.592033386230469, -7.4431867599487305, -7.29434061050415, -7.14549446105957, -6.996647834777832, -6.847801685333252, -6.698955535888672, -6.550108909606934, -6.4012627601623535, -6.252416133880615, -6.103569984436035, -5.954723834991455, -5.805877208709717, -5.657031059265137, -5.508184432983398, -5.359338760375977, -5.2104926109313965, -5.061645984649658, -4.912799835205078, -4.763953685760498, -4.61510705947876, -4.46626091003418, -4.317414283752441, -4.168568134307861, -4.019721984863281, -3.870875597000122, -3.722029209136963, -3.5731828212738037, -3.4243364334106445, -3.2754902839660645, -3.1266438961029053, -2.977797746658325, -2.828951358795166, -2.680105209350586, -2.5312588214874268, -2.3824124336242676, -2.2335662841796875, -2.0847198963165283, -1.9358735084533691, -1.7870272397994995, -1.6381809711456299, -1.4893345832824707, -1.340488314628601, -1.1916420459747314, -1.0427956581115723, -0.8939493894577026, -0.7451030015945435, -0.5962567329406738, -0.4474104046821594, -0.2985641062259674, -0.1497178077697754, -0.0008714795112609863, 0.14797484874725342, 0.29682111740112305, 0.4456675052642822, 0.5945137739181519, 0.7433601021766663, 0.8922064304351807, 1.0410526990890503, 1.18989896774292, 1.338745355606079, 1.4875916242599487, 1.636438012123108, 1.7852842807769775]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 6.0, 10.0, 10.0, 7.0, 9.0, 10.0, 15.0, 17.0, 11.0, 13.0, 20.0, 28.0, 19.0, 29.0, 37.0, 33.0, 29.0, 58.0, 298.0, 10341.0, 816411.0, 217979.0, 2627.0, 132.0, 45.0, 44.0, 29.0, 35.0, 30.0, 18.0, 38.0, 29.0, 32.0, 24.0, 16.0, 8.0, 5.0, 14.0, 13.0, 10.0, 6.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.94921875, -5.77838134765625, -5.6075439453125, -5.43670654296875, -5.265869140625, -5.09503173828125, -4.9241943359375, -4.75335693359375, -4.58251953125, -4.41168212890625, -4.2408447265625, -4.07000732421875, -3.899169921875, -3.72833251953125, -3.5574951171875, -3.38665771484375, -3.2158203125, -3.04498291015625, -2.8741455078125, -2.70330810546875, -2.532470703125, -2.36163330078125, -2.1907958984375, -2.01995849609375, -1.84912109375, -1.67828369140625, -1.5074462890625, -1.33660888671875, -1.165771484375, -0.99493408203125, -0.8240966796875, -0.65325927734375, -0.482421875, -0.31158447265625, -0.1407470703125, 0.03009033203125, 0.200927734375, 0.37176513671875, 0.5426025390625, 0.71343994140625, 0.88427734375, 1.05511474609375, 1.2259521484375, 1.39678955078125, 1.567626953125, 1.73846435546875, 1.9093017578125, 2.08013916015625, 2.2509765625, 2.42181396484375, 2.5926513671875, 2.76348876953125, 2.934326171875, 3.10516357421875, 3.2760009765625, 3.44683837890625, 3.61767578125, 3.78851318359375, 3.9593505859375, 4.13018798828125, 4.301025390625, 4.47186279296875, 4.6427001953125, 4.81353759765625, 4.984375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 11.0, 12.0, 5.0, 27.0, 57.0, 61.0, 92.0, 105.0, 134.0, 150.0, 122.0, 94.0, 51.0, 38.0, 32.0, 19.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.46142578125, -0.45235633850097656, -0.4432868957519531, -0.4342174530029297, -0.42514801025390625, -0.4160785675048828, -0.4070091247558594, -0.39793968200683594, -0.3888702392578125, -0.37980079650878906, -0.3707313537597656, -0.3616619110107422, -0.35259246826171875, -0.3435230255126953, -0.3344535827636719, -0.32538414001464844, -0.316314697265625, -0.30724525451660156, -0.2981758117675781, -0.2891063690185547, -0.28003692626953125, -0.2709674835205078, -0.2618980407714844, -0.25282859802246094, -0.2437591552734375, -0.23468971252441406, -0.22562026977539062, -0.2165508270263672, -0.20748138427734375, -0.1984119415283203, -0.18934249877929688, -0.18027305603027344, -0.17120361328125, -0.16213417053222656, -0.15306472778320312, -0.1439952850341797, -0.13492584228515625, -0.1258563995361328, -0.11678695678710938, -0.10771751403808594, -0.0986480712890625, -0.08957862854003906, -0.08050918579101562, -0.07143974304199219, -0.06237030029296875, -0.05330085754394531, -0.044231414794921875, -0.03516197204589844, -0.026092529296875, -0.017023086547851562, -0.007953643798828125, 0.0011157989501953125, 0.01018524169921875, 0.019254684448242188, 0.028324127197265625, 0.03739356994628906, 0.0464630126953125, 0.05553245544433594, 0.06460189819335938, 0.07367134094238281, 0.08274078369140625, 0.09181022644042969, 0.10087966918945312, 0.10994911193847656, 0.1190185546875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 5.0, 5.0, 12.0, 20.0, 24.0, 37.0, 44.0, 68.0, 98.0, 132.0, 188.0, 287.0, 387.0, 587.0, 1132.0, 2009.0, 4050.0, 9456.0, 23492.0, 64527.0, 190299.0, 378572.0, 238212.0, 83135.0, 29456.0, 11413.0, 4944.0, 2478.0, 1301.0, 729.0, 454.0, 317.0, 211.0, 130.0, 81.0, 65.0, 53.0, 47.0, 20.0, 19.0, 12.0, 11.0, 7.0, 7.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.3720703125, -1.3300018310546875, -1.287933349609375, -1.2458648681640625, -1.20379638671875, -1.1617279052734375, -1.119659423828125, -1.0775909423828125, -1.0355224609375, -0.9934539794921875, -0.951385498046875, -0.9093170166015625, -0.86724853515625, -0.8251800537109375, -0.783111572265625, -0.7410430908203125, -0.698974609375, -0.6569061279296875, -0.614837646484375, -0.5727691650390625, -0.53070068359375, -0.4886322021484375, -0.446563720703125, -0.4044952392578125, -0.3624267578125, -0.3203582763671875, -0.278289794921875, -0.2362213134765625, -0.19415283203125, -0.1520843505859375, -0.110015869140625, -0.0679473876953125, -0.02587890625, 0.0161895751953125, 0.058258056640625, 0.1003265380859375, 0.14239501953125, 0.1844635009765625, 0.226531982421875, 0.2686004638671875, 0.3106689453125, 0.3527374267578125, 0.394805908203125, 0.4368743896484375, 0.47894287109375, 0.5210113525390625, 0.563079833984375, 0.6051483154296875, 0.647216796875, 0.6892852783203125, 0.731353759765625, 0.7734222412109375, 0.81549072265625, 0.8575592041015625, 0.899627685546875, 0.9416961669921875, 0.9837646484375, 1.0258331298828125, 1.067901611328125, 1.1099700927734375, 1.15203857421875, 1.1941070556640625, 1.236175537109375, 1.2782440185546875, 1.3203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 10.0, 10.0, 13.0, 10.0, 25.0, 20.0, 18.0, 25.0, 30.0, 35.0, 28.0, 34.0, 35.0, 37.0, 46.0, 42.0, 45.0, 60.0, 36.0, 52.0, 48.0, 32.0, 46.0, 32.0, 40.0, 29.0, 28.0, 16.0, 16.0, 20.0, 13.0, 14.0, 11.0, 8.0, 6.0, 7.0, 3.0, 4.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.68701171875, -0.6637496948242188, -0.6404876708984375, -0.6172256469726562, -0.593963623046875, -0.5707015991210938, -0.5474395751953125, -0.5241775512695312, -0.50091552734375, -0.47765350341796875, -0.4543914794921875, -0.43112945556640625, -0.407867431640625, -0.38460540771484375, -0.3613433837890625, -0.33808135986328125, -0.3148193359375, -0.29155731201171875, -0.2682952880859375, -0.24503326416015625, -0.221771240234375, -0.19850921630859375, -0.1752471923828125, -0.15198516845703125, -0.12872314453125, -0.10546112060546875, -0.0821990966796875, -0.05893707275390625, -0.035675048828125, -0.01241302490234375, 0.0108489990234375, 0.03411102294921875, 0.057373046875, 0.08063507080078125, 0.1038970947265625, 0.12715911865234375, 0.150421142578125, 0.17368316650390625, 0.1969451904296875, 0.22020721435546875, 0.24346923828125, 0.26673126220703125, 0.2899932861328125, 0.31325531005859375, 0.336517333984375, 0.35977935791015625, 0.3830413818359375, 0.40630340576171875, 0.4295654296875, 0.45282745361328125, 0.4760894775390625, 0.49935150146484375, 0.522613525390625, 0.5458755493164062, 0.5691375732421875, 0.5923995971679688, 0.61566162109375, 0.6389236450195312, 0.6621856689453125, 0.6854476928710938, 0.708709716796875, 0.7319717407226562, 0.7552337646484375, 0.7784957885742188, 0.8017578125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 9.0, 8.0, 19.0, 23.0, 28.0, 36.0, 72.0, 105.0, 197.0, 350.0, 590.0, 1242.0, 2739.0, 6955.0, 21991.0, 95236.0, 483431.0, 346353.0, 63281.0, 16031.0, 5439.0, 2121.0, 1017.0, 537.0, 299.0, 165.0, 104.0, 61.0, 40.0, 20.0, 21.0, 11.0, 7.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.0859375, -2.01837158203125, -1.9508056640625, -1.88323974609375, -1.815673828125, -1.74810791015625, -1.6805419921875, -1.61297607421875, -1.54541015625, -1.47784423828125, -1.4102783203125, -1.34271240234375, -1.275146484375, -1.20758056640625, -1.1400146484375, -1.07244873046875, -1.0048828125, -0.93731689453125, -0.8697509765625, -0.80218505859375, -0.734619140625, -0.66705322265625, -0.5994873046875, -0.53192138671875, -0.46435546875, -0.39678955078125, -0.3292236328125, -0.26165771484375, -0.194091796875, -0.12652587890625, -0.0589599609375, 0.00860595703125, 0.076171875, 0.14373779296875, 0.2113037109375, 0.27886962890625, 0.346435546875, 0.41400146484375, 0.4815673828125, 0.54913330078125, 0.61669921875, 0.68426513671875, 0.7518310546875, 0.81939697265625, 0.886962890625, 0.95452880859375, 1.0220947265625, 1.08966064453125, 1.1572265625, 1.22479248046875, 1.2923583984375, 1.35992431640625, 1.427490234375, 1.49505615234375, 1.5626220703125, 1.63018798828125, 1.69775390625, 1.76531982421875, 1.8328857421875, 1.90045166015625, 1.968017578125, 2.03558349609375, 2.1031494140625, 2.17071533203125, 2.23828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 10.0, 10.0, 18.0, 21.0, 42.0, 38.0, 52.0, 82.0, 86.0, 120.0, 111.0, 110.0, 96.0, 57.0, 37.0, 25.0, 31.0, 18.0, 13.0, 7.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0004458427429199219, -0.0004310011863708496, -0.00041615962982177734, -0.0004013180732727051, -0.0003864765167236328, -0.00037163496017456055, -0.0003567934036254883, -0.000341951847076416, -0.00032711029052734375, -0.0003122687339782715, -0.0002974271774291992, -0.00028258562088012695, -0.0002677440643310547, -0.0002529025077819824, -0.00023806095123291016, -0.0002232193946838379, -0.00020837783813476562, -0.00019353628158569336, -0.0001786947250366211, -0.00016385316848754883, -0.00014901161193847656, -0.0001341700553894043, -0.00011932849884033203, -0.00010448694229125977, -8.96453857421875e-05, -7.480382919311523e-05, -5.996227264404297e-05, -4.51207160949707e-05, -3.0279159545898438e-05, -1.5437602996826172e-05, -5.960464477539062e-07, 1.424551010131836e-05, 2.9087066650390625e-05, 4.392862319946289e-05, 5.8770179748535156e-05, 7.361173629760742e-05, 8.845329284667969e-05, 0.00010329484939575195, 0.00011813640594482422, 0.00013297796249389648, 0.00014781951904296875, 0.00016266107559204102, 0.00017750263214111328, 0.00019234418869018555, 0.0002071857452392578, 0.00022202730178833008, 0.00023686885833740234, 0.0002517104148864746, 0.0002665519714355469, 0.00028139352798461914, 0.0002962350845336914, 0.00031107664108276367, 0.00032591819763183594, 0.0003407597541809082, 0.00035560131072998047, 0.00037044286727905273, 0.000385284423828125, 0.00040012598037719727, 0.00041496753692626953, 0.0004298090934753418, 0.00044465065002441406, 0.00045949220657348633, 0.0004743337631225586, 0.0004891753196716309, 0.0005040168762207031]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 5.0, 8.0, 21.0, 19.0, 49.0, 53.0, 100.0, 175.0, 315.0, 567.0, 1205.0, 2758.0, 7936.0, 30676.0, 187465.0, 632570.0, 147717.0, 25769.0, 6647.0, 2255.0, 1090.0, 479.0, 251.0, 159.0, 98.0, 54.0, 43.0, 20.0, 10.0, 7.0, 10.0, 4.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.11328125, -2.03021240234375, -1.9471435546875, -1.86407470703125, -1.781005859375, -1.69793701171875, -1.6148681640625, -1.53179931640625, -1.44873046875, -1.36566162109375, -1.2825927734375, -1.19952392578125, -1.116455078125, -1.03338623046875, -0.9503173828125, -0.86724853515625, -0.7841796875, -0.70111083984375, -0.6180419921875, -0.53497314453125, -0.451904296875, -0.36883544921875, -0.2857666015625, -0.20269775390625, -0.11962890625, -0.03656005859375, 0.0465087890625, 0.12957763671875, 0.212646484375, 0.29571533203125, 0.3787841796875, 0.46185302734375, 0.544921875, 0.62799072265625, 0.7110595703125, 0.79412841796875, 0.877197265625, 0.96026611328125, 1.0433349609375, 1.12640380859375, 1.20947265625, 1.29254150390625, 1.3756103515625, 1.45867919921875, 1.541748046875, 1.62481689453125, 1.7078857421875, 1.79095458984375, 1.8740234375, 1.95709228515625, 2.0401611328125, 2.12322998046875, 2.206298828125, 2.28936767578125, 2.3724365234375, 2.45550537109375, 2.53857421875, 2.62164306640625, 2.7047119140625, 2.78778076171875, 2.870849609375, 2.95391845703125, 3.0369873046875, 3.12005615234375, 3.203125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 9.0, 10.0, 17.0, 10.0, 14.0, 33.0, 36.0, 50.0, 78.0, 84.0, 107.0, 121.0, 115.0, 94.0, 64.0, 54.0, 39.0, 27.0, 11.0, 9.0, 6.0, 8.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.66015625, -1.617828369140625, -1.57550048828125, -1.533172607421875, -1.4908447265625, -1.448516845703125, -1.40618896484375, -1.363861083984375, -1.321533203125, -1.279205322265625, -1.23687744140625, -1.194549560546875, -1.1522216796875, -1.109893798828125, -1.06756591796875, -1.025238037109375, -0.98291015625, -0.940582275390625, -0.89825439453125, -0.855926513671875, -0.8135986328125, -0.771270751953125, -0.72894287109375, -0.686614990234375, -0.644287109375, -0.601959228515625, -0.55963134765625, -0.517303466796875, -0.4749755859375, -0.432647705078125, -0.39031982421875, -0.347991943359375, -0.3056640625, -0.263336181640625, -0.22100830078125, -0.178680419921875, -0.1363525390625, -0.094024658203125, -0.05169677734375, -0.009368896484375, 0.032958984375, 0.075286865234375, 0.11761474609375, 0.159942626953125, 0.2022705078125, 0.244598388671875, 0.28692626953125, 0.329254150390625, 0.37158203125, 0.413909912109375, 0.45623779296875, 0.498565673828125, 0.5408935546875, 0.583221435546875, 0.62554931640625, 0.667877197265625, 0.710205078125, 0.752532958984375, 0.79486083984375, 0.837188720703125, 0.8795166015625, 0.921844482421875, 0.96417236328125, 1.006500244140625, 1.048828125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 35.0, 582.0, 358.0, 25.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-102.9710464477539, -101.02095794677734, -99.07086181640625, -97.12077331542969, -95.1706771850586, -93.22058868408203, -91.27049255371094, -89.32040405273438, -87.37031555175781, -85.42022705078125, -83.47013092041016, -81.5200424194336, -79.5699462890625, -77.61985778808594, -75.66976928710938, -73.71967315673828, -71.76957702636719, -69.81948852539062, -67.86939239501953, -65.91930389404297, -63.96921157836914, -62.01911926269531, -60.069026947021484, -58.118934631347656, -56.168846130371094, -54.218753814697266, -52.26866149902344, -50.318572998046875, -48.36848068237305, -46.41838836669922, -44.46829605102539, -42.51820373535156, -40.56810760498047, -38.61801528930664, -36.66792297363281, -34.71783447265625, -32.76774215698242, -30.817649841308594, -28.867557525634766, -26.917465209960938, -24.967376708984375, -23.017284393310547, -21.06719398498535, -19.117101669311523, -17.167009353637695, -15.216917991638184, -13.266826629638672, -11.316734313964844, -9.366641998291016, -7.416550159454346, -5.466458320617676, -3.516366958618164, -1.5662751197814941, 0.3838167190551758, 2.3339080810546875, 4.284000396728516, 6.234091758728027, 8.184183120727539, 10.134275436401367, 12.084366798400879, 14.03445816040039, 15.984550476074219, 17.934642791748047, 19.884735107421875, 21.83482551574707]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 5.0, 3.0, 8.0, 7.0, 14.0, 13.0, 13.0, 25.0, 27.0, 30.0, 46.0, 55.0, 56.0, 42.0, 55.0, 56.0, 69.0, 48.0, 66.0, 41.0, 44.0, 35.0, 48.0, 33.0, 31.0, 27.0, 19.0, 13.0, 12.0, 12.0, 9.0, 10.0, 7.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.199690818786621, -5.981070518493652, -5.762450218200684, -5.543830394744873, -5.325210094451904, -5.1065897941589355, -4.887969970703125, -4.669349670410156, -4.4507293701171875, -4.232109069824219, -4.01348876953125, -3.7948689460754395, -3.5762486457824707, -3.357628345489502, -3.1390082836151123, -2.9203882217407227, -2.701767921447754, -2.483147621154785, -2.2645275592803955, -2.045907497406006, -1.827287197113037, -1.608667016029358, -1.3900468349456787, -1.1714266538619995, -0.9528064727783203, -0.7341862916946411, -0.5155661106109619, -0.2969459295272827, -0.07832574844360352, 0.14029443264007568, 0.3589146137237549, 0.5775347948074341, 0.7961544990539551, 1.0147746801376343, 1.2333948612213135, 1.4520150423049927, 1.6706352233886719, 1.889255404472351, 2.1078755855560303, 2.32649564743042, 2.5451159477233887, 2.7637362480163574, 2.982356309890747, 3.2009763717651367, 3.4195966720581055, 3.638216972351074, 3.856837034225464, 4.0754570960998535, 4.294077396392822, 4.512697696685791, 4.731317520141602, 4.94993782043457, 5.168558120727539, 5.387178421020508, 5.605798721313477, 5.824418544769287, 6.043038845062256, 6.261659145355225, 6.480278968811035, 6.698899269104004, 6.917519569396973, 7.136139869689941, 7.35476016998291, 7.573379993438721, 7.7920002937316895]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 8.0, 5.0, 15.0, 18.0, 13.0, 32.0, 43.0, 62.0, 97.0, 161.0, 255.0, 1252.0, 35023.0, 4129691.0, 25622.0, 1222.0, 314.0, 150.0, 101.0, 61.0, 41.0, 23.0, 12.0, 20.0, 12.0, 6.0, 9.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-17.953125, -17.5093994140625, -17.065673828125, -16.6219482421875, -16.17822265625, -15.7344970703125, -15.290771484375, -14.8470458984375, -14.4033203125, -13.9595947265625, -13.515869140625, -13.0721435546875, -12.62841796875, -12.1846923828125, -11.740966796875, -11.2972412109375, -10.853515625, -10.4097900390625, -9.966064453125, -9.5223388671875, -9.07861328125, -8.6348876953125, -8.191162109375, -7.7474365234375, -7.3037109375, -6.8599853515625, -6.416259765625, -5.9725341796875, -5.52880859375, -5.0850830078125, -4.641357421875, -4.1976318359375, -3.75390625, -3.3101806640625, -2.866455078125, -2.4227294921875, -1.97900390625, -1.5352783203125, -1.091552734375, -0.6478271484375, -0.2041015625, 0.2396240234375, 0.683349609375, 1.1270751953125, 1.57080078125, 2.0145263671875, 2.458251953125, 2.9019775390625, 3.345703125, 3.7894287109375, 4.233154296875, 4.6768798828125, 5.12060546875, 5.5643310546875, 6.008056640625, 6.4517822265625, 6.8955078125, 7.3392333984375, 7.782958984375, 8.2266845703125, 8.67041015625, 9.1141357421875, 9.557861328125, 10.0015869140625, 10.4453125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 10.0, 12.0, 16.0, 39.0, 48.0, 74.0, 100.0, 118.0, 123.0, 114.0, 99.0, 75.0, 71.0, 44.0, 32.0, 12.0, 9.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.50537109375, -0.4932708740234375, -0.481170654296875, -0.4690704345703125, -0.45697021484375, -0.4448699951171875, -0.432769775390625, -0.4206695556640625, -0.4085693359375, -0.3964691162109375, -0.384368896484375, -0.3722686767578125, -0.36016845703125, -0.3480682373046875, -0.335968017578125, -0.3238677978515625, -0.311767578125, -0.2996673583984375, -0.287567138671875, -0.2754669189453125, -0.26336669921875, -0.2512664794921875, -0.239166259765625, -0.2270660400390625, -0.2149658203125, -0.2028656005859375, -0.190765380859375, -0.1786651611328125, -0.16656494140625, -0.1544647216796875, -0.142364501953125, -0.1302642822265625, -0.1181640625, -0.1060638427734375, -0.093963623046875, -0.0818634033203125, -0.06976318359375, -0.0576629638671875, -0.045562744140625, -0.0334625244140625, -0.0213623046875, -0.0092620849609375, 0.002838134765625, 0.0149383544921875, 0.02703857421875, 0.0391387939453125, 0.051239013671875, 0.0633392333984375, 0.075439453125, 0.0875396728515625, 0.099639892578125, 0.1117401123046875, 0.12384033203125, 0.1359405517578125, 0.148040771484375, 0.1601409912109375, 0.1722412109375, 0.1843414306640625, 0.196441650390625, 0.2085418701171875, 0.22064208984375, 0.2327423095703125, 0.244842529296875, 0.2569427490234375, 0.26904296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 10.0, 3.0, 8.0, 15.0, 21.0, 27.0, 31.0, 43.0, 51.0, 77.0, 97.0, 160.0, 313.0, 948.0, 18122.0, 4149694.0, 23101.0, 940.0, 252.0, 122.0, 60.0, 55.0, 44.0, 20.0, 22.0, 15.0, 12.0, 11.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.90625, -19.3612060546875, -18.816162109375, -18.2711181640625, -17.72607421875, -17.1810302734375, -16.635986328125, -16.0909423828125, -15.5458984375, -15.0008544921875, -14.455810546875, -13.9107666015625, -13.36572265625, -12.8206787109375, -12.275634765625, -11.7305908203125, -11.185546875, -10.6405029296875, -10.095458984375, -9.5504150390625, -9.00537109375, -8.4603271484375, -7.915283203125, -7.3702392578125, -6.8251953125, -6.2801513671875, -5.735107421875, -5.1900634765625, -4.64501953125, -4.0999755859375, -3.554931640625, -3.0098876953125, -2.46484375, -1.9197998046875, -1.374755859375, -0.8297119140625, -0.28466796875, 0.2603759765625, 0.805419921875, 1.3504638671875, 1.8955078125, 2.4405517578125, 2.985595703125, 3.5306396484375, 4.07568359375, 4.6207275390625, 5.165771484375, 5.7108154296875, 6.255859375, 6.8009033203125, 7.345947265625, 7.8909912109375, 8.43603515625, 8.9810791015625, 9.526123046875, 10.0711669921875, 10.6162109375, 11.1612548828125, 11.706298828125, 12.2513427734375, 12.79638671875, 13.3414306640625, 13.886474609375, 14.4315185546875, 14.9765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 16.0, 46.0, 209.0, 2967.0, 673.0, 128.0, 32.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.421875, -4.339630126953125, -4.25738525390625, -4.175140380859375, -4.0928955078125, -4.010650634765625, -3.92840576171875, -3.846160888671875, -3.763916015625, -3.681671142578125, -3.59942626953125, -3.517181396484375, -3.4349365234375, -3.352691650390625, -3.27044677734375, -3.188201904296875, -3.10595703125, -3.023712158203125, -2.94146728515625, -2.859222412109375, -2.7769775390625, -2.694732666015625, -2.61248779296875, -2.530242919921875, -2.447998046875, -2.365753173828125, -2.28350830078125, -2.201263427734375, -2.1190185546875, -2.036773681640625, -1.95452880859375, -1.872283935546875, -1.7900390625, -1.707794189453125, -1.62554931640625, -1.543304443359375, -1.4610595703125, -1.378814697265625, -1.29656982421875, -1.214324951171875, -1.132080078125, -1.049835205078125, -0.96759033203125, -0.885345458984375, -0.8031005859375, -0.720855712890625, -0.63861083984375, -0.556365966796875, -0.47412109375, -0.391876220703125, -0.30963134765625, -0.227386474609375, -0.1451416015625, -0.062896728515625, 0.01934814453125, 0.101593017578125, 0.183837890625, 0.266082763671875, 0.34832763671875, 0.430572509765625, 0.5128173828125, 0.595062255859375, 0.67730712890625, 0.759552001953125, 0.841796875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 15.0, 305.0, 606.0, 68.0, 10.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.55258560180664, -48.3507194519043, -47.14885711669922, -45.946990966796875, -44.7451286315918, -43.54326248168945, -42.341400146484375, -41.13953399658203, -39.93766784667969, -38.735801696777344, -37.533939361572266, -36.33207321166992, -35.130210876464844, -33.9283447265625, -32.72648239135742, -31.524616241455078, -30.32275390625, -29.12088966369629, -27.919025421142578, -26.717161178588867, -25.515296936035156, -24.313430786132812, -23.1115665435791, -21.90970230102539, -20.70783805847168, -19.50597381591797, -18.304109573364258, -17.102245330810547, -15.90038013458252, -14.698515892028809, -13.496650695800781, -12.29478645324707, -11.092924118041992, -9.891059875488281, -8.68919563293457, -7.487330436706543, -6.285466194152832, -5.083601951599121, -3.881737232208252, -2.679872512817383, -1.4780082702636719, -0.27614378929138184, 0.9257206916809082, 2.1275851726531982, 3.3294496536254883, 4.531313896179199, 5.733178615570068, 6.9350433349609375, 8.136907577514648, 9.33877182006836, 10.54063606262207, 11.742501258850098, 12.944365501403809, 14.14622974395752, 15.348094940185547, 16.549959182739258, 17.75182342529297, 18.95368766784668, 20.15555191040039, 21.3574161529541, 22.559280395507812, 23.761146545410156, 24.963010787963867, 26.164875030517578, 27.36673927307129]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 15.0, 25.0, 40.0, 79.0, 97.0, 133.0, 139.0, 131.0, 125.0, 81.0, 67.0, 33.0, 14.0, 9.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.94870376586914, -10.590127944946289, -10.231553077697754, -9.872977256774902, -9.514402389526367, -9.155826568603516, -8.797250747680664, -8.438675880432129, -8.080100059509277, -7.721524715423584, -7.362949371337891, -7.004373550415039, -6.645798206329346, -6.287222862243652, -5.928647518157959, -5.570072174072266, -5.211496829986572, -4.852921485900879, -4.4943461418151855, -4.135770797729492, -3.7771949768066406, -3.4186196327209473, -3.060044288635254, -2.7014687061309814, -2.342893362045288, -1.9843178987503052, -1.6257424354553223, -1.267167091369629, -0.908591628074646, -0.5500161647796631, -0.19144082069396973, 0.16713476181030273, 0.5257101058959961, 0.884285569190979, 1.242861032485962, 1.6014363765716553, 1.9600118398666382, 2.318587303161621, 2.6771626472473145, 3.035738229751587, 3.3943135738372803, 3.7528889179229736, 4.111464500427246, 4.4700398445129395, 4.828615188598633, 5.187191009521484, 5.5457658767700195, 5.904341697692871, 6.2629170417785645, 6.621492385864258, 6.980067729949951, 7.3386430740356445, 7.697218894958496, 8.055793762207031, 8.414369583129883, 8.772945404052734, 9.13152027130127, 9.490096092224121, 9.848670959472656, 10.207246780395508, 10.565821647644043, 10.924397468566895, 11.28297233581543, 11.641548156738281, 12.000123977661133]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 12.0, 5.0, 10.0, 6.0, 11.0, 19.0, 19.0, 38.0, 41.0, 40.0, 56.0, 122.0, 174.0, 308.0, 573.0, 1472.0, 5043.0, 36163.0, 557834.0, 413298.0, 26547.0, 4162.0, 1259.0, 521.0, 282.0, 142.0, 120.0, 62.0, 32.0, 36.0, 26.0, 16.0, 19.0, 9.0, 14.0, 13.0, 7.0, 7.0, 5.0, 11.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.75, -5.5699462890625, -5.389892578125, -5.2098388671875, -5.02978515625, -4.8497314453125, -4.669677734375, -4.4896240234375, -4.3095703125, -4.1295166015625, -3.949462890625, -3.7694091796875, -3.58935546875, -3.4093017578125, -3.229248046875, -3.0491943359375, -2.869140625, -2.6890869140625, -2.509033203125, -2.3289794921875, -2.14892578125, -1.9688720703125, -1.788818359375, -1.6087646484375, -1.4287109375, -1.2486572265625, -1.068603515625, -0.8885498046875, -0.70849609375, -0.5284423828125, -0.348388671875, -0.1683349609375, 0.01171875, 0.1917724609375, 0.371826171875, 0.5518798828125, 0.73193359375, 0.9119873046875, 1.092041015625, 1.2720947265625, 1.4521484375, 1.6322021484375, 1.812255859375, 1.9923095703125, 2.17236328125, 2.3524169921875, 2.532470703125, 2.7125244140625, 2.892578125, 3.0726318359375, 3.252685546875, 3.4327392578125, 3.61279296875, 3.7928466796875, 3.972900390625, 4.1529541015625, 4.3330078125, 4.5130615234375, 4.693115234375, 4.8731689453125, 5.05322265625, 5.2332763671875, 5.413330078125, 5.5933837890625, 5.7734375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 10.0, 21.0, 23.0, 41.0, 58.0, 81.0, 104.0, 115.0, 110.0, 112.0, 94.0, 66.0, 57.0, 49.0, 30.0, 14.0, 5.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.79443359375, -0.7747688293457031, -0.7551040649414062, -0.7354393005371094, -0.7157745361328125, -0.6961097717285156, -0.6764450073242188, -0.6567802429199219, -0.637115478515625, -0.6174507141113281, -0.5977859497070312, -0.5781211853027344, -0.5584564208984375, -0.5387916564941406, -0.5191268920898438, -0.4994621276855469, -0.47979736328125, -0.4601325988769531, -0.44046783447265625, -0.4208030700683594, -0.4011383056640625, -0.3814735412597656, -0.36180877685546875, -0.3421440124511719, -0.322479248046875, -0.3028144836425781, -0.28314971923828125, -0.2634849548339844, -0.2438201904296875, -0.22415542602539062, -0.20449066162109375, -0.18482589721679688, -0.1651611328125, -0.14549636840820312, -0.12583160400390625, -0.10616683959960938, -0.0865020751953125, -0.06683731079101562, -0.04717254638671875, -0.027507781982421875, -0.007843017578125, 0.011821746826171875, 0.03148651123046875, 0.051151275634765625, 0.0708160400390625, 0.09048080444335938, 0.11014556884765625, 0.12981033325195312, 0.14947509765625, 0.16913986206054688, 0.18880462646484375, 0.20846939086914062, 0.2281341552734375, 0.24779891967773438, 0.26746368408203125, 0.2871284484863281, 0.306793212890625, 0.3264579772949219, 0.34612274169921875, 0.3657875061035156, 0.3854522705078125, 0.4051170349121094, 0.42478179931640625, 0.4444465637207031, 0.464111328125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 4.0, 12.0, 10.0, 14.0, 32.0, 49.0, 70.0, 146.0, 255.0, 517.0, 1122.0, 2847.0, 9761.0, 56379.0, 498559.0, 420520.0, 45493.0, 8238.0, 2560.0, 956.0, 457.0, 241.0, 127.0, 65.0, 42.0, 19.0, 19.0, 9.0, 9.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.42578125, -3.3114013671875, -3.197021484375, -3.0826416015625, -2.96826171875, -2.8538818359375, -2.739501953125, -2.6251220703125, -2.5107421875, -2.3963623046875, -2.281982421875, -2.1676025390625, -2.05322265625, -1.9388427734375, -1.824462890625, -1.7100830078125, -1.595703125, -1.4813232421875, -1.366943359375, -1.2525634765625, -1.13818359375, -1.0238037109375, -0.909423828125, -0.7950439453125, -0.6806640625, -0.5662841796875, -0.451904296875, -0.3375244140625, -0.22314453125, -0.1087646484375, 0.005615234375, 0.1199951171875, 0.234375, 0.3487548828125, 0.463134765625, 0.5775146484375, 0.69189453125, 0.8062744140625, 0.920654296875, 1.0350341796875, 1.1494140625, 1.2637939453125, 1.378173828125, 1.4925537109375, 1.60693359375, 1.7213134765625, 1.835693359375, 1.9500732421875, 2.064453125, 2.1788330078125, 2.293212890625, 2.4075927734375, 2.52197265625, 2.6363525390625, 2.750732421875, 2.8651123046875, 2.9794921875, 3.0938720703125, 3.208251953125, 3.3226318359375, 3.43701171875, 3.5513916015625, 3.665771484375, 3.7801513671875, 3.89453125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 2.0, 4.0, 8.0, 9.0, 11.0, 14.0, 29.0, 33.0, 34.0, 42.0, 59.0, 64.0, 73.0, 74.0, 74.0, 78.0, 66.0, 55.0, 48.0, 60.0, 46.0, 33.0, 20.0, 18.0, 9.0, 16.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.32421875, -2.2550048828125, -2.185791015625, -2.1165771484375, -2.04736328125, -1.9781494140625, -1.908935546875, -1.8397216796875, -1.7705078125, -1.7012939453125, -1.632080078125, -1.5628662109375, -1.49365234375, -1.4244384765625, -1.355224609375, -1.2860107421875, -1.216796875, -1.1475830078125, -1.078369140625, -1.0091552734375, -0.93994140625, -0.8707275390625, -0.801513671875, -0.7322998046875, -0.6630859375, -0.5938720703125, -0.524658203125, -0.4554443359375, -0.38623046875, -0.3170166015625, -0.247802734375, -0.1785888671875, -0.109375, -0.0401611328125, 0.029052734375, 0.0982666015625, 0.16748046875, 0.2366943359375, 0.305908203125, 0.3751220703125, 0.4443359375, 0.5135498046875, 0.582763671875, 0.6519775390625, 0.72119140625, 0.7904052734375, 0.859619140625, 0.9288330078125, 0.998046875, 1.0672607421875, 1.136474609375, 1.2056884765625, 1.27490234375, 1.3441162109375, 1.413330078125, 1.4825439453125, 1.5517578125, 1.6209716796875, 1.690185546875, 1.7593994140625, 1.82861328125, 1.8978271484375, 1.967041015625, 2.0362548828125, 2.10546875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 3.0, 4.0, 8.0, 12.0, 9.0, 14.0, 14.0, 38.0, 35.0, 58.0, 101.0, 150.0, 233.0, 452.0, 754.0, 1603.0, 4056.0, 13503.0, 78664.0, 646727.0, 260777.0, 29322.0, 6945.0, 2527.0, 1148.0, 537.0, 319.0, 191.0, 103.0, 54.0, 58.0, 38.0, 26.0, 15.0, 16.0, 7.0, 1.0, 8.0, 3.0, 9.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.36328125, -2.274932861328125, -2.18658447265625, -2.098236083984375, -2.0098876953125, -1.921539306640625, -1.83319091796875, -1.744842529296875, -1.656494140625, -1.568145751953125, -1.47979736328125, -1.391448974609375, -1.3031005859375, -1.214752197265625, -1.12640380859375, -1.038055419921875, -0.94970703125, -0.861358642578125, -0.77301025390625, -0.684661865234375, -0.5963134765625, -0.507965087890625, -0.41961669921875, -0.331268310546875, -0.242919921875, -0.154571533203125, -0.06622314453125, 0.022125244140625, 0.1104736328125, 0.198822021484375, 0.28717041015625, 0.375518798828125, 0.4638671875, 0.552215576171875, 0.64056396484375, 0.728912353515625, 0.8172607421875, 0.905609130859375, 0.99395751953125, 1.082305908203125, 1.170654296875, 1.259002685546875, 1.34735107421875, 1.435699462890625, 1.5240478515625, 1.612396240234375, 1.70074462890625, 1.789093017578125, 1.87744140625, 1.965789794921875, 2.05413818359375, 2.142486572265625, 2.2308349609375, 2.319183349609375, 2.40753173828125, 2.495880126953125, 2.584228515625, 2.672576904296875, 2.76092529296875, 2.849273681640625, 2.9376220703125, 3.025970458984375, 3.11431884765625, 3.202667236328125, 3.291015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 2.0, 8.0, 4.0, 6.0, 14.0, 9.0, 30.0, 23.0, 21.0, 23.0, 36.0, 41.0, 53.0, 41.0, 55.0, 80.0, 66.0, 68.0, 72.0, 53.0, 62.0, 36.0, 34.0, 33.0, 21.0, 22.0, 21.0, 13.0, 8.0, 12.0, 5.0, 9.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0002872943878173828, -0.00027914345264434814, -0.0002709925174713135, -0.0002628415822982788, -0.00025469064712524414, -0.00024653971195220947, -0.0002383887767791748, -0.00023023784160614014, -0.00022208690643310547, -0.0002139359712600708, -0.00020578503608703613, -0.00019763410091400146, -0.0001894831657409668, -0.00018133223056793213, -0.00017318129539489746, -0.0001650303602218628, -0.00015687942504882812, -0.00014872848987579346, -0.0001405775547027588, -0.00013242661952972412, -0.00012427568435668945, -0.00011612474918365479, -0.00010797381401062012, -9.982287883758545e-05, -9.167194366455078e-05, -8.352100849151611e-05, -7.537007331848145e-05, -6.721913814544678e-05, -5.906820297241211e-05, -5.091726779937744e-05, -4.2766332626342773e-05, -3.4615397453308105e-05, -2.6464462280273438e-05, -1.831352710723877e-05, -1.0162591934204102e-05, -2.0116567611694336e-06, 6.139278411865234e-06, 1.4290213584899902e-05, 2.244114875793457e-05, 3.059208393096924e-05, 3.8743019104003906e-05, 4.6893954277038574e-05, 5.504488945007324e-05, 6.319582462310791e-05, 7.134675979614258e-05, 7.949769496917725e-05, 8.764863014221191e-05, 9.579956531524658e-05, 0.00010395050048828125, 0.00011210143566131592, 0.00012025237083435059, 0.00012840330600738525, 0.00013655424118041992, 0.0001447051763534546, 0.00015285611152648926, 0.00016100704669952393, 0.0001691579818725586, 0.00017730891704559326, 0.00018545985221862793, 0.0001936107873916626, 0.00020176172256469727, 0.00020991265773773193, 0.0002180635929107666, 0.00022621452808380127, 0.00023436546325683594]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 9.0, 6.0, 3.0, 10.0, 9.0, 19.0, 21.0, 21.0, 44.0, 48.0, 93.0, 162.0, 255.0, 552.0, 978.0, 2304.0, 6021.0, 21363.0, 129889.0, 625098.0, 216672.0, 31858.0, 7933.0, 2789.0, 1118.0, 553.0, 271.0, 161.0, 94.0, 61.0, 36.0, 36.0, 18.0, 12.0, 13.0, 7.0, 4.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.529296875, -2.44390869140625, -2.3585205078125, -2.27313232421875, -2.187744140625, -2.10235595703125, -2.0169677734375, -1.93157958984375, -1.84619140625, -1.76080322265625, -1.6754150390625, -1.59002685546875, -1.504638671875, -1.41925048828125, -1.3338623046875, -1.24847412109375, -1.1630859375, -1.07769775390625, -0.9923095703125, -0.90692138671875, -0.821533203125, -0.73614501953125, -0.6507568359375, -0.56536865234375, -0.47998046875, -0.39459228515625, -0.3092041015625, -0.22381591796875, -0.138427734375, -0.05303955078125, 0.0323486328125, 0.11773681640625, 0.203125, 0.28851318359375, 0.3739013671875, 0.45928955078125, 0.544677734375, 0.63006591796875, 0.7154541015625, 0.80084228515625, 0.88623046875, 0.97161865234375, 1.0570068359375, 1.14239501953125, 1.227783203125, 1.31317138671875, 1.3985595703125, 1.48394775390625, 1.5693359375, 1.65472412109375, 1.7401123046875, 1.82550048828125, 1.910888671875, 1.99627685546875, 2.0816650390625, 2.16705322265625, 2.25244140625, 2.33782958984375, 2.4232177734375, 2.50860595703125, 2.593994140625, 2.67938232421875, 2.7647705078125, 2.85015869140625, 2.935546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 8.0, 7.0, 11.0, 13.0, 26.0, 20.0, 30.0, 51.0, 38.0, 63.0, 57.0, 79.0, 83.0, 60.0, 85.0, 73.0, 62.0, 49.0, 35.0, 38.0, 29.0, 17.0, 12.0, 15.0, 6.0, 9.0, 1.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.388671875, -1.35101318359375, -1.3133544921875, -1.27569580078125, -1.238037109375, -1.20037841796875, -1.1627197265625, -1.12506103515625, -1.08740234375, -1.04974365234375, -1.0120849609375, -0.97442626953125, -0.936767578125, -0.89910888671875, -0.8614501953125, -0.82379150390625, -0.7861328125, -0.74847412109375, -0.7108154296875, -0.67315673828125, -0.635498046875, -0.59783935546875, -0.5601806640625, -0.52252197265625, -0.48486328125, -0.44720458984375, -0.4095458984375, -0.37188720703125, -0.334228515625, -0.29656982421875, -0.2589111328125, -0.22125244140625, -0.18359375, -0.14593505859375, -0.1082763671875, -0.07061767578125, -0.032958984375, 0.00469970703125, 0.0423583984375, 0.08001708984375, 0.11767578125, 0.15533447265625, 0.1929931640625, 0.23065185546875, 0.268310546875, 0.30596923828125, 0.3436279296875, 0.38128662109375, 0.4189453125, 0.45660400390625, 0.4942626953125, 0.53192138671875, 0.569580078125, 0.60723876953125, 0.6448974609375, 0.68255615234375, 0.72021484375, 0.75787353515625, 0.7955322265625, 0.83319091796875, 0.870849609375, 0.90850830078125, 0.9461669921875, 0.98382568359375, 1.021484375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 6.0, 10.0, 34.0, 52.0, 94.0, 181.0, 245.0, 166.0, 90.0, 53.0, 27.0, 21.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.711803436279297, -26.016265869140625, -25.320730209350586, -24.625192642211914, -23.929655075073242, -23.234119415283203, -22.53858184814453, -21.84304428100586, -21.147506713867188, -20.451969146728516, -19.756433486938477, -19.060895919799805, -18.365358352661133, -17.669822692871094, -16.974285125732422, -16.27874755859375, -15.583211898803711, -14.887675285339355, -14.192137718200684, -13.496601104736328, -12.801063537597656, -12.1055269241333, -11.409990310668945, -10.714452743530273, -10.018916130065918, -9.323379516601562, -8.62784194946289, -7.932305335998535, -7.2367682456970215, -6.541231155395508, -5.845694541931152, -5.150157451629639, -4.454618453979492, -3.7590813636779785, -3.063544511795044, -2.3680076599121094, -1.6724705696105957, -0.976933479309082, -0.28139686584472656, 0.4141402244567871, 1.1096773147583008, 1.805214285850525, 2.500751256942749, 3.1962881088256836, 3.8918251991271973, 4.587362289428711, 5.282898902893066, 5.97843599319458, 6.673973083496094, 7.369510173797607, 8.065047264099121, 8.760583877563477, 9.456121444702148, 10.151658058166504, 10.84719467163086, 11.542732238769531, 12.238268852233887, 12.933805465698242, 13.629343032836914, 14.32487964630127, 15.020416259765625, 15.715953826904297, 16.41149139404297, 17.107027053833008, 17.80256462097168]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 6.0, 10.0, 19.0, 28.0, 32.0, 32.0, 36.0, 51.0, 65.0, 62.0, 70.0, 83.0, 70.0, 71.0, 61.0, 61.0, 56.0, 38.0, 35.0, 25.0, 27.0, 18.0, 12.0, 11.0, 3.0, 7.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.241382598876953, -16.69890594482422, -16.156431198120117, -15.6139554977417, -15.071479797363281, -14.529004096984863, -13.986528396606445, -13.444052696228027, -12.90157699584961, -12.359101295471191, -11.816625595092773, -11.274149894714355, -10.731674194335938, -10.18919849395752, -9.646722793579102, -9.104247093200684, -8.561771392822266, -8.019295692443848, -7.47681999206543, -6.934344291687012, -6.391868591308594, -5.849392890930176, -5.306917190551758, -4.76444149017334, -4.221965789794922, -3.679490089416504, -3.137014389038086, -2.594538688659668, -2.05206298828125, -1.509587287902832, -0.9671115875244141, -0.4246358871459961, 0.11783981323242188, 0.6603155136108398, 1.2027912139892578, 1.7452669143676758, 2.2877426147460938, 2.8302183151245117, 3.3726940155029297, 3.9151697158813477, 4.457645416259766, 5.000121116638184, 5.542596817016602, 6.0850725173950195, 6.6275482177734375, 7.1700239181518555, 7.712499618530273, 8.254975318908691, 8.79745101928711, 9.339926719665527, 9.882402420043945, 10.424878120422363, 10.967353820800781, 11.5098295211792, 12.052305221557617, 12.594780921936035, 13.137256622314453, 13.679732322692871, 14.222208023071289, 14.764683723449707, 15.307159423828125, 15.849635124206543, 16.39211082458496, 16.934585571289062, 17.477062225341797]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 8.0, 7.0, 18.0, 9.0, 15.0, 24.0, 36.0, 45.0, 71.0, 113.0, 159.0, 290.0, 556.0, 1662.0, 6641.0, 54926.0, 3933573.0, 177954.0, 13804.0, 2685.0, 887.0, 343.0, 187.0, 92.0, 52.0, 35.0, 17.0, 10.0, 11.0, 5.0, 7.0, 7.0, 5.0, 3.0, 4.0, 0.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.796875, -8.53570556640625, -8.2745361328125, -8.01336669921875, -7.752197265625, -7.49102783203125, -7.2298583984375, -6.96868896484375, -6.70751953125, -6.44635009765625, -6.1851806640625, -5.92401123046875, -5.662841796875, -5.40167236328125, -5.1405029296875, -4.87933349609375, -4.6181640625, -4.35699462890625, -4.0958251953125, -3.83465576171875, -3.573486328125, -3.31231689453125, -3.0511474609375, -2.78997802734375, -2.52880859375, -2.26763916015625, -2.0064697265625, -1.74530029296875, -1.484130859375, -1.22296142578125, -0.9617919921875, -0.70062255859375, -0.439453125, -0.17828369140625, 0.0828857421875, 0.34405517578125, 0.605224609375, 0.86639404296875, 1.1275634765625, 1.38873291015625, 1.64990234375, 1.91107177734375, 2.1722412109375, 2.43341064453125, 2.694580078125, 2.95574951171875, 3.2169189453125, 3.47808837890625, 3.7392578125, 4.00042724609375, 4.2615966796875, 4.52276611328125, 4.783935546875, 5.04510498046875, 5.3062744140625, 5.56744384765625, 5.82861328125, 6.08978271484375, 6.3509521484375, 6.61212158203125, 6.873291015625, 7.13446044921875, 7.3956298828125, 7.65679931640625, 7.91796875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 4.0, 6.0, 5.0, 16.0, 20.0, 39.0, 48.0, 66.0, 68.0, 109.0, 92.0, 91.0, 97.0, 90.0, 64.0, 59.0, 41.0, 32.0, 21.0, 9.0, 14.0, 2.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7646484375, -0.7436370849609375, -0.722625732421875, -0.7016143798828125, -0.68060302734375, -0.6595916748046875, -0.638580322265625, -0.6175689697265625, -0.5965576171875, -0.5755462646484375, -0.554534912109375, -0.5335235595703125, -0.51251220703125, -0.4915008544921875, -0.470489501953125, -0.4494781494140625, -0.428466796875, -0.4074554443359375, -0.386444091796875, -0.3654327392578125, -0.34442138671875, -0.3234100341796875, -0.302398681640625, -0.2813873291015625, -0.2603759765625, -0.2393646240234375, -0.218353271484375, -0.1973419189453125, -0.17633056640625, -0.1553192138671875, -0.134307861328125, -0.1132965087890625, -0.09228515625, -0.0712738037109375, -0.050262451171875, -0.0292510986328125, -0.00823974609375, 0.0127716064453125, 0.033782958984375, 0.0547943115234375, 0.0758056640625, 0.0968170166015625, 0.117828369140625, 0.1388397216796875, 0.15985107421875, 0.1808624267578125, 0.201873779296875, 0.2228851318359375, 0.243896484375, 0.2649078369140625, 0.285919189453125, 0.3069305419921875, 0.32794189453125, 0.3489532470703125, 0.369964599609375, 0.3909759521484375, 0.4119873046875, 0.4329986572265625, 0.454010009765625, 0.4750213623046875, 0.49603271484375, 0.5170440673828125, 0.538055419921875, 0.5590667724609375, 0.580078125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 8.0, 4.0, 7.0, 13.0, 32.0, 43.0, 59.0, 93.0, 91.0, 194.0, 686.0, 6619.0, 4173346.0, 12034.0, 689.0, 175.0, 61.0, 50.0, 35.0, 18.0, 14.0, 12.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.125, -34.3707275390625, -33.616455078125, -32.8621826171875, -32.10791015625, -31.3536376953125, -30.599365234375, -29.8450927734375, -29.0908203125, -28.3365478515625, -27.582275390625, -26.8280029296875, -26.07373046875, -25.3194580078125, -24.565185546875, -23.8109130859375, -23.056640625, -22.3023681640625, -21.548095703125, -20.7938232421875, -20.03955078125, -19.2852783203125, -18.531005859375, -17.7767333984375, -17.0224609375, -16.2681884765625, -15.513916015625, -14.7596435546875, -14.00537109375, -13.2510986328125, -12.496826171875, -11.7425537109375, -10.98828125, -10.2340087890625, -9.479736328125, -8.7254638671875, -7.97119140625, -7.2169189453125, -6.462646484375, -5.7083740234375, -4.9541015625, -4.1998291015625, -3.445556640625, -2.6912841796875, -1.93701171875, -1.1827392578125, -0.428466796875, 0.3258056640625, 1.080078125, 1.8343505859375, 2.588623046875, 3.3428955078125, 4.09716796875, 4.8514404296875, 5.605712890625, 6.3599853515625, 7.1142578125, 7.8685302734375, 8.622802734375, 9.3770751953125, 10.13134765625, 10.8856201171875, 11.639892578125, 12.3941650390625, 13.1484375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 15.0, 47.0, 135.0, 2587.0, 1132.0, 122.0, 25.0, 10.0, 3.0, 3.0, 1.0, 2.0], "bins": [-6.5625, -6.445121765136719, -6.3277435302734375, -6.210365295410156, -6.092987060546875, -5.975608825683594, -5.8582305908203125, -5.740852355957031, -5.62347412109375, -5.506095886230469, -5.3887176513671875, -5.271339416503906, -5.153961181640625, -5.036582946777344, -4.9192047119140625, -4.801826477050781, -4.6844482421875, -4.567070007324219, -4.4496917724609375, -4.332313537597656, -4.214935302734375, -4.097557067871094, -3.9801788330078125, -3.8628005981445312, -3.74542236328125, -3.6280441284179688, -3.5106658935546875, -3.3932876586914062, -3.275909423828125, -3.1585311889648438, -3.0411529541015625, -2.9237747192382812, -2.806396484375, -2.6890182495117188, -2.5716400146484375, -2.4542617797851562, -2.336883544921875, -2.2195053100585938, -2.1021270751953125, -1.9847488403320312, -1.86737060546875, -1.7499923706054688, -1.6326141357421875, -1.5152359008789062, -1.397857666015625, -1.2804794311523438, -1.1631011962890625, -1.0457229614257812, -0.9283447265625, -0.8109664916992188, -0.6935882568359375, -0.5762100219726562, -0.458831787109375, -0.34145355224609375, -0.2240753173828125, -0.10669708251953125, 0.01068115234375, 0.12805938720703125, 0.2454376220703125, 0.36281585693359375, 0.480194091796875, 0.5975723266601562, 0.7149505615234375, 0.8323287963867188, 0.94970703125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 11.0, 24.0, 91.0, 431.0, 360.0, 62.0, 17.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.955703735351562, -30.11815643310547, -29.280609130859375, -28.44306182861328, -27.60551643371582, -26.767969131469727, -25.930421829223633, -25.09287452697754, -24.255329132080078, -23.417781829833984, -22.58023452758789, -21.742687225341797, -20.905141830444336, -20.067594528198242, -19.23004722595215, -18.392499923706055, -17.55495262145996, -16.717405319213867, -15.87985897064209, -15.042311668395996, -14.204765319824219, -13.367218017578125, -12.529670715332031, -11.692123413085938, -10.85457706451416, -10.017029762268066, -9.179483413696289, -8.341936111450195, -7.50438928604126, -6.666842460632324, -5.8292951583862305, -4.991748332977295, -4.154201507568359, -3.316654682159424, -2.479107618331909, -1.6415605545043945, -0.804013729095459, 0.03353309631347656, 0.8710803985595703, 1.7086272239685059, 2.5461740493774414, 3.383720874786377, 4.2212677001953125, 5.058815002441406, 5.896361827850342, 6.733908653259277, 7.571455955505371, 8.409002304077148, 9.246549606323242, 10.084096908569336, 10.921643257141113, 11.759190559387207, 12.596736907958984, 13.434284210205078, 14.271831512451172, 15.109378814697266, 15.946925163269043, 16.78447151184082, 17.622018814086914, 18.459566116333008, 19.2971134185791, 20.134658813476562, 20.972206115722656, 21.80975341796875, 22.647300720214844]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 8.0, 13.0, 23.0, 40.0, 53.0, 72.0, 87.0, 86.0, 105.0, 101.0, 95.0, 86.0, 81.0, 55.0, 31.0, 22.0, 14.0, 11.0, 10.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.575103759765625, -12.224360466003418, -11.873616218566895, -11.522872924804688, -11.17212963104248, -10.821386337280273, -10.47064208984375, -10.119898796081543, -9.769155502319336, -9.418412208557129, -9.067667961120605, -8.716924667358398, -8.366181373596191, -8.015438079833984, -7.664693832397461, -7.313950538635254, -6.9632062911987305, -6.612462520599365, -6.261719226837158, -5.910975456237793, -5.560232162475586, -5.209488391876221, -4.8587446212768555, -4.508001327514648, -4.157257556915283, -3.806514024734497, -3.455770492553711, -3.1050267219543457, -2.7542831897735596, -2.4035396575927734, -2.052795886993408, -1.702052354812622, -1.3513097763061523, -1.0005662441253662, -0.6498225927352905, -0.29907894134521484, 0.05166459083557129, 0.4024081230163574, 0.7531518936157227, 1.1038954257965088, 1.454638957977295, 1.805382490158081, 2.156126022338867, 2.5068697929382324, 2.8576133251190186, 3.2083568572998047, 3.55910062789917, 3.909844160079956, 4.260587692260742, 4.611331462860107, 4.9620747566223145, 5.31281852722168, 5.663561820983887, 6.014305591583252, 6.365049362182617, 6.715792655944824, 7.0665364265441895, 7.417280197143555, 7.768023490905762, 8.118766784667969, 8.469511032104492, 8.8202543258667, 9.170997619628906, 9.52174186706543, 9.872485160827637]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 6.0, 11.0, 12.0, 19.0, 21.0, 35.0, 42.0, 85.0, 104.0, 179.0, 319.0, 657.0, 1709.0, 7081.0, 49570.0, 541945.0, 402861.0, 35454.0, 5527.0, 1540.0, 591.0, 293.0, 160.0, 103.0, 79.0, 38.0, 44.0, 22.0, 14.0, 8.0, 8.0, 8.0, 1.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.81640625, -5.63421630859375, -5.4520263671875, -5.26983642578125, -5.087646484375, -4.90545654296875, -4.7232666015625, -4.54107666015625, -4.35888671875, -4.17669677734375, -3.9945068359375, -3.81231689453125, -3.630126953125, -3.44793701171875, -3.2657470703125, -3.08355712890625, -2.9013671875, -2.71917724609375, -2.5369873046875, -2.35479736328125, -2.172607421875, -1.99041748046875, -1.8082275390625, -1.62603759765625, -1.44384765625, -1.26165771484375, -1.0794677734375, -0.89727783203125, -0.715087890625, -0.53289794921875, -0.3507080078125, -0.16851806640625, 0.013671875, 0.19586181640625, 0.3780517578125, 0.56024169921875, 0.742431640625, 0.92462158203125, 1.1068115234375, 1.28900146484375, 1.47119140625, 1.65338134765625, 1.8355712890625, 2.01776123046875, 2.199951171875, 2.38214111328125, 2.5643310546875, 2.74652099609375, 2.9287109375, 3.11090087890625, 3.2930908203125, 3.47528076171875, 3.657470703125, 3.83966064453125, 4.0218505859375, 4.20404052734375, 4.38623046875, 4.56842041015625, 4.7506103515625, 4.93280029296875, 5.114990234375, 5.29718017578125, 5.4793701171875, 5.66156005859375, 5.84375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 13.0, 15.0, 20.0, 32.0, 41.0, 63.0, 67.0, 86.0, 91.0, 116.0, 88.0, 80.0, 75.0, 66.0, 43.0, 49.0, 18.0, 14.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.310546875, -1.2790603637695312, -1.2475738525390625, -1.2160873413085938, -1.184600830078125, -1.1531143188476562, -1.1216278076171875, -1.0901412963867188, -1.05865478515625, -1.0271682739257812, -0.9956817626953125, -0.9641952514648438, -0.932708740234375, -0.9012222290039062, -0.8697357177734375, -0.8382492065429688, -0.8067626953125, -0.7752761840820312, -0.7437896728515625, -0.7123031616210938, -0.680816650390625, -0.6493301391601562, -0.6178436279296875, -0.5863571166992188, -0.55487060546875, -0.5233840942382812, -0.4918975830078125, -0.46041107177734375, -0.428924560546875, -0.39743804931640625, -0.3659515380859375, -0.33446502685546875, -0.302978515625, -0.27149200439453125, -0.2400054931640625, -0.20851898193359375, -0.177032470703125, -0.14554595947265625, -0.1140594482421875, -0.08257293701171875, -0.05108642578125, -0.01959991455078125, 0.0118865966796875, 0.04337310791015625, 0.074859619140625, 0.10634613037109375, 0.1378326416015625, 0.16931915283203125, 0.2008056640625, 0.23229217529296875, 0.2637786865234375, 0.29526519775390625, 0.326751708984375, 0.35823822021484375, 0.3897247314453125, 0.42121124267578125, 0.45269775390625, 0.48418426513671875, 0.5156707763671875, 0.5471572875976562, 0.578643798828125, 0.6101303100585938, 0.6416168212890625, 0.6731033325195312, 0.70458984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 15.0, 11.0, 10.0, 15.0, 28.0, 33.0, 43.0, 54.0, 83.0, 131.0, 215.0, 322.0, 535.0, 904.0, 1704.0, 3586.0, 8720.0, 27867.0, 115205.0, 467625.0, 321868.0, 68711.0, 18402.0, 6237.0, 2755.0, 1376.0, 795.0, 437.0, 283.0, 159.0, 104.0, 95.0, 44.0, 38.0, 23.0, 22.0, 17.0, 17.0, 12.0, 10.0, 4.0, 5.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.78125, -2.6910400390625, -2.600830078125, -2.5106201171875, -2.42041015625, -2.3302001953125, -2.239990234375, -2.1497802734375, -2.0595703125, -1.9693603515625, -1.879150390625, -1.7889404296875, -1.69873046875, -1.6085205078125, -1.518310546875, -1.4281005859375, -1.337890625, -1.2476806640625, -1.157470703125, -1.0672607421875, -0.97705078125, -0.8868408203125, -0.796630859375, -0.7064208984375, -0.6162109375, -0.5260009765625, -0.435791015625, -0.3455810546875, -0.25537109375, -0.1651611328125, -0.074951171875, 0.0152587890625, 0.10546875, 0.1956787109375, 0.285888671875, 0.3760986328125, 0.46630859375, 0.5565185546875, 0.646728515625, 0.7369384765625, 0.8271484375, 0.9173583984375, 1.007568359375, 1.0977783203125, 1.18798828125, 1.2781982421875, 1.368408203125, 1.4586181640625, 1.548828125, 1.6390380859375, 1.729248046875, 1.8194580078125, 1.90966796875, 1.9998779296875, 2.090087890625, 2.1802978515625, 2.2705078125, 2.3607177734375, 2.450927734375, 2.5411376953125, 2.63134765625, 2.7215576171875, 2.811767578125, 2.9019775390625, 2.9921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 7.0, 7.0, 9.0, 13.0, 13.0, 21.0, 28.0, 32.0, 38.0, 40.0, 45.0, 50.0, 52.0, 60.0, 60.0, 50.0, 50.0, 62.0, 51.0, 50.0, 45.0, 40.0, 38.0, 27.0, 19.0, 21.0, 13.0, 13.0, 10.0, 8.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.66015625, -2.572052001953125, -2.48394775390625, -2.395843505859375, -2.3077392578125, -2.219635009765625, -2.13153076171875, -2.043426513671875, -1.955322265625, -1.867218017578125, -1.77911376953125, -1.691009521484375, -1.6029052734375, -1.514801025390625, -1.42669677734375, -1.338592529296875, -1.25048828125, -1.162384033203125, -1.07427978515625, -0.986175537109375, -0.8980712890625, -0.809967041015625, -0.72186279296875, -0.633758544921875, -0.545654296875, -0.457550048828125, -0.36944580078125, -0.281341552734375, -0.1932373046875, -0.105133056640625, -0.01702880859375, 0.071075439453125, 0.1591796875, 0.247283935546875, 0.33538818359375, 0.423492431640625, 0.5115966796875, 0.599700927734375, 0.68780517578125, 0.775909423828125, 0.864013671875, 0.952117919921875, 1.04022216796875, 1.128326416015625, 1.2164306640625, 1.304534912109375, 1.39263916015625, 1.480743408203125, 1.56884765625, 1.656951904296875, 1.74505615234375, 1.833160400390625, 1.9212646484375, 2.009368896484375, 2.09747314453125, 2.185577392578125, 2.273681640625, 2.361785888671875, 2.44989013671875, 2.537994384765625, 2.6260986328125, 2.714202880859375, 2.80230712890625, 2.890411376953125, 2.978515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 4.0, 6.0, 11.0, 18.0, 28.0, 32.0, 43.0, 74.0, 121.0, 253.0, 481.0, 994.0, 2463.0, 6694.0, 20547.0, 81553.0, 408741.0, 411963.0, 82426.0, 20755.0, 6707.0, 2453.0, 1070.0, 465.0, 251.0, 136.0, 86.0, 57.0, 48.0, 19.0, 17.0, 10.0, 9.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.96875, -1.912506103515625, -1.85626220703125, -1.800018310546875, -1.7437744140625, -1.687530517578125, -1.63128662109375, -1.575042724609375, -1.518798828125, -1.462554931640625, -1.40631103515625, -1.350067138671875, -1.2938232421875, -1.237579345703125, -1.18133544921875, -1.125091552734375, -1.06884765625, -1.012603759765625, -0.95635986328125, -0.900115966796875, -0.8438720703125, -0.787628173828125, -0.73138427734375, -0.675140380859375, -0.618896484375, -0.562652587890625, -0.50640869140625, -0.450164794921875, -0.3939208984375, -0.337677001953125, -0.28143310546875, -0.225189208984375, -0.1689453125, -0.112701416015625, -0.05645751953125, -0.000213623046875, 0.0560302734375, 0.112274169921875, 0.16851806640625, 0.224761962890625, 0.281005859375, 0.337249755859375, 0.39349365234375, 0.449737548828125, 0.5059814453125, 0.562225341796875, 0.61846923828125, 0.674713134765625, 0.73095703125, 0.787200927734375, 0.84344482421875, 0.899688720703125, 0.9559326171875, 1.012176513671875, 1.06842041015625, 1.124664306640625, 1.180908203125, 1.237152099609375, 1.29339599609375, 1.349639892578125, 1.4058837890625, 1.462127685546875, 1.51837158203125, 1.574615478515625, 1.630859375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 10.0, 9.0, 9.0, 17.0, 18.0, 19.0, 37.0, 33.0, 46.0, 65.0, 68.0, 100.0, 106.0, 90.0, 85.0, 59.0, 48.0, 39.0, 28.0, 21.0, 14.0, 19.0, 10.0, 9.0, 9.0, 3.0, 6.0, 6.0, 2.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019550323486328125, -0.0001872330904006958, -0.00017896294593811035, -0.0001706928014755249, -0.00016242265701293945, -0.000154152512550354, -0.00014588236808776855, -0.0001376122236251831, -0.00012934207916259766, -0.00012107193470001221, -0.00011280179023742676, -0.00010453164577484131, -9.626150131225586e-05, -8.799135684967041e-05, -7.972121238708496e-05, -7.145106792449951e-05, -6.318092346191406e-05, -5.491077899932861e-05, -4.6640634536743164e-05, -3.8370490074157715e-05, -3.0100345611572266e-05, -2.1830201148986816e-05, -1.3560056686401367e-05, -5.289912223815918e-06, 2.9802322387695312e-06, 1.125037670135498e-05, 1.952052116394043e-05, 2.779066562652588e-05, 3.606081008911133e-05, 4.433095455169678e-05, 5.2601099014282227e-05, 6.0871243476867676e-05, 6.914138793945312e-05, 7.741153240203857e-05, 8.568167686462402e-05, 9.395182132720947e-05, 0.00010222196578979492, 0.00011049211025238037, 0.00011876225471496582, 0.00012703239917755127, 0.00013530254364013672, 0.00014357268810272217, 0.00015184283256530762, 0.00016011297702789307, 0.00016838312149047852, 0.00017665326595306396, 0.00018492341041564941, 0.00019319355487823486, 0.0002014636993408203, 0.00020973384380340576, 0.0002180039882659912, 0.00022627413272857666, 0.0002345442771911621, 0.00024281442165374756, 0.000251084566116333, 0.00025935471057891846, 0.0002676248550415039, 0.00027589499950408936, 0.0002841651439666748, 0.00029243528842926025, 0.0003007054328918457, 0.00030897557735443115, 0.0003172457218170166, 0.00032551586627960205, 0.0003337860107421875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 16.0, 7.0, 16.0, 20.0, 32.0, 36.0, 52.0, 83.0, 99.0, 113.0, 213.0, 317.0, 454.0, 756.0, 1238.0, 2213.0, 4159.0, 8386.0, 18359.0, 44699.0, 127580.0, 357887.0, 308432.0, 103850.0, 37726.0, 15546.0, 7179.0, 3735.0, 2059.0, 1159.0, 688.0, 469.0, 275.0, 182.0, 152.0, 108.0, 63.0, 48.0, 32.0, 27.0, 17.0, 17.0, 7.0, 9.0, 8.0, 7.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.3359375, -1.2940673828125, -1.252197265625, -1.2103271484375, -1.16845703125, -1.1265869140625, -1.084716796875, -1.0428466796875, -1.0009765625, -0.9591064453125, -0.917236328125, -0.8753662109375, -0.83349609375, -0.7916259765625, -0.749755859375, -0.7078857421875, -0.666015625, -0.6241455078125, -0.582275390625, -0.5404052734375, -0.49853515625, -0.4566650390625, -0.414794921875, -0.3729248046875, -0.3310546875, -0.2891845703125, -0.247314453125, -0.2054443359375, -0.16357421875, -0.1217041015625, -0.079833984375, -0.0379638671875, 0.00390625, 0.0457763671875, 0.087646484375, 0.1295166015625, 0.17138671875, 0.2132568359375, 0.255126953125, 0.2969970703125, 0.3388671875, 0.3807373046875, 0.422607421875, 0.4644775390625, 0.50634765625, 0.5482177734375, 0.590087890625, 0.6319580078125, 0.673828125, 0.7156982421875, 0.757568359375, 0.7994384765625, 0.84130859375, 0.8831787109375, 0.925048828125, 0.9669189453125, 1.0087890625, 1.0506591796875, 1.092529296875, 1.1343994140625, 1.17626953125, 1.2181396484375, 1.260009765625, 1.3018798828125, 1.34375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 6.0, 8.0, 9.0, 20.0, 14.0, 10.0, 32.0, 34.0, 28.0, 49.0, 47.0, 59.0, 63.0, 53.0, 74.0, 70.0, 67.0, 52.0, 56.0, 35.0, 39.0, 23.0, 22.0, 22.0, 18.0, 15.0, 17.0, 16.0, 14.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.23828125, -1.2015380859375, -1.164794921875, -1.1280517578125, -1.09130859375, -1.0545654296875, -1.017822265625, -0.9810791015625, -0.9443359375, -0.9075927734375, -0.870849609375, -0.8341064453125, -0.79736328125, -0.7606201171875, -0.723876953125, -0.6871337890625, -0.650390625, -0.6136474609375, -0.576904296875, -0.5401611328125, -0.50341796875, -0.4666748046875, -0.429931640625, -0.3931884765625, -0.3564453125, -0.3197021484375, -0.282958984375, -0.2462158203125, -0.20947265625, -0.1727294921875, -0.135986328125, -0.0992431640625, -0.0625, -0.0257568359375, 0.010986328125, 0.0477294921875, 0.08447265625, 0.1212158203125, 0.157958984375, 0.1947021484375, 0.2314453125, 0.2681884765625, 0.304931640625, 0.3416748046875, 0.37841796875, 0.4151611328125, 0.451904296875, 0.4886474609375, 0.525390625, 0.5621337890625, 0.598876953125, 0.6356201171875, 0.67236328125, 0.7091064453125, 0.745849609375, 0.7825927734375, 0.8193359375, 0.8560791015625, 0.892822265625, 0.9295654296875, 0.96630859375, 1.0030517578125, 1.039794921875, 1.0765380859375, 1.11328125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 9.0, 15.0, 35.0, 93.0, 161.0, 251.0, 214.0, 103.0, 55.0, 27.0, 16.0, 10.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.63908386230469, -33.74003601074219, -32.84098434448242, -31.94193458557129, -31.042884826660156, -30.143835067749023, -29.24478530883789, -28.34573745727539, -27.446685791015625, -26.547636032104492, -25.64858627319336, -24.749536514282227, -23.850486755371094, -22.95143699645996, -22.052387237548828, -21.153339385986328, -20.254289627075195, -19.355239868164062, -18.45619010925293, -17.557140350341797, -16.658090591430664, -15.759040832519531, -14.859992027282715, -13.960942268371582, -13.06189250946045, -12.162842750549316, -11.263792991638184, -10.364744186401367, -9.465694427490234, -8.566644668579102, -7.667594909667969, -6.768545150756836, -5.869497299194336, -4.970447540283203, -4.07139778137207, -3.1723484992980957, -2.273298740386963, -1.37424898147583, -0.47519969940185547, 0.42385005950927734, 1.3228998184204102, 2.221949577331543, 3.1209990978240967, 4.02004861831665, 4.919098377227783, 5.818148136138916, 6.717197418212891, 7.616247177124023, 8.515296936035156, 9.414346694946289, 10.313396453857422, 11.212446212768555, 12.111495971679688, 13.01054573059082, 13.909594535827637, 14.80864429473877, 15.707694053649902, 16.60674285888672, 17.50579261779785, 18.404842376708984, 19.303892135620117, 20.20294189453125, 21.101991653442383, 22.001041412353516, 22.90009117126465]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 8.0, 16.0, 12.0, 15.0, 15.0, 15.0, 17.0, 18.0, 21.0, 17.0, 30.0, 28.0, 42.0, 42.0, 22.0, 36.0, 44.0, 35.0, 46.0, 48.0, 39.0, 56.0, 29.0, 32.0, 40.0, 32.0, 31.0, 28.0, 27.0, 19.0, 24.0, 15.0, 23.0, 16.0, 11.0, 11.0, 7.0, 8.0, 2.0, 6.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.455320358276367, -11.079195022583008, -10.703069686889648, -10.326943397521973, -9.950818061828613, -9.574692726135254, -9.198567390441895, -8.822441101074219, -8.44631576538086, -8.0701904296875, -7.694064617156982, -7.317939281463623, -6.9418134689331055, -6.565688133239746, -6.189562797546387, -5.813436985015869, -5.43731164932251, -5.06118631362915, -4.685060501098633, -4.308935165405273, -3.932809352874756, -3.5566840171813965, -3.180558443069458, -2.8044328689575195, -2.428307294845581, -2.0521817207336426, -1.676056146621704, -1.2999306917190552, -0.9238051176071167, -0.5476795434951782, -0.1715540885925293, 0.20457148551940918, 0.5806970596313477, 0.9568226337432861, 1.3329482078552246, 1.7090736627578735, 2.0851993560791016, 2.461324691772461, 2.8374502658843994, 3.213575839996338, 3.5897014141082764, 3.965826988220215, 4.341952323913574, 4.718078136444092, 5.094203472137451, 5.470329284667969, 5.846454620361328, 6.2225799560546875, 6.598705768585205, 6.9748311042785645, 7.350956916809082, 7.727082252502441, 8.1032075881958, 8.479333877563477, 8.855459213256836, 9.231584548950195, 9.607709884643555, 9.983835220336914, 10.359960556030273, 10.73608684539795, 11.112212181091309, 11.488337516784668, 11.864462852478027, 12.240589141845703, 12.616714477539062]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 13.0, 6.0, 14.0, 16.0, 17.0, 30.0, 28.0, 52.0, 47.0, 94.0, 181.0, 317.0, 612.0, 1604.0, 5502.0, 31841.0, 3745154.0, 384572.0, 17969.0, 3863.0, 1272.0, 500.0, 229.0, 113.0, 76.0, 43.0, 34.0, 21.0, 10.0, 14.0, 8.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.79296875, -6.586181640625, -6.37939453125, -6.172607421875, -5.9658203125, -5.759033203125, -5.55224609375, -5.345458984375, -5.138671875, -4.931884765625, -4.72509765625, -4.518310546875, -4.3115234375, -4.104736328125, -3.89794921875, -3.691162109375, -3.484375, -3.277587890625, -3.07080078125, -2.864013671875, -2.6572265625, -2.450439453125, -2.24365234375, -2.036865234375, -1.830078125, -1.623291015625, -1.41650390625, -1.209716796875, -1.0029296875, -0.796142578125, -0.58935546875, -0.382568359375, -0.17578125, 0.031005859375, 0.23779296875, 0.444580078125, 0.6513671875, 0.858154296875, 1.06494140625, 1.271728515625, 1.478515625, 1.685302734375, 1.89208984375, 2.098876953125, 2.3056640625, 2.512451171875, 2.71923828125, 2.926025390625, 3.1328125, 3.339599609375, 3.54638671875, 3.753173828125, 3.9599609375, 4.166748046875, 4.37353515625, 4.580322265625, 4.787109375, 4.993896484375, 5.20068359375, 5.407470703125, 5.6142578125, 5.821044921875, 6.02783203125, 6.234619140625, 6.44140625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 9.0, 7.0, 22.0, 13.0, 43.0, 31.0, 47.0, 67.0, 83.0, 73.0, 104.0, 86.0, 76.0, 75.0, 69.0, 48.0, 48.0, 24.0, 23.0, 24.0, 12.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.21484375, -1.1837844848632812, -1.1527252197265625, -1.1216659545898438, -1.090606689453125, -1.0595474243164062, -1.0284881591796875, -0.9974288940429688, -0.96636962890625, -0.9353103637695312, -0.9042510986328125, -0.8731918334960938, -0.842132568359375, -0.8110733032226562, -0.7800140380859375, -0.7489547729492188, -0.7178955078125, -0.6868362426757812, -0.6557769775390625, -0.6247177124023438, -0.593658447265625, -0.5625991821289062, -0.5315399169921875, -0.5004806518554688, -0.46942138671875, -0.43836212158203125, -0.4073028564453125, -0.37624359130859375, -0.345184326171875, -0.31412506103515625, -0.2830657958984375, -0.25200653076171875, -0.220947265625, -0.18988800048828125, -0.1588287353515625, -0.12776947021484375, -0.096710205078125, -0.06565093994140625, -0.0345916748046875, -0.00353240966796875, 0.02752685546875, 0.05858612060546875, 0.0896453857421875, 0.12070465087890625, 0.151763916015625, 0.18282318115234375, 0.2138824462890625, 0.24494171142578125, 0.2760009765625, 0.30706024169921875, 0.3381195068359375, 0.36917877197265625, 0.400238037109375, 0.43129730224609375, 0.4623565673828125, 0.49341583251953125, 0.52447509765625, 0.5555343627929688, 0.5865936279296875, 0.6176528930664062, 0.648712158203125, 0.6797714233398438, 0.7108306884765625, 0.7418899536132812, 0.77294921875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 5.0, 25.0, 18.0, 34.0, 79.0, 114.0, 160.0, 249.0, 394.0, 713.0, 1379.0, 3243.0, 11272.0, 68594.0, 3639672.0, 428526.0, 28558.0, 6317.0, 2246.0, 1053.0, 566.0, 362.0, 222.0, 174.0, 112.0, 54.0, 39.0, 32.0, 23.0, 8.0, 9.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5859375, -4.446044921875, -4.30615234375, -4.166259765625, -4.0263671875, -3.886474609375, -3.74658203125, -3.606689453125, -3.466796875, -3.326904296875, -3.18701171875, -3.047119140625, -2.9072265625, -2.767333984375, -2.62744140625, -2.487548828125, -2.34765625, -2.207763671875, -2.06787109375, -1.927978515625, -1.7880859375, -1.648193359375, -1.50830078125, -1.368408203125, -1.228515625, -1.088623046875, -0.94873046875, -0.808837890625, -0.6689453125, -0.529052734375, -0.38916015625, -0.249267578125, -0.109375, 0.030517578125, 0.17041015625, 0.310302734375, 0.4501953125, 0.590087890625, 0.72998046875, 0.869873046875, 1.009765625, 1.149658203125, 1.28955078125, 1.429443359375, 1.5693359375, 1.709228515625, 1.84912109375, 1.989013671875, 2.12890625, 2.268798828125, 2.40869140625, 2.548583984375, 2.6884765625, 2.828369140625, 2.96826171875, 3.108154296875, 3.248046875, 3.387939453125, 3.52783203125, 3.667724609375, 3.8076171875, 3.947509765625, 4.08740234375, 4.227294921875, 4.3671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 7.0, 5.0, 6.0, 11.0, 18.0, 25.0, 58.0, 110.0, 347.0, 1729.0, 1267.0, 257.0, 116.0, 46.0, 28.0, 22.0, 9.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.25, -1.208221435546875, -1.16644287109375, -1.124664306640625, -1.0828857421875, -1.041107177734375, -0.99932861328125, -0.957550048828125, -0.915771484375, -0.873992919921875, -0.83221435546875, -0.790435791015625, -0.7486572265625, -0.706878662109375, -0.66510009765625, -0.623321533203125, -0.58154296875, -0.539764404296875, -0.49798583984375, -0.456207275390625, -0.4144287109375, -0.372650146484375, -0.33087158203125, -0.289093017578125, -0.247314453125, -0.205535888671875, -0.16375732421875, -0.121978759765625, -0.0802001953125, -0.038421630859375, 0.00335693359375, 0.045135498046875, 0.0869140625, 0.128692626953125, 0.17047119140625, 0.212249755859375, 0.2540283203125, 0.295806884765625, 0.33758544921875, 0.379364013671875, 0.421142578125, 0.462921142578125, 0.50469970703125, 0.546478271484375, 0.5882568359375, 0.630035400390625, 0.67181396484375, 0.713592529296875, 0.75537109375, 0.797149658203125, 0.83892822265625, 0.880706787109375, 0.9224853515625, 0.964263916015625, 1.00604248046875, 1.047821044921875, 1.089599609375, 1.131378173828125, 1.17315673828125, 1.214935302734375, 1.2567138671875, 1.298492431640625, 1.34027099609375, 1.382049560546875, 1.423828125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 9.0, 29.0, 317.0, 570.0, 74.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.426021575927734, -25.60384750366211, -24.781675338745117, -23.959501266479492, -23.137327194213867, -22.315155029296875, -21.49298095703125, -20.670806884765625, -19.848634719848633, -19.026460647583008, -18.204288482666016, -17.38211441040039, -16.559940338134766, -15.737768173217773, -14.915594100952148, -14.09342098236084, -13.271246910095215, -12.449073791503906, -11.626899719238281, -10.804726600646973, -9.982553482055664, -9.160379409790039, -8.33820629119873, -7.516033172607422, -6.693859577178955, -5.871685981750488, -5.04951286315918, -4.227339267730713, -3.405165910720825, -2.5829925537109375, -1.7608189582824707, -0.9386458396911621, -0.11647224426269531, 0.7057011723518372, 1.5278745889663696, 2.350048065185547, 3.1722214221954346, 3.9943947792053223, 4.816568374633789, 5.638741493225098, 6.4609150886535645, 7.283088684082031, 8.10526180267334, 8.927434921264648, 9.749608993530273, 10.571782112121582, 11.39395523071289, 12.216129302978516, 13.038302421569824, 13.860475540161133, 14.682649612426758, 15.504822731018066, 16.326995849609375, 17.149169921875, 17.971343994140625, 18.793516159057617, 19.615690231323242, 20.437864303588867, 21.26003646850586, 22.082210540771484, 22.90438461303711, 23.7265567779541, 24.548730850219727, 25.37090301513672, 26.193077087402344]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 2.0, 8.0, 5.0, 11.0, 15.0, 14.0, 19.0, 26.0, 17.0, 31.0, 30.0, 40.0, 36.0, 41.0, 49.0, 43.0, 64.0, 64.0, 52.0, 47.0, 55.0, 54.0, 46.0, 36.0, 29.0, 38.0, 20.0, 24.0, 23.0, 18.0, 12.0, 5.0, 8.0, 3.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.61120343208313, -2.509795665740967, -2.4083878993988037, -2.3069801330566406, -2.2055721282958984, -2.1041643619537354, -2.0027565956115723, -1.9013488292694092, -1.7999409437179565, -1.6985331773757935, -1.5971252918243408, -1.4957175254821777, -1.3943097591400146, -1.292901873588562, -1.191494107246399, -1.0900862216949463, -0.9886784553527832, -0.8872706294059753, -0.7858628034591675, -0.6844550371170044, -0.5830472111701965, -0.48163938522338867, -0.3802316188812256, -0.2788237929344177, -0.17741596698760986, -0.0760081559419632, 0.02539965510368347, 0.12680745124816895, 0.2282152771949768, 0.32962310314178467, 0.43103086948394775, 0.5324386954307556, 0.6338467597961426, 0.7352545857429504, 0.8366624116897583, 0.9380701780319214, 1.039478063583374, 1.140885829925537, 1.2422935962677002, 1.3437013626098633, 1.445109248161316, 1.546517014503479, 1.6479249000549316, 1.7493326663970947, 1.8507404327392578, 1.9521483182907104, 2.053555965423584, 2.154963970184326, 2.2563717365264893, 2.3577795028686523, 2.4591872692108154, 2.5605950355529785, 2.6620030403137207, 2.763410806655884, 2.864818572998047, 2.96622633934021, 3.067634105682373, 3.169041872024536, 3.270449638366699, 3.3718576431274414, 3.4732654094696045, 3.5746731758117676, 3.6760809421539307, 3.7774887084960938, 3.878896713256836]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 9.0, 12.0, 18.0, 27.0, 31.0, 70.0, 94.0, 171.0, 320.0, 730.0, 2331.0, 14955.0, 235345.0, 729603.0, 56983.0, 5447.0, 1350.0, 490.0, 241.0, 138.0, 71.0, 41.0, 28.0, 23.0, 10.0, 8.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.79296875, -7.57806396484375, -7.3631591796875, -7.14825439453125, -6.933349609375, -6.71844482421875, -6.5035400390625, -6.28863525390625, -6.07373046875, -5.85882568359375, -5.6439208984375, -5.42901611328125, -5.214111328125, -4.99920654296875, -4.7843017578125, -4.56939697265625, -4.3544921875, -4.13958740234375, -3.9246826171875, -3.70977783203125, -3.494873046875, -3.27996826171875, -3.0650634765625, -2.85015869140625, -2.63525390625, -2.42034912109375, -2.2054443359375, -1.99053955078125, -1.775634765625, -1.56072998046875, -1.3458251953125, -1.13092041015625, -0.916015625, -0.70111083984375, -0.4862060546875, -0.27130126953125, -0.056396484375, 0.15850830078125, 0.3734130859375, 0.58831787109375, 0.80322265625, 1.01812744140625, 1.2330322265625, 1.44793701171875, 1.662841796875, 1.87774658203125, 2.0926513671875, 2.30755615234375, 2.5224609375, 2.73736572265625, 2.9522705078125, 3.16717529296875, 3.382080078125, 3.59698486328125, 3.8118896484375, 4.02679443359375, 4.24169921875, 4.45660400390625, 4.6715087890625, 4.88641357421875, 5.101318359375, 5.31622314453125, 5.5311279296875, 5.74603271484375, 5.9609375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 14.0, 14.0, 30.0, 27.0, 51.0, 68.0, 74.0, 98.0, 108.0, 90.0, 87.0, 77.0, 71.0, 56.0, 44.0, 29.0, 23.0, 16.0, 11.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3154296875, -1.2801895141601562, -1.2449493408203125, -1.2097091674804688, -1.174468994140625, -1.1392288208007812, -1.1039886474609375, -1.0687484741210938, -1.03350830078125, -0.9982681274414062, -0.9630279541015625, -0.9277877807617188, -0.892547607421875, -0.8573074340820312, -0.8220672607421875, -0.7868270874023438, -0.7515869140625, -0.7163467407226562, -0.6811065673828125, -0.6458663940429688, -0.610626220703125, -0.5753860473632812, -0.5401458740234375, -0.5049057006835938, -0.46966552734375, -0.43442535400390625, -0.3991851806640625, -0.36394500732421875, -0.328704833984375, -0.29346466064453125, -0.2582244873046875, -0.22298431396484375, -0.187744140625, -0.15250396728515625, -0.1172637939453125, -0.08202362060546875, -0.046783447265625, -0.01154327392578125, 0.0236968994140625, 0.05893707275390625, 0.09417724609375, 0.12941741943359375, 0.1646575927734375, 0.19989776611328125, 0.235137939453125, 0.27037811279296875, 0.3056182861328125, 0.34085845947265625, 0.3760986328125, 0.41133880615234375, 0.4465789794921875, 0.48181915283203125, 0.517059326171875, 0.5522994995117188, 0.5875396728515625, 0.6227798461914062, 0.65802001953125, 0.6932601928710938, 0.7285003662109375, 0.7637405395507812, 0.798980712890625, 0.8342208862304688, 0.8694610595703125, 0.9047012329101562, 0.93994140625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 9.0, 5.0, 4.0, 2.0, 11.0, 11.0, 20.0, 18.0, 33.0, 37.0, 60.0, 82.0, 128.0, 223.0, 307.0, 542.0, 914.0, 1705.0, 3750.0, 10359.0, 37008.0, 181721.0, 555988.0, 197078.0, 39695.0, 10727.0, 3886.0, 1749.0, 914.0, 539.0, 320.0, 203.0, 172.0, 85.0, 62.0, 46.0, 39.0, 21.0, 22.0, 14.0, 8.0, 8.0, 11.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.40234375, -3.2977294921875, -3.193115234375, -3.0885009765625, -2.98388671875, -2.8792724609375, -2.774658203125, -2.6700439453125, -2.5654296875, -2.4608154296875, -2.356201171875, -2.2515869140625, -2.14697265625, -2.0423583984375, -1.937744140625, -1.8331298828125, -1.728515625, -1.6239013671875, -1.519287109375, -1.4146728515625, -1.31005859375, -1.2054443359375, -1.100830078125, -0.9962158203125, -0.8916015625, -0.7869873046875, -0.682373046875, -0.5777587890625, -0.47314453125, -0.3685302734375, -0.263916015625, -0.1593017578125, -0.0546875, 0.0499267578125, 0.154541015625, 0.2591552734375, 0.36376953125, 0.4683837890625, 0.572998046875, 0.6776123046875, 0.7822265625, 0.8868408203125, 0.991455078125, 1.0960693359375, 1.20068359375, 1.3052978515625, 1.409912109375, 1.5145263671875, 1.619140625, 1.7237548828125, 1.828369140625, 1.9329833984375, 2.03759765625, 2.1422119140625, 2.246826171875, 2.3514404296875, 2.4560546875, 2.5606689453125, 2.665283203125, 2.7698974609375, 2.87451171875, 2.9791259765625, 3.083740234375, 3.1883544921875, 3.29296875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 5.0, 8.0, 7.0, 12.0, 9.0, 19.0, 28.0, 38.0, 26.0, 49.0, 49.0, 50.0, 79.0, 74.0, 73.0, 68.0, 60.0, 56.0, 71.0, 51.0, 45.0, 21.0, 31.0, 18.0, 9.0, 16.0, 10.0, 4.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3515625, -4.2293701171875, -4.107177734375, -3.9849853515625, -3.86279296875, -3.7406005859375, -3.618408203125, -3.4962158203125, -3.3740234375, -3.2518310546875, -3.129638671875, -3.0074462890625, -2.88525390625, -2.7630615234375, -2.640869140625, -2.5186767578125, -2.396484375, -2.2742919921875, -2.152099609375, -2.0299072265625, -1.90771484375, -1.7855224609375, -1.663330078125, -1.5411376953125, -1.4189453125, -1.2967529296875, -1.174560546875, -1.0523681640625, -0.93017578125, -0.8079833984375, -0.685791015625, -0.5635986328125, -0.44140625, -0.3192138671875, -0.197021484375, -0.0748291015625, 0.04736328125, 0.1695556640625, 0.291748046875, 0.4139404296875, 0.5361328125, 0.6583251953125, 0.780517578125, 0.9027099609375, 1.02490234375, 1.1470947265625, 1.269287109375, 1.3914794921875, 1.513671875, 1.6358642578125, 1.758056640625, 1.8802490234375, 2.00244140625, 2.1246337890625, 2.246826171875, 2.3690185546875, 2.4912109375, 2.6134033203125, 2.735595703125, 2.8577880859375, 2.97998046875, 3.1021728515625, 3.224365234375, 3.3465576171875, 3.46875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 6.0, 10.0, 10.0, 16.0, 21.0, 23.0, 49.0, 68.0, 124.0, 207.0, 328.0, 575.0, 984.0, 2031.0, 4397.0, 12800.0, 52207.0, 300094.0, 525911.0, 113093.0, 22806.0, 6862.0, 2739.0, 1380.0, 731.0, 379.0, 257.0, 152.0, 107.0, 53.0, 43.0, 29.0, 17.0, 11.0, 8.0, 10.0, 9.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.65234375, -1.59942626953125, -1.5465087890625, -1.49359130859375, -1.440673828125, -1.38775634765625, -1.3348388671875, -1.28192138671875, -1.22900390625, -1.17608642578125, -1.1231689453125, -1.07025146484375, -1.017333984375, -0.96441650390625, -0.9114990234375, -0.85858154296875, -0.8056640625, -0.75274658203125, -0.6998291015625, -0.64691162109375, -0.593994140625, -0.54107666015625, -0.4881591796875, -0.43524169921875, -0.38232421875, -0.32940673828125, -0.2764892578125, -0.22357177734375, -0.170654296875, -0.11773681640625, -0.0648193359375, -0.01190185546875, 0.041015625, 0.09393310546875, 0.1468505859375, 0.19976806640625, 0.252685546875, 0.30560302734375, 0.3585205078125, 0.41143798828125, 0.46435546875, 0.51727294921875, 0.5701904296875, 0.62310791015625, 0.676025390625, 0.72894287109375, 0.7818603515625, 0.83477783203125, 0.8876953125, 0.94061279296875, 0.9935302734375, 1.04644775390625, 1.099365234375, 1.15228271484375, 1.2052001953125, 1.25811767578125, 1.31103515625, 1.36395263671875, 1.4168701171875, 1.46978759765625, 1.522705078125, 1.57562255859375, 1.6285400390625, 1.68145751953125, 1.734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 4.0, 8.0, 13.0, 17.0, 24.0, 27.0, 25.0, 54.0, 47.0, 54.0, 101.0, 126.0, 113.0, 85.0, 76.0, 51.0, 41.0, 25.0, 28.0, 18.0, 15.0, 9.0, 7.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00035834312438964844, -0.00034912116825580597, -0.0003398992121219635, -0.00033067725598812103, -0.00032145529985427856, -0.0003122333437204361, -0.00030301138758659363, -0.00029378943145275116, -0.0002845674753189087, -0.0002753455191850662, -0.00026612356305122375, -0.0002569016069173813, -0.0002476796507835388, -0.00023845769464969635, -0.00022923573851585388, -0.00022001378238201141, -0.00021079182624816895, -0.00020156987011432648, -0.000192347913980484, -0.00018312595784664154, -0.00017390400171279907, -0.0001646820455789566, -0.00015546008944511414, -0.00014623813331127167, -0.0001370161771774292, -0.00012779422104358673, -0.00011857226490974426, -0.0001093503087759018, -0.00010012835264205933, -9.090639650821686e-05, -8.168444037437439e-05, -7.246248424053192e-05, -6.324052810668945e-05, -5.4018571972846985e-05, -4.4796615839004517e-05, -3.557465970516205e-05, -2.635270357131958e-05, -1.7130747437477112e-05, -7.908791303634644e-06, 1.3131648302078247e-06, 1.0535120964050293e-05, 1.975707709789276e-05, 2.897903323173523e-05, 3.82009893655777e-05, 4.7422945499420166e-05, 5.6644901633262634e-05, 6.58668577671051e-05, 7.508881390094757e-05, 8.431077003479004e-05, 9.353272616863251e-05, 0.00010275468230247498, 0.00011197663843631744, 0.00012119859457015991, 0.00013042055070400238, 0.00013964250683784485, 0.00014886446297168732, 0.00015808641910552979, 0.00016730837523937225, 0.00017653033137321472, 0.0001857522875070572, 0.00019497424364089966, 0.00020419619977474213, 0.0002134181559085846, 0.00022264011204242706, 0.00023186206817626953]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 6.0, 6.0, 16.0, 11.0, 12.0, 27.0, 45.0, 60.0, 89.0, 147.0, 273.0, 479.0, 1023.0, 2420.0, 6572.0, 25226.0, 163770.0, 647740.0, 164135.0, 25397.0, 6486.0, 2383.0, 1020.0, 504.0, 276.0, 143.0, 85.0, 64.0, 28.0, 20.0, 27.0, 10.0, 14.0, 8.0, 6.0, 6.0, 8.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.025390625, -1.958984375, -1.892578125, -1.826171875, -1.759765625, -1.693359375, -1.626953125, -1.560546875, -1.494140625, -1.427734375, -1.361328125, -1.294921875, -1.228515625, -1.162109375, -1.095703125, -1.029296875, -0.962890625, -0.896484375, -0.830078125, -0.763671875, -0.697265625, -0.630859375, -0.564453125, -0.498046875, -0.431640625, -0.365234375, -0.298828125, -0.232421875, -0.166015625, -0.099609375, -0.033203125, 0.033203125, 0.099609375, 0.166015625, 0.232421875, 0.298828125, 0.365234375, 0.431640625, 0.498046875, 0.564453125, 0.630859375, 0.697265625, 0.763671875, 0.830078125, 0.896484375, 0.962890625, 1.029296875, 1.095703125, 1.162109375, 1.228515625, 1.294921875, 1.361328125, 1.427734375, 1.494140625, 1.560546875, 1.626953125, 1.693359375, 1.759765625, 1.826171875, 1.892578125, 1.958984375, 2.025390625, 2.091796875, 2.158203125, 2.224609375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 4.0, 7.0, 14.0, 20.0, 20.0, 44.0, 56.0, 63.0, 63.0, 85.0, 102.0, 101.0, 75.0, 77.0, 59.0, 47.0, 44.0, 26.0, 26.0, 17.0, 6.0, 10.0, 2.0, 5.0, 8.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.048828125, -1.001556396484375, -0.95428466796875, -0.907012939453125, -0.8597412109375, -0.812469482421875, -0.76519775390625, -0.717926025390625, -0.670654296875, -0.623382568359375, -0.57611083984375, -0.528839111328125, -0.4815673828125, -0.434295654296875, -0.38702392578125, -0.339752197265625, -0.29248046875, -0.245208740234375, -0.19793701171875, -0.150665283203125, -0.1033935546875, -0.056121826171875, -0.00885009765625, 0.038421630859375, 0.085693359375, 0.132965087890625, 0.18023681640625, 0.227508544921875, 0.2747802734375, 0.322052001953125, 0.36932373046875, 0.416595458984375, 0.4638671875, 0.511138916015625, 0.55841064453125, 0.605682373046875, 0.6529541015625, 0.700225830078125, 0.74749755859375, 0.794769287109375, 0.842041015625, 0.889312744140625, 0.93658447265625, 0.983856201171875, 1.0311279296875, 1.078399658203125, 1.12567138671875, 1.172943115234375, 1.22021484375, 1.267486572265625, 1.31475830078125, 1.362030029296875, 1.4093017578125, 1.456573486328125, 1.50384521484375, 1.551116943359375, 1.598388671875, 1.645660400390625, 1.69293212890625, 1.740203857421875, 1.7874755859375, 1.834747314453125, 1.88201904296875, 1.929290771484375, 1.9765625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 12.0, 13.0, 20.0, 35.0, 68.0, 88.0, 176.0, 189.0, 140.0, 93.0, 71.0, 39.0, 24.0, 13.0, 9.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.253944396972656, -15.522032737731934, -14.790121078491211, -14.058209419250488, -13.326297760009766, -12.594386100769043, -11.86247444152832, -11.130562782287598, -10.398651123046875, -9.666739463806152, -8.93482780456543, -8.202916145324707, -7.471004486083984, -6.739092826843262, -6.007181167602539, -5.275269508361816, -4.543357849121094, -3.811446189880371, -3.0795345306396484, -2.347622871398926, -1.6157112121582031, -0.8837995529174805, -0.1518878936767578, 0.5800237655639648, 1.3119354248046875, 2.04384708404541, 2.775758743286133, 3.5076704025268555, 4.239582061767578, 4.971493721008301, 5.703405380249023, 6.435317039489746, 7.167228698730469, 7.899140357971191, 8.631052017211914, 9.362963676452637, 10.09487533569336, 10.826786994934082, 11.558698654174805, 12.290610313415527, 13.02252197265625, 13.754433631896973, 14.486345291137695, 15.218256950378418, 15.95016860961914, 16.682079315185547, 17.413991928100586, 18.145904541015625, 18.87781524658203, 19.609725952148438, 20.341638565063477, 21.073551177978516, 21.805461883544922, 22.537372589111328, 23.269285202026367, 24.001197814941406, 24.733108520507812, 25.46501922607422, 26.196931838989258, 26.928844451904297, 27.660755157470703, 28.39266586303711, 29.12457847595215, 29.856491088867188, 30.588401794433594]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 9.0, 1.0, 9.0, 12.0, 19.0, 24.0, 19.0, 19.0, 21.0, 22.0, 27.0, 27.0, 45.0, 35.0, 38.0, 53.0, 45.0, 46.0, 51.0, 52.0, 43.0, 56.0, 53.0, 40.0, 38.0, 41.0, 26.0, 16.0, 17.0, 18.0, 16.0, 10.0, 15.0, 7.0, 3.0, 6.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.216127395629883, -14.708358764648438, -14.200590133666992, -13.692821502685547, -13.185052871704102, -12.677284240722656, -12.169516563415527, -11.661747932434082, -11.153979301452637, -10.646210670471191, -10.138442039489746, -9.6306734085083, -9.122905731201172, -8.615137100219727, -8.107368469238281, -7.599599838256836, -7.091831207275391, -6.584062576293945, -6.0762939453125, -5.568525791168213, -5.060757160186768, -4.552988529205322, -4.045220375061035, -3.53745174407959, -3.0296831130981445, -2.521914482116699, -2.014146089553833, -1.5063775777816772, -0.9986090660095215, -0.49084043502807617, 0.01692795753479004, 0.5246963500976562, 1.0324668884277344, 1.5402354001998901, 2.048003911972046, 2.555772304534912, 3.0635409355163574, 3.5713095664978027, 4.07907772064209, 4.586846351623535, 5.0946149826049805, 5.602383613586426, 6.110152244567871, 6.617920398712158, 7.1256890296936035, 7.633457660675049, 8.141225814819336, 8.648994445800781, 9.156763076782227, 9.664531707763672, 10.172300338745117, 10.680068969726562, 11.187837600708008, 11.695606231689453, 12.203373908996582, 12.711142539978027, 13.218911170959473, 13.726679801940918, 14.234448432922363, 14.742217063903809, 15.249984741210938, 15.757753372192383, 16.265522003173828, 16.773290634155273, 17.28105926513672]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 3.0, 8.0, 7.0, 19.0, 18.0, 24.0, 45.0, 61.0, 69.0, 82.0, 129.0, 190.0, 256.0, 447.0, 769.0, 1405.0, 3272.0, 9085.0, 34299.0, 278224.0, 3715121.0, 115824.0, 22307.0, 6870.0, 2753.0, 1205.0, 674.0, 395.0, 230.0, 155.0, 90.0, 61.0, 45.0, 27.0, 26.0, 15.0, 10.0, 10.0, 5.0, 11.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.69921875, -5.5423583984375, -5.385498046875, -5.2286376953125, -5.07177734375, -4.9149169921875, -4.758056640625, -4.6011962890625, -4.4443359375, -4.2874755859375, -4.130615234375, -3.9737548828125, -3.81689453125, -3.6600341796875, -3.503173828125, -3.3463134765625, -3.189453125, -3.0325927734375, -2.875732421875, -2.7188720703125, -2.56201171875, -2.4051513671875, -2.248291015625, -2.0914306640625, -1.9345703125, -1.7777099609375, -1.620849609375, -1.4639892578125, -1.30712890625, -1.1502685546875, -0.993408203125, -0.8365478515625, -0.6796875, -0.5228271484375, -0.365966796875, -0.2091064453125, -0.05224609375, 0.1046142578125, 0.261474609375, 0.4183349609375, 0.5751953125, 0.7320556640625, 0.888916015625, 1.0457763671875, 1.20263671875, 1.3594970703125, 1.516357421875, 1.6732177734375, 1.830078125, 1.9869384765625, 2.143798828125, 2.3006591796875, 2.45751953125, 2.6143798828125, 2.771240234375, 2.9281005859375, 3.0849609375, 3.2418212890625, 3.398681640625, 3.5555419921875, 3.71240234375, 3.8692626953125, 4.026123046875, 4.1829833984375, 4.33984375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 6.0, 9.0, 13.0, 41.0, 39.0, 40.0, 57.0, 72.0, 72.0, 90.0, 92.0, 89.0, 79.0, 55.0, 67.0, 38.0, 34.0, 28.0, 21.0, 20.0, 17.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2822265625, -1.2481002807617188, -1.2139739990234375, -1.1798477172851562, -1.145721435546875, -1.1115951538085938, -1.0774688720703125, -1.0433425903320312, -1.00921630859375, -0.9750900268554688, -0.9409637451171875, -0.9068374633789062, -0.872711181640625, -0.8385848999023438, -0.8044586181640625, -0.7703323364257812, -0.7362060546875, -0.7020797729492188, -0.6679534912109375, -0.6338272094726562, -0.599700927734375, -0.5655746459960938, -0.5314483642578125, -0.49732208251953125, -0.46319580078125, -0.42906951904296875, -0.3949432373046875, -0.36081695556640625, -0.326690673828125, -0.29256439208984375, -0.2584381103515625, -0.22431182861328125, -0.190185546875, -0.15605926513671875, -0.1219329833984375, -0.08780670166015625, -0.053680419921875, -0.01955413818359375, 0.0145721435546875, 0.04869842529296875, 0.08282470703125, 0.11695098876953125, 0.1510772705078125, 0.18520355224609375, 0.219329833984375, 0.25345611572265625, 0.2875823974609375, 0.32170867919921875, 0.3558349609375, 0.38996124267578125, 0.4240875244140625, 0.45821380615234375, 0.492340087890625, 0.5264663696289062, 0.5605926513671875, 0.5947189331054688, 0.62884521484375, 0.6629714965820312, 0.6970977783203125, 0.7312240600585938, 0.765350341796875, 0.7994766235351562, 0.8336029052734375, 0.8677291870117188, 0.90185546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 13.0, 19.0, 29.0, 35.0, 66.0, 107.0, 188.0, 281.0, 547.0, 1710.0, 9220.0, 1525625.0, 2643726.0, 9511.0, 1754.0, 609.0, 285.0, 195.0, 144.0, 78.0, 55.0, 31.0, 27.0, 10.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-17.984375, -17.45556640625, -16.9267578125, -16.39794921875, -15.869140625, -15.34033203125, -14.8115234375, -14.28271484375, -13.75390625, -13.22509765625, -12.6962890625, -12.16748046875, -11.638671875, -11.10986328125, -10.5810546875, -10.05224609375, -9.5234375, -8.99462890625, -8.4658203125, -7.93701171875, -7.408203125, -6.87939453125, -6.3505859375, -5.82177734375, -5.29296875, -4.76416015625, -4.2353515625, -3.70654296875, -3.177734375, -2.64892578125, -2.1201171875, -1.59130859375, -1.0625, -0.53369140625, -0.0048828125, 0.52392578125, 1.052734375, 1.58154296875, 2.1103515625, 2.63916015625, 3.16796875, 3.69677734375, 4.2255859375, 4.75439453125, 5.283203125, 5.81201171875, 6.3408203125, 6.86962890625, 7.3984375, 7.92724609375, 8.4560546875, 8.98486328125, 9.513671875, 10.04248046875, 10.5712890625, 11.10009765625, 11.62890625, 12.15771484375, 12.6865234375, 13.21533203125, 13.744140625, 14.27294921875, 14.8017578125, 15.33056640625, 15.859375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 11.0, 14.0, 24.0, 68.0, 238.0, 2771.0, 717.0, 137.0, 41.0, 11.0, 16.0, 4.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.23974609375, -5.0888671875, -4.93798828125, -4.787109375, -4.63623046875, -4.4853515625, -4.33447265625, -4.18359375, -4.03271484375, -3.8818359375, -3.73095703125, -3.580078125, -3.42919921875, -3.2783203125, -3.12744140625, -2.9765625, -2.82568359375, -2.6748046875, -2.52392578125, -2.373046875, -2.22216796875, -2.0712890625, -1.92041015625, -1.76953125, -1.61865234375, -1.4677734375, -1.31689453125, -1.166015625, -1.01513671875, -0.8642578125, -0.71337890625, -0.5625, -0.41162109375, -0.2607421875, -0.10986328125, 0.041015625, 0.19189453125, 0.3427734375, 0.49365234375, 0.64453125, 0.79541015625, 0.9462890625, 1.09716796875, 1.248046875, 1.39892578125, 1.5498046875, 1.70068359375, 1.8515625, 2.00244140625, 2.1533203125, 2.30419921875, 2.455078125, 2.60595703125, 2.7568359375, 2.90771484375, 3.05859375, 3.20947265625, 3.3603515625, 3.51123046875, 3.662109375, 3.81298828125, 3.9638671875, 4.11474609375, 4.265625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 17.0, 261.0, 670.0, 47.0, 5.0, 5.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.80937194824219, -51.00291442871094, -48.19645690917969, -45.38999938964844, -42.58354187011719, -39.77708435058594, -36.97062301635742, -34.16416549682617, -31.357707977294922, -28.551250457763672, -25.744792938232422, -22.93833351135254, -20.13187599182129, -17.32541847229004, -14.518959045410156, -11.712501525878906, -8.906044006347656, -6.099586009979248, -3.29312801361084, -0.48666954040527344, 2.3197879791259766, 5.126245498657227, 7.932704925537109, 10.73916244506836, 13.54561996459961, 16.35207748413086, 19.15853500366211, 21.964994430541992, 24.771451950073242, 27.577909469604492, 30.384368896484375, 33.190826416015625, 35.997283935546875, 38.803741455078125, 41.610198974609375, 44.416656494140625, 47.223114013671875, 50.029571533203125, 52.83603286743164, 55.64249038696289, 58.44894790649414, 61.25540542602539, 64.0618667602539, 66.86832427978516, 69.6747817993164, 72.48123931884766, 75.2876968383789, 78.09415435791016, 80.9006118774414, 83.70706939697266, 86.5135269165039, 89.31998443603516, 92.1264419555664, 94.93289947509766, 97.73936462402344, 100.54582214355469, 103.35227966308594, 106.15873718261719, 108.96519470214844, 111.77165222167969, 114.57810974121094, 117.38456726074219, 120.19102478027344, 122.99748229980469, 125.80393981933594]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 10.0, 14.0, 19.0, 29.0, 41.0, 50.0, 66.0, 80.0, 77.0, 88.0, 87.0, 83.0, 66.0, 73.0, 51.0, 47.0, 36.0, 31.0, 14.0, 12.0, 9.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.01355266571045, -11.603650093078613, -11.193747520446777, -10.783844947814941, -10.373942375183105, -9.96403980255127, -9.554136276245117, -9.144233703613281, -8.734331130981445, -8.32442855834961, -7.914525985717773, -7.5046234130859375, -7.094720840454102, -6.684818267822266, -6.2749152183532715, -5.8650126457214355, -5.455110549926758, -5.045207977294922, -4.635305404663086, -4.22540283203125, -3.815500020980835, -3.405597448348999, -2.995694637298584, -2.585792064666748, -2.175889492034912, -1.7659869194030762, -1.3560842275619507, -0.9461815357208252, -0.5362789630889893, -0.12637639045715332, 0.2835264205932617, 0.6934289932250977, 1.1033306121826172, 1.5132331848144531, 1.9231358766555786, 2.333038568496704, 2.74294114112854, 3.152843713760376, 3.562746524810791, 3.972649097442627, 4.382551670074463, 4.792454242706299, 5.202356815338135, 5.612259864807129, 6.022162437438965, 6.432065010070801, 6.841967582702637, 7.251870155334473, 7.661772727966309, 8.071675300598145, 8.48157787322998, 8.891480445861816, 9.301383018493652, 9.711285591125488, 10.12118911743164, 10.531091690063477, 10.940994262695312, 11.350896835327148, 11.760799407958984, 12.17070198059082, 12.580604553222656, 12.990507125854492, 13.400409698486328, 13.810312271118164, 14.22021484375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 7.0, 12.0, 3.0, 16.0, 21.0, 32.0, 49.0, 49.0, 97.0, 150.0, 241.0, 375.0, 615.0, 1053.0, 2051.0, 5070.0, 16665.0, 76878.0, 458946.0, 396646.0, 65724.0, 14794.0, 4544.0, 1993.0, 1001.0, 559.0, 322.0, 190.0, 146.0, 99.0, 66.0, 40.0, 36.0, 27.0, 9.0, 8.0, 9.0, 4.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.8984375, -5.734375, -5.5703125, -5.40625, -5.2421875, -5.078125, -4.9140625, -4.75, -4.5859375, -4.421875, -4.2578125, -4.09375, -3.9296875, -3.765625, -3.6015625, -3.4375, -3.2734375, -3.109375, -2.9453125, -2.78125, -2.6171875, -2.453125, -2.2890625, -2.125, -1.9609375, -1.796875, -1.6328125, -1.46875, -1.3046875, -1.140625, -0.9765625, -0.8125, -0.6484375, -0.484375, -0.3203125, -0.15625, 0.0078125, 0.171875, 0.3359375, 0.5, 0.6640625, 0.828125, 0.9921875, 1.15625, 1.3203125, 1.484375, 1.6484375, 1.8125, 1.9765625, 2.140625, 2.3046875, 2.46875, 2.6328125, 2.796875, 2.9609375, 3.125, 3.2890625, 3.453125, 3.6171875, 3.78125, 3.9453125, 4.109375, 4.2734375, 4.4375, 4.6015625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 3.0, 10.0, 14.0, 26.0, 51.0, 46.0, 71.0, 99.0, 104.0, 111.0, 105.0, 101.0, 71.0, 52.0, 46.0, 38.0, 26.0, 10.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7578125, -1.7099761962890625, -1.662139892578125, -1.6143035888671875, -1.56646728515625, -1.5186309814453125, -1.470794677734375, -1.4229583740234375, -1.3751220703125, -1.3272857666015625, -1.279449462890625, -1.2316131591796875, -1.18377685546875, -1.1359405517578125, -1.088104248046875, -1.0402679443359375, -0.992431640625, -0.9445953369140625, -0.896759033203125, -0.8489227294921875, -0.80108642578125, -0.7532501220703125, -0.705413818359375, -0.6575775146484375, -0.6097412109375, -0.5619049072265625, -0.514068603515625, -0.4662322998046875, -0.41839599609375, -0.3705596923828125, -0.322723388671875, -0.2748870849609375, -0.22705078125, -0.1792144775390625, -0.131378173828125, -0.0835418701171875, -0.03570556640625, 0.0121307373046875, 0.059967041015625, 0.1078033447265625, 0.1556396484375, 0.2034759521484375, 0.251312255859375, 0.2991485595703125, 0.34698486328125, 0.3948211669921875, 0.442657470703125, 0.4904937744140625, 0.538330078125, 0.5861663818359375, 0.634002685546875, 0.6818389892578125, 0.72967529296875, 0.7775115966796875, 0.825347900390625, 0.8731842041015625, 0.9210205078125, 0.9688568115234375, 1.016693115234375, 1.0645294189453125, 1.11236572265625, 1.1602020263671875, 1.208038330078125, 1.2558746337890625, 1.3037109375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 10.0, 9.0, 19.0, 22.0, 27.0, 33.0, 40.0, 84.0, 135.0, 227.0, 374.0, 687.0, 1247.0, 2353.0, 4930.0, 11227.0, 28452.0, 80749.0, 246075.0, 403249.0, 174071.0, 56960.0, 20718.0, 8597.0, 3925.0, 1898.0, 969.0, 569.0, 311.0, 194.0, 114.0, 87.0, 60.0, 36.0, 18.0, 22.0, 7.0, 14.0, 11.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.494140625, -2.417022705078125, -2.33990478515625, -2.262786865234375, -2.1856689453125, -2.108551025390625, -2.03143310546875, -1.954315185546875, -1.877197265625, -1.800079345703125, -1.72296142578125, -1.645843505859375, -1.5687255859375, -1.491607666015625, -1.41448974609375, -1.337371826171875, -1.26025390625, -1.183135986328125, -1.10601806640625, -1.028900146484375, -0.9517822265625, -0.874664306640625, -0.79754638671875, -0.720428466796875, -0.643310546875, -0.566192626953125, -0.48907470703125, -0.411956787109375, -0.3348388671875, -0.257720947265625, -0.18060302734375, -0.103485107421875, -0.0263671875, 0.050750732421875, 0.12786865234375, 0.204986572265625, 0.2821044921875, 0.359222412109375, 0.43634033203125, 0.513458251953125, 0.590576171875, 0.667694091796875, 0.74481201171875, 0.821929931640625, 0.8990478515625, 0.976165771484375, 1.05328369140625, 1.130401611328125, 1.20751953125, 1.284637451171875, 1.36175537109375, 1.438873291015625, 1.5159912109375, 1.593109130859375, 1.67022705078125, 1.747344970703125, 1.824462890625, 1.901580810546875, 1.97869873046875, 2.055816650390625, 2.1329345703125, 2.210052490234375, 2.28717041015625, 2.364288330078125, 2.44140625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 2.0, 6.0, 11.0, 11.0, 10.0, 7.0, 15.0, 30.0, 18.0, 28.0, 29.0, 37.0, 35.0, 48.0, 38.0, 47.0, 38.0, 47.0, 39.0, 47.0, 47.0, 45.0, 35.0, 52.0, 36.0, 31.0, 36.0, 37.0, 21.0, 14.0, 23.0, 16.0, 8.0, 13.0, 6.0, 3.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.6129150390625, -2.526611328125, -2.4403076171875, -2.35400390625, -2.2677001953125, -2.181396484375, -2.0950927734375, -2.0087890625, -1.9224853515625, -1.836181640625, -1.7498779296875, -1.66357421875, -1.5772705078125, -1.490966796875, -1.4046630859375, -1.318359375, -1.2320556640625, -1.145751953125, -1.0594482421875, -0.97314453125, -0.8868408203125, -0.800537109375, -0.7142333984375, -0.6279296875, -0.5416259765625, -0.455322265625, -0.3690185546875, -0.28271484375, -0.1964111328125, -0.110107421875, -0.0238037109375, 0.0625, 0.1488037109375, 0.235107421875, 0.3214111328125, 0.40771484375, 0.4940185546875, 0.580322265625, 0.6666259765625, 0.7529296875, 0.8392333984375, 0.925537109375, 1.0118408203125, 1.09814453125, 1.1844482421875, 1.270751953125, 1.3570556640625, 1.443359375, 1.5296630859375, 1.615966796875, 1.7022705078125, 1.78857421875, 1.8748779296875, 1.961181640625, 2.0474853515625, 2.1337890625, 2.2200927734375, 2.306396484375, 2.3927001953125, 2.47900390625, 2.5653076171875, 2.651611328125, 2.7379150390625, 2.82421875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 4.0, 9.0, 11.0, 18.0, 17.0, 29.0, 47.0, 59.0, 105.0, 158.0, 302.0, 516.0, 1091.0, 2203.0, 5365.0, 15650.0, 60733.0, 448302.0, 430330.0, 59039.0, 14719.0, 5234.0, 2148.0, 1180.0, 498.0, 279.0, 190.0, 108.0, 54.0, 34.0, 24.0, 13.0, 12.0, 15.0, 9.0, 12.0, 4.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.365234375, -2.288909912109375, -2.21258544921875, -2.136260986328125, -2.0599365234375, -1.983612060546875, -1.90728759765625, -1.830963134765625, -1.754638671875, -1.678314208984375, -1.60198974609375, -1.525665283203125, -1.4493408203125, -1.373016357421875, -1.29669189453125, -1.220367431640625, -1.14404296875, -1.067718505859375, -0.99139404296875, -0.915069580078125, -0.8387451171875, -0.762420654296875, -0.68609619140625, -0.609771728515625, -0.533447265625, -0.457122802734375, -0.38079833984375, -0.304473876953125, -0.2281494140625, -0.151824951171875, -0.07550048828125, 0.000823974609375, 0.0771484375, 0.153472900390625, 0.22979736328125, 0.306121826171875, 0.3824462890625, 0.458770751953125, 0.53509521484375, 0.611419677734375, 0.687744140625, 0.764068603515625, 0.84039306640625, 0.916717529296875, 0.9930419921875, 1.069366455078125, 1.14569091796875, 1.222015380859375, 1.29833984375, 1.374664306640625, 1.45098876953125, 1.527313232421875, 1.6036376953125, 1.679962158203125, 1.75628662109375, 1.832611083984375, 1.908935546875, 1.985260009765625, 2.06158447265625, 2.137908935546875, 2.2142333984375, 2.290557861328125, 2.36688232421875, 2.443206787109375, 2.51953125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 7.0, 5.0, 8.0, 11.0, 15.0, 17.0, 30.0, 44.0, 56.0, 81.0, 114.0, 138.0, 152.0, 100.0, 73.0, 50.0, 17.0, 22.0, 13.0, 7.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0003113746643066406, -0.0003026500344276428, -0.000293925404548645, -0.0002852007746696472, -0.0002764761447906494, -0.0002677515149116516, -0.0002590268850326538, -0.000250302255153656, -0.0002415776252746582, -0.0002328529953956604, -0.0002241283655166626, -0.0002154037356376648, -0.000206679105758667, -0.0001979544758796692, -0.0001892298460006714, -0.00018050521612167358, -0.00017178058624267578, -0.00016305595636367798, -0.00015433132648468018, -0.00014560669660568237, -0.00013688206672668457, -0.00012815743684768677, -0.00011943280696868896, -0.00011070817708969116, -0.00010198354721069336, -9.325891733169556e-05, -8.453428745269775e-05, -7.580965757369995e-05, -6.708502769470215e-05, -5.8360397815704346e-05, -4.963576793670654e-05, -4.091113805770874e-05, -3.218650817871094e-05, -2.3461878299713135e-05, -1.4737248420715332e-05, -6.012618541717529e-06, 2.7120113372802734e-06, 1.1436641216278076e-05, 2.016127109527588e-05, 2.888590097427368e-05, 3.7610530853271484e-05, 4.633516073226929e-05, 5.505979061126709e-05, 6.378442049026489e-05, 7.25090503692627e-05, 8.12336802482605e-05, 8.99583101272583e-05, 9.86829400062561e-05, 0.0001074075698852539, 0.00011613219976425171, 0.0001248568296432495, 0.00013358145952224731, 0.00014230608940124512, 0.00015103071928024292, 0.00015975534915924072, 0.00016847997903823853, 0.00017720460891723633, 0.00018592923879623413, 0.00019465386867523193, 0.00020337849855422974, 0.00021210312843322754, 0.00022082775831222534, 0.00022955238819122314, 0.00023827701807022095, 0.00024700164794921875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 8.0, 8.0, 12.0, 17.0, 25.0, 39.0, 65.0, 114.0, 183.0, 316.0, 589.0, 1463.0, 3716.0, 12176.0, 55734.0, 561979.0, 356670.0, 40028.0, 9856.0, 3124.0, 1176.0, 556.0, 260.0, 164.0, 107.0, 65.0, 41.0, 20.0, 13.0, 9.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.298828125, -3.1954345703125, -3.092041015625, -2.9886474609375, -2.88525390625, -2.7818603515625, -2.678466796875, -2.5750732421875, -2.4716796875, -2.3682861328125, -2.264892578125, -2.1614990234375, -2.05810546875, -1.9547119140625, -1.851318359375, -1.7479248046875, -1.64453125, -1.5411376953125, -1.437744140625, -1.3343505859375, -1.23095703125, -1.1275634765625, -1.024169921875, -0.9207763671875, -0.8173828125, -0.7139892578125, -0.610595703125, -0.5072021484375, -0.40380859375, -0.3004150390625, -0.197021484375, -0.0936279296875, 0.009765625, 0.1131591796875, 0.216552734375, 0.3199462890625, 0.42333984375, 0.5267333984375, 0.630126953125, 0.7335205078125, 0.8369140625, 0.9403076171875, 1.043701171875, 1.1470947265625, 1.25048828125, 1.3538818359375, 1.457275390625, 1.5606689453125, 1.6640625, 1.7674560546875, 1.870849609375, 1.9742431640625, 2.07763671875, 2.1810302734375, 2.284423828125, 2.3878173828125, 2.4912109375, 2.5946044921875, 2.697998046875, 2.8013916015625, 2.90478515625, 3.0081787109375, 3.111572265625, 3.2149658203125, 3.318359375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 12.0, 3.0, 9.0, 10.0, 19.0, 39.0, 31.0, 45.0, 76.0, 116.0, 144.0, 145.0, 112.0, 75.0, 45.0, 40.0, 27.0, 11.0, 13.0, 8.0, 7.0, 3.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.947265625, -1.862060546875, -1.77685546875, -1.691650390625, -1.6064453125, -1.521240234375, -1.43603515625, -1.350830078125, -1.265625, -1.180419921875, -1.09521484375, -1.010009765625, -0.9248046875, -0.839599609375, -0.75439453125, -0.669189453125, -0.583984375, -0.498779296875, -0.41357421875, -0.328369140625, -0.2431640625, -0.157958984375, -0.07275390625, 0.012451171875, 0.09765625, 0.182861328125, 0.26806640625, 0.353271484375, 0.4384765625, 0.523681640625, 0.60888671875, 0.694091796875, 0.779296875, 0.864501953125, 0.94970703125, 1.034912109375, 1.1201171875, 1.205322265625, 1.29052734375, 1.375732421875, 1.4609375, 1.546142578125, 1.63134765625, 1.716552734375, 1.8017578125, 1.886962890625, 1.97216796875, 2.057373046875, 2.142578125, 2.227783203125, 2.31298828125, 2.398193359375, 2.4833984375, 2.568603515625, 2.65380859375, 2.739013671875, 2.82421875, 2.909423828125, 2.99462890625, 3.079833984375, 3.1650390625, 3.250244140625, 3.33544921875, 3.420654296875, 3.505859375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 11.0, 27.0, 75.0, 187.0, 304.0, 233.0, 93.0, 52.0, 14.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-73.95397186279297, -72.4579849243164, -70.96199035644531, -69.46600341796875, -67.97001647949219, -66.4740219116211, -64.97803497314453, -63.4820442199707, -61.986053466796875, -60.49006271362305, -58.994075775146484, -57.498085021972656, -56.00209426879883, -54.506103515625, -53.01011657714844, -51.51412582397461, -50.01813507080078, -48.52214431762695, -47.02615737915039, -45.53016662597656, -44.034175872802734, -42.538185119628906, -41.042198181152344, -39.546207427978516, -38.05022048950195, -36.554229736328125, -35.05824279785156, -33.562252044677734, -32.066261291503906, -30.57027244567871, -29.074283599853516, -27.578292846679688, -26.082300186157227, -24.58631134033203, -23.090320587158203, -21.594331741333008, -20.09834098815918, -18.602352142333984, -17.106361389160156, -15.610372543334961, -14.11438274383545, -12.618392944335938, -11.122403144836426, -9.626413345336914, -8.130424499511719, -6.634434223175049, -5.138444900512695, -3.6424551010131836, -2.146465301513672, -0.6504756212234497, 0.8455140590667725, 2.341503620147705, 3.837493419647217, 5.3334832191467285, 6.829472541809082, 8.325462341308594, 9.821452140808105, 11.317441940307617, 12.813431739807129, 14.30942153930664, 15.805410385131836, 17.301401138305664, 18.79738998413086, 20.293380737304688, 21.789369583129883]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 7.0, 5.0, 10.0, 11.0, 14.0, 11.0, 26.0, 18.0, 25.0, 21.0, 21.0, 35.0, 40.0, 32.0, 53.0, 36.0, 39.0, 44.0, 42.0, 40.0, 57.0, 45.0, 40.0, 55.0, 36.0, 39.0, 30.0, 37.0, 20.0, 20.0, 17.0, 17.0, 5.0, 12.0, 10.0, 6.0, 7.0, 3.0, 5.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-17.680103302001953, -17.176015853881836, -16.67193031311035, -16.167842864990234, -15.66375732421875, -15.159669876098633, -14.655583381652832, -14.151496887207031, -13.64741039276123, -13.14332389831543, -12.639237403869629, -12.135150909423828, -11.631063461303711, -11.126977920532227, -10.62289047241211, -10.118803977966309, -9.614717483520508, -9.110630989074707, -8.606544494628906, -8.102458000183105, -7.5983710289001465, -7.094284534454346, -6.590197563171387, -6.086111068725586, -5.582024574279785, -5.077938079833984, -4.573851585388184, -4.069764614105225, -3.565678119659424, -3.061591625213623, -2.557504892349243, -2.0534181594848633, -1.5493316650390625, -1.0452450513839722, -0.5411584377288818, -0.037071824073791504, 0.46701478958129883, 0.9711012840270996, 1.4751880168914795, 1.9792747497558594, 2.48336124420166, 2.987447738647461, 3.491534471511841, 3.9956212043762207, 4.4997076988220215, 5.003794193267822, 5.507881164550781, 6.011967658996582, 6.516054153442383, 7.020140647888184, 7.524227142333984, 8.028313636779785, 8.532400131225586, 9.036487579345703, 9.540574073791504, 10.044660568237305, 10.548747062683105, 11.052833557128906, 11.556920051574707, 12.061006546020508, 12.565093994140625, 13.06917953491211, 13.573266983032227, 14.077353477478027, 14.581439971923828]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 6.0, 7.0, 20.0, 17.0, 18.0, 36.0, 47.0, 83.0, 126.0, 240.0, 386.0, 771.0, 1685.0, 5558.0, 27628.0, 3618056.0, 512126.0, 19827.0, 4505.0, 1616.0, 663.0, 361.0, 233.0, 100.0, 56.0, 40.0, 21.0, 13.0, 13.0, 5.0, 5.0, 5.0, 5.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.87890625, -7.65948486328125, -7.4400634765625, -7.22064208984375, -7.001220703125, -6.78179931640625, -6.5623779296875, -6.34295654296875, -6.12353515625, -5.90411376953125, -5.6846923828125, -5.46527099609375, -5.245849609375, -5.02642822265625, -4.8070068359375, -4.58758544921875, -4.3681640625, -4.14874267578125, -3.9293212890625, -3.70989990234375, -3.490478515625, -3.27105712890625, -3.0516357421875, -2.83221435546875, -2.61279296875, -2.39337158203125, -2.1739501953125, -1.95452880859375, -1.735107421875, -1.51568603515625, -1.2962646484375, -1.07684326171875, -0.857421875, -0.63800048828125, -0.4185791015625, -0.19915771484375, 0.020263671875, 0.23968505859375, 0.4591064453125, 0.67852783203125, 0.89794921875, 1.11737060546875, 1.3367919921875, 1.55621337890625, 1.775634765625, 1.99505615234375, 2.2144775390625, 2.43389892578125, 2.6533203125, 2.87274169921875, 3.0921630859375, 3.31158447265625, 3.531005859375, 3.75042724609375, 3.9698486328125, 4.18927001953125, 4.40869140625, 4.62811279296875, 4.8475341796875, 5.06695556640625, 5.286376953125, 5.50579833984375, 5.7252197265625, 5.94464111328125, 6.1640625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 8.0, 11.0, 25.0, 33.0, 26.0, 55.0, 66.0, 77.0, 89.0, 109.0, 101.0, 90.0, 66.0, 63.0, 61.0, 45.0, 24.0, 22.0, 8.0, 4.0, 2.0, 6.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7861328125, -1.7391357421875, -1.692138671875, -1.6451416015625, -1.59814453125, -1.5511474609375, -1.504150390625, -1.4571533203125, -1.41015625, -1.3631591796875, -1.316162109375, -1.2691650390625, -1.22216796875, -1.1751708984375, -1.128173828125, -1.0811767578125, -1.0341796875, -0.9871826171875, -0.940185546875, -0.8931884765625, -0.84619140625, -0.7991943359375, -0.752197265625, -0.7052001953125, -0.658203125, -0.6112060546875, -0.564208984375, -0.5172119140625, -0.47021484375, -0.4232177734375, -0.376220703125, -0.3292236328125, -0.2822265625, -0.2352294921875, -0.188232421875, -0.1412353515625, -0.09423828125, -0.0472412109375, -0.000244140625, 0.0467529296875, 0.09375, 0.1407470703125, 0.187744140625, 0.2347412109375, 0.28173828125, 0.3287353515625, 0.375732421875, 0.4227294921875, 0.4697265625, 0.5167236328125, 0.563720703125, 0.6107177734375, 0.65771484375, 0.7047119140625, 0.751708984375, 0.7987060546875, 0.845703125, 0.8927001953125, 0.939697265625, 0.9866943359375, 1.03369140625, 1.0806884765625, 1.127685546875, 1.1746826171875, 1.2216796875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 13.0, 14.0, 29.0, 23.0, 38.0, 51.0, 92.0, 145.0, 259.0, 506.0, 1186.0, 5378.0, 134168.0, 4027768.0, 20470.0, 2348.0, 734.0, 390.0, 231.0, 138.0, 95.0, 48.0, 47.0, 26.0, 27.0, 15.0, 16.0, 15.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.25, -8.9227294921875, -8.595458984375, -8.2681884765625, -7.94091796875, -7.6136474609375, -7.286376953125, -6.9591064453125, -6.6318359375, -6.3045654296875, -5.977294921875, -5.6500244140625, -5.32275390625, -4.9954833984375, -4.668212890625, -4.3409423828125, -4.013671875, -3.6864013671875, -3.359130859375, -3.0318603515625, -2.70458984375, -2.3773193359375, -2.050048828125, -1.7227783203125, -1.3955078125, -1.0682373046875, -0.740966796875, -0.4136962890625, -0.08642578125, 0.2408447265625, 0.568115234375, 0.8953857421875, 1.22265625, 1.5499267578125, 1.877197265625, 2.2044677734375, 2.53173828125, 2.8590087890625, 3.186279296875, 3.5135498046875, 3.8408203125, 4.1680908203125, 4.495361328125, 4.8226318359375, 5.14990234375, 5.4771728515625, 5.804443359375, 6.1317138671875, 6.458984375, 6.7862548828125, 7.113525390625, 7.4407958984375, 7.76806640625, 8.0953369140625, 8.422607421875, 8.7498779296875, 9.0771484375, 9.4044189453125, 9.731689453125, 10.0589599609375, 10.38623046875, 10.7135009765625, 11.040771484375, 11.3680419921875, 11.6953125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 10.0, 20.0, 27.0, 54.0, 115.0, 379.0, 2676.0, 534.0, 130.0, 54.0, 26.0, 18.0, 10.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.576171875, -1.503021240234375, -1.42987060546875, -1.356719970703125, -1.2835693359375, -1.210418701171875, -1.13726806640625, -1.064117431640625, -0.990966796875, -0.917816162109375, -0.84466552734375, -0.771514892578125, -0.6983642578125, -0.625213623046875, -0.55206298828125, -0.478912353515625, -0.40576171875, -0.332611083984375, -0.25946044921875, -0.186309814453125, -0.1131591796875, -0.040008544921875, 0.03314208984375, 0.106292724609375, 0.179443359375, 0.252593994140625, 0.32574462890625, 0.398895263671875, 0.4720458984375, 0.545196533203125, 0.61834716796875, 0.691497802734375, 0.7646484375, 0.837799072265625, 0.91094970703125, 0.984100341796875, 1.0572509765625, 1.130401611328125, 1.20355224609375, 1.276702880859375, 1.349853515625, 1.423004150390625, 1.49615478515625, 1.569305419921875, 1.6424560546875, 1.715606689453125, 1.78875732421875, 1.861907958984375, 1.93505859375, 2.008209228515625, 2.08135986328125, 2.154510498046875, 2.2276611328125, 2.300811767578125, 2.37396240234375, 2.447113037109375, 2.520263671875, 2.593414306640625, 2.66656494140625, 2.739715576171875, 2.8128662109375, 2.886016845703125, 2.95916748046875, 3.032318115234375, 3.10546875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 10.0, 10.0, 46.0, 58.0, 181.0, 282.0, 221.0, 111.0, 41.0, 27.0, 9.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.538350582122803, -6.056714057922363, -5.575078010559082, -5.093441963195801, -4.611805438995361, -4.130168914794922, -3.6485328674316406, -3.1668965816497803, -2.68526029586792, -2.2036240100860596, -1.7219877243041992, -1.2403514385223389, -0.7587151527404785, -0.27707886695861816, 0.2045574188232422, 0.6861937046051025, 1.167829990386963, 1.6494662761688232, 2.1311025619506836, 2.612738847732544, 3.0943751335144043, 3.5760114192962646, 4.057647705078125, 4.539283752441406, 5.020920276641846, 5.502556800842285, 5.984192848205566, 6.465828895568848, 6.947465419769287, 7.429101943969727, 7.910737991333008, 8.392374038696289, 8.87401008605957, 9.355646133422852, 9.837282180786133, 10.31891918182373, 10.800555229187012, 11.282191276550293, 11.76382827758789, 12.245464324951172, 12.727100372314453, 13.208736419677734, 13.690372467041016, 14.172009468078613, 14.653645515441895, 15.135281562805176, 15.616918563842773, 16.098554611206055, 16.580190658569336, 17.061826705932617, 17.5434627532959, 18.02509880065918, 18.506736755371094, 18.988372802734375, 19.470008850097656, 19.951644897460938, 20.43328094482422, 20.9149169921875, 21.39655303955078, 21.878189086914062, 22.359825134277344, 22.841463088989258, 23.32309913635254, 23.80473518371582, 24.2863712310791]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 36.0, 45.0, 76.0, 114.0, 140.0, 144.0, 155.0, 110.0, 75.0, 48.0, 34.0, 11.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.032001495361328, -10.602417945861816, -10.172834396362305, -9.743250846862793, -9.313667297363281, -8.884084701538086, -8.454500198364258, -8.024917602539062, -7.595334053039551, -7.165750503540039, -6.736166954040527, -6.306583404541016, -5.877000331878662, -5.44741678237915, -5.017833232879639, -4.588250160217285, -4.158666133880615, -3.7290825843811035, -3.299499273300171, -2.869915723800659, -2.4403324127197266, -2.010748863220215, -1.5811653137207031, -1.1515820026397705, -0.7219984531402588, -0.29241499304771423, 0.13716846704483032, 0.5667519569396973, 0.9963353872299194, 1.4259188175201416, 1.8555023670196533, 2.285085678100586, 2.7146692276000977, 3.1442527770996094, 3.573836088180542, 4.003419876098633, 4.433002948760986, 4.862586498260498, 5.29217004776001, 5.721753120422363, 6.151336669921875, 6.580920219421387, 7.010503768920898, 7.44008731842041, 7.869670391082764, 8.299253463745117, 8.728837966918945, 9.15842056274414, 9.588005065917969, 10.01758861541748, 10.447172164916992, 10.876755714416504, 11.306339263916016, 11.735921859741211, 12.165506362915039, 12.595088958740234, 13.024672508239746, 13.454256057739258, 13.88383960723877, 14.313423156738281, 14.743006706237793, 15.172590255737305, 15.6021728515625, 16.031757354736328, 16.461339950561523]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 4.0, 7.0, 11.0, 31.0, 27.0, 42.0, 67.0, 148.0, 239.0, 423.0, 855.0, 2102.0, 6375.0, 28174.0, 231759.0, 662352.0, 94280.0, 14754.0, 3965.0, 1431.0, 674.0, 331.0, 190.0, 113.0, 64.0, 47.0, 25.0, 16.0, 10.0, 14.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8828125, -7.6387939453125, -7.394775390625, -7.1507568359375, -6.90673828125, -6.6627197265625, -6.418701171875, -6.1746826171875, -5.9306640625, -5.6866455078125, -5.442626953125, -5.1986083984375, -4.95458984375, -4.7105712890625, -4.466552734375, -4.2225341796875, -3.978515625, -3.7344970703125, -3.490478515625, -3.2464599609375, -3.00244140625, -2.7584228515625, -2.514404296875, -2.2703857421875, -2.0263671875, -1.7823486328125, -1.538330078125, -1.2943115234375, -1.05029296875, -0.8062744140625, -0.562255859375, -0.3182373046875, -0.07421875, 0.1697998046875, 0.413818359375, 0.6578369140625, 0.90185546875, 1.1458740234375, 1.389892578125, 1.6339111328125, 1.8779296875, 2.1219482421875, 2.365966796875, 2.6099853515625, 2.85400390625, 3.0980224609375, 3.342041015625, 3.5860595703125, 3.830078125, 4.0740966796875, 4.318115234375, 4.5621337890625, 4.80615234375, 5.0501708984375, 5.294189453125, 5.5382080078125, 5.7822265625, 6.0262451171875, 6.270263671875, 6.5142822265625, 6.75830078125, 7.0023193359375, 7.246337890625, 7.4903564453125, 7.734375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 13.0, 23.0, 22.0, 47.0, 56.0, 80.0, 83.0, 88.0, 100.0, 111.0, 82.0, 71.0, 66.0, 55.0, 28.0, 26.0, 16.0, 9.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.998046875, -1.947845458984375, -1.89764404296875, -1.847442626953125, -1.7972412109375, -1.747039794921875, -1.69683837890625, -1.646636962890625, -1.596435546875, -1.546234130859375, -1.49603271484375, -1.445831298828125, -1.3956298828125, -1.345428466796875, -1.29522705078125, -1.245025634765625, -1.19482421875, -1.144622802734375, -1.09442138671875, -1.044219970703125, -0.9940185546875, -0.943817138671875, -0.89361572265625, -0.843414306640625, -0.793212890625, -0.743011474609375, -0.69281005859375, -0.642608642578125, -0.5924072265625, -0.542205810546875, -0.49200439453125, -0.441802978515625, -0.3916015625, -0.341400146484375, -0.29119873046875, -0.240997314453125, -0.1907958984375, -0.140594482421875, -0.09039306640625, -0.040191650390625, 0.010009765625, 0.060211181640625, 0.11041259765625, 0.160614013671875, 0.2108154296875, 0.261016845703125, 0.31121826171875, 0.361419677734375, 0.41162109375, 0.461822509765625, 0.51202392578125, 0.562225341796875, 0.6124267578125, 0.662628173828125, 0.71282958984375, 0.763031005859375, 0.813232421875, 0.863433837890625, 0.91363525390625, 0.963836669921875, 1.0140380859375, 1.064239501953125, 1.11444091796875, 1.164642333984375, 1.21484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 4.0, 7.0, 11.0, 13.0, 21.0, 33.0, 27.0, 43.0, 50.0, 58.0, 86.0, 140.0, 185.0, 290.0, 412.0, 657.0, 1208.0, 2410.0, 5181.0, 12974.0, 37085.0, 122948.0, 400535.0, 323543.0, 92169.0, 28746.0, 10474.0, 4391.0, 2025.0, 1060.0, 590.0, 350.0, 220.0, 152.0, 114.0, 83.0, 64.0, 35.0, 29.0, 40.0, 27.0, 17.0, 10.0, 10.0, 7.0, 10.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.232421875, -3.13104248046875, -3.0296630859375, -2.92828369140625, -2.826904296875, -2.72552490234375, -2.6241455078125, -2.52276611328125, -2.42138671875, -2.32000732421875, -2.2186279296875, -2.11724853515625, -2.015869140625, -1.91448974609375, -1.8131103515625, -1.71173095703125, -1.6103515625, -1.50897216796875, -1.4075927734375, -1.30621337890625, -1.204833984375, -1.10345458984375, -1.0020751953125, -0.90069580078125, -0.79931640625, -0.69793701171875, -0.5965576171875, -0.49517822265625, -0.393798828125, -0.29241943359375, -0.1910400390625, -0.08966064453125, 0.01171875, 0.11309814453125, 0.2144775390625, 0.31585693359375, 0.417236328125, 0.51861572265625, 0.6199951171875, 0.72137451171875, 0.82275390625, 0.92413330078125, 1.0255126953125, 1.12689208984375, 1.228271484375, 1.32965087890625, 1.4310302734375, 1.53240966796875, 1.6337890625, 1.73516845703125, 1.8365478515625, 1.93792724609375, 2.039306640625, 2.14068603515625, 2.2420654296875, 2.34344482421875, 2.44482421875, 2.54620361328125, 2.6475830078125, 2.74896240234375, 2.850341796875, 2.95172119140625, 3.0531005859375, 3.15447998046875, 3.255859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 5.0, 5.0, 4.0, 8.0, 8.0, 12.0, 14.0, 18.0, 18.0, 22.0, 26.0, 29.0, 42.0, 34.0, 50.0, 38.0, 52.0, 54.0, 42.0, 45.0, 38.0, 51.0, 59.0, 45.0, 42.0, 30.0, 31.0, 35.0, 17.0, 18.0, 24.0, 20.0, 13.0, 11.0, 11.0, 10.0, 11.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.583984375, -3.474853515625, -3.36572265625, -3.256591796875, -3.1474609375, -3.038330078125, -2.92919921875, -2.820068359375, -2.7109375, -2.601806640625, -2.49267578125, -2.383544921875, -2.2744140625, -2.165283203125, -2.05615234375, -1.947021484375, -1.837890625, -1.728759765625, -1.61962890625, -1.510498046875, -1.4013671875, -1.292236328125, -1.18310546875, -1.073974609375, -0.96484375, -0.855712890625, -0.74658203125, -0.637451171875, -0.5283203125, -0.419189453125, -0.31005859375, -0.200927734375, -0.091796875, 0.017333984375, 0.12646484375, 0.235595703125, 0.3447265625, 0.453857421875, 0.56298828125, 0.672119140625, 0.78125, 0.890380859375, 0.99951171875, 1.108642578125, 1.2177734375, 1.326904296875, 1.43603515625, 1.545166015625, 1.654296875, 1.763427734375, 1.87255859375, 1.981689453125, 2.0908203125, 2.199951171875, 2.30908203125, 2.418212890625, 2.52734375, 2.636474609375, 2.74560546875, 2.854736328125, 2.9638671875, 3.072998046875, 3.18212890625, 3.291259765625, 3.400390625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 19.0, 14.0, 16.0, 29.0, 38.0, 56.0, 103.0, 146.0, 278.0, 461.0, 847.0, 1582.0, 3195.0, 8189.0, 34847.0, 534973.0, 419692.0, 30041.0, 7513.0, 3031.0, 1531.0, 803.0, 476.0, 245.0, 156.0, 98.0, 56.0, 44.0, 20.0, 16.0, 10.0, 5.0, 8.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.79296875, -4.64300537109375, -4.4930419921875, -4.34307861328125, -4.193115234375, -4.04315185546875, -3.8931884765625, -3.74322509765625, -3.59326171875, -3.44329833984375, -3.2933349609375, -3.14337158203125, -2.993408203125, -2.84344482421875, -2.6934814453125, -2.54351806640625, -2.3935546875, -2.24359130859375, -2.0936279296875, -1.94366455078125, -1.793701171875, -1.64373779296875, -1.4937744140625, -1.34381103515625, -1.19384765625, -1.04388427734375, -0.8939208984375, -0.74395751953125, -0.593994140625, -0.44403076171875, -0.2940673828125, -0.14410400390625, 0.005859375, 0.15582275390625, 0.3057861328125, 0.45574951171875, 0.605712890625, 0.75567626953125, 0.9056396484375, 1.05560302734375, 1.20556640625, 1.35552978515625, 1.5054931640625, 1.65545654296875, 1.805419921875, 1.95538330078125, 2.1053466796875, 2.25531005859375, 2.4052734375, 2.55523681640625, 2.7052001953125, 2.85516357421875, 3.005126953125, 3.15509033203125, 3.3050537109375, 3.45501708984375, 3.60498046875, 3.75494384765625, 3.9049072265625, 4.05487060546875, 4.204833984375, 4.35479736328125, 4.5047607421875, 4.65472412109375, 4.8046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 7.0, 2.0, 6.0, 3.0, 6.0, 9.0, 8.0, 18.0, 41.0, 72.0, 156.0, 258.0, 174.0, 87.0, 50.0, 39.0, 19.0, 14.0, 9.0, 12.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008745193481445312, -0.0008492916822433472, -0.0008240640163421631, -0.000798836350440979, -0.0007736086845397949, -0.0007483810186386108, -0.0007231533527374268, -0.0006979256868362427, -0.0006726980209350586, -0.0006474703550338745, -0.0006222426891326904, -0.0005970150232315063, -0.0005717873573303223, -0.0005465596914291382, -0.0005213320255279541, -0.00049610435962677, -0.00047087669372558594, -0.00044564902782440186, -0.0004204213619232178, -0.0003951936960220337, -0.0003699660301208496, -0.00034473836421966553, -0.00031951069831848145, -0.00029428303241729736, -0.0002690553665161133, -0.0002438277006149292, -0.00021860003471374512, -0.00019337236881256104, -0.00016814470291137695, -0.00014291703701019287, -0.00011768937110900879, -9.246170520782471e-05, -6.723403930664062e-05, -4.200637340545654e-05, -1.677870750427246e-05, 8.448958396911621e-06, 3.36766242980957e-05, 5.8904290199279785e-05, 8.413195610046387e-05, 0.00010935962200164795, 0.00013458728790283203, 0.0001598149538040161, 0.0001850426197052002, 0.00021027028560638428, 0.00023549795150756836, 0.00026072561740875244, 0.0002859532833099365, 0.0003111809492111206, 0.0003364086151123047, 0.00036163628101348877, 0.00038686394691467285, 0.00041209161281585693, 0.000437319278717041, 0.0004625469446182251, 0.0004877746105194092, 0.0005130022764205933, 0.0005382299423217773, 0.0005634576082229614, 0.0005886852741241455, 0.0006139129400253296, 0.0006391406059265137, 0.0006643682718276978, 0.0006895959377288818, 0.0007148236036300659, 0.00074005126953125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 7.0, 14.0, 13.0, 18.0, 24.0, 42.0, 70.0, 125.0, 239.0, 427.0, 783.0, 1627.0, 3915.0, 12018.0, 90671.0, 862385.0, 59844.0, 9806.0, 3441.0, 1460.0, 709.0, 362.0, 208.0, 126.0, 64.0, 47.0, 36.0, 22.0, 10.0, 10.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.32415771484375, -6.1092529296875, -5.89434814453125, -5.679443359375, -5.46453857421875, -5.2496337890625, -5.03472900390625, -4.81982421875, -4.60491943359375, -4.3900146484375, -4.17510986328125, -3.960205078125, -3.74530029296875, -3.5303955078125, -3.31549072265625, -3.1005859375, -2.88568115234375, -2.6707763671875, -2.45587158203125, -2.240966796875, -2.02606201171875, -1.8111572265625, -1.59625244140625, -1.38134765625, -1.16644287109375, -0.9515380859375, -0.73663330078125, -0.521728515625, -0.30682373046875, -0.0919189453125, 0.12298583984375, 0.337890625, 0.55279541015625, 0.7677001953125, 0.98260498046875, 1.197509765625, 1.41241455078125, 1.6273193359375, 1.84222412109375, 2.05712890625, 2.27203369140625, 2.4869384765625, 2.70184326171875, 2.916748046875, 3.13165283203125, 3.3465576171875, 3.56146240234375, 3.7763671875, 3.99127197265625, 4.2061767578125, 4.42108154296875, 4.635986328125, 4.85089111328125, 5.0657958984375, 5.28070068359375, 5.49560546875, 5.71051025390625, 5.9254150390625, 6.14031982421875, 6.355224609375, 6.57012939453125, 6.7850341796875, 6.99993896484375, 7.21484375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 3.0, 4.0, 3.0, 3.0, 6.0, 7.0, 11.0, 17.0, 36.0, 58.0, 88.0, 159.0, 220.0, 151.0, 79.0, 59.0, 29.0, 18.0, 8.0, 10.0, 8.0, 4.0, 4.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.6953125, -4.55877685546875, -4.4222412109375, -4.28570556640625, -4.149169921875, -4.01263427734375, -3.8760986328125, -3.73956298828125, -3.60302734375, -3.46649169921875, -3.3299560546875, -3.19342041015625, -3.056884765625, -2.92034912109375, -2.7838134765625, -2.64727783203125, -2.5107421875, -2.37420654296875, -2.2376708984375, -2.10113525390625, -1.964599609375, -1.82806396484375, -1.6915283203125, -1.55499267578125, -1.41845703125, -1.28192138671875, -1.1453857421875, -1.00885009765625, -0.872314453125, -0.73577880859375, -0.5992431640625, -0.46270751953125, -0.326171875, -0.18963623046875, -0.0531005859375, 0.08343505859375, 0.219970703125, 0.35650634765625, 0.4930419921875, 0.62957763671875, 0.76611328125, 0.90264892578125, 1.0391845703125, 1.17572021484375, 1.312255859375, 1.44879150390625, 1.5853271484375, 1.72186279296875, 1.8583984375, 1.99493408203125, 2.1314697265625, 2.26800537109375, 2.404541015625, 2.54107666015625, 2.6776123046875, 2.81414794921875, 2.95068359375, 3.08721923828125, 3.2237548828125, 3.36029052734375, 3.496826171875, 3.63336181640625, 3.7698974609375, 3.90643310546875, 4.04296875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 13.0, 26.0, 96.0, 326.0, 374.0, 127.0, 33.0, 12.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-141.1402587890625, -138.00645446777344, -134.87265014648438, -131.73883056640625, -128.6050262451172, -125.47122192382812, -122.33741760253906, -119.20361328125, -116.06980895996094, -112.93600463867188, -109.80219268798828, -106.66838836669922, -103.53458404541016, -100.40077209472656, -97.2669677734375, -94.13316345214844, -90.99935150146484, -87.86554718017578, -84.73173522949219, -81.59793090820312, -78.46412658691406, -75.330322265625, -72.1965103149414, -69.06270599365234, -65.92889404296875, -62.79508590698242, -59.66128158569336, -56.52747344970703, -53.39366912841797, -50.25986099243164, -47.12605285644531, -43.99224853515625, -40.85844421386719, -37.72463607788086, -34.5908317565918, -31.45702362060547, -28.323217391967773, -25.189411163330078, -22.05560302734375, -18.921796798706055, -15.78799057006836, -12.654184341430664, -9.520377159118652, -6.386569976806641, -3.2527637481689453, -0.11895751953125, 3.014850616455078, 6.148656845092773, 9.282463073730469, 12.416269302368164, 15.550076484680176, 18.683883666992188, 21.817689895629883, 24.951496124267578, 28.085304260253906, 31.2191104888916, 34.3529167175293, 37.486724853515625, 40.62052917480469, 43.754337310791016, 46.888145446777344, 50.021949768066406, 53.155757904052734, 56.28956604003906, 59.423370361328125]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 12.0, 11.0, 18.0, 15.0, 17.0, 24.0, 23.0, 33.0, 44.0, 40.0, 53.0, 54.0, 51.0, 50.0, 59.0, 58.0, 53.0, 62.0, 46.0, 37.0, 49.0, 41.0, 26.0, 26.0, 22.0, 12.0, 14.0, 7.0, 9.0, 12.0, 7.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.86016273498535, -28.06566619873047, -27.271167755126953, -26.476669311523438, -25.682172775268555, -24.887676239013672, -24.093177795410156, -23.29867935180664, -22.504182815551758, -21.709686279296875, -20.91518783569336, -20.120689392089844, -19.32619285583496, -18.531696319580078, -17.737197875976562, -16.942699432373047, -16.148202896118164, -15.353705406188965, -14.559207916259766, -13.764710426330566, -12.970212936401367, -12.175715446472168, -11.381217956542969, -10.58672046661377, -9.79222297668457, -8.997725486755371, -8.203227996826172, -7.408730506896973, -6.614233016967773, -5.819735527038574, -5.025238037109375, -4.230740547180176, -3.4362449645996094, -2.64174747467041, -1.847249984741211, -1.0527524948120117, -0.2582550048828125, 0.5362424850463867, 1.330739974975586, 2.125237464904785, 2.9197349548339844, 3.7142324447631836, 4.508729934692383, 5.303227424621582, 6.097724914550781, 6.8922224044799805, 7.68671989440918, 8.481217384338379, 9.275714874267578, 10.070212364196777, 10.864709854125977, 11.659207344055176, 12.453704833984375, 13.248202323913574, 14.042699813842773, 14.837197303771973, 15.631694793701172, 16.426193237304688, 17.22068977355957, 18.015186309814453, 18.80968475341797, 19.604183197021484, 20.398679733276367, 21.19317626953125, 21.987674713134766]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 10.0, 15.0, 14.0, 20.0, 36.0, 69.0, 73.0, 161.0, 206.0, 397.0, 767.0, 1482.0, 3547.0, 10920.0, 58260.0, 3824822.0, 257939.0, 24047.0, 6463.0, 2541.0, 1115.0, 578.0, 322.0, 162.0, 100.0, 78.0, 45.0, 32.0, 16.0, 12.0, 12.0, 0.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.7578125, -8.51287841796875, -8.2679443359375, -8.02301025390625, -7.778076171875, -7.53314208984375, -7.2882080078125, -7.04327392578125, -6.79833984375, -6.55340576171875, -6.3084716796875, -6.06353759765625, -5.818603515625, -5.57366943359375, -5.3287353515625, -5.08380126953125, -4.8388671875, -4.59393310546875, -4.3489990234375, -4.10406494140625, -3.859130859375, -3.61419677734375, -3.3692626953125, -3.12432861328125, -2.87939453125, -2.63446044921875, -2.3895263671875, -2.14459228515625, -1.899658203125, -1.65472412109375, -1.4097900390625, -1.16485595703125, -0.919921875, -0.67498779296875, -0.4300537109375, -0.18511962890625, 0.059814453125, 0.30474853515625, 0.5496826171875, 0.79461669921875, 1.03955078125, 1.28448486328125, 1.5294189453125, 1.77435302734375, 2.019287109375, 2.26422119140625, 2.5091552734375, 2.75408935546875, 2.9990234375, 3.24395751953125, 3.4888916015625, 3.73382568359375, 3.978759765625, 4.22369384765625, 4.4686279296875, 4.71356201171875, 4.95849609375, 5.20343017578125, 5.4483642578125, 5.69329833984375, 5.938232421875, 6.18316650390625, 6.4281005859375, 6.67303466796875, 6.91796875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 10.0, 21.0, 31.0, 21.0, 23.0, 43.0, 64.0, 74.0, 78.0, 68.0, 86.0, 87.0, 64.0, 63.0, 61.0, 49.0, 40.0, 27.0, 21.0, 22.0, 10.0, 8.0, 9.0, 9.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8427734375, -1.7952880859375, -1.747802734375, -1.7003173828125, -1.65283203125, -1.6053466796875, -1.557861328125, -1.5103759765625, -1.462890625, -1.4154052734375, -1.367919921875, -1.3204345703125, -1.27294921875, -1.2254638671875, -1.177978515625, -1.1304931640625, -1.0830078125, -1.0355224609375, -0.988037109375, -0.9405517578125, -0.89306640625, -0.8455810546875, -0.798095703125, -0.7506103515625, -0.703125, -0.6556396484375, -0.608154296875, -0.5606689453125, -0.51318359375, -0.4656982421875, -0.418212890625, -0.3707275390625, -0.3232421875, -0.2757568359375, -0.228271484375, -0.1807861328125, -0.13330078125, -0.0858154296875, -0.038330078125, 0.0091552734375, 0.056640625, 0.1041259765625, 0.151611328125, 0.1990966796875, 0.24658203125, 0.2940673828125, 0.341552734375, 0.3890380859375, 0.4365234375, 0.4840087890625, 0.531494140625, 0.5789794921875, 0.62646484375, 0.6739501953125, 0.721435546875, 0.7689208984375, 0.81640625, 0.8638916015625, 0.911376953125, 0.9588623046875, 1.00634765625, 1.0538330078125, 1.101318359375, 1.1488037109375, 1.1962890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 8.0, 13.0, 11.0, 18.0, 25.0, 23.0, 34.0, 55.0, 75.0, 102.0, 129.0, 179.0, 335.0, 523.0, 805.0, 1446.0, 2757.0, 5336.0, 12337.0, 37859.0, 237045.0, 3653659.0, 185250.0, 33811.0, 11434.0, 4915.0, 2486.0, 1357.0, 799.0, 475.0, 309.0, 218.0, 129.0, 77.0, 58.0, 44.0, 36.0, 26.0, 22.0, 14.0, 8.0, 6.0, 10.0, 5.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.49609375, -4.34844970703125, -4.2008056640625, -4.05316162109375, -3.905517578125, -3.75787353515625, -3.6102294921875, -3.46258544921875, -3.31494140625, -3.16729736328125, -3.0196533203125, -2.87200927734375, -2.724365234375, -2.57672119140625, -2.4290771484375, -2.28143310546875, -2.1337890625, -1.98614501953125, -1.8385009765625, -1.69085693359375, -1.543212890625, -1.39556884765625, -1.2479248046875, -1.10028076171875, -0.95263671875, -0.80499267578125, -0.6573486328125, -0.50970458984375, -0.362060546875, -0.21441650390625, -0.0667724609375, 0.08087158203125, 0.228515625, 0.37615966796875, 0.5238037109375, 0.67144775390625, 0.819091796875, 0.96673583984375, 1.1143798828125, 1.26202392578125, 1.40966796875, 1.55731201171875, 1.7049560546875, 1.85260009765625, 2.000244140625, 2.14788818359375, 2.2955322265625, 2.44317626953125, 2.5908203125, 2.73846435546875, 2.8861083984375, 3.03375244140625, 3.181396484375, 3.32904052734375, 3.4766845703125, 3.62432861328125, 3.77197265625, 3.91961669921875, 4.0672607421875, 4.21490478515625, 4.362548828125, 4.51019287109375, 4.6578369140625, 4.80548095703125, 4.953125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 8.0, 12.0, 17.0, 30.0, 38.0, 78.0, 158.0, 458.0, 2265.0, 587.0, 175.0, 88.0, 38.0, 30.0, 21.0, 11.0, 15.0, 4.0, 4.0, 10.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.794921875, -2.714019775390625, -2.63311767578125, -2.552215576171875, -2.4713134765625, -2.390411376953125, -2.30950927734375, -2.228607177734375, -2.147705078125, -2.066802978515625, -1.98590087890625, -1.904998779296875, -1.8240966796875, -1.743194580078125, -1.66229248046875, -1.581390380859375, -1.50048828125, -1.419586181640625, -1.33868408203125, -1.257781982421875, -1.1768798828125, -1.095977783203125, -1.01507568359375, -0.934173583984375, -0.853271484375, -0.772369384765625, -0.69146728515625, -0.610565185546875, -0.5296630859375, -0.448760986328125, -0.36785888671875, -0.286956787109375, -0.2060546875, -0.125152587890625, -0.04425048828125, 0.036651611328125, 0.1175537109375, 0.198455810546875, 0.27935791015625, 0.360260009765625, 0.441162109375, 0.522064208984375, 0.60296630859375, 0.683868408203125, 0.7647705078125, 0.845672607421875, 0.92657470703125, 1.007476806640625, 1.08837890625, 1.169281005859375, 1.25018310546875, 1.331085205078125, 1.4119873046875, 1.492889404296875, 1.57379150390625, 1.654693603515625, 1.735595703125, 1.816497802734375, 1.89739990234375, 1.978302001953125, 2.0592041015625, 2.140106201171875, 2.22100830078125, 2.301910400390625, 2.3828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 10.0, 26.0, 57.0, 147.0, 292.0, 246.0, 134.0, 56.0, 28.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.293342590332031, -12.452301025390625, -11.611259460449219, -10.770217895507812, -9.929176330566406, -9.088134765625, -8.247093200683594, -7.406052112579346, -6.5650105476379395, -5.723968982696533, -4.882927417755127, -4.041886329650879, -3.2008445262908936, -2.3598031997680664, -1.5187616348266602, -0.6777200698852539, 0.16332149505615234, 1.0043630599975586, 1.8454045057296753, 2.686445951461792, 3.5274875164031982, 4.368528842926025, 5.209570407867432, 6.050611972808838, 6.891653537750244, 7.73269510269165, 8.573736190795898, 9.414777755737305, 10.255819320678711, 11.096860885620117, 11.937902450561523, 12.77894401550293, 13.619985580444336, 14.461027145385742, 15.302068710327148, 16.143110275268555, 16.98415184020996, 17.825193405151367, 18.666234970092773, 19.50727653503418, 20.348318099975586, 21.189359664916992, 22.0304012298584, 22.871442794799805, 23.71248435974121, 24.553525924682617, 25.394567489624023, 26.23560905456543, 27.076648712158203, 27.91769027709961, 28.758731842041016, 29.599773406982422, 30.440814971923828, 31.281856536865234, 32.12289810180664, 32.96393966674805, 33.80498123168945, 34.64602279663086, 35.487064361572266, 36.32810592651367, 37.16914749145508, 38.010189056396484, 38.85123062133789, 39.6922721862793, 40.5333137512207]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 6.0, 9.0, 9.0, 9.0, 13.0, 11.0, 23.0, 25.0, 29.0, 28.0, 23.0, 37.0, 39.0, 28.0, 54.0, 39.0, 60.0, 40.0, 48.0, 47.0, 45.0, 41.0, 43.0, 45.0, 40.0, 39.0, 32.0, 19.0, 20.0, 18.0, 12.0, 13.0, 12.0, 9.0, 3.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.926694869995117, -5.73092794418335, -5.535161018371582, -5.3393940925598145, -5.143627166748047, -4.947860240936279, -4.752093315124512, -4.556326389312744, -4.360559463500977, -4.164792537689209, -3.9690256118774414, -3.773258686065674, -3.5774917602539062, -3.3817248344421387, -3.185957908630371, -2.9901909828186035, -2.794424057006836, -2.5986571311950684, -2.402890205383301, -2.207123279571533, -2.0113563537597656, -1.815589427947998, -1.6198225021362305, -1.424055576324463, -1.2282886505126953, -1.0325217247009277, -0.8367547988891602, -0.6409878730773926, -0.445220947265625, -0.24945402145385742, -0.053687095642089844, 0.14207983016967773, 0.3378462791442871, 0.5336132049560547, 0.7293801307678223, 0.9251470565795898, 1.1209139823913574, 1.316680908203125, 1.5124478340148926, 1.7082147598266602, 1.9039816856384277, 2.0997486114501953, 2.295515537261963, 2.4912824630737305, 2.687049388885498, 2.8828163146972656, 3.078583240509033, 3.274350166320801, 3.4701170921325684, 3.665884017944336, 3.8616509437561035, 4.057417869567871, 4.253184795379639, 4.448951721191406, 4.644718647003174, 4.840485572814941, 5.036252498626709, 5.232019424438477, 5.427786350250244, 5.623553276062012, 5.819320201873779, 6.015087127685547, 6.2108540534973145, 6.406620979309082, 6.60238790512085]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 1.0, 4.0, 3.0, 9.0, 17.0, 22.0, 29.0, 36.0, 44.0, 78.0, 100.0, 162.0, 253.0, 400.0, 593.0, 1071.0, 2123.0, 4285.0, 9727.0, 26448.0, 88279.0, 398623.0, 385630.0, 86114.0, 25816.0, 9637.0, 4172.0, 1987.0, 1131.0, 644.0, 378.0, 223.0, 152.0, 101.0, 64.0, 54.0, 41.0, 25.0, 25.0, 18.0, 9.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.91015625, -4.751708984375, -4.59326171875, -4.434814453125, -4.2763671875, -4.117919921875, -3.95947265625, -3.801025390625, -3.642578125, -3.484130859375, -3.32568359375, -3.167236328125, -3.0087890625, -2.850341796875, -2.69189453125, -2.533447265625, -2.375, -2.216552734375, -2.05810546875, -1.899658203125, -1.7412109375, -1.582763671875, -1.42431640625, -1.265869140625, -1.107421875, -0.948974609375, -0.79052734375, -0.632080078125, -0.4736328125, -0.315185546875, -0.15673828125, 0.001708984375, 0.16015625, 0.318603515625, 0.47705078125, 0.635498046875, 0.7939453125, 0.952392578125, 1.11083984375, 1.269287109375, 1.427734375, 1.586181640625, 1.74462890625, 1.903076171875, 2.0615234375, 2.219970703125, 2.37841796875, 2.536865234375, 2.6953125, 2.853759765625, 3.01220703125, 3.170654296875, 3.3291015625, 3.487548828125, 3.64599609375, 3.804443359375, 3.962890625, 4.121337890625, 4.27978515625, 4.438232421875, 4.5966796875, 4.755126953125, 4.91357421875, 5.072021484375, 5.23046875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 9.0, 21.0, 25.0, 30.0, 36.0, 65.0, 53.0, 69.0, 69.0, 71.0, 74.0, 69.0, 72.0, 56.0, 64.0, 53.0, 40.0, 22.0, 26.0, 19.0, 13.0, 9.0, 12.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.90625, -1.8582000732421875, -1.810150146484375, -1.7621002197265625, -1.71405029296875, -1.6660003662109375, -1.617950439453125, -1.5699005126953125, -1.5218505859375, -1.4738006591796875, -1.425750732421875, -1.3777008056640625, -1.32965087890625, -1.2816009521484375, -1.233551025390625, -1.1855010986328125, -1.137451171875, -1.0894012451171875, -1.041351318359375, -0.9933013916015625, -0.94525146484375, -0.8972015380859375, -0.849151611328125, -0.8011016845703125, -0.7530517578125, -0.7050018310546875, -0.656951904296875, -0.6089019775390625, -0.56085205078125, -0.5128021240234375, -0.464752197265625, -0.4167022705078125, -0.36865234375, -0.3206024169921875, -0.272552490234375, -0.2245025634765625, -0.17645263671875, -0.1284027099609375, -0.080352783203125, -0.0323028564453125, 0.0157470703125, 0.0637969970703125, 0.111846923828125, 0.1598968505859375, 0.20794677734375, 0.2559967041015625, 0.304046630859375, 0.3520965576171875, 0.400146484375, 0.4481964111328125, 0.496246337890625, 0.5442962646484375, 0.59234619140625, 0.6403961181640625, 0.688446044921875, 0.7364959716796875, 0.7845458984375, 0.8325958251953125, 0.880645751953125, 0.9286956787109375, 0.97674560546875, 1.0247955322265625, 1.072845458984375, 1.1208953857421875, 1.1689453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 8.0, 13.0, 14.0, 7.0, 25.0, 31.0, 48.0, 74.0, 83.0, 108.0, 169.0, 243.0, 392.0, 685.0, 1189.0, 2337.0, 5040.0, 11089.0, 29166.0, 94085.0, 451873.0, 334977.0, 73934.0, 23982.0, 9713.0, 4302.0, 2070.0, 1030.0, 622.0, 403.0, 263.0, 187.0, 104.0, 74.0, 56.0, 33.0, 27.0, 28.0, 17.0, 15.0, 6.0, 7.0, 6.0, 4.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.6796875, -4.5374755859375, -4.395263671875, -4.2530517578125, -4.11083984375, -3.9686279296875, -3.826416015625, -3.6842041015625, -3.5419921875, -3.3997802734375, -3.257568359375, -3.1153564453125, -2.97314453125, -2.8309326171875, -2.688720703125, -2.5465087890625, -2.404296875, -2.2620849609375, -2.119873046875, -1.9776611328125, -1.83544921875, -1.6932373046875, -1.551025390625, -1.4088134765625, -1.2666015625, -1.1243896484375, -0.982177734375, -0.8399658203125, -0.69775390625, -0.5555419921875, -0.413330078125, -0.2711181640625, -0.12890625, 0.0133056640625, 0.155517578125, 0.2977294921875, 0.43994140625, 0.5821533203125, 0.724365234375, 0.8665771484375, 1.0087890625, 1.1510009765625, 1.293212890625, 1.4354248046875, 1.57763671875, 1.7198486328125, 1.862060546875, 2.0042724609375, 2.146484375, 2.2886962890625, 2.430908203125, 2.5731201171875, 2.71533203125, 2.8575439453125, 2.999755859375, 3.1419677734375, 3.2841796875, 3.4263916015625, 3.568603515625, 3.7108154296875, 3.85302734375, 3.9952392578125, 4.137451171875, 4.2796630859375, 4.421875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 11.0, 7.0, 12.0, 10.0, 24.0, 21.0, 27.0, 40.0, 38.0, 54.0, 52.0, 58.0, 55.0, 64.0, 58.0, 55.0, 62.0, 60.0, 55.0, 53.0, 33.0, 26.0, 32.0, 17.0, 10.0, 12.0, 6.0, 14.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6875, -4.51385498046875, -4.3402099609375, -4.16656494140625, -3.992919921875, -3.81927490234375, -3.6456298828125, -3.47198486328125, -3.29833984375, -3.12469482421875, -2.9510498046875, -2.77740478515625, -2.603759765625, -2.43011474609375, -2.2564697265625, -2.08282470703125, -1.9091796875, -1.73553466796875, -1.5618896484375, -1.38824462890625, -1.214599609375, -1.04095458984375, -0.8673095703125, -0.69366455078125, -0.52001953125, -0.34637451171875, -0.1727294921875, 0.00091552734375, 0.174560546875, 0.34820556640625, 0.5218505859375, 0.69549560546875, 0.869140625, 1.04278564453125, 1.2164306640625, 1.39007568359375, 1.563720703125, 1.73736572265625, 1.9110107421875, 2.08465576171875, 2.25830078125, 2.43194580078125, 2.6055908203125, 2.77923583984375, 2.952880859375, 3.12652587890625, 3.3001708984375, 3.47381591796875, 3.6474609375, 3.82110595703125, 3.9947509765625, 4.16839599609375, 4.342041015625, 4.51568603515625, 4.6893310546875, 4.86297607421875, 5.03662109375, 5.21026611328125, 5.3839111328125, 5.55755615234375, 5.731201171875, 5.90484619140625, 6.0784912109375, 6.25213623046875, 6.42578125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 5.0, 8.0, 6.0, 13.0, 22.0, 33.0, 55.0, 97.0, 223.0, 422.0, 977.0, 2612.0, 8495.0, 44711.0, 931543.0, 46313.0, 8657.0, 2518.0, 925.0, 417.0, 219.0, 115.0, 63.0, 47.0, 26.0, 14.0, 8.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.489501953125, -8.14306640625, -7.796630859375, -7.4501953125, -7.103759765625, -6.75732421875, -6.410888671875, -6.064453125, -5.718017578125, -5.37158203125, -5.025146484375, -4.6787109375, -4.332275390625, -3.98583984375, -3.639404296875, -3.29296875, -2.946533203125, -2.60009765625, -2.253662109375, -1.9072265625, -1.560791015625, -1.21435546875, -0.867919921875, -0.521484375, -0.175048828125, 0.17138671875, 0.517822265625, 0.8642578125, 1.210693359375, 1.55712890625, 1.903564453125, 2.25, 2.596435546875, 2.94287109375, 3.289306640625, 3.6357421875, 3.982177734375, 4.32861328125, 4.675048828125, 5.021484375, 5.367919921875, 5.71435546875, 6.060791015625, 6.4072265625, 6.753662109375, 7.10009765625, 7.446533203125, 7.79296875, 8.139404296875, 8.48583984375, 8.832275390625, 9.1787109375, 9.525146484375, 9.87158203125, 10.218017578125, 10.564453125, 10.910888671875, 11.25732421875, 11.603759765625, 11.9501953125, 12.296630859375, 12.64306640625, 12.989501953125, 13.3359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 4.0, 9.0, 16.0, 36.0, 77.0, 454.0, 227.0, 57.0, 30.0, 19.0, 14.0, 8.0, 6.0, 5.0, 5.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012416839599609375, -0.0012088567018508911, -0.0011760294437408447, -0.0011432021856307983, -0.001110374927520752, -0.0010775476694107056, -0.0010447204113006592, -0.0010118931531906128, -0.0009790658950805664, -0.00094623863697052, -0.0009134113788604736, -0.0008805841207504272, -0.0008477568626403809, -0.0008149296045303345, -0.0007821023464202881, -0.0007492750883102417, -0.0007164478302001953, -0.0006836205720901489, -0.0006507933139801025, -0.0006179660558700562, -0.0005851387977600098, -0.0005523115396499634, -0.000519484281539917, -0.0004866570234298706, -0.0004538297653198242, -0.00042100250720977783, -0.00038817524909973145, -0.00035534799098968506, -0.00032252073287963867, -0.0002896934747695923, -0.0002568662166595459, -0.0002240389585494995, -0.00019121170043945312, -0.00015838444232940674, -0.00012555718421936035, -9.272992610931396e-05, -5.990266799926758e-05, -2.707540988922119e-05, 5.751848220825195e-06, 3.857910633087158e-05, 7.140636444091797e-05, 0.00010423362255096436, 0.00013706088066101074, 0.00016988813877105713, 0.00020271539688110352, 0.0002355426549911499, 0.0002683699131011963, 0.0003011971712112427, 0.00033402442932128906, 0.00036685168743133545, 0.00039967894554138184, 0.0004325062036514282, 0.0004653334617614746, 0.000498160719871521, 0.0005309879779815674, 0.0005638152360916138, 0.0005966424942016602, 0.0006294697523117065, 0.0006622970104217529, 0.0006951242685317993, 0.0007279515266418457, 0.0007607787847518921, 0.0007936060428619385, 0.0008264333009719849, 0.0008592605590820312]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 3.0, 12.0, 9.0, 19.0, 25.0, 43.0, 54.0, 68.0, 92.0, 203.0, 284.0, 500.0, 832.0, 1375.0, 2791.0, 5670.0, 14240.0, 56102.0, 887628.0, 52873.0, 13918.0, 5615.0, 2602.0, 1441.0, 843.0, 456.0, 292.0, 188.0, 122.0, 87.0, 40.0, 34.0, 16.0, 17.0, 8.0, 9.0, 12.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.78125, -10.4686279296875, -10.156005859375, -9.8433837890625, -9.53076171875, -9.2181396484375, -8.905517578125, -8.5928955078125, -8.2802734375, -7.9676513671875, -7.655029296875, -7.3424072265625, -7.02978515625, -6.7171630859375, -6.404541015625, -6.0919189453125, -5.779296875, -5.4666748046875, -5.154052734375, -4.8414306640625, -4.52880859375, -4.2161865234375, -3.903564453125, -3.5909423828125, -3.2783203125, -2.9656982421875, -2.653076171875, -2.3404541015625, -2.02783203125, -1.7152099609375, -1.402587890625, -1.0899658203125, -0.77734375, -0.4647216796875, -0.152099609375, 0.1605224609375, 0.47314453125, 0.7857666015625, 1.098388671875, 1.4110107421875, 1.7236328125, 2.0362548828125, 2.348876953125, 2.6614990234375, 2.97412109375, 3.2867431640625, 3.599365234375, 3.9119873046875, 4.224609375, 4.5372314453125, 4.849853515625, 5.1624755859375, 5.47509765625, 5.7877197265625, 6.100341796875, 6.4129638671875, 6.7255859375, 7.0382080078125, 7.350830078125, 7.6634521484375, 7.97607421875, 8.2886962890625, 8.601318359375, 8.9139404296875, 9.2265625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 4.0, 10.0, 12.0, 7.0, 10.0, 27.0, 41.0, 115.0, 431.0, 181.0, 46.0, 30.0, 16.0, 14.0, 7.0, 5.0, 4.0, 5.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2421875, -6.9798583984375, -6.717529296875, -6.4552001953125, -6.19287109375, -5.9305419921875, -5.668212890625, -5.4058837890625, -5.1435546875, -4.8812255859375, -4.618896484375, -4.3565673828125, -4.09423828125, -3.8319091796875, -3.569580078125, -3.3072509765625, -3.044921875, -2.7825927734375, -2.520263671875, -2.2579345703125, -1.99560546875, -1.7332763671875, -1.470947265625, -1.2086181640625, -0.9462890625, -0.6839599609375, -0.421630859375, -0.1593017578125, 0.10302734375, 0.3653564453125, 0.627685546875, 0.8900146484375, 1.15234375, 1.4146728515625, 1.677001953125, 1.9393310546875, 2.20166015625, 2.4639892578125, 2.726318359375, 2.9886474609375, 3.2509765625, 3.5133056640625, 3.775634765625, 4.0379638671875, 4.30029296875, 4.5626220703125, 4.824951171875, 5.0872802734375, 5.349609375, 5.6119384765625, 5.874267578125, 6.1365966796875, 6.39892578125, 6.6612548828125, 6.923583984375, 7.1859130859375, 7.4482421875, 7.7105712890625, 7.972900390625, 8.2352294921875, 8.49755859375, 8.7598876953125, 9.022216796875, 9.2845458984375, 9.546875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 5.0, 23.0, 34.0, 70.0, 198.0, 287.0, 197.0, 88.0, 49.0, 25.0, 8.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.56669616699219, -114.6602783203125, -111.75385284423828, -108.8474349975586, -105.94100952148438, -103.03459167480469, -100.128173828125, -97.22174835205078, -94.31532287597656, -91.40890502929688, -88.50247955322266, -85.59606170654297, -82.68963623046875, -79.78321838378906, -76.87680053710938, -73.97037506103516, -71.06395721435547, -68.15753936767578, -65.25111389160156, -62.344696044921875, -59.438270568847656, -56.53185272216797, -53.625431060791016, -50.71900939941406, -47.81258773803711, -44.906166076660156, -41.9997444152832, -39.09332275390625, -36.18690490722656, -33.280479431152344, -30.374061584472656, -27.467639923095703, -24.56121826171875, -21.654796600341797, -18.748374938964844, -15.841955184936523, -12.93553352355957, -10.029111862182617, -7.122692108154297, -4.216270446777344, -1.3098487854003906, 1.5965723991394043, 4.502993583679199, 7.409414291381836, 10.315835952758789, 13.222257614135742, 16.128677368164062, 19.035099029541016, 21.94152069091797, 24.847942352294922, 27.754364013671875, 30.660783767700195, 33.56720733642578, 36.47362518310547, 39.38004684448242, 42.286468505859375, 45.19289016723633, 48.09931182861328, 51.005733489990234, 53.91215515136719, 56.818572998046875, 59.724998474121094, 62.63141632080078, 65.537841796875, 68.44425964355469]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 7.0, 8.0, 6.0, 6.0, 7.0, 8.0, 10.0, 12.0, 13.0, 22.0, 14.0, 20.0, 25.0, 37.0, 27.0, 34.0, 37.0, 37.0, 57.0, 46.0, 66.0, 53.0, 36.0, 42.0, 41.0, 48.0, 47.0, 35.0, 40.0, 26.0, 18.0, 28.0, 19.0, 11.0, 14.0, 13.0, 9.0, 10.0, 4.0, 7.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.00039291381836, -26.122529983520508, -25.244667053222656, -24.366804122924805, -23.488941192626953, -22.6110782623291, -21.73321533203125, -20.855350494384766, -19.977489471435547, -19.099626541137695, -18.221763610839844, -17.343900680541992, -16.46603775024414, -15.588174819946289, -14.710310935974121, -13.83244800567627, -12.954584121704102, -12.07672119140625, -11.198858261108398, -10.320995330810547, -9.443132400512695, -8.565269470214844, -7.687405586242676, -6.809542655944824, -5.931679725646973, -5.053816795349121, -4.1759538650512695, -3.2980904579162598, -2.420227527618408, -1.5423645973205566, -0.6645011901855469, 0.2133617401123047, 1.091226577758789, 1.9690896272659302, 2.8469526767730713, 3.724815845489502, 4.6026787757873535, 5.480541706085205, 6.358405113220215, 7.236268043518066, 8.114130973815918, 8.99199390411377, 9.869856834411621, 10.747720718383789, 11.62558364868164, 12.503446578979492, 13.381309509277344, 14.259172439575195, 15.137035369873047, 16.0148983001709, 16.89276123046875, 17.7706241607666, 18.648487091064453, 19.526350021362305, 20.404212951660156, 21.28207778930664, 22.15993881225586, 23.03780174255371, 23.915664672851562, 24.793527603149414, 25.671390533447266, 26.549253463745117, 27.42711639404297, 28.304981231689453, 29.182844161987305]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 20.0, 24.0, 30.0, 48.0, 71.0, 118.0, 194.0, 340.0, 609.0, 1221.0, 2648.0, 6720.0, 25723.0, 427981.0, 3671749.0, 41293.0, 8949.0, 3358.0, 1442.0, 721.0, 394.0, 242.0, 129.0, 70.0, 66.0, 39.0, 17.0, 22.0, 7.0, 9.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.171875, -10.8709716796875, -10.570068359375, -10.2691650390625, -9.96826171875, -9.6673583984375, -9.366455078125, -9.0655517578125, -8.7646484375, -8.4637451171875, -8.162841796875, -7.8619384765625, -7.56103515625, -7.2601318359375, -6.959228515625, -6.6583251953125, -6.357421875, -6.0565185546875, -5.755615234375, -5.4547119140625, -5.15380859375, -4.8529052734375, -4.552001953125, -4.2510986328125, -3.9501953125, -3.6492919921875, -3.348388671875, -3.0474853515625, -2.74658203125, -2.4456787109375, -2.144775390625, -1.8438720703125, -1.54296875, -1.2420654296875, -0.941162109375, -0.6402587890625, -0.33935546875, -0.0384521484375, 0.262451171875, 0.5633544921875, 0.8642578125, 1.1651611328125, 1.466064453125, 1.7669677734375, 2.06787109375, 2.3687744140625, 2.669677734375, 2.9705810546875, 3.271484375, 3.5723876953125, 3.873291015625, 4.1741943359375, 4.47509765625, 4.7760009765625, 5.076904296875, 5.3778076171875, 5.6787109375, 5.9796142578125, 6.280517578125, 6.5814208984375, 6.88232421875, 7.1832275390625, 7.484130859375, 7.7850341796875, 8.0859375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 6.0, 5.0, 5.0, 8.0, 12.0, 15.0, 20.0, 26.0, 39.0, 36.0, 50.0, 52.0, 61.0, 71.0, 69.0, 80.0, 72.0, 71.0, 59.0, 44.0, 42.0, 44.0, 28.0, 26.0, 16.0, 15.0, 16.0, 9.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.989105224609375, -1.92938232421875, -1.869659423828125, -1.8099365234375, -1.750213623046875, -1.69049072265625, -1.630767822265625, -1.571044921875, -1.511322021484375, -1.45159912109375, -1.391876220703125, -1.3321533203125, -1.272430419921875, -1.21270751953125, -1.152984619140625, -1.09326171875, -1.033538818359375, -0.97381591796875, -0.914093017578125, -0.8543701171875, -0.794647216796875, -0.73492431640625, -0.675201416015625, -0.615478515625, -0.555755615234375, -0.49603271484375, -0.436309814453125, -0.3765869140625, -0.316864013671875, -0.25714111328125, -0.197418212890625, -0.1376953125, -0.077972412109375, -0.01824951171875, 0.041473388671875, 0.1011962890625, 0.160919189453125, 0.22064208984375, 0.280364990234375, 0.340087890625, 0.399810791015625, 0.45953369140625, 0.519256591796875, 0.5789794921875, 0.638702392578125, 0.69842529296875, 0.758148193359375, 0.81787109375, 0.877593994140625, 0.93731689453125, 0.997039794921875, 1.0567626953125, 1.116485595703125, 1.17620849609375, 1.235931396484375, 1.295654296875, 1.355377197265625, 1.41510009765625, 1.474822998046875, 1.5345458984375, 1.594268798828125, 1.65399169921875, 1.713714599609375, 1.7734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 2.0, 2.0, 10.0, 6.0, 10.0, 18.0, 17.0, 21.0, 28.0, 33.0, 48.0, 71.0, 112.0, 143.0, 258.0, 336.0, 555.0, 1000.0, 1705.0, 3323.0, 7516.0, 25075.0, 325198.0, 3759357.0, 48480.0, 11111.0, 4409.0, 2179.0, 1195.0, 715.0, 442.0, 271.0, 201.0, 138.0, 90.0, 58.0, 36.0, 29.0, 26.0, 21.0, 15.0, 5.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.2421875, -9.9029541015625, -9.563720703125, -9.2244873046875, -8.88525390625, -8.5460205078125, -8.206787109375, -7.8675537109375, -7.5283203125, -7.1890869140625, -6.849853515625, -6.5106201171875, -6.17138671875, -5.8321533203125, -5.492919921875, -5.1536865234375, -4.814453125, -4.4752197265625, -4.135986328125, -3.7967529296875, -3.45751953125, -3.1182861328125, -2.779052734375, -2.4398193359375, -2.1005859375, -1.7613525390625, -1.422119140625, -1.0828857421875, -0.74365234375, -0.4044189453125, -0.065185546875, 0.2740478515625, 0.61328125, 0.9525146484375, 1.291748046875, 1.6309814453125, 1.97021484375, 2.3094482421875, 2.648681640625, 2.9879150390625, 3.3271484375, 3.6663818359375, 4.005615234375, 4.3448486328125, 4.68408203125, 5.0233154296875, 5.362548828125, 5.7017822265625, 6.041015625, 6.3802490234375, 6.719482421875, 7.0587158203125, 7.39794921875, 7.7371826171875, 8.076416015625, 8.4156494140625, 8.7548828125, 9.0941162109375, 9.433349609375, 9.7725830078125, 10.11181640625, 10.4510498046875, 10.790283203125, 11.1295166015625, 11.46875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 13.0, 12.0, 14.0, 35.0, 60.0, 131.0, 403.0, 2807.0, 358.0, 111.0, 43.0, 20.0, 11.0, 13.0, 10.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.453125, -5.318328857421875, -5.18353271484375, -5.048736572265625, -4.9139404296875, -4.779144287109375, -4.64434814453125, -4.509552001953125, -4.374755859375, -4.239959716796875, -4.10516357421875, -3.970367431640625, -3.8355712890625, -3.700775146484375, -3.56597900390625, -3.431182861328125, -3.29638671875, -3.161590576171875, -3.02679443359375, -2.891998291015625, -2.7572021484375, -2.622406005859375, -2.48760986328125, -2.352813720703125, -2.218017578125, -2.083221435546875, -1.94842529296875, -1.813629150390625, -1.6788330078125, -1.544036865234375, -1.40924072265625, -1.274444580078125, -1.1396484375, -1.004852294921875, -0.87005615234375, -0.735260009765625, -0.6004638671875, -0.465667724609375, -0.33087158203125, -0.196075439453125, -0.061279296875, 0.073516845703125, 0.20831298828125, 0.343109130859375, 0.4779052734375, 0.612701416015625, 0.74749755859375, 0.882293701171875, 1.01708984375, 1.151885986328125, 1.28668212890625, 1.421478271484375, 1.5562744140625, 1.691070556640625, 1.82586669921875, 1.960662841796875, 2.095458984375, 2.230255126953125, 2.36505126953125, 2.499847412109375, 2.6346435546875, 2.769439697265625, 2.90423583984375, 3.039031982421875, 3.173828125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 8.0, 4.0, 5.0, 12.0, 13.0, 12.0, 23.0, 38.0, 45.0, 76.0, 111.0, 146.0, 148.0, 124.0, 71.0, 62.0, 33.0, 25.0, 11.0, 11.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.377222061157227, -21.76167869567871, -21.146135330200195, -20.530590057373047, -19.91504669189453, -19.299503326416016, -18.6839599609375, -18.068416595458984, -17.45287322998047, -16.837329864501953, -16.221786499023438, -15.606242179870605, -14.990697860717773, -14.375154495239258, -13.759611129760742, -13.144067764282227, -12.528522491455078, -11.912979125976562, -11.29743480682373, -10.681891441345215, -10.066347122192383, -9.450803756713867, -8.835260391235352, -8.219717025756836, -7.604172706604004, -6.98862886428833, -6.373085021972656, -5.757541656494141, -5.141997814178467, -4.526453971862793, -3.9109103679656982, -3.2953667640686035, -2.6798248291015625, -2.0642809867858887, -1.448737382888794, -0.8331936597824097, -0.2176499366760254, 0.39789390563964844, 1.0134375095367432, 1.628981113433838, 2.2445249557495117, 2.8600687980651855, 3.4756124019622803, 4.091156005859375, 4.706699848175049, 5.322243690490723, 5.937787055969238, 6.553330898284912, 7.168874740600586, 7.78441858291626, 8.399962425231934, 9.01550579071045, 9.631050109863281, 10.246593475341797, 10.862136840820312, 11.477680206298828, 12.09322452545166, 12.708767890930176, 13.324312210083008, 13.939855575561523, 14.555398941040039, 15.170943260192871, 15.786486625671387, 16.40203094482422, 17.017574310302734]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 9.0, 15.0, 9.0, 17.0, 18.0, 34.0, 29.0, 28.0, 38.0, 42.0, 43.0, 57.0, 42.0, 54.0, 45.0, 51.0, 44.0, 62.0, 55.0, 42.0, 38.0, 40.0, 38.0, 28.0, 21.0, 18.0, 18.0, 6.0, 15.0, 8.0, 11.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.711044311523438, -10.362683296203613, -10.014322280883789, -9.665961265563965, -9.31760025024414, -8.969240188598633, -8.620879173278809, -8.272518157958984, -7.92415714263916, -7.575796127319336, -7.227435111999512, -6.879074573516846, -6.5307135581970215, -6.182352542877197, -5.833992004394531, -5.485630989074707, -5.137269973754883, -4.788908958435059, -4.440547943115234, -4.092187404632568, -3.743826389312744, -3.39546537399292, -3.047104597091675, -2.6987438201904297, -2.3503828048706055, -2.0020217895507812, -1.6536610126495361, -1.3053001165390015, -0.9569392204284668, -0.6085783243179321, -0.26021742820739746, 0.08814334869384766, 0.4365043640136719, 0.7848652601242065, 1.1332261562347412, 1.4815870523452759, 1.8299479484558105, 2.1783089637756348, 2.52666974067688, 2.875030517578125, 3.223391532897949, 3.5717525482177734, 3.9201133251190186, 4.268474102020264, 4.616835117340088, 4.965196132659912, 5.313556671142578, 5.661917686462402, 6.010278701782227, 6.358639717102051, 6.707000732421875, 7.055361270904541, 7.403722286224365, 7.7520833015441895, 8.100443840026855, 8.44880485534668, 8.797165870666504, 9.145526885986328, 9.493887901306152, 9.842248916625977, 10.190608978271484, 10.538969993591309, 10.887331008911133, 11.235692024230957, 11.584053039550781]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 4.0, 11.0, 18.0, 43.0, 32.0, 66.0, 83.0, 161.0, 232.0, 435.0, 737.0, 1409.0, 2724.0, 5754.0, 11995.0, 27969.0, 73339.0, 238540.0, 454703.0, 143439.0, 49164.0, 20040.0, 8723.0, 4176.0, 2119.0, 1138.0, 612.0, 352.0, 194.0, 103.0, 87.0, 43.0, 42.0, 19.0, 9.0, 9.0, 6.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0390625, -5.84613037109375, -5.6531982421875, -5.46026611328125, -5.267333984375, -5.07440185546875, -4.8814697265625, -4.68853759765625, -4.49560546875, -4.30267333984375, -4.1097412109375, -3.91680908203125, -3.723876953125, -3.53094482421875, -3.3380126953125, -3.14508056640625, -2.9521484375, -2.75921630859375, -2.5662841796875, -2.37335205078125, -2.180419921875, -1.98748779296875, -1.7945556640625, -1.60162353515625, -1.40869140625, -1.21575927734375, -1.0228271484375, -0.82989501953125, -0.636962890625, -0.44403076171875, -0.2510986328125, -0.05816650390625, 0.134765625, 0.32769775390625, 0.5206298828125, 0.71356201171875, 0.906494140625, 1.09942626953125, 1.2923583984375, 1.48529052734375, 1.67822265625, 1.87115478515625, 2.0640869140625, 2.25701904296875, 2.449951171875, 2.64288330078125, 2.8358154296875, 3.02874755859375, 3.2216796875, 3.41461181640625, 3.6075439453125, 3.80047607421875, 3.993408203125, 4.18634033203125, 4.3792724609375, 4.57220458984375, 4.76513671875, 4.95806884765625, 5.1510009765625, 5.34393310546875, 5.536865234375, 5.72979736328125, 5.9227294921875, 6.11566162109375, 6.30859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 9.0, 13.0, 16.0, 17.0, 34.0, 31.0, 41.0, 46.0, 45.0, 57.0, 70.0, 70.0, 70.0, 71.0, 61.0, 55.0, 57.0, 47.0, 35.0, 29.0, 35.0, 29.0, 19.0, 10.0, 13.0, 3.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.41455078125, -2.3447265625, -2.27490234375, -2.205078125, -2.13525390625, -2.0654296875, -1.99560546875, -1.92578125, -1.85595703125, -1.7861328125, -1.71630859375, -1.646484375, -1.57666015625, -1.5068359375, -1.43701171875, -1.3671875, -1.29736328125, -1.2275390625, -1.15771484375, -1.087890625, -1.01806640625, -0.9482421875, -0.87841796875, -0.80859375, -0.73876953125, -0.6689453125, -0.59912109375, -0.529296875, -0.45947265625, -0.3896484375, -0.31982421875, -0.25, -0.18017578125, -0.1103515625, -0.04052734375, 0.029296875, 0.09912109375, 0.1689453125, 0.23876953125, 0.30859375, 0.37841796875, 0.4482421875, 0.51806640625, 0.587890625, 0.65771484375, 0.7275390625, 0.79736328125, 0.8671875, 0.93701171875, 1.0068359375, 1.07666015625, 1.146484375, 1.21630859375, 1.2861328125, 1.35595703125, 1.42578125, 1.49560546875, 1.5654296875, 1.63525390625, 1.705078125, 1.77490234375, 1.8447265625, 1.91455078125, 1.984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 8.0, 5.0, 5.0, 6.0, 16.0, 14.0, 23.0, 36.0, 55.0, 71.0, 95.0, 207.0, 297.0, 404.0, 788.0, 1264.0, 2286.0, 4508.0, 10267.0, 28630.0, 130657.0, 678748.0, 139579.0, 29653.0, 10454.0, 4745.0, 2323.0, 1347.0, 776.0, 450.0, 293.0, 174.0, 135.0, 84.0, 44.0, 27.0, 18.0, 18.0, 11.0, 6.0, 10.0, 8.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7734375, -8.4761962890625, -8.178955078125, -7.8817138671875, -7.58447265625, -7.2872314453125, -6.989990234375, -6.6927490234375, -6.3955078125, -6.0982666015625, -5.801025390625, -5.5037841796875, -5.20654296875, -4.9093017578125, -4.612060546875, -4.3148193359375, -4.017578125, -3.7203369140625, -3.423095703125, -3.1258544921875, -2.82861328125, -2.5313720703125, -2.234130859375, -1.9368896484375, -1.6396484375, -1.3424072265625, -1.045166015625, -0.7479248046875, -0.45068359375, -0.1534423828125, 0.143798828125, 0.4410400390625, 0.73828125, 1.0355224609375, 1.332763671875, 1.6300048828125, 1.92724609375, 2.2244873046875, 2.521728515625, 2.8189697265625, 3.1162109375, 3.4134521484375, 3.710693359375, 4.0079345703125, 4.30517578125, 4.6024169921875, 4.899658203125, 5.1968994140625, 5.494140625, 5.7913818359375, 6.088623046875, 6.3858642578125, 6.68310546875, 6.9803466796875, 7.277587890625, 7.5748291015625, 7.8720703125, 8.1693115234375, 8.466552734375, 8.7637939453125, 9.06103515625, 9.3582763671875, 9.655517578125, 9.9527587890625, 10.25]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 9.0, 15.0, 14.0, 35.0, 53.0, 42.0, 59.0, 73.0, 72.0, 123.0, 92.0, 81.0, 78.0, 69.0, 48.0, 31.0, 19.0, 10.0, 13.0, 13.0, 14.0, 5.0, 6.0, 1.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.328125, -12.943603515625, -12.55908203125, -12.174560546875, -11.7900390625, -11.405517578125, -11.02099609375, -10.636474609375, -10.251953125, -9.867431640625, -9.48291015625, -9.098388671875, -8.7138671875, -8.329345703125, -7.94482421875, -7.560302734375, -7.17578125, -6.791259765625, -6.40673828125, -6.022216796875, -5.6376953125, -5.253173828125, -4.86865234375, -4.484130859375, -4.099609375, -3.715087890625, -3.33056640625, -2.946044921875, -2.5615234375, -2.177001953125, -1.79248046875, -1.407958984375, -1.0234375, -0.638916015625, -0.25439453125, 0.130126953125, 0.5146484375, 0.899169921875, 1.28369140625, 1.668212890625, 2.052734375, 2.437255859375, 2.82177734375, 3.206298828125, 3.5908203125, 3.975341796875, 4.35986328125, 4.744384765625, 5.12890625, 5.513427734375, 5.89794921875, 6.282470703125, 6.6669921875, 7.051513671875, 7.43603515625, 7.820556640625, 8.205078125, 8.589599609375, 8.97412109375, 9.358642578125, 9.7431640625, 10.127685546875, 10.51220703125, 10.896728515625, 11.28125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0, 5.0, 12.0, 11.0, 20.0, 22.0, 31.0, 47.0, 64.0, 99.0, 154.0, 239.0, 343.0, 563.0, 1034.0, 2030.0, 3858.0, 8549.0, 27919.0, 919432.0, 60171.0, 12805.0, 5276.0, 2565.0, 1336.0, 712.0, 424.0, 284.0, 168.0, 120.0, 90.0, 57.0, 31.0, 21.0, 20.0, 15.0, 6.0, 2.0, 5.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.96875, -18.350830078125, -17.73291015625, -17.114990234375, -16.4970703125, -15.879150390625, -15.26123046875, -14.643310546875, -14.025390625, -13.407470703125, -12.78955078125, -12.171630859375, -11.5537109375, -10.935791015625, -10.31787109375, -9.699951171875, -9.08203125, -8.464111328125, -7.84619140625, -7.228271484375, -6.6103515625, -5.992431640625, -5.37451171875, -4.756591796875, -4.138671875, -3.520751953125, -2.90283203125, -2.284912109375, -1.6669921875, -1.049072265625, -0.43115234375, 0.186767578125, 0.8046875, 1.422607421875, 2.04052734375, 2.658447265625, 3.2763671875, 3.894287109375, 4.51220703125, 5.130126953125, 5.748046875, 6.365966796875, 6.98388671875, 7.601806640625, 8.2197265625, 8.837646484375, 9.45556640625, 10.073486328125, 10.69140625, 11.309326171875, 11.92724609375, 12.545166015625, 13.1630859375, 13.781005859375, 14.39892578125, 15.016845703125, 15.634765625, 16.252685546875, 16.87060546875, 17.488525390625, 18.1064453125, 18.724365234375, 19.34228515625, 19.960205078125, 20.578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 10.0, 12.0, 18.0, 30.0, 142.0, 669.0, 45.0, 21.0, 15.0, 12.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022563934326171875, -0.0021591484546661377, -0.002061903476715088, -0.001964658498764038, -0.0018674135208129883, -0.0017701685428619385, -0.0016729235649108887, -0.0015756785869598389, -0.001478433609008789, -0.0013811886310577393, -0.0012839436531066895, -0.0011866986751556396, -0.0010894536972045898, -0.00099220871925354, -0.0008949637413024902, -0.0007977187633514404, -0.0007004737854003906, -0.0006032288074493408, -0.000505983829498291, -0.0004087388515472412, -0.0003114938735961914, -0.0002142488956451416, -0.0001170039176940918, -1.9758939743041992e-05, 7.748603820800781e-05, 0.00017473101615905762, 0.0002719759941101074, 0.0003692209720611572, 0.00046646595001220703, 0.0005637109279632568, 0.0006609559059143066, 0.0007582008838653564, 0.0008554458618164062, 0.0009526908397674561, 0.0010499358177185059, 0.0011471807956695557, 0.0012444257736206055, 0.0013416707515716553, 0.001438915729522705, 0.0015361607074737549, 0.0016334056854248047, 0.0017306506633758545, 0.0018278956413269043, 0.001925140619277954, 0.002022385597229004, 0.0021196305751800537, 0.0022168755531311035, 0.0023141205310821533, 0.002411365509033203, 0.002508610486984253, 0.0026058554649353027, 0.0027031004428863525, 0.0028003454208374023, 0.002897590398788452, 0.002994835376739502, 0.0030920803546905518, 0.0031893253326416016, 0.0032865703105926514, 0.003383815288543701, 0.003481060266494751, 0.0035783052444458008, 0.0036755502223968506, 0.0037727952003479004, 0.00387004017829895, 0.00396728515625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 13.0, 12.0, 25.0, 32.0, 22.0, 57.0, 82.0, 112.0, 170.0, 290.0, 410.0, 619.0, 941.0, 1433.0, 2488.0, 4159.0, 7008.0, 14414.0, 116902.0, 861144.0, 18330.0, 7949.0, 4513.0, 2719.0, 1704.0, 1077.0, 636.0, 423.0, 269.0, 168.0, 119.0, 106.0, 57.0, 40.0, 33.0, 19.0, 9.0, 12.0, 11.0, 8.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.328125, -25.481689453125, -24.63525390625, -23.788818359375, -22.9423828125, -22.095947265625, -21.24951171875, -20.403076171875, -19.556640625, -18.710205078125, -17.86376953125, -17.017333984375, -16.1708984375, -15.324462890625, -14.47802734375, -13.631591796875, -12.78515625, -11.938720703125, -11.09228515625, -10.245849609375, -9.3994140625, -8.552978515625, -7.70654296875, -6.860107421875, -6.013671875, -5.167236328125, -4.32080078125, -3.474365234375, -2.6279296875, -1.781494140625, -0.93505859375, -0.088623046875, 0.7578125, 1.604248046875, 2.45068359375, 3.297119140625, 4.1435546875, 4.989990234375, 5.83642578125, 6.682861328125, 7.529296875, 8.375732421875, 9.22216796875, 10.068603515625, 10.9150390625, 11.761474609375, 12.60791015625, 13.454345703125, 14.30078125, 15.147216796875, 15.99365234375, 16.840087890625, 17.6865234375, 18.532958984375, 19.37939453125, 20.225830078125, 21.072265625, 21.918701171875, 22.76513671875, 23.611572265625, 24.4580078125, 25.304443359375, 26.15087890625, 26.997314453125, 27.84375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 1.0, 5.0, 10.0, 14.0, 36.0, 99.0, 638.0, 76.0, 36.0, 17.0, 3.0, 6.0, 3.0, 3.0, 4.0, 1.0, 5.0, 6.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.546875, -26.790283203125, -26.03369140625, -25.277099609375, -24.5205078125, -23.763916015625, -23.00732421875, -22.250732421875, -21.494140625, -20.737548828125, -19.98095703125, -19.224365234375, -18.4677734375, -17.711181640625, -16.95458984375, -16.197998046875, -15.44140625, -14.684814453125, -13.92822265625, -13.171630859375, -12.4150390625, -11.658447265625, -10.90185546875, -10.145263671875, -9.388671875, -8.632080078125, -7.87548828125, -7.118896484375, -6.3623046875, -5.605712890625, -4.84912109375, -4.092529296875, -3.3359375, -2.579345703125, -1.82275390625, -1.066162109375, -0.3095703125, 0.447021484375, 1.20361328125, 1.960205078125, 2.716796875, 3.473388671875, 4.22998046875, 4.986572265625, 5.7431640625, 6.499755859375, 7.25634765625, 8.012939453125, 8.76953125, 9.526123046875, 10.28271484375, 11.039306640625, 11.7958984375, 12.552490234375, 13.30908203125, 14.065673828125, 14.822265625, 15.578857421875, 16.33544921875, 17.092041015625, 17.8486328125, 18.605224609375, 19.36181640625, 20.118408203125, 20.875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 6.0, 12.0, 4.0, 18.0, 17.0, 26.0, 64.0, 67.0, 130.0, 135.0, 165.0, 120.0, 73.0, 56.0, 34.0, 13.0, 20.0, 11.0, 3.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.67933654785156, -137.57054138183594, -132.4617462158203, -127.35295104980469, -122.24415588378906, -117.13536071777344, -112.02655792236328, -106.91776275634766, -101.80896759033203, -96.7001724243164, -91.59137725830078, -86.48258209228516, -81.373779296875, -76.26498413085938, -71.15618896484375, -66.04739379882812, -60.9385986328125, -55.829803466796875, -50.72100830078125, -45.61220932006836, -40.503414154052734, -35.39461898803711, -30.28582191467285, -25.177024841308594, -20.06822967529297, -14.959433555603027, -9.850637435913086, -4.7418413162231445, 0.3669548034667969, 5.475749969482422, 10.58454704284668, 15.693344116210938, 20.8021240234375, 25.910919189453125, 31.019716262817383, 36.12851333618164, 41.237308502197266, 46.34610366821289, 51.45490264892578, 56.563697814941406, 61.67249298095703, 66.78128814697266, 71.89008331298828, 76.9988784790039, 82.10768127441406, 87.21647644042969, 92.32527160644531, 97.43406677246094, 102.54286193847656, 107.65165710449219, 112.76045227050781, 117.86924743652344, 122.97804260253906, 128.0868377685547, 133.1956329345703, 138.304443359375, 143.41323852539062, 148.52203369140625, 153.63082885742188, 158.7396240234375, 163.84841918945312, 168.95721435546875, 174.06600952148438, 179.1748046875, 184.28359985351562]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 3.0, 7.0, 2.0, 6.0, 9.0, 11.0, 15.0, 11.0, 19.0, 20.0, 20.0, 19.0, 22.0, 31.0, 28.0, 36.0, 38.0, 29.0, 39.0, 22.0, 51.0, 41.0, 42.0, 38.0, 44.0, 39.0, 46.0, 45.0, 33.0, 29.0, 18.0, 22.0, 31.0, 15.0, 18.0, 17.0, 14.0, 7.0, 11.0, 5.0, 13.0, 6.0, 10.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-59.1793212890625, -57.31219482421875, -55.445068359375, -53.57794189453125, -51.710811614990234, -49.843685150146484, -47.976558685302734, -46.109432220458984, -44.24230194091797, -42.37517547607422, -40.50804901123047, -38.64092254638672, -36.7737922668457, -34.90666580200195, -33.0395393371582, -31.172412872314453, -29.305286407470703, -27.438159942626953, -25.57103157043457, -23.70390510559082, -21.836776733398438, -19.969650268554688, -18.102523803710938, -16.235397338867188, -14.368268966674805, -12.501141548156738, -10.634014129638672, -8.766887664794922, -6.8997602462768555, -5.032632827758789, -3.165506362915039, -1.2983789443969727, 0.5687446594238281, 2.4358718395233154, 4.302999019622803, 6.170125961303711, 8.037253379821777, 9.904380798339844, 11.771507263183594, 13.63863468170166, 15.505762100219727, 17.372888565063477, 19.24001693725586, 21.10714340209961, 22.97426986694336, 24.841398239135742, 26.708524703979492, 28.575653076171875, 30.442779541015625, 32.309906005859375, 34.177032470703125, 36.044158935546875, 37.91128921508789, 39.77841567993164, 41.64554214477539, 43.51266860961914, 45.379798889160156, 47.246925354003906, 49.114051818847656, 50.981178283691406, 52.84830856323242, 54.71543502807617, 56.58256149291992, 58.44968795776367, 60.31681442260742]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 10.0, 10.0, 12.0, 18.0, 27.0, 22.0, 39.0, 48.0, 51.0, 73.0, 106.0, 163.0, 290.0, 530.0, 1175.0, 2797.0, 9872.0, 134703.0, 4018917.0, 18030.0, 3947.0, 1588.0, 694.0, 387.0, 191.0, 150.0, 112.0, 60.0, 59.0, 28.0, 35.0, 32.0, 15.0, 16.0, 12.0, 5.0, 5.0, 7.0, 8.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-34.5625, -33.3359375, -32.109375, -30.8828125, -29.65625, -28.4296875, -27.203125, -25.9765625, -24.75, -23.5234375, -22.296875, -21.0703125, -19.84375, -18.6171875, -17.390625, -16.1640625, -14.9375, -13.7109375, -12.484375, -11.2578125, -10.03125, -8.8046875, -7.578125, -6.3515625, -5.125, -3.8984375, -2.671875, -1.4453125, -0.21875, 1.0078125, 2.234375, 3.4609375, 4.6875, 5.9140625, 7.140625, 8.3671875, 9.59375, 10.8203125, 12.046875, 13.2734375, 14.5, 15.7265625, 16.953125, 18.1796875, 19.40625, 20.6328125, 21.859375, 23.0859375, 24.3125, 25.5390625, 26.765625, 27.9921875, 29.21875, 30.4453125, 31.671875, 32.8984375, 34.125, 35.3515625, 36.578125, 37.8046875, 39.03125, 40.2578125, 41.484375, 42.7109375, 43.9375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 5.0, 0.0, 6.0, 4.0, 6.0, 7.0, 6.0, 16.0, 15.0, 16.0, 28.0, 25.0, 34.0, 23.0, 25.0, 35.0, 39.0, 46.0, 42.0, 33.0, 49.0, 56.0, 51.0, 44.0, 42.0, 43.0, 43.0, 35.0, 23.0, 27.0, 23.0, 26.0, 23.0, 27.0, 13.0, 13.0, 8.0, 8.0, 5.0, 6.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62890625, -2.534393310546875, -2.43988037109375, -2.345367431640625, -2.2508544921875, -2.156341552734375, -2.06182861328125, -1.967315673828125, -1.872802734375, -1.778289794921875, -1.68377685546875, -1.589263916015625, -1.4947509765625, -1.400238037109375, -1.30572509765625, -1.211212158203125, -1.11669921875, -1.022186279296875, -0.92767333984375, -0.833160400390625, -0.7386474609375, -0.644134521484375, -0.54962158203125, -0.455108642578125, -0.360595703125, -0.266082763671875, -0.17156982421875, -0.077056884765625, 0.0174560546875, 0.111968994140625, 0.20648193359375, 0.300994873046875, 0.3955078125, 0.490020751953125, 0.58453369140625, 0.679046630859375, 0.7735595703125, 0.868072509765625, 0.96258544921875, 1.057098388671875, 1.151611328125, 1.246124267578125, 1.34063720703125, 1.435150146484375, 1.5296630859375, 1.624176025390625, 1.71868896484375, 1.813201904296875, 1.90771484375, 2.002227783203125, 2.09674072265625, 2.191253662109375, 2.2857666015625, 2.380279541015625, 2.47479248046875, 2.569305419921875, 2.663818359375, 2.758331298828125, 2.85284423828125, 2.947357177734375, 3.0418701171875, 3.136383056640625, 3.23089599609375, 3.325408935546875, 3.419921875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 5.0, 11.0, 12.0, 21.0, 17.0, 23.0, 11.0, 34.0, 42.0, 36.0, 63.0, 100.0, 215.0, 572.0, 1578.0, 5258.0, 39895.0, 4116362.0, 23623.0, 4086.0, 1268.0, 443.0, 200.0, 94.0, 60.0, 39.0, 29.0, 26.0, 14.0, 20.0, 20.0, 11.0, 13.0, 12.0, 9.0, 9.0, 6.0, 3.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-67.0625, -64.9931640625, -62.923828125, -60.8544921875, -58.78515625, -56.7158203125, -54.646484375, -52.5771484375, -50.5078125, -48.4384765625, -46.369140625, -44.2998046875, -42.23046875, -40.1611328125, -38.091796875, -36.0224609375, -33.953125, -31.8837890625, -29.814453125, -27.7451171875, -25.67578125, -23.6064453125, -21.537109375, -19.4677734375, -17.3984375, -15.3291015625, -13.259765625, -11.1904296875, -9.12109375, -7.0517578125, -4.982421875, -2.9130859375, -0.84375, 1.2255859375, 3.294921875, 5.3642578125, 7.43359375, 9.5029296875, 11.572265625, 13.6416015625, 15.7109375, 17.7802734375, 19.849609375, 21.9189453125, 23.98828125, 26.0576171875, 28.126953125, 30.1962890625, 32.265625, 34.3349609375, 36.404296875, 38.4736328125, 40.54296875, 42.6123046875, 44.681640625, 46.7509765625, 48.8203125, 50.8896484375, 52.958984375, 55.0283203125, 57.09765625, 59.1669921875, 61.236328125, 63.3056640625, 65.375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 10.0, 10.0, 20.0, 26.0, 149.0, 3539.0, 228.0, 40.0, 27.0, 10.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.125, -8.49951171875, -7.8740234375, -7.24853515625, -6.623046875, -5.99755859375, -5.3720703125, -4.74658203125, -4.12109375, -3.49560546875, -2.8701171875, -2.24462890625, -1.619140625, -0.99365234375, -0.3681640625, 0.25732421875, 0.8828125, 1.50830078125, 2.1337890625, 2.75927734375, 3.384765625, 4.01025390625, 4.6357421875, 5.26123046875, 5.88671875, 6.51220703125, 7.1376953125, 7.76318359375, 8.388671875, 9.01416015625, 9.6396484375, 10.26513671875, 10.890625, 11.51611328125, 12.1416015625, 12.76708984375, 13.392578125, 14.01806640625, 14.6435546875, 15.26904296875, 15.89453125, 16.52001953125, 17.1455078125, 17.77099609375, 18.396484375, 19.02197265625, 19.6474609375, 20.27294921875, 20.8984375, 21.52392578125, 22.1494140625, 22.77490234375, 23.400390625, 24.02587890625, 24.6513671875, 25.27685546875, 25.90234375, 26.52783203125, 27.1533203125, 27.77880859375, 28.404296875, 29.02978515625, 29.6552734375, 30.28076171875, 30.90625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 9.0, 6.0, 13.0, 12.0, 17.0, 25.0, 55.0, 88.0, 122.0, 198.0, 161.0, 112.0, 49.0, 50.0, 32.0, 20.0, 9.0, 5.0, 4.0, 8.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.61977005004883, -39.86016845703125, -38.100563049316406, -36.34096145629883, -34.58135986328125, -32.821754455566406, -31.062152862548828, -29.30255126953125, -27.54294776916504, -25.783344268798828, -24.02374267578125, -22.26413917541504, -20.504535675048828, -18.74493408203125, -16.98533058166504, -15.225728034973145, -13.46612548828125, -11.706522941589355, -9.946920394897461, -8.18731689453125, -6.4277143478393555, -4.668111801147461, -2.90850830078125, -1.1489057540893555, 0.6106967926025391, 2.3702995777130127, 4.129902362823486, 5.889505386352539, 7.649107933044434, 9.408710479736328, 11.168313980102539, 12.927916526794434, 14.687522888183594, 16.447126388549805, 18.206727981567383, 19.966331481933594, 21.725933074951172, 23.485536575317383, 25.245140075683594, 27.004741668701172, 28.764345169067383, 30.523948669433594, 32.28355026245117, 34.04315185546875, 35.802757263183594, 37.56235885620117, 39.32196044921875, 41.081565856933594, 42.84116744995117, 44.60076904296875, 46.360374450683594, 48.11997604370117, 49.87957763671875, 51.639183044433594, 53.39878463745117, 55.15838623046875, 56.917991638183594, 58.67759323120117, 60.437198638916016, 62.196800231933594, 63.95640182495117, 65.71600341796875, 67.4756088256836, 69.23521423339844, 70.99481201171875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 9.0, 6.0, 9.0, 6.0, 20.0, 15.0, 23.0, 22.0, 25.0, 29.0, 32.0, 29.0, 40.0, 47.0, 51.0, 39.0, 40.0, 46.0, 42.0, 47.0, 39.0, 33.0, 40.0, 35.0, 41.0, 31.0, 18.0, 27.0, 19.0, 19.0, 22.0, 25.0, 17.0, 19.0, 7.0, 11.0, 5.0, 9.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.131103515625, -25.36793327331543, -24.60476303100586, -23.841590881347656, -23.078420639038086, -22.315250396728516, -21.552078247070312, -20.788908004760742, -20.025737762451172, -19.2625675201416, -18.49939727783203, -17.736225128173828, -16.973054885864258, -16.209884643554688, -15.4467134475708, -14.683542251586914, -13.920372009277344, -13.157201766967773, -12.394030570983887, -11.630859375, -10.86768913269043, -10.10451889038086, -9.341347694396973, -8.578176498413086, -7.815006256103516, -7.051835536956787, -6.288664817810059, -5.52549409866333, -4.762323379516602, -3.999152660369873, -3.2359819412231445, -2.472811222076416, -1.7096405029296875, -0.946469783782959, -0.18329906463623047, 0.579871654510498, 1.3430423736572266, 2.106213092803955, 2.8693838119506836, 3.632554531097412, 4.395725250244141, 5.158895969390869, 5.922066688537598, 6.685237407684326, 7.448408126831055, 8.211578369140625, 8.974749565124512, 9.737920761108398, 10.501091003417969, 11.264261245727539, 12.027432441711426, 12.790603637695312, 13.553773880004883, 14.316944122314453, 15.08011531829834, 15.843286514282227, 16.606456756591797, 17.369626998901367, 18.132797241210938, 18.89596939086914, 19.65913963317871, 20.42230987548828, 21.185482025146484, 21.948652267456055, 22.711822509765625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 6.0, 7.0, 12.0, 20.0, 12.0, 32.0, 38.0, 49.0, 66.0, 100.0, 143.0, 190.0, 286.0, 366.0, 590.0, 901.0, 1335.0, 2035.0, 3203.0, 5347.0, 9106.0, 15875.0, 28793.0, 58771.0, 136651.0, 356165.0, 240448.0, 91842.0, 42320.0, 22029.0, 12296.0, 7207.0, 4257.0, 2707.0, 1749.0, 1131.0, 758.0, 533.0, 355.0, 259.0, 155.0, 115.0, 81.0, 69.0, 33.0, 33.0, 28.0, 15.0, 13.0, 4.0, 10.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0], "bins": [-13.1171875, -12.717041015625, -12.31689453125, -11.916748046875, -11.5166015625, -11.116455078125, -10.71630859375, -10.316162109375, -9.916015625, -9.515869140625, -9.11572265625, -8.715576171875, -8.3154296875, -7.915283203125, -7.51513671875, -7.114990234375, -6.71484375, -6.314697265625, -5.91455078125, -5.514404296875, -5.1142578125, -4.714111328125, -4.31396484375, -3.913818359375, -3.513671875, -3.113525390625, -2.71337890625, -2.313232421875, -1.9130859375, -1.512939453125, -1.11279296875, -0.712646484375, -0.3125, 0.087646484375, 0.48779296875, 0.887939453125, 1.2880859375, 1.688232421875, 2.08837890625, 2.488525390625, 2.888671875, 3.288818359375, 3.68896484375, 4.089111328125, 4.4892578125, 4.889404296875, 5.28955078125, 5.689697265625, 6.08984375, 6.489990234375, 6.89013671875, 7.290283203125, 7.6904296875, 8.090576171875, 8.49072265625, 8.890869140625, 9.291015625, 9.691162109375, 10.09130859375, 10.491455078125, 10.8916015625, 11.291748046875, 11.69189453125, 12.092041015625, 12.4921875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 7.0, 5.0, 11.0, 10.0, 19.0, 15.0, 20.0, 22.0, 30.0, 26.0, 32.0, 30.0, 42.0, 45.0, 56.0, 45.0, 46.0, 40.0, 38.0, 57.0, 42.0, 42.0, 37.0, 43.0, 35.0, 19.0, 19.0, 31.0, 20.0, 22.0, 17.0, 10.0, 10.0, 9.0, 7.0, 9.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.830078125, -3.7099609375, -3.58984375, -3.4697265625, -3.349609375, -3.2294921875, -3.109375, -2.9892578125, -2.869140625, -2.7490234375, -2.62890625, -2.5087890625, -2.388671875, -2.2685546875, -2.1484375, -2.0283203125, -1.908203125, -1.7880859375, -1.66796875, -1.5478515625, -1.427734375, -1.3076171875, -1.1875, -1.0673828125, -0.947265625, -0.8271484375, -0.70703125, -0.5869140625, -0.466796875, -0.3466796875, -0.2265625, -0.1064453125, 0.013671875, 0.1337890625, 0.25390625, 0.3740234375, 0.494140625, 0.6142578125, 0.734375, 0.8544921875, 0.974609375, 1.0947265625, 1.21484375, 1.3349609375, 1.455078125, 1.5751953125, 1.6953125, 1.8154296875, 1.935546875, 2.0556640625, 2.17578125, 2.2958984375, 2.416015625, 2.5361328125, 2.65625, 2.7763671875, 2.896484375, 3.0166015625, 3.13671875, 3.2568359375, 3.376953125, 3.4970703125, 3.6171875, 3.7373046875, 3.857421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 10.0, 12.0, 10.0, 13.0, 29.0, 46.0, 55.0, 89.0, 161.0, 293.0, 447.0, 966.0, 1980.0, 4481.0, 12482.0, 52407.0, 642690.0, 282131.0, 33873.0, 9418.0, 3498.0, 1606.0, 763.0, 411.0, 245.0, 166.0, 82.0, 62.0, 40.0, 23.0, 11.0, 11.0, 11.0, 5.0, 8.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-50.65625, -49.2822265625, -47.908203125, -46.5341796875, -45.16015625, -43.7861328125, -42.412109375, -41.0380859375, -39.6640625, -38.2900390625, -36.916015625, -35.5419921875, -34.16796875, -32.7939453125, -31.419921875, -30.0458984375, -28.671875, -27.2978515625, -25.923828125, -24.5498046875, -23.17578125, -21.8017578125, -20.427734375, -19.0537109375, -17.6796875, -16.3056640625, -14.931640625, -13.5576171875, -12.18359375, -10.8095703125, -9.435546875, -8.0615234375, -6.6875, -5.3134765625, -3.939453125, -2.5654296875, -1.19140625, 0.1826171875, 1.556640625, 2.9306640625, 4.3046875, 5.6787109375, 7.052734375, 8.4267578125, 9.80078125, 11.1748046875, 12.548828125, 13.9228515625, 15.296875, 16.6708984375, 18.044921875, 19.4189453125, 20.79296875, 22.1669921875, 23.541015625, 24.9150390625, 26.2890625, 27.6630859375, 29.037109375, 30.4111328125, 31.78515625, 33.1591796875, 34.533203125, 35.9072265625, 37.28125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 9.0, 7.0, 3.0, 13.0, 12.0, 21.0, 22.0, 18.0, 41.0, 58.0, 43.0, 73.0, 100.0, 96.0, 81.0, 81.0, 80.0, 57.0, 42.0, 32.0, 32.0, 21.0, 9.0, 11.0, 7.0, 5.0, 6.0, 5.0, 3.0, 0.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.53125, -48.14990234375, -46.7685546875, -45.38720703125, -44.005859375, -42.62451171875, -41.2431640625, -39.86181640625, -38.48046875, -37.09912109375, -35.7177734375, -34.33642578125, -32.955078125, -31.57373046875, -30.1923828125, -28.81103515625, -27.4296875, -26.04833984375, -24.6669921875, -23.28564453125, -21.904296875, -20.52294921875, -19.1416015625, -17.76025390625, -16.37890625, -14.99755859375, -13.6162109375, -12.23486328125, -10.853515625, -9.47216796875, -8.0908203125, -6.70947265625, -5.328125, -3.94677734375, -2.5654296875, -1.18408203125, 0.197265625, 1.57861328125, 2.9599609375, 4.34130859375, 5.72265625, 7.10400390625, 8.4853515625, 9.86669921875, 11.248046875, 12.62939453125, 14.0107421875, 15.39208984375, 16.7734375, 18.15478515625, 19.5361328125, 20.91748046875, 22.298828125, 23.68017578125, 25.0615234375, 26.44287109375, 27.82421875, 29.20556640625, 30.5869140625, 31.96826171875, 33.349609375, 34.73095703125, 36.1123046875, 37.49365234375, 38.875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 5.0, 3.0, 7.0, 4.0, 19.0, 27.0, 26.0, 42.0, 46.0, 90.0, 138.0, 214.0, 390.0, 654.0, 1213.0, 2542.0, 5736.0, 18116.0, 212219.0, 771474.0, 22856.0, 6760.0, 2759.0, 1384.0, 710.0, 398.0, 227.0, 162.0, 105.0, 64.0, 48.0, 30.0, 20.0, 24.0, 14.0, 7.0, 8.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.0, -94.3837890625, -91.767578125, -89.1513671875, -86.53515625, -83.9189453125, -81.302734375, -78.6865234375, -76.0703125, -73.4541015625, -70.837890625, -68.2216796875, -65.60546875, -62.9892578125, -60.373046875, -57.7568359375, -55.140625, -52.5244140625, -49.908203125, -47.2919921875, -44.67578125, -42.0595703125, -39.443359375, -36.8271484375, -34.2109375, -31.5947265625, -28.978515625, -26.3623046875, -23.74609375, -21.1298828125, -18.513671875, -15.8974609375, -13.28125, -10.6650390625, -8.048828125, -5.4326171875, -2.81640625, -0.2001953125, 2.416015625, 5.0322265625, 7.6484375, 10.2646484375, 12.880859375, 15.4970703125, 18.11328125, 20.7294921875, 23.345703125, 25.9619140625, 28.578125, 31.1943359375, 33.810546875, 36.4267578125, 39.04296875, 41.6591796875, 44.275390625, 46.8916015625, 49.5078125, 52.1240234375, 54.740234375, 57.3564453125, 59.97265625, 62.5888671875, 65.205078125, 67.8212890625, 70.4375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 11.0, 12.0, 28.0, 44.0, 147.0, 606.0, 77.0, 30.0, 11.0, 10.0, 8.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.01824951171875, -0.017837882041931152, -0.017426252365112305, -0.017014622688293457, -0.01660299301147461, -0.01619136333465576, -0.015779733657836914, -0.015368103981018066, -0.014956474304199219, -0.014544844627380371, -0.014133214950561523, -0.013721585273742676, -0.013309955596923828, -0.01289832592010498, -0.012486696243286133, -0.012075066566467285, -0.011663436889648438, -0.01125180721282959, -0.010840177536010742, -0.010428547859191895, -0.010016918182373047, -0.0096052885055542, -0.009193658828735352, -0.008782029151916504, -0.008370399475097656, -0.007958769798278809, -0.007547140121459961, -0.007135510444641113, -0.006723880767822266, -0.006312251091003418, -0.00590062141418457, -0.005488991737365723, -0.005077362060546875, -0.004665732383728027, -0.00425410270690918, -0.003842473030090332, -0.0034308433532714844, -0.0030192136764526367, -0.002607583999633789, -0.0021959543228149414, -0.0017843246459960938, -0.001372694969177246, -0.0009610652923583984, -0.0005494356155395508, -0.00013780593872070312, 0.00027382373809814453, 0.0006854534149169922, 0.0010970830917358398, 0.0015087127685546875, 0.0019203424453735352, 0.002331972122192383, 0.0027436017990112305, 0.003155231475830078, 0.0035668611526489258, 0.0039784908294677734, 0.004390120506286621, 0.004801750183105469, 0.005213379859924316, 0.005625009536743164, 0.006036639213562012, 0.006448268890380859, 0.006859898567199707, 0.007271528244018555, 0.007683157920837402, 0.00809478759765625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 7.0, 8.0, 5.0, 9.0, 11.0, 16.0, 24.0, 29.0, 51.0, 53.0, 96.0, 129.0, 184.0, 284.0, 436.0, 681.0, 1103.0, 1836.0, 3448.0, 6941.0, 17502.0, 95515.0, 864350.0, 33849.0, 10754.0, 4793.0, 2562.0, 1393.0, 874.0, 525.0, 324.0, 234.0, 166.0, 91.0, 90.0, 50.0, 39.0, 28.0, 30.0, 7.0, 11.0, 8.0, 4.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-103.5625, -100.5390625, -97.515625, -94.4921875, -91.46875, -88.4453125, -85.421875, -82.3984375, -79.375, -76.3515625, -73.328125, -70.3046875, -67.28125, -64.2578125, -61.234375, -58.2109375, -55.1875, -52.1640625, -49.140625, -46.1171875, -43.09375, -40.0703125, -37.046875, -34.0234375, -31.0, -27.9765625, -24.953125, -21.9296875, -18.90625, -15.8828125, -12.859375, -9.8359375, -6.8125, -3.7890625, -0.765625, 2.2578125, 5.28125, 8.3046875, 11.328125, 14.3515625, 17.375, 20.3984375, 23.421875, 26.4453125, 29.46875, 32.4921875, 35.515625, 38.5390625, 41.5625, 44.5859375, 47.609375, 50.6328125, 53.65625, 56.6796875, 59.703125, 62.7265625, 65.75, 68.7734375, 71.796875, 74.8203125, 77.84375, 80.8671875, 83.890625, 86.9140625, 89.9375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 7.0, 6.0, 7.0, 8.0, 14.0, 11.0, 32.0, 34.0, 104.0, 477.0, 155.0, 46.0, 28.0, 16.0, 8.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-98.5, -95.6513671875, -92.802734375, -89.9541015625, -87.10546875, -84.2568359375, -81.408203125, -78.5595703125, -75.7109375, -72.8623046875, -70.013671875, -67.1650390625, -64.31640625, -61.4677734375, -58.619140625, -55.7705078125, -52.921875, -50.0732421875, -47.224609375, -44.3759765625, -41.52734375, -38.6787109375, -35.830078125, -32.9814453125, -30.1328125, -27.2841796875, -24.435546875, -21.5869140625, -18.73828125, -15.8896484375, -13.041015625, -10.1923828125, -7.34375, -4.4951171875, -1.646484375, 1.2021484375, 4.05078125, 6.8994140625, 9.748046875, 12.5966796875, 15.4453125, 18.2939453125, 21.142578125, 23.9912109375, 26.83984375, 29.6884765625, 32.537109375, 35.3857421875, 38.234375, 41.0830078125, 43.931640625, 46.7802734375, 49.62890625, 52.4775390625, 55.326171875, 58.1748046875, 61.0234375, 63.8720703125, 66.720703125, 69.5693359375, 72.41796875, 75.2666015625, 78.115234375, 80.9638671875, 83.8125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 5.0, 9.0, 9.0, 19.0, 23.0, 63.0, 94.0, 159.0, 224.0, 174.0, 110.0, 51.0, 39.0, 20.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-434.08038330078125, -409.52764892578125, -384.97491455078125, -360.42218017578125, -335.86944580078125, -311.31671142578125, -286.76397705078125, -262.21124267578125, -237.65850830078125, -213.10577392578125, -188.55303955078125, -164.00030517578125, -139.44757080078125, -114.89483642578125, -90.34210205078125, -65.78936767578125, -41.23663330078125, -16.68389892578125, 7.86883544921875, 32.42156982421875, 56.97430419921875, 81.52703857421875, 106.07977294921875, 130.63250732421875, 155.18524169921875, 179.73797607421875, 204.29071044921875, 228.84344482421875, 253.39617919921875, 277.94891357421875, 302.50164794921875, 327.05438232421875, 351.607177734375, 376.159912109375, 400.712646484375, 425.265380859375, 449.818115234375, 474.370849609375, 498.923583984375, 523.476318359375, 548.029052734375, 572.581787109375, 597.134521484375, 621.687255859375, 646.239990234375, 670.792724609375, 695.345458984375, 719.898193359375, 744.450927734375, 769.003662109375, 793.556396484375, 818.109130859375, 842.661865234375, 867.214599609375, 891.767333984375, 916.320068359375, 940.872802734375, 965.425537109375, 989.978271484375, 1014.531005859375, 1039.083740234375, 1063.636474609375, 1088.189208984375, 1112.741943359375, 1137.294677734375]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 1.0, 4.0, 7.0, 9.0, 11.0, 11.0, 21.0, 20.0, 23.0, 23.0, 35.0, 33.0, 43.0, 34.0, 48.0, 50.0, 57.0, 52.0, 56.0, 37.0, 59.0, 50.0, 58.0, 49.0, 34.0, 28.0, 22.0, 23.0, 15.0, 21.0, 18.0, 16.0, 11.0, 6.0, 8.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-285.10296630859375, -276.0133056640625, -266.92364501953125, -257.833984375, -248.74432373046875, -239.6546630859375, -230.5650177001953, -221.47535705566406, -212.3856964111328, -203.29603576660156, -194.2063751220703, -185.11671447753906, -176.02706909179688, -166.93740844726562, -157.84774780273438, -148.75808715820312, -139.66842651367188, -130.57876586914062, -121.48910522460938, -112.39945220947266, -103.3097915649414, -94.22013092041016, -85.13047790527344, -76.04081726074219, -66.95115661621094, -57.86149597167969, -48.7718391418457, -39.68218231201172, -30.59252166748047, -21.50286102294922, -12.413204193115234, -3.32354736328125, 5.76611328125, 14.855772018432617, 23.945430755615234, 33.03508758544922, 42.12474822998047, 51.21440887451172, 60.3040657043457, 69.39372253417969, 78.48338317871094, 87.57304382324219, 96.66270446777344, 105.75235748291016, 114.8420181274414, 123.93167877197266, 133.02133178710938, 142.11099243164062, 151.20065307617188, 160.29031372070312, 169.37997436523438, 178.46963500976562, 187.55929565429688, 196.64895629882812, 205.7386016845703, 214.82826232910156, 223.9179229736328, 233.00758361816406, 242.0972442626953, 251.18690490722656, 260.27655029296875, 269.3662109375, 278.45587158203125, 287.5455322265625, 296.63519287109375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 7.0, 5.0, 18.0, 5.0, 11.0, 26.0, 34.0, 38.0, 58.0, 91.0, 125.0, 196.0, 308.0, 629.0, 1213.0, 2989.0, 10415.0, 215480.0, 3941361.0, 14784.0, 3545.0, 1355.0, 658.0, 324.0, 186.0, 135.0, 85.0, 58.0, 44.0, 31.0, 25.0, 17.0, 9.0, 2.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-136.375, -131.84375, -127.3125, -122.78125, -118.25, -113.71875, -109.1875, -104.65625, -100.125, -95.59375, -91.0625, -86.53125, -82.0, -77.46875, -72.9375, -68.40625, -63.875, -59.34375, -54.8125, -50.28125, -45.75, -41.21875, -36.6875, -32.15625, -27.625, -23.09375, -18.5625, -14.03125, -9.5, -4.96875, -0.4375, 4.09375, 8.625, 13.15625, 17.6875, 22.21875, 26.75, 31.28125, 35.8125, 40.34375, 44.875, 49.40625, 53.9375, 58.46875, 63.0, 67.53125, 72.0625, 76.59375, 81.125, 85.65625, 90.1875, 94.71875, 99.25, 103.78125, 108.3125, 112.84375, 117.375, 121.90625, 126.4375, 130.96875, 135.5, 140.03125, 144.5625, 149.09375, 153.625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 1.0, 3.0, 14.0, 17.0, 17.0, 21.0, 24.0, 35.0, 39.0, 52.0, 63.0, 58.0, 66.0, 80.0, 86.0, 85.0, 67.0, 56.0, 52.0, 48.0, 22.0, 21.0, 16.0, 18.0, 11.0, 5.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.375, -13.9072265625, -13.439453125, -12.9716796875, -12.50390625, -12.0361328125, -11.568359375, -11.1005859375, -10.6328125, -10.1650390625, -9.697265625, -9.2294921875, -8.76171875, -8.2939453125, -7.826171875, -7.3583984375, -6.890625, -6.4228515625, -5.955078125, -5.4873046875, -5.01953125, -4.5517578125, -4.083984375, -3.6162109375, -3.1484375, -2.6806640625, -2.212890625, -1.7451171875, -1.27734375, -0.8095703125, -0.341796875, 0.1259765625, 0.59375, 1.0615234375, 1.529296875, 1.9970703125, 2.46484375, 2.9326171875, 3.400390625, 3.8681640625, 4.3359375, 4.8037109375, 5.271484375, 5.7392578125, 6.20703125, 6.6748046875, 7.142578125, 7.6103515625, 8.078125, 8.5458984375, 9.013671875, 9.4814453125, 9.94921875, 10.4169921875, 10.884765625, 11.3525390625, 11.8203125, 12.2880859375, 12.755859375, 13.2236328125, 13.69140625, 14.1591796875, 14.626953125, 15.0947265625, 15.5625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 10.0, 5.0, 17.0, 19.0, 24.0, 35.0, 38.0, 62.0, 83.0, 86.0, 119.0, 192.0, 254.0, 370.0, 516.0, 807.0, 1215.0, 2376.0, 4735.0, 12833.0, 69044.0, 4005011.0, 72184.0, 13117.0, 4845.0, 2341.0, 1277.0, 793.0, 519.0, 353.0, 242.0, 219.0, 142.0, 82.0, 85.0, 64.0, 48.0, 29.0, 22.0, 16.0, 14.0, 10.0, 6.0, 8.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-140.25, -135.798828125, -131.34765625, -126.896484375, -122.4453125, -117.994140625, -113.54296875, -109.091796875, -104.640625, -100.189453125, -95.73828125, -91.287109375, -86.8359375, -82.384765625, -77.93359375, -73.482421875, -69.03125, -64.580078125, -60.12890625, -55.677734375, -51.2265625, -46.775390625, -42.32421875, -37.873046875, -33.421875, -28.970703125, -24.51953125, -20.068359375, -15.6171875, -11.166015625, -6.71484375, -2.263671875, 2.1875, 6.638671875, 11.08984375, 15.541015625, 19.9921875, 24.443359375, 28.89453125, 33.345703125, 37.796875, 42.248046875, 46.69921875, 51.150390625, 55.6015625, 60.052734375, 64.50390625, 68.955078125, 73.40625, 77.857421875, 82.30859375, 86.759765625, 91.2109375, 95.662109375, 100.11328125, 104.564453125, 109.015625, 113.466796875, 117.91796875, 122.369140625, 126.8203125, 131.271484375, 135.72265625, 140.173828125, 144.625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 4.0, 11.0, 10.0, 21.0, 28.0, 68.0, 283.0, 3315.0, 184.0, 57.0, 36.0, 16.0, 11.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.75, -66.5595703125, -64.369140625, -62.1787109375, -59.98828125, -57.7978515625, -55.607421875, -53.4169921875, -51.2265625, -49.0361328125, -46.845703125, -44.6552734375, -42.46484375, -40.2744140625, -38.083984375, -35.8935546875, -33.703125, -31.5126953125, -29.322265625, -27.1318359375, -24.94140625, -22.7509765625, -20.560546875, -18.3701171875, -16.1796875, -13.9892578125, -11.798828125, -9.6083984375, -7.41796875, -5.2275390625, -3.037109375, -0.8466796875, 1.34375, 3.5341796875, 5.724609375, 7.9150390625, 10.10546875, 12.2958984375, 14.486328125, 16.6767578125, 18.8671875, 21.0576171875, 23.248046875, 25.4384765625, 27.62890625, 29.8193359375, 32.009765625, 34.2001953125, 36.390625, 38.5810546875, 40.771484375, 42.9619140625, 45.15234375, 47.3427734375, 49.533203125, 51.7236328125, 53.9140625, 56.1044921875, 58.294921875, 60.4853515625, 62.67578125, 64.8662109375, 67.056640625, 69.2470703125, 71.4375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 10.0, 2.0, 5.0, 5.0, 8.0, 7.0, 9.0, 20.0, 16.0, 22.0, 35.0, 42.0, 66.0, 67.0, 92.0, 86.0, 93.0, 89.0, 82.0, 48.0, 33.0, 39.0, 36.0, 16.0, 16.0, 14.0, 6.0, 6.0, 3.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-180.0049285888672, -174.7041015625, -169.40325927734375, -164.10243225097656, -158.80160522460938, -153.50076293945312, -148.19993591308594, -142.89910888671875, -137.5982666015625, -132.2974395751953, -126.99659729003906, -121.69577026367188, -116.39493560791016, -111.09410095214844, -105.79327392578125, -100.49243927001953, -95.19160461425781, -89.8907699584961, -84.58993530273438, -79.28910827636719, -73.98827362060547, -68.68743896484375, -63.3866081237793, -58.085777282714844, -52.784942626953125, -47.484107971191406, -42.18327713012695, -36.8824462890625, -31.58161163330078, -26.280778884887695, -20.97994613647461, -15.679115295410156, -10.378280639648438, -5.077447891235352, 0.22338485717773438, 5.52421760559082, 10.825050354003906, 16.125883102416992, 21.426715850830078, 26.72754669189453, 32.02838134765625, 37.32921600341797, 42.63004684448242, 47.930877685546875, 53.231712341308594, 58.53254699707031, 63.833377838134766, 69.13420867919922, 74.43504333496094, 79.73587799072266, 85.03671264648438, 90.33753967285156, 95.63837432861328, 100.939208984375, 106.24003601074219, 111.5408706665039, 116.84170532226562, 122.14253997802734, 127.44337463378906, 132.74420166015625, 138.0450439453125, 143.3458709716797, 148.64669799804688, 153.94754028320312, 159.2483673095703]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 6.0, 4.0, 7.0, 9.0, 14.0, 9.0, 10.0, 15.0, 14.0, 15.0, 13.0, 21.0, 23.0, 37.0, 32.0, 29.0, 44.0, 41.0, 48.0, 33.0, 34.0, 30.0, 34.0, 35.0, 35.0, 36.0, 36.0, 26.0, 29.0, 35.0, 31.0, 26.0, 22.0, 27.0, 18.0, 15.0, 16.0, 19.0, 15.0, 12.0, 9.0, 6.0, 10.0, 2.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-104.44767761230469, -101.22380065917969, -97.99993133544922, -94.77605438232422, -91.55218505859375, -88.32830810546875, -85.10443878173828, -81.88056182861328, -78.65669250488281, -75.43281555175781, -72.20894622802734, -68.98506927490234, -65.76119995117188, -62.537322998046875, -59.313453674316406, -56.089576721191406, -52.86570358276367, -49.64183044433594, -46.4179573059082, -43.19408416748047, -39.970211029052734, -36.746337890625, -33.5224609375, -30.2985897064209, -27.074716567993164, -23.85084342956543, -20.626970291137695, -17.403095245361328, -14.17922306060791, -10.95534896850586, -7.731475830078125, -4.507602691650391, -1.2837295532226562, 1.9401438236236572, 5.164017200469971, 8.387890815734863, 11.611763954162598, 14.835638046264648, 18.059511184692383, 21.283384323120117, 24.50725746154785, 27.731130599975586, 30.95500373840332, 34.17887878417969, 37.40275192260742, 40.626625061035156, 43.85049819946289, 47.074371337890625, 50.29824447631836, 53.522117614746094, 56.74599075317383, 59.96986389160156, 63.1937370300293, 66.41761016845703, 69.64148712158203, 72.8653564453125, 76.0892333984375, 79.3131103515625, 82.53697967529297, 85.76085662841797, 88.98472595214844, 92.20860290527344, 95.4324722290039, 98.6563491821289, 101.88021850585938]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 15.0, 13.0, 13.0, 23.0, 33.0, 51.0, 109.0, 141.0, 274.0, 505.0, 1066.0, 2232.0, 5596.0, 15421.0, 52276.0, 274121.0, 558444.0, 98444.0, 25201.0, 8329.0, 3159.0, 1460.0, 702.0, 371.0, 193.0, 120.0, 82.0, 49.0, 40.0, 21.0, 16.0, 14.0, 9.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.9375, -82.30078125, -79.6640625, -77.02734375, -74.390625, -71.75390625, -69.1171875, -66.48046875, -63.84375, -61.20703125, -58.5703125, -55.93359375, -53.296875, -50.66015625, -48.0234375, -45.38671875, -42.75, -40.11328125, -37.4765625, -34.83984375, -32.203125, -29.56640625, -26.9296875, -24.29296875, -21.65625, -19.01953125, -16.3828125, -13.74609375, -11.109375, -8.47265625, -5.8359375, -3.19921875, -0.5625, 2.07421875, 4.7109375, 7.34765625, 9.984375, 12.62109375, 15.2578125, 17.89453125, 20.53125, 23.16796875, 25.8046875, 28.44140625, 31.078125, 33.71484375, 36.3515625, 38.98828125, 41.625, 44.26171875, 46.8984375, 49.53515625, 52.171875, 54.80859375, 57.4453125, 60.08203125, 62.71875, 65.35546875, 67.9921875, 70.62890625, 73.265625, 75.90234375, 78.5390625, 81.17578125, 83.8125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 2.0, 6.0, 10.0, 11.0, 17.0, 17.0, 21.0, 26.0, 37.0, 40.0, 39.0, 52.0, 47.0, 58.0, 64.0, 60.0, 56.0, 64.0, 57.0, 62.0, 50.0, 32.0, 40.0, 23.0, 26.0, 24.0, 14.0, 9.0, 7.0, 9.0, 3.0, 6.0, 2.0, 5.0, 1.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.8211669921875, -11.306396484375, -10.7916259765625, -10.27685546875, -9.7620849609375, -9.247314453125, -8.7325439453125, -8.2177734375, -7.7030029296875, -7.188232421875, -6.6734619140625, -6.15869140625, -5.6439208984375, -5.129150390625, -4.6143798828125, -4.099609375, -3.5848388671875, -3.070068359375, -2.5552978515625, -2.04052734375, -1.5257568359375, -1.010986328125, -0.4962158203125, 0.0185546875, 0.5333251953125, 1.048095703125, 1.5628662109375, 2.07763671875, 2.5924072265625, 3.107177734375, 3.6219482421875, 4.13671875, 4.6514892578125, 5.166259765625, 5.6810302734375, 6.19580078125, 6.7105712890625, 7.225341796875, 7.7401123046875, 8.2548828125, 8.7696533203125, 9.284423828125, 9.7991943359375, 10.31396484375, 10.8287353515625, 11.343505859375, 11.8582763671875, 12.373046875, 12.8878173828125, 13.402587890625, 13.9173583984375, 14.43212890625, 14.9468994140625, 15.461669921875, 15.9764404296875, 16.4912109375, 17.0059814453125, 17.520751953125, 18.0355224609375, 18.55029296875, 19.0650634765625, 19.579833984375, 20.0946044921875, 20.609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 7.0, 12.0, 15.0, 28.0, 47.0, 86.0, 110.0, 196.0, 354.0, 720.0, 1688.0, 4233.0, 11813.0, 39872.0, 186049.0, 634852.0, 123694.0, 29361.0, 9383.0, 3288.0, 1330.0, 629.0, 338.0, 193.0, 85.0, 66.0, 35.0, 24.0, 19.0, 10.0, 5.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.125, -102.9462890625, -99.767578125, -96.5888671875, -93.41015625, -90.2314453125, -87.052734375, -83.8740234375, -80.6953125, -77.5166015625, -74.337890625, -71.1591796875, -67.98046875, -64.8017578125, -61.623046875, -58.4443359375, -55.265625, -52.0869140625, -48.908203125, -45.7294921875, -42.55078125, -39.3720703125, -36.193359375, -33.0146484375, -29.8359375, -26.6572265625, -23.478515625, -20.2998046875, -17.12109375, -13.9423828125, -10.763671875, -7.5849609375, -4.40625, -1.2275390625, 1.951171875, 5.1298828125, 8.30859375, 11.4873046875, 14.666015625, 17.8447265625, 21.0234375, 24.2021484375, 27.380859375, 30.5595703125, 33.73828125, 36.9169921875, 40.095703125, 43.2744140625, 46.453125, 49.6318359375, 52.810546875, 55.9892578125, 59.16796875, 62.3466796875, 65.525390625, 68.7041015625, 71.8828125, 75.0615234375, 78.240234375, 81.4189453125, 84.59765625, 87.7763671875, 90.955078125, 94.1337890625, 97.3125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 10.0, 6.0, 5.0, 25.0, 13.0, 24.0, 27.0, 28.0, 27.0, 40.0, 39.0, 48.0, 50.0, 51.0, 55.0, 62.0, 55.0, 60.0, 75.0, 52.0, 45.0, 36.0, 38.0, 24.0, 17.0, 18.0, 14.0, 16.0, 16.0, 4.0, 4.0, 5.0, 8.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.75, -89.033203125, -85.31640625, -81.599609375, -77.8828125, -74.166015625, -70.44921875, -66.732421875, -63.015625, -59.298828125, -55.58203125, -51.865234375, -48.1484375, -44.431640625, -40.71484375, -36.998046875, -33.28125, -29.564453125, -25.84765625, -22.130859375, -18.4140625, -14.697265625, -10.98046875, -7.263671875, -3.546875, 0.169921875, 3.88671875, 7.603515625, 11.3203125, 15.037109375, 18.75390625, 22.470703125, 26.1875, 29.904296875, 33.62109375, 37.337890625, 41.0546875, 44.771484375, 48.48828125, 52.205078125, 55.921875, 59.638671875, 63.35546875, 67.072265625, 70.7890625, 74.505859375, 78.22265625, 81.939453125, 85.65625, 89.373046875, 93.08984375, 96.806640625, 100.5234375, 104.240234375, 107.95703125, 111.673828125, 115.390625, 119.107421875, 122.82421875, 126.541015625, 130.2578125, 133.974609375, 137.69140625, 141.408203125, 145.125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 10.0, 16.0, 13.0, 16.0, 39.0, 51.0, 76.0, 125.0, 188.0, 362.0, 548.0, 994.0, 2073.0, 4881.0, 13154.0, 49901.0, 534643.0, 378571.0, 42516.0, 11848.0, 4300.0, 1909.0, 984.0, 528.0, 300.0, 186.0, 113.0, 79.0, 47.0, 37.0, 17.0, 10.0, 9.0, 2.0, 3.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.1875, -70.25390625, -67.3203125, -64.38671875, -61.453125, -58.51953125, -55.5859375, -52.65234375, -49.71875, -46.78515625, -43.8515625, -40.91796875, -37.984375, -35.05078125, -32.1171875, -29.18359375, -26.25, -23.31640625, -20.3828125, -17.44921875, -14.515625, -11.58203125, -8.6484375, -5.71484375, -2.78125, 0.15234375, 3.0859375, 6.01953125, 8.953125, 11.88671875, 14.8203125, 17.75390625, 20.6875, 23.62109375, 26.5546875, 29.48828125, 32.421875, 35.35546875, 38.2890625, 41.22265625, 44.15625, 47.08984375, 50.0234375, 52.95703125, 55.890625, 58.82421875, 61.7578125, 64.69140625, 67.625, 70.55859375, 73.4921875, 76.42578125, 79.359375, 82.29296875, 85.2265625, 88.16015625, 91.09375, 94.02734375, 96.9609375, 99.89453125, 102.828125, 105.76171875, 108.6953125, 111.62890625, 114.5625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 18.0, 16.0, 29.0, 47.0, 103.0, 193.0, 295.0, 127.0, 67.0, 40.0, 17.0, 16.0, 9.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0165863037109375, -0.01607227325439453, -0.015558242797851562, -0.015044212341308594, -0.014530181884765625, -0.014016151428222656, -0.013502120971679688, -0.012988090515136719, -0.01247406005859375, -0.011960029602050781, -0.011445999145507812, -0.010931968688964844, -0.010417938232421875, -0.009903907775878906, -0.009389877319335938, -0.008875846862792969, -0.00836181640625, -0.007847785949707031, -0.0073337554931640625, -0.006819725036621094, -0.006305694580078125, -0.005791664123535156, -0.0052776336669921875, -0.004763603210449219, -0.00424957275390625, -0.0037355422973632812, -0.0032215118408203125, -0.0027074813842773438, -0.002193450927734375, -0.0016794204711914062, -0.0011653900146484375, -0.0006513595581054688, -0.0001373291015625, 0.00037670135498046875, 0.0008907318115234375, 0.0014047622680664062, 0.001918792724609375, 0.0024328231811523438, 0.0029468536376953125, 0.0034608840942382812, 0.00397491455078125, 0.004488945007324219, 0.0050029754638671875, 0.005517005920410156, 0.006031036376953125, 0.006545066833496094, 0.0070590972900390625, 0.007573127746582031, 0.008087158203125, 0.008601188659667969, 0.009115219116210938, 0.009629249572753906, 0.010143280029296875, 0.010657310485839844, 0.011171340942382812, 0.011685371398925781, 0.01219940185546875, 0.012713432312011719, 0.013227462768554688, 0.013741493225097656, 0.014255523681640625, 0.014769554138183594, 0.015283584594726562, 0.01579761505126953, 0.0163116455078125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 5.0, 7.0, 12.0, 21.0, 24.0, 28.0, 48.0, 67.0, 93.0, 117.0, 164.0, 197.0, 375.0, 510.0, 724.0, 1104.0, 1705.0, 2796.0, 4806.0, 8810.0, 18645.0, 47297.0, 195781.0, 598586.0, 102746.0, 32482.0, 13893.0, 6952.0, 3892.0, 2219.0, 1462.0, 900.0, 620.0, 397.0, 339.0, 166.0, 147.0, 91.0, 89.0, 64.0, 41.0, 35.0, 29.0, 18.0, 14.0, 7.0, 6.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-67.8125, -65.4990234375, -63.185546875, -60.8720703125, -58.55859375, -56.2451171875, -53.931640625, -51.6181640625, -49.3046875, -46.9912109375, -44.677734375, -42.3642578125, -40.05078125, -37.7373046875, -35.423828125, -33.1103515625, -30.796875, -28.4833984375, -26.169921875, -23.8564453125, -21.54296875, -19.2294921875, -16.916015625, -14.6025390625, -12.2890625, -9.9755859375, -7.662109375, -5.3486328125, -3.03515625, -0.7216796875, 1.591796875, 3.9052734375, 6.21875, 8.5322265625, 10.845703125, 13.1591796875, 15.47265625, 17.7861328125, 20.099609375, 22.4130859375, 24.7265625, 27.0400390625, 29.353515625, 31.6669921875, 33.98046875, 36.2939453125, 38.607421875, 40.9208984375, 43.234375, 45.5478515625, 47.861328125, 50.1748046875, 52.48828125, 54.8017578125, 57.115234375, 59.4287109375, 61.7421875, 64.0556640625, 66.369140625, 68.6826171875, 70.99609375, 73.3095703125, 75.623046875, 77.9365234375, 80.25]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 6.0, 3.0, 5.0, 3.0, 4.0, 12.0, 18.0, 7.0, 17.0, 31.0, 31.0, 43.0, 48.0, 87.0, 113.0, 157.0, 128.0, 67.0, 45.0, 31.0, 35.0, 22.0, 25.0, 14.0, 17.0, 3.0, 8.0, 2.0, 2.0, 6.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-94.6875, -92.0087890625, -89.330078125, -86.6513671875, -83.97265625, -81.2939453125, -78.615234375, -75.9365234375, -73.2578125, -70.5791015625, -67.900390625, -65.2216796875, -62.54296875, -59.8642578125, -57.185546875, -54.5068359375, -51.828125, -49.1494140625, -46.470703125, -43.7919921875, -41.11328125, -38.4345703125, -35.755859375, -33.0771484375, -30.3984375, -27.7197265625, -25.041015625, -22.3623046875, -19.68359375, -17.0048828125, -14.326171875, -11.6474609375, -8.96875, -6.2900390625, -3.611328125, -0.9326171875, 1.74609375, 4.4248046875, 7.103515625, 9.7822265625, 12.4609375, 15.1396484375, 17.818359375, 20.4970703125, 23.17578125, 25.8544921875, 28.533203125, 31.2119140625, 33.890625, 36.5693359375, 39.248046875, 41.9267578125, 44.60546875, 47.2841796875, 49.962890625, 52.6416015625, 55.3203125, 57.9990234375, 60.677734375, 63.3564453125, 66.03515625, 68.7138671875, 71.392578125, 74.0712890625, 76.75]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 12.0, 11.0, 23.0, 32.0, 46.0, 85.0, 164.0, 167.0, 164.0, 115.0, 80.0, 47.0, 33.0, 14.0, 7.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-516.238525390625, -481.251708984375, -446.264892578125, -411.278076171875, -376.291259765625, -341.304443359375, -306.317626953125, -271.330810546875, -236.343994140625, -201.357177734375, -166.370361328125, -131.383544921875, -96.396728515625, -61.409912109375, -26.423095703125, 8.563720703125, 43.550537109375, 78.537353515625, 113.524169921875, 148.510986328125, 183.497802734375, 218.484619140625, 253.471435546875, 288.458251953125, 323.445068359375, 358.431884765625, 393.418701171875, 428.405517578125, 463.392333984375, 498.379150390625, 533.365966796875, 568.352783203125, 603.339599609375, 638.326416015625, 673.313232421875, 708.300048828125, 743.286865234375, 778.273681640625, 813.260498046875, 848.247314453125, 883.234130859375, 918.220947265625, 953.207763671875, 988.194580078125, 1023.181396484375, 1058.168212890625, 1093.155029296875, 1128.141845703125, 1163.128662109375, 1198.115478515625, 1233.102294921875, 1268.089111328125, 1303.075927734375, 1338.062744140625, 1373.049560546875, 1408.036376953125, 1443.023193359375, 1478.010009765625, 1512.996826171875, 1547.983642578125, 1582.970458984375, 1617.957275390625, 1652.944091796875, 1687.930908203125, 1722.917724609375]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 2.0, 8.0, 12.0, 11.0, 17.0, 14.0, 18.0, 33.0, 21.0, 27.0, 35.0, 29.0, 38.0, 27.0, 37.0, 46.0, 41.0, 42.0, 42.0, 50.0, 41.0, 33.0, 41.0, 47.0, 34.0, 41.0, 33.0, 22.0, 23.0, 23.0, 18.0, 19.0, 17.0, 11.0, 10.0, 11.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-493.55401611328125, -478.4468994140625, -463.3397521972656, -448.23260498046875, -433.12548828125, -418.01837158203125, -402.9112243652344, -387.8040771484375, -372.69696044921875, -357.58984375, -342.4826965332031, -327.37554931640625, -312.2684326171875, -297.16131591796875, -282.0541687011719, -266.947021484375, -251.83990478515625, -236.73277282714844, -221.62564086914062, -206.5185089111328, -191.411376953125, -176.3042449951172, -161.19711303710938, -146.08998107910156, -130.98284912109375, -115.87571716308594, -100.76858520507812, -85.66145324707031, -70.5543212890625, -55.44718933105469, -40.340057373046875, -25.232925415039062, -10.125823974609375, 4.9813079833984375, 20.08843994140625, 35.19557189941406, 50.302703857421875, 65.40983581542969, 80.5169677734375, 95.62409973144531, 110.73123168945312, 125.83836364746094, 140.94549560546875, 156.05262756347656, 171.15975952148438, 186.2668914794922, 201.3740234375, 216.4811553955078, 231.58828735351562, 246.69541931152344, 261.80255126953125, 276.90966796875, 292.0168151855469, 307.12396240234375, 322.2310791015625, 337.33819580078125, 352.4453430175781, 367.552490234375, 382.65960693359375, 397.7667236328125, 412.8738708496094, 427.98101806640625, 443.088134765625, 458.19525146484375, 473.3023986816406]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 2.0, 3.0, 10.0, 6.0, 15.0, 23.0, 27.0, 42.0, 52.0, 81.0, 132.0, 177.0, 279.0, 416.0, 683.0, 1110.0, 2093.0, 5313.0, 34570.0, 4130373.0, 11645.0, 3270.0, 1571.0, 857.0, 524.0, 321.0, 234.0, 127.0, 104.0, 59.0, 40.0, 36.0, 16.0, 22.0, 15.0, 10.0, 5.0, 2.0, 5.0, 5.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-182.0, -176.689453125, -171.37890625, -166.068359375, -160.7578125, -155.447265625, -150.13671875, -144.826171875, -139.515625, -134.205078125, -128.89453125, -123.583984375, -118.2734375, -112.962890625, -107.65234375, -102.341796875, -97.03125, -91.720703125, -86.41015625, -81.099609375, -75.7890625, -70.478515625, -65.16796875, -59.857421875, -54.546875, -49.236328125, -43.92578125, -38.615234375, -33.3046875, -27.994140625, -22.68359375, -17.373046875, -12.0625, -6.751953125, -1.44140625, 3.869140625, 9.1796875, 14.490234375, 19.80078125, 25.111328125, 30.421875, 35.732421875, 41.04296875, 46.353515625, 51.6640625, 56.974609375, 62.28515625, 67.595703125, 72.90625, 78.216796875, 83.52734375, 88.837890625, 94.1484375, 99.458984375, 104.76953125, 110.080078125, 115.390625, 120.701171875, 126.01171875, 131.322265625, 136.6328125, 141.943359375, 147.25390625, 152.564453125, 157.875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 11.0, 7.0, 12.0, 13.0, 12.0, 17.0, 23.0, 18.0, 30.0, 34.0, 40.0, 48.0, 38.0, 48.0, 52.0, 64.0, 48.0, 50.0, 53.0, 52.0, 47.0, 57.0, 41.0, 31.0, 25.0, 25.0, 15.0, 15.0, 15.0, 13.0, 4.0, 10.0, 5.0, 4.0, 3.0, 1.0, 3.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.203125, -22.527587890625, -21.85205078125, -21.176513671875, -20.5009765625, -19.825439453125, -19.14990234375, -18.474365234375, -17.798828125, -17.123291015625, -16.44775390625, -15.772216796875, -15.0966796875, -14.421142578125, -13.74560546875, -13.070068359375, -12.39453125, -11.718994140625, -11.04345703125, -10.367919921875, -9.6923828125, -9.016845703125, -8.34130859375, -7.665771484375, -6.990234375, -6.314697265625, -5.63916015625, -4.963623046875, -4.2880859375, -3.612548828125, -2.93701171875, -2.261474609375, -1.5859375, -0.910400390625, -0.23486328125, 0.440673828125, 1.1162109375, 1.791748046875, 2.46728515625, 3.142822265625, 3.818359375, 4.493896484375, 5.16943359375, 5.844970703125, 6.5205078125, 7.196044921875, 7.87158203125, 8.547119140625, 9.22265625, 9.898193359375, 10.57373046875, 11.249267578125, 11.9248046875, 12.600341796875, 13.27587890625, 13.951416015625, 14.626953125, 15.302490234375, 15.97802734375, 16.653564453125, 17.3291015625, 18.004638671875, 18.68017578125, 19.355712890625, 20.03125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 10.0, 5.0, 6.0, 9.0, 11.0, 15.0, 19.0, 34.0, 39.0, 45.0, 61.0, 70.0, 100.0, 114.0, 159.0, 185.0, 274.0, 375.0, 624.0, 1127.0, 2390.0, 5829.0, 18197.0, 4084116.0, 62453.0, 10013.0, 3685.0, 1646.0, 787.0, 495.0, 335.0, 225.0, 183.0, 138.0, 105.0, 90.0, 63.0, 74.0, 38.0, 48.0, 17.0, 12.0, 14.0, 14.0, 12.0, 10.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-175.25, -170.060546875, -164.87109375, -159.681640625, -154.4921875, -149.302734375, -144.11328125, -138.923828125, -133.734375, -128.544921875, -123.35546875, -118.166015625, -112.9765625, -107.787109375, -102.59765625, -97.408203125, -92.21875, -87.029296875, -81.83984375, -76.650390625, -71.4609375, -66.271484375, -61.08203125, -55.892578125, -50.703125, -45.513671875, -40.32421875, -35.134765625, -29.9453125, -24.755859375, -19.56640625, -14.376953125, -9.1875, -3.998046875, 1.19140625, 6.380859375, 11.5703125, 16.759765625, 21.94921875, 27.138671875, 32.328125, 37.517578125, 42.70703125, 47.896484375, 53.0859375, 58.275390625, 63.46484375, 68.654296875, 73.84375, 79.033203125, 84.22265625, 89.412109375, 94.6015625, 99.791015625, 104.98046875, 110.169921875, 115.359375, 120.548828125, 125.73828125, 130.927734375, 136.1171875, 141.306640625, 146.49609375, 151.685546875, 156.875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 10.0, 4.0, 9.0, 25.0, 49.0, 3775.0, 121.0, 26.0, 14.0, 16.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.328125, -22.298583984375, -21.26904296875, -20.239501953125, -19.2099609375, -18.180419921875, -17.15087890625, -16.121337890625, -15.091796875, -14.062255859375, -13.03271484375, -12.003173828125, -10.9736328125, -9.944091796875, -8.91455078125, -7.885009765625, -6.85546875, -5.825927734375, -4.79638671875, -3.766845703125, -2.7373046875, -1.707763671875, -0.67822265625, 0.351318359375, 1.380859375, 2.410400390625, 3.43994140625, 4.469482421875, 5.4990234375, 6.528564453125, 7.55810546875, 8.587646484375, 9.6171875, 10.646728515625, 11.67626953125, 12.705810546875, 13.7353515625, 14.764892578125, 15.79443359375, 16.823974609375, 17.853515625, 18.883056640625, 19.91259765625, 20.942138671875, 21.9716796875, 23.001220703125, 24.03076171875, 25.060302734375, 26.08984375, 27.119384765625, 28.14892578125, 29.178466796875, 30.2080078125, 31.237548828125, 32.26708984375, 33.296630859375, 34.326171875, 35.355712890625, 36.38525390625, 37.414794921875, 38.4443359375, 39.473876953125, 40.50341796875, 41.532958984375, 42.5625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 0.0, 1.0, 5.0, 6.0, 4.0, 9.0, 10.0, 21.0, 29.0, 28.0, 38.0, 28.0, 64.0, 59.0, 77.0, 63.0, 92.0, 87.0, 73.0, 55.0, 54.0, 39.0, 39.0, 27.0, 26.0, 17.0, 13.0, 8.0, 5.0, 5.0, 7.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-74.04110717773438, -72.18450927734375, -70.32791137695312, -68.47130584716797, -66.61470794677734, -64.75811004638672, -62.901512145996094, -61.0449104309082, -59.18831253051758, -57.33171463012695, -55.47511291503906, -53.61851501464844, -51.76191329956055, -49.90531539916992, -48.04871368408203, -46.192115783691406, -44.33551788330078, -42.478919982910156, -40.622318267822266, -38.76572036743164, -36.90911865234375, -35.052520751953125, -33.1959228515625, -31.33932113647461, -29.48271942138672, -27.62611961364746, -25.769519805908203, -23.912921905517578, -22.05632209777832, -20.199722290039062, -18.343122482299805, -16.486522674560547, -14.629924774169922, -12.773324966430664, -10.916726112365723, -9.060126304626465, -7.203526973724365, -5.346927642822266, -3.490327835083008, -1.6337289810180664, 0.2228708267211914, 2.079470157623291, 3.9360697269439697, 5.792669296264648, 7.649268627166748, 9.505867958068848, 11.362467765808105, 13.219066619873047, 15.075666427612305, 16.932266235351562, 18.78886604309082, 20.645465850830078, 22.502063751220703, 24.35866355895996, 26.21526336669922, 28.071861267089844, 29.928462982177734, 31.785062789916992, 33.64166259765625, 35.498260498046875, 37.354862213134766, 39.21146011352539, 41.06806182861328, 42.924659729003906, 44.78125762939453]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 5.0, 4.0, 8.0, 10.0, 9.0, 14.0, 15.0, 12.0, 21.0, 24.0, 33.0, 28.0, 21.0, 33.0, 36.0, 44.0, 32.0, 36.0, 32.0, 44.0, 36.0, 50.0, 56.0, 51.0, 44.0, 32.0, 40.0, 31.0, 25.0, 21.0, 24.0, 22.0, 18.0, 12.0, 15.0, 10.0, 12.0, 6.0, 6.0, 2.0, 5.0, 5.0, 7.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-46.47748947143555, -45.142860412597656, -43.8082275390625, -42.47359848022461, -41.13896942138672, -39.80434036254883, -38.46971130371094, -37.13507843017578, -35.80044937133789, -34.4658203125, -33.131187438964844, -31.796558380126953, -30.461929321289062, -29.127300262451172, -27.79266929626465, -26.458038330078125, -25.123409271240234, -23.788780212402344, -22.45414924621582, -21.119518280029297, -19.784889221191406, -18.450260162353516, -17.115629196166992, -15.780999183654785, -14.446369171142578, -13.111739158630371, -11.777109146118164, -10.442479133605957, -9.10784912109375, -7.773219108581543, -6.438589096069336, -5.103959083557129, -3.7693328857421875, -2.4347028732299805, -1.1000728607177734, 0.2345571517944336, 1.5691871643066406, 2.9038171768188477, 4.238447189331055, 5.573077201843262, 6.907707214355469, 8.242337226867676, 9.576967239379883, 10.91159725189209, 12.246227264404297, 13.580857276916504, 14.915487289428711, 16.250118255615234, 17.584747314453125, 18.919376373291016, 20.25400733947754, 21.588638305664062, 22.923267364501953, 24.257896423339844, 25.592527389526367, 26.92715835571289, 28.26178741455078, 29.596416473388672, 30.931047439575195, 32.26567840576172, 33.60030746459961, 34.9349365234375, 36.269569396972656, 37.60419845581055, 38.93882751464844]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 10.0, 11.0, 9.0, 10.0, 25.0, 49.0, 52.0, 90.0, 131.0, 204.0, 342.0, 547.0, 991.0, 1767.0, 3386.0, 6993.0, 14677.0, 34925.0, 91067.0, 269623.0, 391169.0, 141151.0, 51095.0, 20938.0, 9423.0, 4571.0, 2238.0, 1228.0, 728.0, 387.0, 243.0, 169.0, 88.0, 63.0, 42.0, 32.0, 23.0, 19.0, 12.0, 8.0, 8.0, 7.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-78.25, -76.0888671875, -73.927734375, -71.7666015625, -69.60546875, -67.4443359375, -65.283203125, -63.1220703125, -60.9609375, -58.7998046875, -56.638671875, -54.4775390625, -52.31640625, -50.1552734375, -47.994140625, -45.8330078125, -43.671875, -41.5107421875, -39.349609375, -37.1884765625, -35.02734375, -32.8662109375, -30.705078125, -28.5439453125, -26.3828125, -24.2216796875, -22.060546875, -19.8994140625, -17.73828125, -15.5771484375, -13.416015625, -11.2548828125, -9.09375, -6.9326171875, -4.771484375, -2.6103515625, -0.44921875, 1.7119140625, 3.873046875, 6.0341796875, 8.1953125, 10.3564453125, 12.517578125, 14.6787109375, 16.83984375, 19.0009765625, 21.162109375, 23.3232421875, 25.484375, 27.6455078125, 29.806640625, 31.9677734375, 34.12890625, 36.2900390625, 38.451171875, 40.6123046875, 42.7734375, 44.9345703125, 47.095703125, 49.2568359375, 51.41796875, 53.5791015625, 55.740234375, 57.9013671875, 60.0625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 8.0, 14.0, 8.0, 11.0, 11.0, 19.0, 29.0, 25.0, 31.0, 35.0, 42.0, 47.0, 37.0, 48.0, 44.0, 56.0, 48.0, 62.0, 49.0, 61.0, 48.0, 53.0, 27.0, 29.0, 35.0, 19.0, 17.0, 15.0, 12.0, 10.0, 8.0, 3.0, 13.0, 4.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-28.5, -27.712646484375, -26.92529296875, -26.137939453125, -25.3505859375, -24.563232421875, -23.77587890625, -22.988525390625, -22.201171875, -21.413818359375, -20.62646484375, -19.839111328125, -19.0517578125, -18.264404296875, -17.47705078125, -16.689697265625, -15.90234375, -15.114990234375, -14.32763671875, -13.540283203125, -12.7529296875, -11.965576171875, -11.17822265625, -10.390869140625, -9.603515625, -8.816162109375, -8.02880859375, -7.241455078125, -6.4541015625, -5.666748046875, -4.87939453125, -4.092041015625, -3.3046875, -2.517333984375, -1.72998046875, -0.942626953125, -0.1552734375, 0.632080078125, 1.41943359375, 2.206787109375, 2.994140625, 3.781494140625, 4.56884765625, 5.356201171875, 6.1435546875, 6.930908203125, 7.71826171875, 8.505615234375, 9.29296875, 10.080322265625, 10.86767578125, 11.655029296875, 12.4423828125, 13.229736328125, 14.01708984375, 14.804443359375, 15.591796875, 16.379150390625, 17.16650390625, 17.953857421875, 18.7412109375, 19.528564453125, 20.31591796875, 21.103271484375, 21.890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 5.0, 1.0, 3.0, 2.0, 8.0, 8.0, 8.0, 20.0, 19.0, 36.0, 50.0, 106.0, 232.0, 452.0, 998.0, 2906.0, 10971.0, 68445.0, 715704.0, 216398.0, 24252.0, 5080.0, 1562.0, 593.0, 301.0, 172.0, 89.0, 48.0, 26.0, 25.0, 7.0, 11.0, 7.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-138.625, -133.626953125, -128.62890625, -123.630859375, -118.6328125, -113.634765625, -108.63671875, -103.638671875, -98.640625, -93.642578125, -88.64453125, -83.646484375, -78.6484375, -73.650390625, -68.65234375, -63.654296875, -58.65625, -53.658203125, -48.66015625, -43.662109375, -38.6640625, -33.666015625, -28.66796875, -23.669921875, -18.671875, -13.673828125, -8.67578125, -3.677734375, 1.3203125, 6.318359375, 11.31640625, 16.314453125, 21.3125, 26.310546875, 31.30859375, 36.306640625, 41.3046875, 46.302734375, 51.30078125, 56.298828125, 61.296875, 66.294921875, 71.29296875, 76.291015625, 81.2890625, 86.287109375, 91.28515625, 96.283203125, 101.28125, 106.279296875, 111.27734375, 116.275390625, 121.2734375, 126.271484375, 131.26953125, 136.267578125, 141.265625, 146.263671875, 151.26171875, 156.259765625, 161.2578125, 166.255859375, 171.25390625, 176.251953125, 181.25]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 7.0, 17.0, 13.0, 20.0, 20.0, 27.0, 17.0, 23.0, 36.0, 46.0, 55.0, 48.0, 57.0, 49.0, 66.0, 39.0, 48.0, 59.0, 44.0, 43.0, 42.0, 37.0, 38.0, 37.0, 24.0, 20.0, 16.0, 13.0, 12.0, 6.0, 6.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-163.875, -159.189453125, -154.50390625, -149.818359375, -145.1328125, -140.447265625, -135.76171875, -131.076171875, -126.390625, -121.705078125, -117.01953125, -112.333984375, -107.6484375, -102.962890625, -98.27734375, -93.591796875, -88.90625, -84.220703125, -79.53515625, -74.849609375, -70.1640625, -65.478515625, -60.79296875, -56.107421875, -51.421875, -46.736328125, -42.05078125, -37.365234375, -32.6796875, -27.994140625, -23.30859375, -18.623046875, -13.9375, -9.251953125, -4.56640625, 0.119140625, 4.8046875, 9.490234375, 14.17578125, 18.861328125, 23.546875, 28.232421875, 32.91796875, 37.603515625, 42.2890625, 46.974609375, 51.66015625, 56.345703125, 61.03125, 65.716796875, 70.40234375, 75.087890625, 79.7734375, 84.458984375, 89.14453125, 93.830078125, 98.515625, 103.201171875, 107.88671875, 112.572265625, 117.2578125, 121.943359375, 126.62890625, 131.314453125, 136.0]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 11.0, 21.0, 39.0, 70.0, 137.0, 226.0, 443.0, 1127.0, 3046.0, 12545.0, 250359.0, 752442.0, 21107.0, 4334.0, 1453.0, 628.0, 234.0, 139.0, 73.0, 45.0, 23.0, 19.0, 18.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.125, -123.40234375, -118.6796875, -113.95703125, -109.234375, -104.51171875, -99.7890625, -95.06640625, -90.34375, -85.62109375, -80.8984375, -76.17578125, -71.453125, -66.73046875, -62.0078125, -57.28515625, -52.5625, -47.83984375, -43.1171875, -38.39453125, -33.671875, -28.94921875, -24.2265625, -19.50390625, -14.78125, -10.05859375, -5.3359375, -0.61328125, 4.109375, 8.83203125, 13.5546875, 18.27734375, 23.0, 27.72265625, 32.4453125, 37.16796875, 41.890625, 46.61328125, 51.3359375, 56.05859375, 60.78125, 65.50390625, 70.2265625, 74.94921875, 79.671875, 84.39453125, 89.1171875, 93.83984375, 98.5625, 103.28515625, 108.0078125, 112.73046875, 117.453125, 122.17578125, 126.8984375, 131.62109375, 136.34375, 141.06640625, 145.7890625, 150.51171875, 155.234375, 159.95703125, 164.6796875, 169.40234375, 174.125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 13.0, 18.0, 39.0, 63.0, 169.0, 260.0, 194.0, 110.0, 53.0, 27.0, 19.0, 12.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01540374755859375, -0.014933943748474121, -0.014464139938354492, -0.013994336128234863, -0.013524532318115234, -0.013054728507995605, -0.012584924697875977, -0.012115120887756348, -0.011645317077636719, -0.01117551326751709, -0.010705709457397461, -0.010235905647277832, -0.009766101837158203, -0.009296298027038574, -0.008826494216918945, -0.008356690406799316, -0.007886886596679688, -0.007417082786560059, -0.00694727897644043, -0.006477475166320801, -0.006007671356201172, -0.005537867546081543, -0.005068063735961914, -0.004598259925842285, -0.004128456115722656, -0.0036586523056030273, -0.0031888484954833984, -0.0027190446853637695, -0.0022492408752441406, -0.0017794370651245117, -0.0013096332550048828, -0.0008398294448852539, -0.000370025634765625, 9.97781753540039e-05, 0.0005695819854736328, 0.0010393857955932617, 0.0015091896057128906, 0.0019789934158325195, 0.0024487972259521484, 0.0029186010360717773, 0.0033884048461914062, 0.003858208656311035, 0.004328012466430664, 0.004797816276550293, 0.005267620086669922, 0.005737423896789551, 0.00620722770690918, 0.006677031517028809, 0.0071468353271484375, 0.007616639137268066, 0.008086442947387695, 0.008556246757507324, 0.009026050567626953, 0.009495854377746582, 0.009965658187866211, 0.01043546199798584, 0.010905265808105469, 0.011375069618225098, 0.011844873428344727, 0.012314677238464355, 0.012784481048583984, 0.013254284858703613, 0.013724088668823242, 0.014193892478942871, 0.0146636962890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 7.0, 5.0, 8.0, 27.0, 27.0, 27.0, 39.0, 69.0, 112.0, 149.0, 225.0, 367.0, 648.0, 1070.0, 1976.0, 3770.0, 8766.0, 34970.0, 640560.0, 316716.0, 24449.0, 7248.0, 3161.0, 1651.0, 938.0, 557.0, 345.0, 216.0, 128.0, 102.0, 66.0, 44.0, 35.0, 15.0, 15.0, 19.0, 8.0, 5.0, 3.0, 4.0, 0.0, 4.0, 1.0, 5.0, 0.0, 1.0], "bins": [-146.5, -142.529296875, -138.55859375, -134.587890625, -130.6171875, -126.646484375, -122.67578125, -118.705078125, -114.734375, -110.763671875, -106.79296875, -102.822265625, -98.8515625, -94.880859375, -90.91015625, -86.939453125, -82.96875, -78.998046875, -75.02734375, -71.056640625, -67.0859375, -63.115234375, -59.14453125, -55.173828125, -51.203125, -47.232421875, -43.26171875, -39.291015625, -35.3203125, -31.349609375, -27.37890625, -23.408203125, -19.4375, -15.466796875, -11.49609375, -7.525390625, -3.5546875, 0.416015625, 4.38671875, 8.357421875, 12.328125, 16.298828125, 20.26953125, 24.240234375, 28.2109375, 32.181640625, 36.15234375, 40.123046875, 44.09375, 48.064453125, 52.03515625, 56.005859375, 59.9765625, 63.947265625, 67.91796875, 71.888671875, 75.859375, 79.830078125, 83.80078125, 87.771484375, 91.7421875, 95.712890625, 99.68359375, 103.654296875, 107.625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 8.0, 16.0, 21.0, 33.0, 48.0, 119.0, 205.0, 211.0, 141.0, 73.0, 34.0, 22.0, 17.0, 9.0, 6.0, 3.0, 10.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.8125, -100.6494140625, -96.486328125, -92.3232421875, -88.16015625, -83.9970703125, -79.833984375, -75.6708984375, -71.5078125, -67.3447265625, -63.181640625, -59.0185546875, -54.85546875, -50.6923828125, -46.529296875, -42.3662109375, -38.203125, -34.0400390625, -29.876953125, -25.7138671875, -21.55078125, -17.3876953125, -13.224609375, -9.0615234375, -4.8984375, -0.7353515625, 3.427734375, 7.5908203125, 11.75390625, 15.9169921875, 20.080078125, 24.2431640625, 28.40625, 32.5693359375, 36.732421875, 40.8955078125, 45.05859375, 49.2216796875, 53.384765625, 57.5478515625, 61.7109375, 65.8740234375, 70.037109375, 74.2001953125, 78.36328125, 82.5263671875, 86.689453125, 90.8525390625, 95.015625, 99.1787109375, 103.341796875, 107.5048828125, 111.66796875, 115.8310546875, 119.994140625, 124.1572265625, 128.3203125, 132.4833984375, 136.646484375, 140.8095703125, 144.97265625, 149.1357421875, 153.298828125, 157.4619140625, 161.625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 9.0, 26.0, 62.0, 64.0, 117.0, 150.0, 162.0, 134.0, 103.0, 47.0, 41.0, 28.0, 18.0, 13.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-732.9332275390625, -696.023681640625, -659.1141967773438, -622.2046508789062, -585.2951049804688, -548.3856201171875, -511.47607421875, -474.5665283203125, -437.6570129394531, -400.74749755859375, -363.83795166015625, -326.9284362792969, -290.0189208984375, -253.109375, -216.19985961914062, -179.29031372070312, -142.38079833984375, -105.47126770019531, -68.5617446899414, -31.6522216796875, 5.2573089599609375, 42.166839599609375, 79.07635498046875, 115.98590087890625, 152.89541625976562, 189.80494689941406, 226.7144775390625, 263.6239929199219, 300.53350830078125, 337.44305419921875, 374.3525695800781, 411.2621154785156, 448.171630859375, 485.0811462402344, 521.9906616210938, 558.9002075195312, 595.8097534179688, 632.71923828125, 669.6287841796875, 706.538330078125, 743.4478759765625, 780.357421875, 817.2669067382812, 854.1764526367188, 891.0859985351562, 927.9954833984375, 964.905029296875, 1001.8145751953125, 1038.72412109375, 1075.6336669921875, 1112.543212890625, 1149.45263671875, 1186.3621826171875, 1223.271728515625, 1260.1812744140625, 1297.0908203125, 1334.000244140625, 1370.9097900390625, 1407.8193359375, 1444.728759765625, 1481.6383056640625, 1518.5478515625, 1555.4573974609375, 1592.366943359375, 1629.2764892578125]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 9.0, 6.0, 5.0, 5.0, 7.0, 13.0, 15.0, 25.0, 22.0, 28.0, 27.0, 40.0, 32.0, 37.0, 34.0, 46.0, 40.0, 32.0, 47.0, 44.0, 61.0, 42.0, 42.0, 44.0, 35.0, 33.0, 29.0, 36.0, 24.0, 16.0, 25.0, 15.0, 13.0, 18.0, 8.0, 7.0, 9.0, 4.0, 6.0, 2.0, 5.0, 0.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-598.069580078125, -578.2907104492188, -558.5118408203125, -538.7329711914062, -518.9541015625, -499.1752014160156, -479.39630126953125, -459.617431640625, -439.83856201171875, -420.0596923828125, -400.28082275390625, -380.5019226074219, -360.7230529785156, -340.9441833496094, -321.165283203125, -301.38641357421875, -281.6075439453125, -261.82867431640625, -242.04978942871094, -222.27090454101562, -202.49203491210938, -182.71316528320312, -162.9342803955078, -143.1553955078125, -123.37652587890625, -103.59764862060547, -83.81877136230469, -64.0398941040039, -44.261016845703125, -24.482139587402344, -4.7032623291015625, 15.07562255859375, 34.85455322265625, 54.63343048095703, 74.41230773925781, 94.1911849975586, 113.97006225585938, 133.74893188476562, 153.52781677246094, 173.30670166015625, 193.0855712890625, 212.86444091796875, 232.64332580566406, 252.42221069335938, 272.2010803222656, 291.9799499511719, 311.75885009765625, 331.5377197265625, 351.31658935546875, 371.095458984375, 390.87432861328125, 410.6532287597656, 430.4320983886719, 450.2109680175781, 469.9898681640625, 489.76873779296875, 509.547607421875, 529.3264770507812, 549.1053466796875, 568.8842163085938, 588.6630859375, 608.4420166015625, 628.2208862304688, 647.999755859375, 667.7786254882812]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 6.0, 5.0, 8.0, 9.0, 5.0, 16.0, 31.0, 47.0, 49.0, 69.0, 125.0, 201.0, 323.0, 594.0, 1281.0, 3415.0, 18817.0, 4138516.0, 24065.0, 3814.0, 1335.0, 627.0, 352.0, 210.0, 116.0, 83.0, 48.0, 33.0, 22.0, 19.0, 14.0, 13.0, 4.0, 6.0, 1.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.5, -180.16015625, -172.8203125, -165.48046875, -158.140625, -150.80078125, -143.4609375, -136.12109375, -128.78125, -121.44140625, -114.1015625, -106.76171875, -99.421875, -92.08203125, -84.7421875, -77.40234375, -70.0625, -62.72265625, -55.3828125, -48.04296875, -40.703125, -33.36328125, -26.0234375, -18.68359375, -11.34375, -4.00390625, 3.3359375, 10.67578125, 18.015625, 25.35546875, 32.6953125, 40.03515625, 47.375, 54.71484375, 62.0546875, 69.39453125, 76.734375, 84.07421875, 91.4140625, 98.75390625, 106.09375, 113.43359375, 120.7734375, 128.11328125, 135.453125, 142.79296875, 150.1328125, 157.47265625, 164.8125, 172.15234375, 179.4921875, 186.83203125, 194.171875, 201.51171875, 208.8515625, 216.19140625, 223.53125, 230.87109375, 238.2109375, 245.55078125, 252.890625, 260.23046875, 267.5703125, 274.91015625, 282.25]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 11.0, 6.0, 6.0, 12.0, 18.0, 17.0, 13.0, 20.0, 33.0, 35.0, 35.0, 31.0, 52.0, 46.0, 59.0, 62.0, 64.0, 63.0, 66.0, 63.0, 59.0, 53.0, 33.0, 30.0, 19.0, 16.0, 16.0, 18.0, 7.0, 12.0, 8.0, 8.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.765625, -22.865478515625, -21.96533203125, -21.065185546875, -20.1650390625, -19.264892578125, -18.36474609375, -17.464599609375, -16.564453125, -15.664306640625, -14.76416015625, -13.864013671875, -12.9638671875, -12.063720703125, -11.16357421875, -10.263427734375, -9.36328125, -8.463134765625, -7.56298828125, -6.662841796875, -5.7626953125, -4.862548828125, -3.96240234375, -3.062255859375, -2.162109375, -1.261962890625, -0.36181640625, 0.538330078125, 1.4384765625, 2.338623046875, 3.23876953125, 4.138916015625, 5.0390625, 5.939208984375, 6.83935546875, 7.739501953125, 8.6396484375, 9.539794921875, 10.43994140625, 11.340087890625, 12.240234375, 13.140380859375, 14.04052734375, 14.940673828125, 15.8408203125, 16.740966796875, 17.64111328125, 18.541259765625, 19.44140625, 20.341552734375, 21.24169921875, 22.141845703125, 23.0419921875, 23.942138671875, 24.84228515625, 25.742431640625, 26.642578125, 27.542724609375, 28.44287109375, 29.343017578125, 30.2431640625, 31.143310546875, 32.04345703125, 32.943603515625, 33.84375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 9.0, 6.0, 13.0, 16.0, 27.0, 30.0, 43.0, 62.0, 93.0, 151.0, 216.0, 383.0, 577.0, 1568.0, 14662.0, 4164167.0, 9394.0, 1340.0, 559.0, 336.0, 202.0, 132.0, 93.0, 55.0, 37.0, 32.0, 28.0, 16.0, 8.0, 10.0, 8.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-511.25, -494.44921875, -477.6484375, -460.84765625, -444.046875, -427.24609375, -410.4453125, -393.64453125, -376.84375, -360.04296875, -343.2421875, -326.44140625, -309.640625, -292.83984375, -276.0390625, -259.23828125, -242.4375, -225.63671875, -208.8359375, -192.03515625, -175.234375, -158.43359375, -141.6328125, -124.83203125, -108.03125, -91.23046875, -74.4296875, -57.62890625, -40.828125, -24.02734375, -7.2265625, 9.57421875, 26.375, 43.17578125, 59.9765625, 76.77734375, 93.578125, 110.37890625, 127.1796875, 143.98046875, 160.78125, 177.58203125, 194.3828125, 211.18359375, 227.984375, 244.78515625, 261.5859375, 278.38671875, 295.1875, 311.98828125, 328.7890625, 345.58984375, 362.390625, 379.19140625, 395.9921875, 412.79296875, 429.59375, 446.39453125, 463.1953125, 479.99609375, 496.796875, 513.59765625, 530.3984375, 547.19921875, 564.0]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 15.0, 29.0, 359.0, 3594.0, 41.0, 16.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.5, -101.6806640625, -98.861328125, -96.0419921875, -93.22265625, -90.4033203125, -87.583984375, -84.7646484375, -81.9453125, -79.1259765625, -76.306640625, -73.4873046875, -70.66796875, -67.8486328125, -65.029296875, -62.2099609375, -59.390625, -56.5712890625, -53.751953125, -50.9326171875, -48.11328125, -45.2939453125, -42.474609375, -39.6552734375, -36.8359375, -34.0166015625, -31.197265625, -28.3779296875, -25.55859375, -22.7392578125, -19.919921875, -17.1005859375, -14.28125, -11.4619140625, -8.642578125, -5.8232421875, -3.00390625, -0.1845703125, 2.634765625, 5.4541015625, 8.2734375, 11.0927734375, 13.912109375, 16.7314453125, 19.55078125, 22.3701171875, 25.189453125, 28.0087890625, 30.828125, 33.6474609375, 36.466796875, 39.2861328125, 42.10546875, 44.9248046875, 47.744140625, 50.5634765625, 53.3828125, 56.2021484375, 59.021484375, 61.8408203125, 64.66015625, 67.4794921875, 70.298828125, 73.1181640625, 75.9375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 6.0, 12.0, 14.0, 11.0, 29.0, 50.0, 75.0, 120.0, 162.0, 171.0, 133.0, 73.0, 46.0, 24.0, 23.0, 14.0, 11.0, 10.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.30610656738281, -107.1808090209961, -100.05551147460938, -92.93020629882812, -85.8049087524414, -78.67961120605469, -71.55430603027344, -64.42900848388672, -57.3037109375, -50.17841339111328, -43.0531120300293, -35.92781066894531, -28.802513122558594, -21.677215576171875, -14.55191421508789, -7.426612854003906, -0.3013153076171875, 6.823984146118164, 13.949283599853516, 21.074583053588867, 28.19988250732422, 35.32518005371094, 42.45048141479492, 49.575782775878906, 56.701080322265625, 63.826377868652344, 70.95167541503906, 78.07698059082031, 85.20227813720703, 92.32757568359375, 99.452880859375, 106.57817840576172, 113.7034912109375, 120.82878875732422, 127.95408630371094, 135.0793914794922, 142.20468139648438, 149.32998657226562, 156.45529174804688, 163.58059692382812, 170.7058868408203, 177.83119201660156, 184.95648193359375, 192.081787109375, 199.20709228515625, 206.33238220214844, 213.4576873779297, 220.58297729492188, 227.70828247070312, 234.83358764648438, 241.95887756347656, 249.0841827392578, 256.20947265625, 263.33477783203125, 270.4600830078125, 277.58538818359375, 284.710693359375, 291.83599853515625, 298.9613037109375, 306.0865783691406, 313.2118835449219, 320.3371887207031, 327.4624938964844, 334.5877990722656, 341.71307373046875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 5.0, 9.0, 8.0, 7.0, 17.0, 18.0, 14.0, 15.0, 16.0, 15.0, 18.0, 23.0, 41.0, 30.0, 39.0, 36.0, 42.0, 36.0, 40.0, 40.0, 46.0, 49.0, 43.0, 35.0, 37.0, 34.0, 40.0, 30.0, 30.0, 21.0, 19.0, 23.0, 17.0, 22.0, 14.0, 13.0, 8.0, 5.0, 10.0, 9.0, 7.0, 3.0, 7.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-88.91793823242188, -86.1122817993164, -83.30662536621094, -80.5009765625, -77.69532012939453, -74.88966369628906, -72.0840072631836, -69.27835083007812, -66.47270202636719, -63.66704559326172, -60.861392974853516, -58.05573654174805, -55.250083923339844, -52.444427490234375, -49.638771057128906, -46.83311462402344, -44.02745819091797, -41.2218017578125, -38.4161491394043, -35.61049270629883, -32.804840087890625, -29.999183654785156, -27.193527221679688, -24.38787269592285, -21.582218170166016, -18.77656364440918, -15.970908164978027, -13.165252685546875, -10.359598159790039, -7.553943634033203, -4.748287200927734, -1.9426326751708984, 0.8630142211914062, 3.6686692237854004, 6.4743242263793945, 9.279979705810547, 12.085634231567383, 14.891288757324219, 17.696945190429688, 20.502599716186523, 23.30825424194336, 26.113908767700195, 28.91956329345703, 31.7252197265625, 34.53087615966797, 37.33652877807617, 40.14218521118164, 42.947837829589844, 45.75349426269531, 48.55915069580078, 51.364803314208984, 54.17045974731445, 56.976112365722656, 59.781768798828125, 62.587425231933594, 65.39308166503906, 68.19873046875, 71.00438690185547, 73.81004333496094, 76.61569213867188, 79.42134857177734, 82.22700500488281, 85.03266143798828, 87.83831787109375, 90.64397430419922]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 10.0, 4.0, 10.0, 11.0, 12.0, 13.0, 26.0, 33.0, 51.0, 93.0, 134.0, 181.0, 291.0, 483.0, 943.0, 1774.0, 3293.0, 6744.0, 14673.0, 34647.0, 93509.0, 300452.0, 388980.0, 123703.0, 43555.0, 18232.0, 8059.0, 3961.0, 1992.0, 1132.0, 605.0, 311.0, 192.0, 124.0, 111.0, 54.0, 46.0, 26.0, 25.0, 18.0, 22.0, 10.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-71.1875, -68.900390625, -66.61328125, -64.326171875, -62.0390625, -59.751953125, -57.46484375, -55.177734375, -52.890625, -50.603515625, -48.31640625, -46.029296875, -43.7421875, -41.455078125, -39.16796875, -36.880859375, -34.59375, -32.306640625, -30.01953125, -27.732421875, -25.4453125, -23.158203125, -20.87109375, -18.583984375, -16.296875, -14.009765625, -11.72265625, -9.435546875, -7.1484375, -4.861328125, -2.57421875, -0.287109375, 2.0, 4.287109375, 6.57421875, 8.861328125, 11.1484375, 13.435546875, 15.72265625, 18.009765625, 20.296875, 22.583984375, 24.87109375, 27.158203125, 29.4453125, 31.732421875, 34.01953125, 36.306640625, 38.59375, 40.880859375, 43.16796875, 45.455078125, 47.7421875, 50.029296875, 52.31640625, 54.603515625, 56.890625, 59.177734375, 61.46484375, 63.751953125, 66.0390625, 68.326171875, 70.61328125, 72.900390625, 75.1875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 11.0, 5.0, 6.0, 13.0, 20.0, 10.0, 18.0, 24.0, 20.0, 27.0, 31.0, 34.0, 45.0, 39.0, 44.0, 56.0, 43.0, 56.0, 58.0, 49.0, 45.0, 48.0, 29.0, 36.0, 33.0, 26.0, 24.0, 25.0, 22.0, 18.0, 11.0, 6.0, 7.0, 9.0, 9.0, 11.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-32.1875, -31.134765625, -30.08203125, -29.029296875, -27.9765625, -26.923828125, -25.87109375, -24.818359375, -23.765625, -22.712890625, -21.66015625, -20.607421875, -19.5546875, -18.501953125, -17.44921875, -16.396484375, -15.34375, -14.291015625, -13.23828125, -12.185546875, -11.1328125, -10.080078125, -9.02734375, -7.974609375, -6.921875, -5.869140625, -4.81640625, -3.763671875, -2.7109375, -1.658203125, -0.60546875, 0.447265625, 1.5, 2.552734375, 3.60546875, 4.658203125, 5.7109375, 6.763671875, 7.81640625, 8.869140625, 9.921875, 10.974609375, 12.02734375, 13.080078125, 14.1328125, 15.185546875, 16.23828125, 17.291015625, 18.34375, 19.396484375, 20.44921875, 21.501953125, 22.5546875, 23.607421875, 24.66015625, 25.712890625, 26.765625, 27.818359375, 28.87109375, 29.923828125, 30.9765625, 32.029296875, 33.08203125, 34.134765625, 35.1875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 7.0, 6.0, 4.0, 13.0, 8.0, 13.0, 20.0, 18.0, 22.0, 52.0, 78.0, 145.0, 267.0, 734.0, 1935.0, 7295.0, 42182.0, 520325.0, 429347.0, 36277.0, 6710.0, 1819.0, 651.0, 251.0, 139.0, 77.0, 51.0, 36.0, 20.0, 14.0, 9.0, 13.0, 5.0, 6.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.125, -152.470703125, -146.81640625, -141.162109375, -135.5078125, -129.853515625, -124.19921875, -118.544921875, -112.890625, -107.236328125, -101.58203125, -95.927734375, -90.2734375, -84.619140625, -78.96484375, -73.310546875, -67.65625, -62.001953125, -56.34765625, -50.693359375, -45.0390625, -39.384765625, -33.73046875, -28.076171875, -22.421875, -16.767578125, -11.11328125, -5.458984375, 0.1953125, 5.849609375, 11.50390625, 17.158203125, 22.8125, 28.466796875, 34.12109375, 39.775390625, 45.4296875, 51.083984375, 56.73828125, 62.392578125, 68.046875, 73.701171875, 79.35546875, 85.009765625, 90.6640625, 96.318359375, 101.97265625, 107.626953125, 113.28125, 118.935546875, 124.58984375, 130.244140625, 135.8984375, 141.552734375, 147.20703125, 152.861328125, 158.515625, 164.169921875, 169.82421875, 175.478515625, 181.1328125, 186.787109375, 192.44140625, 198.095703125, 203.75]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 1.0, 1.0, 4.0, 3.0, 9.0, 8.0, 5.0, 15.0, 16.0, 24.0, 13.0, 23.0, 26.0, 33.0, 41.0, 45.0, 42.0, 39.0, 53.0, 40.0, 39.0, 53.0, 25.0, 48.0, 35.0, 30.0, 35.0, 41.0, 36.0, 20.0, 37.0, 34.0, 15.0, 20.0, 18.0, 17.0, 21.0, 4.0, 7.0, 3.0, 3.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-200.25, -194.654296875, -189.05859375, -183.462890625, -177.8671875, -172.271484375, -166.67578125, -161.080078125, -155.484375, -149.888671875, -144.29296875, -138.697265625, -133.1015625, -127.505859375, -121.91015625, -116.314453125, -110.71875, -105.123046875, -99.52734375, -93.931640625, -88.3359375, -82.740234375, -77.14453125, -71.548828125, -65.953125, -60.357421875, -54.76171875, -49.166015625, -43.5703125, -37.974609375, -32.37890625, -26.783203125, -21.1875, -15.591796875, -9.99609375, -4.400390625, 1.1953125, 6.791015625, 12.38671875, 17.982421875, 23.578125, 29.173828125, 34.76953125, 40.365234375, 45.9609375, 51.556640625, 57.15234375, 62.748046875, 68.34375, 73.939453125, 79.53515625, 85.130859375, 90.7265625, 96.322265625, 101.91796875, 107.513671875, 113.109375, 118.705078125, 124.30078125, 129.896484375, 135.4921875, 141.087890625, 146.68359375, 152.279296875, 157.875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 4.0, 8.0, 10.0, 11.0, 7.0, 17.0, 20.0, 22.0, 52.0, 63.0, 79.0, 144.0, 273.0, 582.0, 1443.0, 4376.0, 19057.0, 178855.0, 758326.0, 69901.0, 10507.0, 2782.0, 975.0, 452.0, 214.0, 129.0, 66.0, 55.0, 31.0, 33.0, 19.0, 14.0, 10.0, 10.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-75.5, -73.1640625, -70.828125, -68.4921875, -66.15625, -63.8203125, -61.484375, -59.1484375, -56.8125, -54.4765625, -52.140625, -49.8046875, -47.46875, -45.1328125, -42.796875, -40.4609375, -38.125, -35.7890625, -33.453125, -31.1171875, -28.78125, -26.4453125, -24.109375, -21.7734375, -19.4375, -17.1015625, -14.765625, -12.4296875, -10.09375, -7.7578125, -5.421875, -3.0859375, -0.75, 1.5859375, 3.921875, 6.2578125, 8.59375, 10.9296875, 13.265625, 15.6015625, 17.9375, 20.2734375, 22.609375, 24.9453125, 27.28125, 29.6171875, 31.953125, 34.2890625, 36.625, 38.9609375, 41.296875, 43.6328125, 45.96875, 48.3046875, 50.640625, 52.9765625, 55.3125, 57.6484375, 59.984375, 62.3203125, 64.65625, 66.9921875, 69.328125, 71.6640625, 74.0]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 2.0, 3.0, 13.0, 8.0, 9.0, 16.0, 18.0, 21.0, 32.0, 34.0, 54.0, 61.0, 86.0, 103.0, 87.0, 107.0, 62.0, 61.0, 52.0, 37.0, 28.0, 15.0, 8.0, 13.0, 12.0, 9.0, 6.0, 8.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00539398193359375, -0.005216777324676514, -0.005039572715759277, -0.004862368106842041, -0.004685163497924805, -0.004507958889007568, -0.004330754280090332, -0.004153549671173096, -0.003976345062255859, -0.003799140453338623, -0.0036219358444213867, -0.0034447312355041504, -0.003267526626586914, -0.0030903220176696777, -0.0029131174087524414, -0.002735912799835205, -0.0025587081909179688, -0.0023815035820007324, -0.002204298973083496, -0.0020270943641662598, -0.0018498897552490234, -0.0016726851463317871, -0.0014954805374145508, -0.0013182759284973145, -0.0011410713195800781, -0.0009638667106628418, -0.0007866621017456055, -0.0006094574928283691, -0.0004322528839111328, -0.0002550482749938965, -7.784366607666016e-05, 9.936094284057617e-05, 0.0002765655517578125, 0.00045377016067504883, 0.0006309747695922852, 0.0008081793785095215, 0.0009853839874267578, 0.0011625885963439941, 0.0013397932052612305, 0.0015169978141784668, 0.0016942024230957031, 0.0018714070320129395, 0.0020486116409301758, 0.002225816249847412, 0.0024030208587646484, 0.0025802254676818848, 0.002757430076599121, 0.0029346346855163574, 0.0031118392944335938, 0.00328904390335083, 0.0034662485122680664, 0.0036434531211853027, 0.003820657730102539, 0.003997862339019775, 0.004175066947937012, 0.004352271556854248, 0.004529476165771484, 0.004706680774688721, 0.004883885383605957, 0.005061089992523193, 0.00523829460144043, 0.005415499210357666, 0.005592703819274902, 0.005769908428192139, 0.005947113037109375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 7.0, 14.0, 18.0, 37.0, 41.0, 93.0, 149.0, 258.0, 440.0, 763.0, 1577.0, 3343.0, 8140.0, 24970.0, 119441.0, 658168.0, 180508.0, 32663.0, 10105.0, 3988.0, 1813.0, 903.0, 456.0, 262.0, 150.0, 90.0, 48.0, 35.0, 26.0, 12.0, 14.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.0, -46.923828125, -44.84765625, -42.771484375, -40.6953125, -38.619140625, -36.54296875, -34.466796875, -32.390625, -30.314453125, -28.23828125, -26.162109375, -24.0859375, -22.009765625, -19.93359375, -17.857421875, -15.78125, -13.705078125, -11.62890625, -9.552734375, -7.4765625, -5.400390625, -3.32421875, -1.248046875, 0.828125, 2.904296875, 4.98046875, 7.056640625, 9.1328125, 11.208984375, 13.28515625, 15.361328125, 17.4375, 19.513671875, 21.58984375, 23.666015625, 25.7421875, 27.818359375, 29.89453125, 31.970703125, 34.046875, 36.123046875, 38.19921875, 40.275390625, 42.3515625, 44.427734375, 46.50390625, 48.580078125, 50.65625, 52.732421875, 54.80859375, 56.884765625, 58.9609375, 61.037109375, 63.11328125, 65.189453125, 67.265625, 69.341796875, 71.41796875, 73.494140625, 75.5703125, 77.646484375, 79.72265625, 81.798828125, 83.875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 6.0, 8.0, 16.0, 22.0, 20.0, 24.0, 40.0, 63.0, 73.0, 87.0, 105.0, 110.0, 117.0, 78.0, 62.0, 50.0, 29.0, 17.0, 19.0, 13.0, 12.0, 12.0, 7.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.84375, -60.60205078125, -58.3603515625, -56.11865234375, -53.876953125, -51.63525390625, -49.3935546875, -47.15185546875, -44.91015625, -42.66845703125, -40.4267578125, -38.18505859375, -35.943359375, -33.70166015625, -31.4599609375, -29.21826171875, -26.9765625, -24.73486328125, -22.4931640625, -20.25146484375, -18.009765625, -15.76806640625, -13.5263671875, -11.28466796875, -9.04296875, -6.80126953125, -4.5595703125, -2.31787109375, -0.076171875, 2.16552734375, 4.4072265625, 6.64892578125, 8.890625, 11.13232421875, 13.3740234375, 15.61572265625, 17.857421875, 20.09912109375, 22.3408203125, 24.58251953125, 26.82421875, 29.06591796875, 31.3076171875, 33.54931640625, 35.791015625, 38.03271484375, 40.2744140625, 42.51611328125, 44.7578125, 46.99951171875, 49.2412109375, 51.48291015625, 53.724609375, 55.96630859375, 58.2080078125, 60.44970703125, 62.69140625, 64.93310546875, 67.1748046875, 69.41650390625, 71.658203125, 73.89990234375, 76.1416015625, 78.38330078125, 80.625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 13.0, 65.0, 346.0, 457.0, 107.0, 21.0, 4.0, 4.0, 0.0, 1.0], "bins": [-7298.294921875, -7170.47119140625, -7042.64794921875, -6914.82421875, -6787.00048828125, -6659.17724609375, -6531.353515625, -6403.52978515625, -6275.70654296875, -6147.8828125, -6020.0595703125, -5892.23583984375, -5764.412109375, -5636.5888671875, -5508.76513671875, -5380.94140625, -5253.1181640625, -5125.29443359375, -4997.47119140625, -4869.6474609375, -4741.82373046875, -4614.00048828125, -4486.1767578125, -4358.35302734375, -4230.529296875, -4102.70556640625, -3974.882080078125, -3847.05859375, -3719.235107421875, -3591.41162109375, -3463.587890625, -3335.764404296875, -3207.94091796875, -3080.117431640625, -2952.293701171875, -2824.47021484375, -2696.646728515625, -2568.8232421875, -2440.99951171875, -2313.176025390625, -2185.3525390625, -2057.529052734375, -1929.7054443359375, -1801.8818359375, -1674.058349609375, -1546.2347412109375, -1418.4111328125, -1290.587646484375, -1162.763916015625, -1034.9403076171875, -907.1168212890625, -779.293212890625, -651.4696655273438, -523.6461181640625, -395.822509765625, -267.99896240234375, -140.1754150390625, -12.351852416992188, 115.47171020507812, 243.2952880859375, 371.11883544921875, 498.9423828125, 626.7659912109375, 754.5895385742188, 882.4130859375]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 9.0, 11.0, 11.0, 17.0, 20.0, 30.0, 24.0, 42.0, 56.0, 49.0, 60.0, 73.0, 64.0, 80.0, 83.0, 66.0, 55.0, 48.0, 34.0, 38.0, 31.0, 21.0, 21.0, 15.0, 12.0, 3.0, 5.0, 8.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1207.50634765625, -1167.396484375, -1127.28662109375, -1087.1766357421875, -1047.0667724609375, -1006.9569091796875, -966.8470458984375, -926.7371215820312, -886.627197265625, -846.517333984375, -806.4074096679688, -766.2975463867188, -726.1876220703125, -686.0777587890625, -645.9678955078125, -605.8579711914062, -565.7481079101562, -525.6382446289062, -485.5283203125, -445.41845703125, -405.30853271484375, -365.19866943359375, -325.0887756347656, -284.9788818359375, -244.86898803710938, -204.75909423828125, -164.64920043945312, -124.53932189941406, -84.42942810058594, -44.31953430175781, -4.20965576171875, 35.900238037109375, 76.0101318359375, 116.12002563476562, 156.22991943359375, 196.3397979736328, 236.44969177246094, 276.5595703125, 316.6694641113281, 356.77935791015625, 396.8892517089844, 436.9991455078125, 477.1090393066406, 517.2189331054688, 557.3287963867188, 597.438720703125, 637.548583984375, 677.658447265625, 717.7683715820312, 757.8782348632812, 797.9881591796875, 838.0980224609375, 878.2079467773438, 918.3178100585938, 958.427734375, 998.53759765625, 1038.6474609375, 1078.75732421875, 1118.8671875, 1158.9771728515625, 1199.0870361328125, 1239.1968994140625, 1279.3067626953125, 1319.416748046875, 1359.526611328125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 5.0, 8.0, 8.0, 8.0, 12.0, 28.0, 29.0, 27.0, 42.0, 88.0, 106.0, 130.0, 227.0, 400.0, 663.0, 1268.0, 2707.0, 8324.0, 4036006.0, 131385.0, 7371.0, 2449.0, 1214.0, 667.0, 396.0, 199.0, 149.0, 101.0, 64.0, 55.0, 35.0, 27.0, 25.0, 15.0, 6.0, 13.0, 4.0, 5.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-116.75, -113.09765625, -109.4453125, -105.79296875, -102.140625, -98.48828125, -94.8359375, -91.18359375, -87.53125, -83.87890625, -80.2265625, -76.57421875, -72.921875, -69.26953125, -65.6171875, -61.96484375, -58.3125, -54.66015625, -51.0078125, -47.35546875, -43.703125, -40.05078125, -36.3984375, -32.74609375, -29.09375, -25.44140625, -21.7890625, -18.13671875, -14.484375, -10.83203125, -7.1796875, -3.52734375, 0.125, 3.77734375, 7.4296875, 11.08203125, 14.734375, 18.38671875, 22.0390625, 25.69140625, 29.34375, 32.99609375, 36.6484375, 40.30078125, 43.953125, 47.60546875, 51.2578125, 54.91015625, 58.5625, 62.21484375, 65.8671875, 69.51953125, 73.171875, 76.82421875, 80.4765625, 84.12890625, 87.78125, 91.43359375, 95.0859375, 98.73828125, 102.390625, 106.04296875, 109.6953125, 113.34765625, 117.0]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 8.0, 3.0, 6.0, 10.0, 5.0, 9.0, 19.0, 19.0, 26.0, 39.0, 45.0, 45.0, 71.0, 70.0, 95.0, 80.0, 104.0, 72.0, 62.0, 49.0, 38.0, 32.0, 23.0, 26.0, 16.0, 14.0, 9.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.1875, -46.365234375, -44.54296875, -42.720703125, -40.8984375, -39.076171875, -37.25390625, -35.431640625, -33.609375, -31.787109375, -29.96484375, -28.142578125, -26.3203125, -24.498046875, -22.67578125, -20.853515625, -19.03125, -17.208984375, -15.38671875, -13.564453125, -11.7421875, -9.919921875, -8.09765625, -6.275390625, -4.453125, -2.630859375, -0.80859375, 1.013671875, 2.8359375, 4.658203125, 6.48046875, 8.302734375, 10.125, 11.947265625, 13.76953125, 15.591796875, 17.4140625, 19.236328125, 21.05859375, 22.880859375, 24.703125, 26.525390625, 28.34765625, 30.169921875, 31.9921875, 33.814453125, 35.63671875, 37.458984375, 39.28125, 41.103515625, 42.92578125, 44.748046875, 46.5703125, 48.392578125, 50.21484375, 52.037109375, 53.859375, 55.681640625, 57.50390625, 59.326171875, 61.1484375, 62.970703125, 64.79296875, 66.615234375, 68.4375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 7.0, 8.0, 11.0, 12.0, 16.0, 26.0, 42.0, 34.0, 43.0, 66.0, 76.0, 127.0, 211.0, 356.0, 912.0, 3479.0, 72077.0, 4109899.0, 4679.0, 1050.0, 405.0, 227.0, 132.0, 92.0, 77.0, 42.0, 38.0, 30.0, 21.0, 13.0, 19.0, 12.0, 6.0, 10.0, 6.0, 3.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-225.875, -218.107421875, -210.33984375, -202.572265625, -194.8046875, -187.037109375, -179.26953125, -171.501953125, -163.734375, -155.966796875, -148.19921875, -140.431640625, -132.6640625, -124.896484375, -117.12890625, -109.361328125, -101.59375, -93.826171875, -86.05859375, -78.291015625, -70.5234375, -62.755859375, -54.98828125, -47.220703125, -39.453125, -31.685546875, -23.91796875, -16.150390625, -8.3828125, -0.615234375, 7.15234375, 14.919921875, 22.6875, 30.455078125, 38.22265625, 45.990234375, 53.7578125, 61.525390625, 69.29296875, 77.060546875, 84.828125, 92.595703125, 100.36328125, 108.130859375, 115.8984375, 123.666015625, 131.43359375, 139.201171875, 146.96875, 154.736328125, 162.50390625, 170.271484375, 178.0390625, 185.806640625, 193.57421875, 201.341796875, 209.109375, 216.876953125, 224.64453125, 232.412109375, 240.1796875, 247.947265625, 255.71484375, 263.482421875, 271.25]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 4.0, 9.0, 28.0, 3801.0, 178.0, 26.0, 9.0, 9.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-55.28125, -53.929443359375, -52.57763671875, -51.225830078125, -49.8740234375, -48.522216796875, -47.17041015625, -45.818603515625, -44.466796875, -43.114990234375, -41.76318359375, -40.411376953125, -39.0595703125, -37.707763671875, -36.35595703125, -35.004150390625, -33.65234375, -32.300537109375, -30.94873046875, -29.596923828125, -28.2451171875, -26.893310546875, -25.54150390625, -24.189697265625, -22.837890625, -21.486083984375, -20.13427734375, -18.782470703125, -17.4306640625, -16.078857421875, -14.72705078125, -13.375244140625, -12.0234375, -10.671630859375, -9.31982421875, -7.968017578125, -6.6162109375, -5.264404296875, -3.91259765625, -2.560791015625, -1.208984375, 0.142822265625, 1.49462890625, 2.846435546875, 4.1982421875, 5.550048828125, 6.90185546875, 8.253662109375, 9.60546875, 10.957275390625, 12.30908203125, 13.660888671875, 15.0126953125, 16.364501953125, 17.71630859375, 19.068115234375, 20.419921875, 21.771728515625, 23.12353515625, 24.475341796875, 25.8271484375, 27.178955078125, 28.53076171875, 29.882568359375, 31.234375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 7.0, 6.0, 5.0, 17.0, 37.0, 59.0, 148.0, 242.0, 245.0, 120.0, 67.0, 28.0, 18.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.51009368896484, -114.68014526367188, -109.85018920898438, -105.0202407836914, -100.19029235839844, -95.36033630371094, -90.53038787841797, -85.700439453125, -80.8704833984375, -76.04053497314453, -71.21057891845703, -66.38063049316406, -61.55067825317383, -56.720726013183594, -51.890777587890625, -47.06082534790039, -42.230873107910156, -37.40092086791992, -32.57096862792969, -27.74102020263672, -22.911067962646484, -18.08111572265625, -13.251165390014648, -8.421215057373047, -3.5912628173828125, 1.2386884689331055, 6.068639755249023, 10.898591041564941, 15.72854232788086, 20.558494567871094, 25.388444900512695, 30.218395233154297, 35.04833984375, 39.878292083740234, 44.70824432373047, 49.53819274902344, 54.36814498901367, 59.198097229003906, 64.02804565429688, 68.85800170898438, 73.68795013427734, 78.51789855957031, 83.34785461425781, 88.17780303955078, 93.00775146484375, 97.83770751953125, 102.66765594482422, 107.49760437011719, 112.32756042480469, 117.15750885009766, 121.98746490478516, 126.81741333007812, 131.64736938476562, 136.47732543945312, 141.30726623535156, 146.13722229003906, 150.9671630859375, 155.797119140625, 160.62705993652344, 165.45701599121094, 170.28697204589844, 175.11691284179688, 179.94686889648438, 184.77682495117188, 189.60678100585938]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 3.0, 6.0, 6.0, 7.0, 9.0, 12.0, 8.0, 7.0, 13.0, 18.0, 14.0, 25.0, 26.0, 33.0, 28.0, 42.0, 23.0, 28.0, 37.0, 41.0, 48.0, 46.0, 48.0, 45.0, 58.0, 33.0, 42.0, 32.0, 18.0, 46.0, 28.0, 25.0, 22.0, 22.0, 22.0, 11.0, 14.0, 14.0, 5.0, 8.0, 7.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-34.15808868408203, -32.95467758178711, -31.751264572143555, -30.547853469848633, -29.344440460205078, -28.141029357910156, -26.937618255615234, -25.734207153320312, -24.530794143676758, -23.327383041381836, -22.12397003173828, -20.92055892944336, -19.717147827148438, -18.513734817504883, -17.31032371520996, -16.106910705566406, -14.903499603271484, -13.700087547302246, -12.496675491333008, -11.293264389038086, -10.089852333068848, -8.88644027709961, -7.683028697967529, -6.479617118835449, -5.276205062866211, -4.072793006896973, -2.8693814277648926, -1.6659696102142334, -0.4625577926635742, 0.7408542633056641, 1.9442658424377441, 3.147677421569824, 4.3510894775390625, 5.554501533508301, 6.757913112640381, 7.961324691772461, 9.1647367477417, 10.368148803710938, 11.57155990600586, 12.774971961975098, 13.978384017944336, 15.181796073913574, 16.385208129882812, 17.588619232177734, 18.792030334472656, 19.99544334411621, 21.198854446411133, 22.402267456054688, 23.60567855834961, 24.80908966064453, 26.012502670288086, 27.215913772583008, 28.419326782226562, 29.622737884521484, 30.826148986816406, 32.02956008911133, 33.23297119140625, 34.43638229370117, 35.639793395996094, 36.84320831298828, 38.0466194152832, 39.250030517578125, 40.45344161987305, 41.65685272216797, 42.860267639160156]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 7.0, 4.0, 15.0, 13.0, 20.0, 21.0, 21.0, 57.0, 64.0, 97.0, 134.0, 199.0, 282.0, 419.0, 727.0, 1140.0, 2001.0, 3451.0, 6917.0, 14613.0, 35151.0, 104925.0, 426868.0, 316143.0, 80659.0, 28677.0, 12236.0, 5813.0, 3154.0, 1768.0, 1066.0, 650.0, 398.0, 232.0, 197.0, 112.0, 81.0, 66.0, 49.0, 37.0, 15.0, 21.0, 12.0, 15.0, 8.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-85.6875, -82.7216796875, -79.755859375, -76.7900390625, -73.82421875, -70.8583984375, -67.892578125, -64.9267578125, -61.9609375, -58.9951171875, -56.029296875, -53.0634765625, -50.09765625, -47.1318359375, -44.166015625, -41.2001953125, -38.234375, -35.2685546875, -32.302734375, -29.3369140625, -26.37109375, -23.4052734375, -20.439453125, -17.4736328125, -14.5078125, -11.5419921875, -8.576171875, -5.6103515625, -2.64453125, 0.3212890625, 3.287109375, 6.2529296875, 9.21875, 12.1845703125, 15.150390625, 18.1162109375, 21.08203125, 24.0478515625, 27.013671875, 29.9794921875, 32.9453125, 35.9111328125, 38.876953125, 41.8427734375, 44.80859375, 47.7744140625, 50.740234375, 53.7060546875, 56.671875, 59.6376953125, 62.603515625, 65.5693359375, 68.53515625, 71.5009765625, 74.466796875, 77.4326171875, 80.3984375, 83.3642578125, 86.330078125, 89.2958984375, 92.26171875, 95.2275390625, 98.193359375, 101.1591796875, 104.125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 5.0, 4.0, 8.0, 5.0, 11.0, 18.0, 17.0, 29.0, 31.0, 38.0, 38.0, 45.0, 74.0, 72.0, 86.0, 71.0, 85.0, 71.0, 53.0, 54.0, 42.0, 32.0, 16.0, 28.0, 23.0, 12.0, 8.0, 8.0, 2.0, 8.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.78125, -41.08642578125, -39.3916015625, -37.69677734375, -36.001953125, -34.30712890625, -32.6123046875, -30.91748046875, -29.22265625, -27.52783203125, -25.8330078125, -24.13818359375, -22.443359375, -20.74853515625, -19.0537109375, -17.35888671875, -15.6640625, -13.96923828125, -12.2744140625, -10.57958984375, -8.884765625, -7.18994140625, -5.4951171875, -3.80029296875, -2.10546875, -0.41064453125, 1.2841796875, 2.97900390625, 4.673828125, 6.36865234375, 8.0634765625, 9.75830078125, 11.453125, 13.14794921875, 14.8427734375, 16.53759765625, 18.232421875, 19.92724609375, 21.6220703125, 23.31689453125, 25.01171875, 26.70654296875, 28.4013671875, 30.09619140625, 31.791015625, 33.48583984375, 35.1806640625, 36.87548828125, 38.5703125, 40.26513671875, 41.9599609375, 43.65478515625, 45.349609375, 47.04443359375, 48.7392578125, 50.43408203125, 52.12890625, 53.82373046875, 55.5185546875, 57.21337890625, 58.908203125, 60.60302734375, 62.2978515625, 63.99267578125, 65.6875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 9.0, 9.0, 13.0, 16.0, 29.0, 41.0, 50.0, 59.0, 104.0, 173.0, 261.0, 446.0, 922.0, 1887.0, 4382.0, 12278.0, 50694.0, 504362.0, 407534.0, 45841.0, 11563.0, 4080.0, 1752.0, 860.0, 439.0, 264.0, 149.0, 100.0, 57.0, 40.0, 24.0, 20.0, 18.0, 24.0, 5.0, 10.0, 8.0, 4.0, 6.0, 2.0, 2.0, 6.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-168.75, -163.923828125, -159.09765625, -154.271484375, -149.4453125, -144.619140625, -139.79296875, -134.966796875, -130.140625, -125.314453125, -120.48828125, -115.662109375, -110.8359375, -106.009765625, -101.18359375, -96.357421875, -91.53125, -86.705078125, -81.87890625, -77.052734375, -72.2265625, -67.400390625, -62.57421875, -57.748046875, -52.921875, -48.095703125, -43.26953125, -38.443359375, -33.6171875, -28.791015625, -23.96484375, -19.138671875, -14.3125, -9.486328125, -4.66015625, 0.166015625, 4.9921875, 9.818359375, 14.64453125, 19.470703125, 24.296875, 29.123046875, 33.94921875, 38.775390625, 43.6015625, 48.427734375, 53.25390625, 58.080078125, 62.90625, 67.732421875, 72.55859375, 77.384765625, 82.2109375, 87.037109375, 91.86328125, 96.689453125, 101.515625, 106.341796875, 111.16796875, 115.994140625, 120.8203125, 125.646484375, 130.47265625, 135.298828125, 140.125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 10.0, 4.0, 9.0, 13.0, 10.0, 14.0, 18.0, 18.0, 27.0, 23.0, 28.0, 29.0, 35.0, 36.0, 33.0, 33.0, 43.0, 38.0, 32.0, 46.0, 41.0, 39.0, 40.0, 39.0, 38.0, 33.0, 37.0, 32.0, 28.0, 27.0, 17.0, 13.0, 18.0, 9.0, 11.0, 13.0, 11.0, 6.0, 8.0, 5.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-151.375, -146.646484375, -141.91796875, -137.189453125, -132.4609375, -127.732421875, -123.00390625, -118.275390625, -113.546875, -108.818359375, -104.08984375, -99.361328125, -94.6328125, -89.904296875, -85.17578125, -80.447265625, -75.71875, -70.990234375, -66.26171875, -61.533203125, -56.8046875, -52.076171875, -47.34765625, -42.619140625, -37.890625, -33.162109375, -28.43359375, -23.705078125, -18.9765625, -14.248046875, -9.51953125, -4.791015625, -0.0625, 4.666015625, 9.39453125, 14.123046875, 18.8515625, 23.580078125, 28.30859375, 33.037109375, 37.765625, 42.494140625, 47.22265625, 51.951171875, 56.6796875, 61.408203125, 66.13671875, 70.865234375, 75.59375, 80.322265625, 85.05078125, 89.779296875, 94.5078125, 99.236328125, 103.96484375, 108.693359375, 113.421875, 118.150390625, 122.87890625, 127.607421875, 132.3359375, 137.064453125, 141.79296875, 146.521484375, 151.25]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 4.0, 18.0, 17.0, 25.0, 31.0, 52.0, 74.0, 154.0, 319.0, 633.0, 1737.0, 5511.0, 28594.0, 720857.0, 266098.0, 17854.0, 4023.0, 1373.0, 551.0, 274.0, 130.0, 72.0, 44.0, 26.0, 22.0, 15.0, 8.0, 6.0, 5.0, 5.0, 1.0, 3.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.9375, -75.6318359375, -72.326171875, -69.0205078125, -65.71484375, -62.4091796875, -59.103515625, -55.7978515625, -52.4921875, -49.1865234375, -45.880859375, -42.5751953125, -39.26953125, -35.9638671875, -32.658203125, -29.3525390625, -26.046875, -22.7412109375, -19.435546875, -16.1298828125, -12.82421875, -9.5185546875, -6.212890625, -2.9072265625, 0.3984375, 3.7041015625, 7.009765625, 10.3154296875, 13.62109375, 16.9267578125, 20.232421875, 23.5380859375, 26.84375, 30.1494140625, 33.455078125, 36.7607421875, 40.06640625, 43.3720703125, 46.677734375, 49.9833984375, 53.2890625, 56.5947265625, 59.900390625, 63.2060546875, 66.51171875, 69.8173828125, 73.123046875, 76.4287109375, 79.734375, 83.0400390625, 86.345703125, 89.6513671875, 92.95703125, 96.2626953125, 99.568359375, 102.8740234375, 106.1796875, 109.4853515625, 112.791015625, 116.0966796875, 119.40234375, 122.7080078125, 126.013671875, 129.3193359375, 132.625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 6.0, 9.0, 9.0, 7.0, 8.0, 15.0, 21.0, 21.0, 37.0, 39.0, 58.0, 99.0, 191.0, 162.0, 87.0, 57.0, 36.0, 25.0, 18.0, 17.0, 11.0, 14.0, 5.0, 7.0, 7.0, 6.0, 1.0, 4.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0111236572265625, -0.010764241218566895, -0.010404825210571289, -0.010045409202575684, -0.009685993194580078, -0.009326577186584473, -0.008967161178588867, -0.008607745170593262, -0.008248329162597656, -0.00788891315460205, -0.007529497146606445, -0.00717008113861084, -0.006810665130615234, -0.006451249122619629, -0.0060918331146240234, -0.005732417106628418, -0.0053730010986328125, -0.005013585090637207, -0.0046541690826416016, -0.004294753074645996, -0.003935337066650391, -0.003575921058654785, -0.0032165050506591797, -0.0028570890426635742, -0.0024976730346679688, -0.0021382570266723633, -0.0017788410186767578, -0.0014194250106811523, -0.0010600090026855469, -0.0007005929946899414, -0.00034117698669433594, 1.823902130126953e-05, 0.000377655029296875, 0.0007370710372924805, 0.001096487045288086, 0.0014559030532836914, 0.0018153190612792969, 0.0021747350692749023, 0.002534151077270508, 0.0028935670852661133, 0.0032529830932617188, 0.0036123991012573242, 0.00397181510925293, 0.004331231117248535, 0.004690647125244141, 0.005050063133239746, 0.0054094791412353516, 0.005768895149230957, 0.0061283111572265625, 0.006487727165222168, 0.0068471431732177734, 0.007206559181213379, 0.007565975189208984, 0.00792539119720459, 0.008284807205200195, 0.0086442232131958, 0.009003639221191406, 0.009363055229187012, 0.009722471237182617, 0.010081887245178223, 0.010441303253173828, 0.010800719261169434, 0.011160135269165039, 0.011519551277160645, 0.01187896728515625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 9.0, 9.0, 7.0, 15.0, 21.0, 41.0, 51.0, 78.0, 149.0, 258.0, 513.0, 1105.0, 2258.0, 6135.0, 21569.0, 214086.0, 746465.0, 40301.0, 9297.0, 3328.0, 1403.0, 679.0, 312.0, 194.0, 89.0, 63.0, 32.0, 23.0, 23.0, 14.0, 7.0, 6.0, 2.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-136.875, -133.46875, -130.0625, -126.65625, -123.25, -119.84375, -116.4375, -113.03125, -109.625, -106.21875, -102.8125, -99.40625, -96.0, -92.59375, -89.1875, -85.78125, -82.375, -78.96875, -75.5625, -72.15625, -68.75, -65.34375, -61.9375, -58.53125, -55.125, -51.71875, -48.3125, -44.90625, -41.5, -38.09375, -34.6875, -31.28125, -27.875, -24.46875, -21.0625, -17.65625, -14.25, -10.84375, -7.4375, -4.03125, -0.625, 2.78125, 6.1875, 9.59375, 13.0, 16.40625, 19.8125, 23.21875, 26.625, 30.03125, 33.4375, 36.84375, 40.25, 43.65625, 47.0625, 50.46875, 53.875, 57.28125, 60.6875, 64.09375, 67.5, 70.90625, 74.3125, 77.71875, 81.125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 12.0, 9.0, 7.0, 9.0, 13.0, 11.0, 28.0, 25.0, 41.0, 79.0, 95.0, 127.0, 151.0, 118.0, 72.0, 59.0, 41.0, 28.0, 13.0, 16.0, 17.0, 6.0, 4.0, 10.0, 5.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.5, -55.0263671875, -52.552734375, -50.0791015625, -47.60546875, -45.1318359375, -42.658203125, -40.1845703125, -37.7109375, -35.2373046875, -32.763671875, -30.2900390625, -27.81640625, -25.3427734375, -22.869140625, -20.3955078125, -17.921875, -15.4482421875, -12.974609375, -10.5009765625, -8.02734375, -5.5537109375, -3.080078125, -0.6064453125, 1.8671875, 4.3408203125, 6.814453125, 9.2880859375, 11.76171875, 14.2353515625, 16.708984375, 19.1826171875, 21.65625, 24.1298828125, 26.603515625, 29.0771484375, 31.55078125, 34.0244140625, 36.498046875, 38.9716796875, 41.4453125, 43.9189453125, 46.392578125, 48.8662109375, 51.33984375, 53.8134765625, 56.287109375, 58.7607421875, 61.234375, 63.7080078125, 66.181640625, 68.6552734375, 71.12890625, 73.6025390625, 76.076171875, 78.5498046875, 81.0234375, 83.4970703125, 85.970703125, 88.4443359375, 90.91796875, 93.3916015625, 95.865234375, 98.3388671875, 100.8125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 38.0, 162.0, 450.0, 257.0, 66.0, 23.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-952.281005859375, -842.4746704101562, -732.6683349609375, -622.862060546875, -513.0557250976562, -403.2493896484375, -293.443115234375, -183.63677978515625, -73.8304443359375, 35.97587585449219, 145.78219604492188, 255.5885009765625, 365.39483642578125, 475.201171875, 585.0074462890625, 694.8137817382812, 804.6201171875, 914.4264526367188, 1024.2327880859375, 1134.0390625, 1243.845458984375, 1353.6517333984375, 1463.4580078125, 1573.264404296875, 1683.0706787109375, 1792.876953125, 1902.683349609375, 2012.4896240234375, 2122.2958984375, 2232.102294921875, 2341.90869140625, 2451.71484375, 2561.52099609375, 2671.327392578125, 2781.133544921875, 2890.93994140625, 3000.746337890625, 3110.552734375, 3220.35888671875, 3330.165283203125, 3439.9716796875, 3549.778076171875, 3659.584228515625, 3769.390625, 3879.197021484375, 3989.00341796875, 4098.8095703125, 4208.61572265625, 4318.421875, 4428.22802734375, 4538.03466796875, 4647.8408203125, 4757.64697265625, 4867.45361328125, 4977.259765625, 5087.06591796875, 5196.87255859375, 5306.6787109375, 5416.4853515625, 5526.29150390625, 5636.09765625, 5745.904296875, 5855.71044921875, 5965.5166015625, 6075.3232421875]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 5.0, 7.0, 15.0, 10.0, 15.0, 20.0, 22.0, 24.0, 28.0, 37.0, 31.0, 39.0, 48.0, 38.0, 47.0, 45.0, 53.0, 52.0, 53.0, 40.0, 35.0, 46.0, 30.0, 38.0, 31.0, 38.0, 37.0, 16.0, 23.0, 14.0, 12.0, 12.0, 7.0, 7.0, 9.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-953.2337036132812, -927.6359252929688, -902.0381469726562, -876.4404296875, -850.8426513671875, -825.244873046875, -799.6470947265625, -774.04931640625, -748.4515380859375, -722.853759765625, -697.2559814453125, -671.658203125, -646.0604858398438, -620.4627075195312, -594.8649291992188, -569.2671508789062, -543.66943359375, -518.0716552734375, -492.4739074707031, -466.8761291503906, -441.27838134765625, -415.68060302734375, -390.08282470703125, -364.48504638671875, -338.8872985839844, -313.2895202636719, -287.6917724609375, -262.093994140625, -236.49623107910156, -210.89846801757812, -185.30068969726562, -159.7029266357422, -134.1051025390625, -108.50733947753906, -82.9095687866211, -57.311798095703125, -31.714035034179688, -6.11627197265625, 19.48150634765625, 45.07926940917969, 70.67703247070312, 96.27479553222656, 121.87256622314453, 147.4703369140625, 173.06809997558594, 198.66586303710938, 224.26364135742188, 249.8614044189453, 275.45916748046875, 301.05694580078125, 326.6546936035156, 352.2524719238281, 377.8502197265625, 403.447998046875, 429.0457763671875, 454.6435546875, 480.2413024902344, 505.8390808105469, 531.4368286132812, 557.0346069335938, 582.6323852539062, 608.2301025390625, 633.827880859375, 659.4256591796875, 685.0234375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 12.0, 5.0, 15.0, 14.0, 32.0, 35.0, 53.0, 76.0, 119.0, 158.0, 294.0, 419.0, 702.0, 1224.0, 2250.0, 5096.0, 23200.0, 4109658.0, 38750.0, 6067.0, 2555.0, 1376.0, 785.0, 458.0, 313.0, 218.0, 117.0, 86.0, 52.0, 39.0, 28.0, 20.0, 18.0, 9.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-213.625, -206.154296875, -198.68359375, -191.212890625, -183.7421875, -176.271484375, -168.80078125, -161.330078125, -153.859375, -146.388671875, -138.91796875, -131.447265625, -123.9765625, -116.505859375, -109.03515625, -101.564453125, -94.09375, -86.623046875, -79.15234375, -71.681640625, -64.2109375, -56.740234375, -49.26953125, -41.798828125, -34.328125, -26.857421875, -19.38671875, -11.916015625, -4.4453125, 3.025390625, 10.49609375, 17.966796875, 25.4375, 32.908203125, 40.37890625, 47.849609375, 55.3203125, 62.791015625, 70.26171875, 77.732421875, 85.203125, 92.673828125, 100.14453125, 107.615234375, 115.0859375, 122.556640625, 130.02734375, 137.498046875, 144.96875, 152.439453125, 159.91015625, 167.380859375, 174.8515625, 182.322265625, 189.79296875, 197.263671875, 204.734375, 212.205078125, 219.67578125, 227.146484375, 234.6171875, 242.087890625, 249.55859375, 257.029296875, 264.5]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 2.0, 3.0, 5.0, 10.0, 18.0, 11.0, 17.0, 26.0, 25.0, 28.0, 30.0, 50.0, 55.0, 47.0, 86.0, 75.0, 69.0, 75.0, 68.0, 54.0, 48.0, 35.0, 33.0, 25.0, 25.0, 20.0, 11.0, 12.0, 8.0, 4.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.625, -41.25537109375, -39.8857421875, -38.51611328125, -37.146484375, -35.77685546875, -34.4072265625, -33.03759765625, -31.66796875, -30.29833984375, -28.9287109375, -27.55908203125, -26.189453125, -24.81982421875, -23.4501953125, -22.08056640625, -20.7109375, -19.34130859375, -17.9716796875, -16.60205078125, -15.232421875, -13.86279296875, -12.4931640625, -11.12353515625, -9.75390625, -8.38427734375, -7.0146484375, -5.64501953125, -4.275390625, -2.90576171875, -1.5361328125, -0.16650390625, 1.203125, 2.57275390625, 3.9423828125, 5.31201171875, 6.681640625, 8.05126953125, 9.4208984375, 10.79052734375, 12.16015625, 13.52978515625, 14.8994140625, 16.26904296875, 17.638671875, 19.00830078125, 20.3779296875, 21.74755859375, 23.1171875, 24.48681640625, 25.8564453125, 27.22607421875, 28.595703125, 29.96533203125, 31.3349609375, 32.70458984375, 34.07421875, 35.44384765625, 36.8134765625, 38.18310546875, 39.552734375, 40.92236328125, 42.2919921875, 43.66162109375, 45.03125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 3.0, 7.0, 16.0, 16.0, 22.0, 23.0, 46.0, 53.0, 82.0, 117.0, 152.0, 224.0, 310.0, 474.0, 638.0, 885.0, 1391.0, 2199.0, 3243.0, 5737.0, 12759.0, 74661.0, 4031954.0, 36263.0, 9558.0, 4797.0, 2825.0, 1824.0, 1204.0, 832.0, 554.0, 397.0, 305.0, 186.0, 139.0, 103.0, 75.0, 61.0, 41.0, 24.0, 25.0, 16.0, 8.0, 9.0, 4.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0], "bins": [-192.875, -187.419921875, -181.96484375, -176.509765625, -171.0546875, -165.599609375, -160.14453125, -154.689453125, -149.234375, -143.779296875, -138.32421875, -132.869140625, -127.4140625, -121.958984375, -116.50390625, -111.048828125, -105.59375, -100.138671875, -94.68359375, -89.228515625, -83.7734375, -78.318359375, -72.86328125, -67.408203125, -61.953125, -56.498046875, -51.04296875, -45.587890625, -40.1328125, -34.677734375, -29.22265625, -23.767578125, -18.3125, -12.857421875, -7.40234375, -1.947265625, 3.5078125, 8.962890625, 14.41796875, 19.873046875, 25.328125, 30.783203125, 36.23828125, 41.693359375, 47.1484375, 52.603515625, 58.05859375, 63.513671875, 68.96875, 74.423828125, 79.87890625, 85.333984375, 90.7890625, 96.244140625, 101.69921875, 107.154296875, 112.609375, 118.064453125, 123.51953125, 128.974609375, 134.4296875, 139.884765625, 145.33984375, 150.794921875, 156.25]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 14.0, 17.0, 56.0, 146.0, 3525.0, 177.0, 34.0, 26.0, 9.0, 11.0, 5.0, 3.0, 4.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.8125, -74.2119140625, -71.611328125, -69.0107421875, -66.41015625, -63.8095703125, -61.208984375, -58.6083984375, -56.0078125, -53.4072265625, -50.806640625, -48.2060546875, -45.60546875, -43.0048828125, -40.404296875, -37.8037109375, -35.203125, -32.6025390625, -30.001953125, -27.4013671875, -24.80078125, -22.2001953125, -19.599609375, -16.9990234375, -14.3984375, -11.7978515625, -9.197265625, -6.5966796875, -3.99609375, -1.3955078125, 1.205078125, 3.8056640625, 6.40625, 9.0068359375, 11.607421875, 14.2080078125, 16.80859375, 19.4091796875, 22.009765625, 24.6103515625, 27.2109375, 29.8115234375, 32.412109375, 35.0126953125, 37.61328125, 40.2138671875, 42.814453125, 45.4150390625, 48.015625, 50.6162109375, 53.216796875, 55.8173828125, 58.41796875, 61.0185546875, 63.619140625, 66.2197265625, 68.8203125, 71.4208984375, 74.021484375, 76.6220703125, 79.22265625, 81.8232421875, 84.423828125, 87.0244140625, 89.625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 9.0, 7.0, 18.0, 23.0, 31.0, 51.0, 96.0, 154.0, 195.0, 162.0, 94.0, 70.0, 30.0, 26.0, 11.0, 10.0, 9.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0], "bins": [-646.0114135742188, -633.0687255859375, -620.1260375976562, -607.183349609375, -594.2406616210938, -581.2979736328125, -568.3552856445312, -555.41259765625, -542.4699096679688, -529.5272216796875, -516.5845336914062, -503.641845703125, -490.69915771484375, -477.7564697265625, -464.81378173828125, -451.87109375, -438.9284362792969, -425.9857482910156, -413.0430603027344, -400.1003723144531, -387.1576843261719, -374.2149963378906, -361.2723388671875, -348.32965087890625, -335.386962890625, -322.44427490234375, -309.5015869140625, -296.55889892578125, -283.6162109375, -270.67352294921875, -257.7308349609375, -244.7881622314453, -231.84547424316406, -218.9027862548828, -205.96009826660156, -193.01742553710938, -180.07473754882812, -167.13204956054688, -154.18936157226562, -141.24667358398438, -128.30398559570312, -115.36129760742188, -102.41860961914062, -89.4759292602539, -76.53324127197266, -63.590553283691406, -50.64787292480469, -37.70518493652344, -24.762496948242188, -11.81981086730957, 1.1228752136230469, 14.065559387207031, 27.00824737548828, 39.95093536376953, 52.89361572265625, 65.8363037109375, 78.77899169921875, 91.7216796875, 104.66436767578125, 117.60704803466797, 130.54974365234375, 143.492431640625, 156.4351043701172, 169.37779235839844, 182.3204803466797]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 1.0, 4.0, 2.0, 9.0, 8.0, 7.0, 9.0, 11.0, 13.0, 13.0, 20.0, 11.0, 18.0, 28.0, 27.0, 25.0, 34.0, 31.0, 41.0, 37.0, 47.0, 41.0, 40.0, 29.0, 45.0, 41.0, 39.0, 37.0, 35.0, 37.0, 38.0, 27.0, 25.0, 30.0, 22.0, 19.0, 13.0, 19.0, 11.0, 10.0, 8.0, 5.0, 5.0, 8.0, 8.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-150.04367065429688, -145.26568603515625, -140.48770141601562, -135.70970153808594, -130.9317169189453, -126.15373229980469, -121.37574005126953, -116.59774780273438, -111.81976318359375, -107.04177856445312, -102.26378631591797, -97.48579406738281, -92.70780944824219, -87.92982482910156, -83.1518325805664, -78.37384033203125, -73.59585571289062, -68.81787109375, -64.03987884521484, -59.26189041137695, -54.48390197753906, -49.70591354370117, -44.92792510986328, -40.14993667602539, -35.3719482421875, -30.59395980834961, -25.81597137451172, -21.037982940673828, -16.259994506835938, -11.482006072998047, -6.704017639160156, -1.9260292053222656, 2.851959228515625, 7.629947662353516, 12.407936096191406, 17.185924530029297, 21.963912963867188, 26.741901397705078, 31.51988983154297, 36.29787826538086, 41.07586669921875, 45.85385513305664, 50.63184356689453, 55.40983200073242, 60.18782043457031, 64.96580505371094, 69.7437973022461, 74.52178955078125, 79.29977416992188, 84.0777587890625, 88.85575103759766, 93.63374328613281, 98.41172790527344, 103.18971252441406, 107.96770477294922, 112.74569702148438, 117.523681640625, 122.30166625976562, 127.07965850830078, 131.85765075683594, 136.63563537597656, 141.4136199951172, 146.19161987304688, 150.9696044921875, 155.74758911132812]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 9.0, 15.0, 17.0, 21.0, 47.0, 80.0, 95.0, 133.0, 232.0, 427.0, 722.0, 1269.0, 2560.0, 5356.0, 12326.0, 32207.0, 104174.0, 442736.0, 323718.0, 77489.0, 25447.0, 10033.0, 4583.0, 2216.0, 1114.0, 591.0, 326.0, 195.0, 134.0, 73.0, 64.0, 45.0, 23.0, 20.0, 14.0, 11.0, 7.0, 9.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-98.625, -95.951171875, -93.27734375, -90.603515625, -87.9296875, -85.255859375, -82.58203125, -79.908203125, -77.234375, -74.560546875, -71.88671875, -69.212890625, -66.5390625, -63.865234375, -61.19140625, -58.517578125, -55.84375, -53.169921875, -50.49609375, -47.822265625, -45.1484375, -42.474609375, -39.80078125, -37.126953125, -34.453125, -31.779296875, -29.10546875, -26.431640625, -23.7578125, -21.083984375, -18.41015625, -15.736328125, -13.0625, -10.388671875, -7.71484375, -5.041015625, -2.3671875, 0.306640625, 2.98046875, 5.654296875, 8.328125, 11.001953125, 13.67578125, 16.349609375, 19.0234375, 21.697265625, 24.37109375, 27.044921875, 29.71875, 32.392578125, 35.06640625, 37.740234375, 40.4140625, 43.087890625, 45.76171875, 48.435546875, 51.109375, 53.783203125, 56.45703125, 59.130859375, 61.8046875, 64.478515625, 67.15234375, 69.826171875, 72.5]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 9.0, 7.0, 14.0, 24.0, 28.0, 24.0, 44.0, 63.0, 50.0, 62.0, 73.0, 100.0, 97.0, 71.0, 60.0, 51.0, 50.0, 39.0, 30.0, 31.0, 15.0, 17.0, 7.0, 9.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.8125, -68.8974609375, -66.982421875, -65.0673828125, -63.15234375, -61.2373046875, -59.322265625, -57.4072265625, -55.4921875, -53.5771484375, -51.662109375, -49.7470703125, -47.83203125, -45.9169921875, -44.001953125, -42.0869140625, -40.171875, -38.2568359375, -36.341796875, -34.4267578125, -32.51171875, -30.5966796875, -28.681640625, -26.7666015625, -24.8515625, -22.9365234375, -21.021484375, -19.1064453125, -17.19140625, -15.2763671875, -13.361328125, -11.4462890625, -9.53125, -7.6162109375, -5.701171875, -3.7861328125, -1.87109375, 0.0439453125, 1.958984375, 3.8740234375, 5.7890625, 7.7041015625, 9.619140625, 11.5341796875, 13.44921875, 15.3642578125, 17.279296875, 19.1943359375, 21.109375, 23.0244140625, 24.939453125, 26.8544921875, 28.76953125, 30.6845703125, 32.599609375, 34.5146484375, 36.4296875, 38.3447265625, 40.259765625, 42.1748046875, 44.08984375, 46.0048828125, 47.919921875, 49.8349609375, 51.75]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 3.0, 6.0, 13.0, 5.0, 14.0, 25.0, 23.0, 54.0, 93.0, 164.0, 332.0, 835.0, 2436.0, 10280.0, 82869.0, 811831.0, 121733.0, 13189.0, 2891.0, 970.0, 360.0, 180.0, 81.0, 57.0, 33.0, 16.0, 16.0, 12.0, 6.0, 6.0, 2.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-228.5, -222.076171875, -215.65234375, -209.228515625, -202.8046875, -196.380859375, -189.95703125, -183.533203125, -177.109375, -170.685546875, -164.26171875, -157.837890625, -151.4140625, -144.990234375, -138.56640625, -132.142578125, -125.71875, -119.294921875, -112.87109375, -106.447265625, -100.0234375, -93.599609375, -87.17578125, -80.751953125, -74.328125, -67.904296875, -61.48046875, -55.056640625, -48.6328125, -42.208984375, -35.78515625, -29.361328125, -22.9375, -16.513671875, -10.08984375, -3.666015625, 2.7578125, 9.181640625, 15.60546875, 22.029296875, 28.453125, 34.876953125, 41.30078125, 47.724609375, 54.1484375, 60.572265625, 66.99609375, 73.419921875, 79.84375, 86.267578125, 92.69140625, 99.115234375, 105.5390625, 111.962890625, 118.38671875, 124.810546875, 131.234375, 137.658203125, 144.08203125, 150.505859375, 156.9296875, 163.353515625, 169.77734375, 176.201171875, 182.625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 4.0, 8.0, 4.0, 4.0, 2.0, 11.0, 10.0, 16.0, 18.0, 11.0, 13.0, 16.0, 23.0, 22.0, 28.0, 39.0, 35.0, 42.0, 39.0, 46.0, 48.0, 36.0, 48.0, 41.0, 41.0, 37.0, 29.0, 49.0, 38.0, 36.0, 25.0, 20.0, 34.0, 24.0, 13.0, 19.0, 11.0, 14.0, 7.0, 7.0, 7.0, 6.0, 5.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-153.125, -147.455078125, -141.78515625, -136.115234375, -130.4453125, -124.775390625, -119.10546875, -113.435546875, -107.765625, -102.095703125, -96.42578125, -90.755859375, -85.0859375, -79.416015625, -73.74609375, -68.076171875, -62.40625, -56.736328125, -51.06640625, -45.396484375, -39.7265625, -34.056640625, -28.38671875, -22.716796875, -17.046875, -11.376953125, -5.70703125, -0.037109375, 5.6328125, 11.302734375, 16.97265625, 22.642578125, 28.3125, 33.982421875, 39.65234375, 45.322265625, 50.9921875, 56.662109375, 62.33203125, 68.001953125, 73.671875, 79.341796875, 85.01171875, 90.681640625, 96.3515625, 102.021484375, 107.69140625, 113.361328125, 119.03125, 124.701171875, 130.37109375, 136.041015625, 141.7109375, 147.380859375, 153.05078125, 158.720703125, 164.390625, 170.060546875, 175.73046875, 181.400390625, 187.0703125, 192.740234375, 198.41015625, 204.080078125, 209.75]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 5.0, 9.0, 14.0, 17.0, 21.0, 33.0, 55.0, 96.0, 182.0, 368.0, 1045.0, 4449.0, 39057.0, 826643.0, 163474.0, 10253.0, 1753.0, 513.0, 233.0, 124.0, 57.0, 46.0, 44.0, 22.0, 11.0, 6.0, 5.0, 4.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-69.0, -67.068359375, -65.13671875, -63.205078125, -61.2734375, -59.341796875, -57.41015625, -55.478515625, -53.546875, -51.615234375, -49.68359375, -47.751953125, -45.8203125, -43.888671875, -41.95703125, -40.025390625, -38.09375, -36.162109375, -34.23046875, -32.298828125, -30.3671875, -28.435546875, -26.50390625, -24.572265625, -22.640625, -20.708984375, -18.77734375, -16.845703125, -14.9140625, -12.982421875, -11.05078125, -9.119140625, -7.1875, -5.255859375, -3.32421875, -1.392578125, 0.5390625, 2.470703125, 4.40234375, 6.333984375, 8.265625, 10.197265625, 12.12890625, 14.060546875, 15.9921875, 17.923828125, 19.85546875, 21.787109375, 23.71875, 25.650390625, 27.58203125, 29.513671875, 31.4453125, 33.376953125, 35.30859375, 37.240234375, 39.171875, 41.103515625, 43.03515625, 44.966796875, 46.8984375, 48.830078125, 50.76171875, 52.693359375, 54.625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 8.0, 9.0, 13.0, 24.0, 17.0, 25.0, 35.0, 32.0, 44.0, 60.0, 62.0, 81.0, 91.0, 87.0, 73.0, 55.0, 36.0, 46.0, 32.0, 30.0, 26.0, 21.0, 14.0, 19.0, 9.0, 12.0, 3.0, 3.0, 4.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.005313873291015625, -0.005173027515411377, -0.005032181739807129, -0.004891335964202881, -0.004750490188598633, -0.004609644412994385, -0.004468798637390137, -0.004327952861785889, -0.004187107086181641, -0.004046261310577393, -0.0039054155349731445, -0.0037645697593688965, -0.0036237239837646484, -0.0034828782081604004, -0.0033420324325561523, -0.0032011866569519043, -0.0030603408813476562, -0.002919495105743408, -0.00277864933013916, -0.002637803554534912, -0.002496957778930664, -0.002356112003326416, -0.002215266227722168, -0.00207442045211792, -0.0019335746765136719, -0.0017927289009094238, -0.0016518831253051758, -0.0015110373497009277, -0.0013701915740966797, -0.0012293457984924316, -0.0010885000228881836, -0.0009476542472839355, -0.0008068084716796875, -0.0006659626960754395, -0.0005251169204711914, -0.00038427114486694336, -0.0002434253692626953, -0.00010257959365844727, 3.826618194580078e-05, 0.00017911195755004883, 0.0003199577331542969, 0.0004608035087585449, 0.000601649284362793, 0.000742495059967041, 0.0008833408355712891, 0.0010241866111755371, 0.0011650323867797852, 0.0013058781623840332, 0.0014467239379882812, 0.0015875697135925293, 0.0017284154891967773, 0.0018692612648010254, 0.0020101070404052734, 0.0021509528160095215, 0.0022917985916137695, 0.0024326443672180176, 0.0025734901428222656, 0.0027143359184265137, 0.0028551816940307617, 0.0029960274696350098, 0.003136873245239258, 0.003277719020843506, 0.003418564796447754, 0.003559410572052002, 0.00370025634765625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 7.0, 5.0, 8.0, 16.0, 16.0, 35.0, 63.0, 85.0, 175.0, 299.0, 745.0, 2369.0, 10621.0, 104700.0, 844747.0, 72817.0, 8406.0, 2077.0, 686.0, 305.0, 135.0, 71.0, 59.0, 31.0, 23.0, 12.0, 10.0, 8.0, 2.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-68.1875, -65.6083984375, -63.029296875, -60.4501953125, -57.87109375, -55.2919921875, -52.712890625, -50.1337890625, -47.5546875, -44.9755859375, -42.396484375, -39.8173828125, -37.23828125, -34.6591796875, -32.080078125, -29.5009765625, -26.921875, -24.3427734375, -21.763671875, -19.1845703125, -16.60546875, -14.0263671875, -11.447265625, -8.8681640625, -6.2890625, -3.7099609375, -1.130859375, 1.4482421875, 4.02734375, 6.6064453125, 9.185546875, 11.7646484375, 14.34375, 16.9228515625, 19.501953125, 22.0810546875, 24.66015625, 27.2392578125, 29.818359375, 32.3974609375, 34.9765625, 37.5556640625, 40.134765625, 42.7138671875, 45.29296875, 47.8720703125, 50.451171875, 53.0302734375, 55.609375, 58.1884765625, 60.767578125, 63.3466796875, 65.92578125, 68.5048828125, 71.083984375, 73.6630859375, 76.2421875, 78.8212890625, 81.400390625, 83.9794921875, 86.55859375, 89.1376953125, 91.716796875, 94.2958984375, 96.875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 8.0, 5.0, 9.0, 9.0, 19.0, 21.0, 45.0, 43.0, 71.0, 72.0, 83.0, 106.0, 106.0, 84.0, 87.0, 64.0, 46.0, 27.0, 25.0, 27.0, 11.0, 11.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.34375, -59.599609375, -57.85546875, -56.111328125, -54.3671875, -52.623046875, -50.87890625, -49.134765625, -47.390625, -45.646484375, -43.90234375, -42.158203125, -40.4140625, -38.669921875, -36.92578125, -35.181640625, -33.4375, -31.693359375, -29.94921875, -28.205078125, -26.4609375, -24.716796875, -22.97265625, -21.228515625, -19.484375, -17.740234375, -15.99609375, -14.251953125, -12.5078125, -10.763671875, -9.01953125, -7.275390625, -5.53125, -3.787109375, -2.04296875, -0.298828125, 1.4453125, 3.189453125, 4.93359375, 6.677734375, 8.421875, 10.166015625, 11.91015625, 13.654296875, 15.3984375, 17.142578125, 18.88671875, 20.630859375, 22.375, 24.119140625, 25.86328125, 27.607421875, 29.3515625, 31.095703125, 32.83984375, 34.583984375, 36.328125, 38.072265625, 39.81640625, 41.560546875, 43.3046875, 45.048828125, 46.79296875, 48.537109375, 50.28125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 12.0, 12.0, 25.0, 50.0, 93.0, 112.0, 162.0, 197.0, 151.0, 84.0, 43.0, 22.0, 12.0, 9.0, 4.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1214.714111328125, -1176.0416259765625, -1137.369140625, -1098.6966552734375, -1060.024169921875, -1021.3516845703125, -982.67919921875, -944.0067138671875, -905.334228515625, -866.6617431640625, -827.9892578125, -789.3167724609375, -750.644287109375, -711.9718017578125, -673.29931640625, -634.6268310546875, -595.9544067382812, -557.2819213867188, -518.6094360351562, -479.93695068359375, -441.26446533203125, -402.59197998046875, -363.9195251464844, -325.2470397949219, -286.5745544433594, -247.90206909179688, -209.22958374023438, -170.55711364746094, -131.88462829589844, -93.21214294433594, -54.5396728515625, -15.8671875, 22.8052978515625, 61.477779388427734, 100.15026092529297, 138.82273864746094, 177.49522399902344, 216.16770935058594, 254.84017944335938, 293.5126647949219, 332.1851501464844, 370.8576354980469, 409.5301208496094, 448.20257568359375, 486.87506103515625, 525.5475463867188, 564.2200317382812, 602.8925170898438, 641.5650024414062, 680.2374877929688, 718.9099731445312, 757.5824584960938, 796.2549438476562, 834.9274291992188, 873.599853515625, 912.2723388671875, 950.94482421875, 989.6173095703125, 1028.289794921875, 1066.9622802734375, 1105.634765625, 1144.3072509765625, 1182.979736328125, 1221.6522216796875, 1260.32470703125]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 8.0, 3.0, 14.0, 9.0, 26.0, 24.0, 33.0, 40.0, 42.0, 56.0, 58.0, 80.0, 79.0, 98.0, 81.0, 64.0, 57.0, 59.0, 48.0, 38.0, 18.0, 22.0, 14.0, 11.0, 12.0, 2.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1035.1513671875, -990.2135009765625, -945.275634765625, -900.3377685546875, -855.39990234375, -810.4620361328125, -765.5242309570312, -720.5863647460938, -675.6484985351562, -630.7106323242188, -585.7727661132812, -540.8349609375, -495.8970642089844, -450.9591979980469, -406.0213623046875, -361.08349609375, -316.1456298828125, -271.207763671875, -226.26991271972656, -181.33206176757812, -136.39419555664062, -91.45632934570312, -46.51849365234375, -1.58062744140625, 43.35723876953125, 88.29509735107422, 133.2329559326172, 178.17080688476562, 223.10867309570312, 268.0465393066406, 312.984375, 357.9222412109375, 402.8599853515625, 447.7978515625, 492.7357177734375, 537.673583984375, 582.6114501953125, 627.54931640625, 672.4871215820312, 717.4249877929688, 762.3628540039062, 807.3007202148438, 852.2385864257812, 897.1763916015625, 942.1142578125, 987.0521240234375, 1031.989990234375, 1076.9278564453125, 1121.86572265625, 1166.8035888671875, 1211.741455078125, 1256.6793212890625, 1301.6171875, 1346.5550537109375, 1391.492919921875, 1436.4306640625, 1481.36865234375, 1526.3065185546875, 1571.244384765625, 1616.1822509765625, 1661.1201171875, 1706.0579833984375, 1750.995849609375, 1795.93359375, 1840.8714599609375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 3.0, 7.0, 14.0, 25.0, 37.0, 80.0, 175.0, 454.0, 1618.0, 6955.0, 89497.0, 4036521.0, 51388.0, 5169.0, 1336.0, 515.0, 182.0, 112.0, 53.0, 33.0, 36.0, 16.0, 17.0, 10.0, 5.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.1875, -99.7783203125, -94.369140625, -88.9599609375, -83.55078125, -78.1416015625, -72.732421875, -67.3232421875, -61.9140625, -56.5048828125, -51.095703125, -45.6865234375, -40.27734375, -34.8681640625, -29.458984375, -24.0498046875, -18.640625, -13.2314453125, -7.822265625, -2.4130859375, 2.99609375, 8.4052734375, 13.814453125, 19.2236328125, 24.6328125, 30.0419921875, 35.451171875, 40.8603515625, 46.26953125, 51.6787109375, 57.087890625, 62.4970703125, 67.90625, 73.3154296875, 78.724609375, 84.1337890625, 89.54296875, 94.9521484375, 100.361328125, 105.7705078125, 111.1796875, 116.5888671875, 121.998046875, 127.4072265625, 132.81640625, 138.2255859375, 143.634765625, 149.0439453125, 154.453125, 159.8623046875, 165.271484375, 170.6806640625, 176.08984375, 181.4990234375, 186.908203125, 192.3173828125, 197.7265625, 203.1357421875, 208.544921875, 213.9541015625, 219.36328125, 224.7724609375, 230.181640625, 235.5908203125, 241.0]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 10.0, 15.0, 33.0, 61.0, 91.0, 110.0, 166.0, 150.0, 122.0, 99.0, 75.0, 34.0, 18.0, 17.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.0, -66.369140625, -62.73828125, -59.107421875, -55.4765625, -51.845703125, -48.21484375, -44.583984375, -40.953125, -37.322265625, -33.69140625, -30.060546875, -26.4296875, -22.798828125, -19.16796875, -15.537109375, -11.90625, -8.275390625, -4.64453125, -1.013671875, 2.6171875, 6.248046875, 9.87890625, 13.509765625, 17.140625, 20.771484375, 24.40234375, 28.033203125, 31.6640625, 35.294921875, 38.92578125, 42.556640625, 46.1875, 49.818359375, 53.44921875, 57.080078125, 60.7109375, 64.341796875, 67.97265625, 71.603515625, 75.234375, 78.865234375, 82.49609375, 86.126953125, 89.7578125, 93.388671875, 97.01953125, 100.650390625, 104.28125, 107.912109375, 111.54296875, 115.173828125, 118.8046875, 122.435546875, 126.06640625, 129.697265625, 133.328125, 136.958984375, 140.58984375, 144.220703125, 147.8515625, 151.482421875, 155.11328125, 158.744140625, 162.375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 4.0, 2.0, 8.0, 16.0, 18.0, 32.0, 63.0, 160.0, 291.0, 696.0, 1719.0, 4889.0, 24889.0, 3607866.0, 530671.0, 16467.0, 4017.0, 1362.0, 571.0, 266.0, 135.0, 64.0, 26.0, 13.0, 5.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-191.25, -185.251953125, -179.25390625, -173.255859375, -167.2578125, -161.259765625, -155.26171875, -149.263671875, -143.265625, -137.267578125, -131.26953125, -125.271484375, -119.2734375, -113.275390625, -107.27734375, -101.279296875, -95.28125, -89.283203125, -83.28515625, -77.287109375, -71.2890625, -65.291015625, -59.29296875, -53.294921875, -47.296875, -41.298828125, -35.30078125, -29.302734375, -23.3046875, -17.306640625, -11.30859375, -5.310546875, 0.6875, 6.685546875, 12.68359375, 18.681640625, 24.6796875, 30.677734375, 36.67578125, 42.673828125, 48.671875, 54.669921875, 60.66796875, 66.666015625, 72.6640625, 78.662109375, 84.66015625, 90.658203125, 96.65625, 102.654296875, 108.65234375, 114.650390625, 120.6484375, 126.646484375, 132.64453125, 138.642578125, 144.640625, 150.638671875, 156.63671875, 162.634765625, 168.6328125, 174.630859375, 180.62890625, 186.626953125, 192.625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 4.0, 11.0, 18.0, 28.0, 39.0, 107.0, 317.0, 1386.0, 1531.0, 349.0, 109.0, 44.0, 39.0, 23.0, 10.0, 16.0, 10.0, 7.0, 7.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.625, -122.10546875, -117.5859375, -113.06640625, -108.546875, -104.02734375, -99.5078125, -94.98828125, -90.46875, -85.94921875, -81.4296875, -76.91015625, -72.390625, -67.87109375, -63.3515625, -58.83203125, -54.3125, -49.79296875, -45.2734375, -40.75390625, -36.234375, -31.71484375, -27.1953125, -22.67578125, -18.15625, -13.63671875, -9.1171875, -4.59765625, -0.078125, 4.44140625, 8.9609375, 13.48046875, 18.0, 22.51953125, 27.0390625, 31.55859375, 36.078125, 40.59765625, 45.1171875, 49.63671875, 54.15625, 58.67578125, 63.1953125, 67.71484375, 72.234375, 76.75390625, 81.2734375, 85.79296875, 90.3125, 94.83203125, 99.3515625, 103.87109375, 108.390625, 112.91015625, 117.4296875, 121.94921875, 126.46875, 130.98828125, 135.5078125, 140.02734375, 144.546875, 149.06640625, 153.5859375, 158.10546875, 162.625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 10.0, 2.0, 10.0, 31.0, 53.0, 82.0, 123.0, 167.0, 165.0, 122.0, 73.0, 58.0, 38.0, 24.0, 11.0, 10.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-519.5640869140625, -497.08245849609375, -474.600830078125, -452.11920166015625, -429.6375732421875, -407.15594482421875, -384.6743469238281, -362.1927185058594, -339.7110900878906, -317.2294616699219, -294.7478332519531, -272.2662353515625, -249.7845916748047, -227.30296325683594, -204.82135009765625, -182.3397216796875, -159.85809326171875, -137.37646484375, -114.89484405517578, -92.41322326660156, -69.93159484863281, -47.44996643066406, -24.968353271484375, -2.486724853515625, 19.994903564453125, 42.47652816772461, 64.9581527709961, 87.43977355957031, 109.92140197753906, 132.4030303955078, 154.8846435546875, 177.36627197265625, 199.84783935546875, 222.3294677734375, 244.81109619140625, 267.292724609375, 289.77435302734375, 312.2559814453125, 334.7375793457031, 357.2192077636719, 379.7008361816406, 402.1824645996094, 424.6640930175781, 447.14569091796875, 469.6273193359375, 492.10894775390625, 514.590576171875, 537.0722045898438, 559.5538330078125, 582.0354614257812, 604.51708984375, 626.9987182617188, 649.4803466796875, 671.9619750976562, 694.443603515625, 716.9251708984375, 739.4068603515625, 761.8884887695312, 784.3701171875, 806.8517456054688, 829.3333740234375, 851.8150024414062, 874.296630859375, 896.7781982421875, 919.2598266601562]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 8.0, 10.0, 15.0, 18.0, 25.0, 29.0, 33.0, 54.0, 76.0, 86.0, 100.0, 93.0, 83.0, 78.0, 61.0, 60.0, 46.0, 43.0, 29.0, 18.0, 13.0, 5.0, 10.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-867.1318969726562, -842.2020874023438, -817.2722778320312, -792.3424682617188, -767.4127197265625, -742.48291015625, -717.5531005859375, -692.623291015625, -667.6934814453125, -642.763671875, -617.8338623046875, -592.904052734375, -567.9742431640625, -543.0444946289062, -518.1146850585938, -493.18487548828125, -468.25506591796875, -443.32525634765625, -418.39544677734375, -393.4656677246094, -368.5358581542969, -343.6060485839844, -318.67626953125, -293.7464599609375, -268.816650390625, -243.8868408203125, -218.95704650878906, -194.02725219726562, -169.09744262695312, -144.16763305664062, -119.23783874511719, -94.30804443359375, -69.378173828125, -44.44837188720703, -19.518569946289062, 5.411231994628906, 30.341033935546875, 55.270835876464844, 80.20063781738281, 105.13043212890625, 130.06024169921875, 154.99005126953125, 179.9198455810547, 204.84963989257812, 229.77944946289062, 254.70925903320312, 279.6390380859375, 304.56884765625, 329.4986572265625, 354.428466796875, 379.3582763671875, 404.2880554199219, 429.2178649902344, 454.1476745605469, 479.07745361328125, 504.00726318359375, 528.9370727539062, 553.8668823242188, 578.7966918945312, 603.7265014648438, 628.65625, 653.5860595703125, 678.515869140625, 703.4456787109375, 728.37548828125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 12.0, 13.0, 23.0, 39.0, 53.0, 74.0, 148.0, 306.0, 603.0, 1415.0, 3667.0, 11035.0, 40784.0, 197185.0, 583550.0, 160518.0, 33900.0, 9433.0, 3288.0, 1344.0, 543.0, 271.0, 134.0, 87.0, 41.0, 28.0, 16.0, 10.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.625, -84.6484375, -81.671875, -78.6953125, -75.71875, -72.7421875, -69.765625, -66.7890625, -63.8125, -60.8359375, -57.859375, -54.8828125, -51.90625, -48.9296875, -45.953125, -42.9765625, -40.0, -37.0234375, -34.046875, -31.0703125, -28.09375, -25.1171875, -22.140625, -19.1640625, -16.1875, -13.2109375, -10.234375, -7.2578125, -4.28125, -1.3046875, 1.671875, 4.6484375, 7.625, 10.6015625, 13.578125, 16.5546875, 19.53125, 22.5078125, 25.484375, 28.4609375, 31.4375, 34.4140625, 37.390625, 40.3671875, 43.34375, 46.3203125, 49.296875, 52.2734375, 55.25, 58.2265625, 61.203125, 64.1796875, 67.15625, 70.1328125, 73.109375, 76.0859375, 79.0625, 82.0390625, 85.015625, 87.9921875, 90.96875, 93.9453125, 96.921875, 99.8984375, 102.875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 6.0, 9.0, 24.0, 19.0, 26.0, 43.0, 47.0, 67.0, 72.0, 90.0, 105.0, 84.0, 93.0, 64.0, 59.0, 53.0, 35.0, 33.0, 27.0, 25.0, 9.0, 6.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.5625, -36.5478515625, -34.533203125, -32.5185546875, -30.50390625, -28.4892578125, -26.474609375, -24.4599609375, -22.4453125, -20.4306640625, -18.416015625, -16.4013671875, -14.38671875, -12.3720703125, -10.357421875, -8.3427734375, -6.328125, -4.3134765625, -2.298828125, -0.2841796875, 1.73046875, 3.7451171875, 5.759765625, 7.7744140625, 9.7890625, 11.8037109375, 13.818359375, 15.8330078125, 17.84765625, 19.8623046875, 21.876953125, 23.8916015625, 25.90625, 27.9208984375, 29.935546875, 31.9501953125, 33.96484375, 35.9794921875, 37.994140625, 40.0087890625, 42.0234375, 44.0380859375, 46.052734375, 48.0673828125, 50.08203125, 52.0966796875, 54.111328125, 56.1259765625, 58.140625, 60.1552734375, 62.169921875, 64.1845703125, 66.19921875, 68.2138671875, 70.228515625, 72.2431640625, 74.2578125, 76.2724609375, 78.287109375, 80.3017578125, 82.31640625, 84.3310546875, 86.345703125, 88.3603515625, 90.375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 2.0, 3.0, 5.0, 11.0, 21.0, 20.0, 31.0, 38.0, 92.0, 216.0, 702.0, 3574.0, 187220.0, 848215.0, 6997.0, 886.0, 250.0, 113.0, 58.0, 34.0, 19.0, 12.0, 5.0, 8.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-434.0, -421.98828125, -409.9765625, -397.96484375, -385.953125, -373.94140625, -361.9296875, -349.91796875, -337.90625, -325.89453125, -313.8828125, -301.87109375, -289.859375, -277.84765625, -265.8359375, -253.82421875, -241.8125, -229.80078125, -217.7890625, -205.77734375, -193.765625, -181.75390625, -169.7421875, -157.73046875, -145.71875, -133.70703125, -121.6953125, -109.68359375, -97.671875, -85.66015625, -73.6484375, -61.63671875, -49.625, -37.61328125, -25.6015625, -13.58984375, -1.578125, 10.43359375, 22.4453125, 34.45703125, 46.46875, 58.48046875, 70.4921875, 82.50390625, 94.515625, 106.52734375, 118.5390625, 130.55078125, 142.5625, 154.57421875, 166.5859375, 178.59765625, 190.609375, 202.62109375, 214.6328125, 226.64453125, 238.65625, 250.66796875, 262.6796875, 274.69140625, 286.703125, 298.71484375, 310.7265625, 322.73828125, 334.75]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 9.0, 3.0, 4.0, 12.0, 11.0, 10.0, 8.0, 14.0, 19.0, 17.0, 14.0, 16.0, 20.0, 26.0, 27.0, 34.0, 45.0, 49.0, 51.0, 51.0, 51.0, 48.0, 40.0, 44.0, 45.0, 45.0, 36.0, 36.0, 32.0, 34.0, 30.0, 20.0, 14.0, 23.0, 16.0, 16.0, 8.0, 7.0, 7.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.0, -145.10546875, -140.2109375, -135.31640625, -130.421875, -125.52734375, -120.6328125, -115.73828125, -110.84375, -105.94921875, -101.0546875, -96.16015625, -91.265625, -86.37109375, -81.4765625, -76.58203125, -71.6875, -66.79296875, -61.8984375, -57.00390625, -52.109375, -47.21484375, -42.3203125, -37.42578125, -32.53125, -27.63671875, -22.7421875, -17.84765625, -12.953125, -8.05859375, -3.1640625, 1.73046875, 6.625, 11.51953125, 16.4140625, 21.30859375, 26.203125, 31.09765625, 35.9921875, 40.88671875, 45.78125, 50.67578125, 55.5703125, 60.46484375, 65.359375, 70.25390625, 75.1484375, 80.04296875, 84.9375, 89.83203125, 94.7265625, 99.62109375, 104.515625, 109.41015625, 114.3046875, 119.19921875, 124.09375, 128.98828125, 133.8828125, 138.77734375, 143.671875, 148.56640625, 153.4609375, 158.35546875, 163.25]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 10.0, 10.0, 21.0, 16.0, 23.0, 44.0, 57.0, 77.0, 148.0, 253.0, 471.0, 1020.0, 2958.0, 14637.0, 223544.0, 766902.0, 30705.0, 4805.0, 1437.0, 634.0, 301.0, 157.0, 110.0, 64.0, 42.0, 28.0, 24.0, 13.0, 5.0, 12.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.59375, -54.65380859375, -52.7138671875, -50.77392578125, -48.833984375, -46.89404296875, -44.9541015625, -43.01416015625, -41.07421875, -39.13427734375, -37.1943359375, -35.25439453125, -33.314453125, -31.37451171875, -29.4345703125, -27.49462890625, -25.5546875, -23.61474609375, -21.6748046875, -19.73486328125, -17.794921875, -15.85498046875, -13.9150390625, -11.97509765625, -10.03515625, -8.09521484375, -6.1552734375, -4.21533203125, -2.275390625, -0.33544921875, 1.6044921875, 3.54443359375, 5.484375, 7.42431640625, 9.3642578125, 11.30419921875, 13.244140625, 15.18408203125, 17.1240234375, 19.06396484375, 21.00390625, 22.94384765625, 24.8837890625, 26.82373046875, 28.763671875, 30.70361328125, 32.6435546875, 34.58349609375, 36.5234375, 38.46337890625, 40.4033203125, 42.34326171875, 44.283203125, 46.22314453125, 48.1630859375, 50.10302734375, 52.04296875, 53.98291015625, 55.9228515625, 57.86279296875, 59.802734375, 61.74267578125, 63.6826171875, 65.62255859375, 67.5625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 6.0, 6.0, 8.0, 12.0, 10.0, 11.0, 22.0, 18.0, 31.0, 47.0, 50.0, 74.0, 118.0, 143.0, 104.0, 87.0, 62.0, 53.0, 24.0, 29.0, 17.0, 14.0, 16.0, 6.0, 8.0, 2.0, 4.0, 6.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.006267547607421875, -0.006069183349609375, -0.005870819091796875, -0.005672454833984375, -0.005474090576171875, -0.005275726318359375, -0.005077362060546875, -0.004878997802734375, -0.004680633544921875, -0.004482269287109375, -0.004283905029296875, -0.004085540771484375, -0.003887176513671875, -0.003688812255859375, -0.003490447998046875, -0.003292083740234375, -0.003093719482421875, -0.002895355224609375, -0.002696990966796875, -0.002498626708984375, -0.002300262451171875, -0.002101898193359375, -0.001903533935546875, -0.001705169677734375, -0.001506805419921875, -0.001308441162109375, -0.001110076904296875, -0.000911712646484375, -0.000713348388671875, -0.000514984130859375, -0.000316619873046875, -0.000118255615234375, 8.0108642578125e-05, 0.000278472900390625, 0.000476837158203125, 0.000675201416015625, 0.000873565673828125, 0.001071929931640625, 0.001270294189453125, 0.001468658447265625, 0.001667022705078125, 0.001865386962890625, 0.002063751220703125, 0.002262115478515625, 0.002460479736328125, 0.002658843994140625, 0.002857208251953125, 0.003055572509765625, 0.003253936767578125, 0.003452301025390625, 0.003650665283203125, 0.003849029541015625, 0.004047393798828125, 0.004245758056640625, 0.004444122314453125, 0.004642486572265625, 0.004840850830078125, 0.005039215087890625, 0.005237579345703125, 0.005435943603515625, 0.005634307861328125, 0.005832672119140625, 0.006031036376953125, 0.006229400634765625, 0.006427764892578125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 9.0, 14.0, 35.0, 61.0, 92.0, 202.0, 464.0, 1274.0, 4825.0, 37580.0, 853482.0, 136825.0, 10361.0, 2034.0, 695.0, 271.0, 133.0, 67.0, 40.0, 33.0, 17.0, 10.0, 7.0, 2.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.75, -81.0224609375, -78.294921875, -75.5673828125, -72.83984375, -70.1123046875, -67.384765625, -64.6572265625, -61.9296875, -59.2021484375, -56.474609375, -53.7470703125, -51.01953125, -48.2919921875, -45.564453125, -42.8369140625, -40.109375, -37.3818359375, -34.654296875, -31.9267578125, -29.19921875, -26.4716796875, -23.744140625, -21.0166015625, -18.2890625, -15.5615234375, -12.833984375, -10.1064453125, -7.37890625, -4.6513671875, -1.923828125, 0.8037109375, 3.53125, 6.2587890625, 8.986328125, 11.7138671875, 14.44140625, 17.1689453125, 19.896484375, 22.6240234375, 25.3515625, 28.0791015625, 30.806640625, 33.5341796875, 36.26171875, 38.9892578125, 41.716796875, 44.4443359375, 47.171875, 49.8994140625, 52.626953125, 55.3544921875, 58.08203125, 60.8095703125, 63.537109375, 66.2646484375, 68.9921875, 71.7197265625, 74.447265625, 77.1748046875, 79.90234375, 82.6298828125, 85.357421875, 88.0849609375, 90.8125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 2.0, 8.0, 11.0, 6.0, 21.0, 16.0, 29.0, 37.0, 58.0, 91.0, 115.0, 154.0, 139.0, 86.0, 63.0, 48.0, 36.0, 24.0, 22.0, 15.0, 10.0, 3.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.875, -35.95703125, -34.0390625, -32.12109375, -30.203125, -28.28515625, -26.3671875, -24.44921875, -22.53125, -20.61328125, -18.6953125, -16.77734375, -14.859375, -12.94140625, -11.0234375, -9.10546875, -7.1875, -5.26953125, -3.3515625, -1.43359375, 0.484375, 2.40234375, 4.3203125, 6.23828125, 8.15625, 10.07421875, 11.9921875, 13.91015625, 15.828125, 17.74609375, 19.6640625, 21.58203125, 23.5, 25.41796875, 27.3359375, 29.25390625, 31.171875, 33.08984375, 35.0078125, 36.92578125, 38.84375, 40.76171875, 42.6796875, 44.59765625, 46.515625, 48.43359375, 50.3515625, 52.26953125, 54.1875, 56.10546875, 58.0234375, 59.94140625, 61.859375, 63.77734375, 65.6953125, 67.61328125, 69.53125, 71.44921875, 73.3671875, 75.28515625, 77.203125, 79.12109375, 81.0390625, 82.95703125, 84.875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 8.0, 13.0, 16.0, 29.0, 51.0, 91.0, 179.0, 243.0, 167.0, 90.0, 49.0, 26.0, 16.0, 8.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1365.573974609375, -1333.446044921875, -1301.318115234375, -1269.190185546875, -1237.062255859375, -1204.934326171875, -1172.806396484375, -1140.6785888671875, -1108.5506591796875, -1076.4227294921875, -1044.2947998046875, -1012.1668701171875, -980.0390014648438, -947.9110717773438, -915.7831420898438, -883.6552124023438, -851.5272827148438, -819.3993530273438, -787.2714233398438, -755.1435546875, -723.015625, -690.8876953125, -658.759765625, -626.6318359375, -594.50390625, -562.3759765625, -530.248046875, -498.1201477050781, -465.99224853515625, -433.86431884765625, -401.73638916015625, -369.60845947265625, -337.48052978515625, -305.35260009765625, -273.2247009277344, -241.09677124023438, -208.96885681152344, -176.8409423828125, -144.7130126953125, -112.58509826660156, -80.45718383789062, -48.32926559448242, -16.20134735107422, 15.92657470703125, 48.05448913574219, 80.18240356445312, 112.31033325195312, 144.43824768066406, 176.566162109375, 208.69407653808594, 240.82199096679688, 272.9499206542969, 305.07781982421875, 337.20574951171875, 369.33367919921875, 401.46160888671875, 433.5895080566406, 465.7174377441406, 497.8453369140625, 529.9732666015625, 562.1011962890625, 594.2291259765625, 626.3570556640625, 658.4849243164062, 690.6128540039062]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 3.0, 15.0, 9.0, 19.0, 24.0, 26.0, 48.0, 35.0, 46.0, 50.0, 75.0, 67.0, 105.0, 78.0, 72.0, 67.0, 66.0, 48.0, 46.0, 36.0, 26.0, 12.0, 15.0, 9.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-880.3641967773438, -848.6144409179688, -816.8646850585938, -785.1149291992188, -753.3651123046875, -721.6153564453125, -689.8656005859375, -658.1158447265625, -626.3660888671875, -594.6163330078125, -562.8665771484375, -531.1168212890625, -499.3670349121094, -467.6172790527344, -435.86749267578125, -404.11773681640625, -372.36798095703125, -340.61822509765625, -308.86846923828125, -277.1186828613281, -245.36892700195312, -213.61917114257812, -181.86940002441406, -150.11962890625, -118.369873046875, -86.62010955810547, -54.87034606933594, -23.120582580566406, 8.629180908203125, 40.378936767578125, 72.12870788574219, 103.87847900390625, 135.6282958984375, 167.3780517578125, 199.12782287597656, 230.87759399414062, 262.6273498535156, 294.3771057128906, 326.12689208984375, 357.87664794921875, 389.62640380859375, 421.37615966796875, 453.12591552734375, 484.8757019042969, 516.62548828125, 548.375244140625, 580.125, 611.874755859375, 643.62451171875, 675.374267578125, 707.1240234375, 738.873779296875, 770.62353515625, 802.373291015625, 834.1231079101562, 865.8728637695312, 897.6226196289062, 929.3723754882812, 961.1221313476562, 992.8718872070312, 1024.6217041015625, 1056.3714599609375, 1088.1212158203125, 1119.8709716796875, 1151.6207275390625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 12.0, 16.0, 30.0, 41.0, 73.0, 133.0, 322.0, 921.0, 13987.0, 4170436.0, 7007.0, 758.0, 256.0, 111.0, 59.0, 36.0, 25.0, 13.0, 5.0, 8.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-322.75, -310.53515625, -298.3203125, -286.10546875, -273.890625, -261.67578125, -249.4609375, -237.24609375, -225.03125, -212.81640625, -200.6015625, -188.38671875, -176.171875, -163.95703125, -151.7421875, -139.52734375, -127.3125, -115.09765625, -102.8828125, -90.66796875, -78.453125, -66.23828125, -54.0234375, -41.80859375, -29.59375, -17.37890625, -5.1640625, 7.05078125, 19.265625, 31.48046875, 43.6953125, 55.91015625, 68.125, 80.33984375, 92.5546875, 104.76953125, 116.984375, 129.19921875, 141.4140625, 153.62890625, 165.84375, 178.05859375, 190.2734375, 202.48828125, 214.703125, 226.91796875, 239.1328125, 251.34765625, 263.5625, 275.77734375, 287.9921875, 300.20703125, 312.421875, 324.63671875, 336.8515625, 349.06640625, 361.28125, 373.49609375, 385.7109375, 397.92578125, 410.140625, 422.35546875, 434.5703125, 446.78515625, 459.0]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 14.0, 12.0, 14.0, 35.0, 40.0, 58.0, 67.0, 69.0, 98.0, 87.0, 100.0, 95.0, 75.0, 63.0, 48.0, 43.0, 21.0, 24.0, 21.0, 9.0, 8.0, 5.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.90625, -49.02490234375, -47.1435546875, -45.26220703125, -43.380859375, -41.49951171875, -39.6181640625, -37.73681640625, -35.85546875, -33.97412109375, -32.0927734375, -30.21142578125, -28.330078125, -26.44873046875, -24.5673828125, -22.68603515625, -20.8046875, -18.92333984375, -17.0419921875, -15.16064453125, -13.279296875, -11.39794921875, -9.5166015625, -7.63525390625, -5.75390625, -3.87255859375, -1.9912109375, -0.10986328125, 1.771484375, 3.65283203125, 5.5341796875, 7.41552734375, 9.296875, 11.17822265625, 13.0595703125, 14.94091796875, 16.822265625, 18.70361328125, 20.5849609375, 22.46630859375, 24.34765625, 26.22900390625, 28.1103515625, 29.99169921875, 31.873046875, 33.75439453125, 35.6357421875, 37.51708984375, 39.3984375, 41.27978515625, 43.1611328125, 45.04248046875, 46.923828125, 48.80517578125, 50.6865234375, 52.56787109375, 54.44921875, 56.33056640625, 58.2119140625, 60.09326171875, 61.974609375, 63.85595703125, 65.7373046875, 67.61865234375, 69.5]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 13.0, 15.0, 17.0, 28.0, 38.0, 73.0, 113.0, 176.0, 293.0, 505.0, 1029.0, 2416.0, 6752.0, 33432.0, 3603581.0, 518111.0, 19338.0, 4716.0, 1789.0, 765.0, 415.0, 196.0, 129.0, 96.0, 69.0, 46.0, 33.0, 27.0, 22.0, 10.0, 11.0, 4.0, 7.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-146.625, -142.162109375, -137.69921875, -133.236328125, -128.7734375, -124.310546875, -119.84765625, -115.384765625, -110.921875, -106.458984375, -101.99609375, -97.533203125, -93.0703125, -88.607421875, -84.14453125, -79.681640625, -75.21875, -70.755859375, -66.29296875, -61.830078125, -57.3671875, -52.904296875, -48.44140625, -43.978515625, -39.515625, -35.052734375, -30.58984375, -26.126953125, -21.6640625, -17.201171875, -12.73828125, -8.275390625, -3.8125, 0.650390625, 5.11328125, 9.576171875, 14.0390625, 18.501953125, 22.96484375, 27.427734375, 31.890625, 36.353515625, 40.81640625, 45.279296875, 49.7421875, 54.205078125, 58.66796875, 63.130859375, 67.59375, 72.056640625, 76.51953125, 80.982421875, 85.4453125, 89.908203125, 94.37109375, 98.833984375, 103.296875, 107.759765625, 112.22265625, 116.685546875, 121.1484375, 125.611328125, 130.07421875, 134.537109375, 139.0]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 3.0, 16.0, 15.0, 30.0, 59.0, 172.0, 693.0, 2030.0, 670.0, 207.0, 57.0, 49.0, 12.0, 13.0, 13.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-119.125, -115.4609375, -111.796875, -108.1328125, -104.46875, -100.8046875, -97.140625, -93.4765625, -89.8125, -86.1484375, -82.484375, -78.8203125, -75.15625, -71.4921875, -67.828125, -64.1640625, -60.5, -56.8359375, -53.171875, -49.5078125, -45.84375, -42.1796875, -38.515625, -34.8515625, -31.1875, -27.5234375, -23.859375, -20.1953125, -16.53125, -12.8671875, -9.203125, -5.5390625, -1.875, 1.7890625, 5.453125, 9.1171875, 12.78125, 16.4453125, 20.109375, 23.7734375, 27.4375, 31.1015625, 34.765625, 38.4296875, 42.09375, 45.7578125, 49.421875, 53.0859375, 56.75, 60.4140625, 64.078125, 67.7421875, 71.40625, 75.0703125, 78.734375, 82.3984375, 86.0625, 89.7265625, 93.390625, 97.0546875, 100.71875, 104.3828125, 108.046875, 111.7109375, 115.375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 5.0, 4.0, 8.0, 9.0, 15.0, 23.0, 33.0, 44.0, 72.0, 120.0, 124.0, 146.0, 133.0, 90.0, 49.0, 45.0, 24.0, 15.0, 12.0, 15.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-580.38818359375, -564.8668823242188, -549.3455810546875, -533.8242797851562, -518.302978515625, -502.7817077636719, -487.2604064941406, -471.7391052246094, -456.21783447265625, -440.696533203125, -425.17523193359375, -409.6539306640625, -394.1326599121094, -378.6113586425781, -363.0900573730469, -347.5687561035156, -332.0474548339844, -316.5261535644531, -301.0048522949219, -285.48358154296875, -269.9622802734375, -254.44097900390625, -238.919677734375, -223.39837646484375, -207.87709045410156, -192.3557891845703, -176.83450317382812, -161.31320190429688, -145.79190063476562, -130.27061462402344, -114.74931335449219, -99.22801971435547, -83.70672607421875, -68.18543243408203, -52.66413497924805, -37.14283752441406, -21.621543884277344, -6.100250244140625, 9.421051025390625, 24.942344665527344, 40.46363830566406, 55.98493194580078, 71.5062255859375, 87.02752685546875, 102.54882049560547, 118.07011413574219, 133.59141540527344, 149.11270141601562, 164.63400268554688, 180.15530395507812, 195.6765899658203, 211.19789123535156, 226.71917724609375, 242.240478515625, 257.76177978515625, 273.2830810546875, 288.80438232421875, 304.32568359375, 319.84698486328125, 335.3682861328125, 350.8895568847656, 366.4108581542969, 381.9321594238281, 397.4534606933594, 412.9747314453125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 6.0, 3.0, 2.0, 4.0, 2.0, 10.0, 14.0, 15.0, 11.0, 18.0, 21.0, 16.0, 29.0, 30.0, 35.0, 35.0, 39.0, 40.0, 46.0, 56.0, 53.0, 51.0, 42.0, 44.0, 40.0, 41.0, 36.0, 30.0, 31.0, 22.0, 26.0, 27.0, 27.0, 14.0, 19.0, 13.0, 11.0, 11.0, 7.0, 3.0, 5.0, 4.0, 5.0, 8.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-267.47802734375, -258.94537353515625, -250.41275024414062, -241.88009643554688, -233.3474578857422, -224.8148193359375, -216.2821807861328, -207.74954223632812, -199.21688842773438, -190.6842498779297, -182.151611328125, -173.61895751953125, -165.08631896972656, -156.55368041992188, -148.0210418701172, -139.4884033203125, -130.9557647705078, -122.42312622070312, -113.8904800415039, -105.35784149169922, -96.8251953125, -88.29255676269531, -79.75991821289062, -71.22727966308594, -62.69463348388672, -54.161991119384766, -45.62934875488281, -37.096710205078125, -28.564067840576172, -20.03142547607422, -11.498786926269531, -2.966144561767578, 5.566497802734375, 14.099139213562012, 22.63178062438965, 31.16442108154297, 39.69706344604492, 48.229705810546875, 56.76234436035156, 65.29498291015625, 73.82762908935547, 82.36026763916016, 90.89291381835938, 99.42555236816406, 107.95819091796875, 116.49083709716797, 125.02347564697266, 133.55612182617188, 142.08876037597656, 150.62139892578125, 159.15403747558594, 167.68667602539062, 176.21932983398438, 184.75196838378906, 193.28460693359375, 201.81724548339844, 210.34988403320312, 218.8825225830078, 227.4151611328125, 235.94781494140625, 244.48045349121094, 253.01309204101562, 261.54571533203125, 270.078369140625, 278.61102294921875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 8.0, 13.0, 8.0, 17.0, 34.0, 49.0, 64.0, 95.0, 159.0, 327.0, 592.0, 1115.0, 2360.0, 5178.0, 12053.0, 30889.0, 81522.0, 238462.0, 413609.0, 164756.0, 58023.0, 22205.0, 9136.0, 3981.0, 1855.0, 884.0, 466.0, 238.0, 166.0, 109.0, 50.0, 38.0, 24.0, 24.0, 12.0, 17.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.4375, -60.50634765625, -58.5751953125, -56.64404296875, -54.712890625, -52.78173828125, -50.8505859375, -48.91943359375, -46.98828125, -45.05712890625, -43.1259765625, -41.19482421875, -39.263671875, -37.33251953125, -35.4013671875, -33.47021484375, -31.5390625, -29.60791015625, -27.6767578125, -25.74560546875, -23.814453125, -21.88330078125, -19.9521484375, -18.02099609375, -16.08984375, -14.15869140625, -12.2275390625, -10.29638671875, -8.365234375, -6.43408203125, -4.5029296875, -2.57177734375, -0.640625, 1.29052734375, 3.2216796875, 5.15283203125, 7.083984375, 9.01513671875, 10.9462890625, 12.87744140625, 14.80859375, 16.73974609375, 18.6708984375, 20.60205078125, 22.533203125, 24.46435546875, 26.3955078125, 28.32666015625, 30.2578125, 32.18896484375, 34.1201171875, 36.05126953125, 37.982421875, 39.91357421875, 41.8447265625, 43.77587890625, 45.70703125, 47.63818359375, 49.5693359375, 51.50048828125, 53.431640625, 55.36279296875, 57.2939453125, 59.22509765625, 61.15625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 10.0, 5.0, 8.0, 5.0, 28.0, 14.0, 34.0, 45.0, 41.0, 46.0, 49.0, 70.0, 64.0, 62.0, 63.0, 74.0, 61.0, 69.0, 47.0, 41.0, 47.0, 32.0, 24.0, 21.0, 17.0, 9.0, 6.0, 7.0, 4.0, 5.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.0, -33.55810546875, -32.1162109375, -30.67431640625, -29.232421875, -27.79052734375, -26.3486328125, -24.90673828125, -23.46484375, -22.02294921875, -20.5810546875, -19.13916015625, -17.697265625, -16.25537109375, -14.8134765625, -13.37158203125, -11.9296875, -10.48779296875, -9.0458984375, -7.60400390625, -6.162109375, -4.72021484375, -3.2783203125, -1.83642578125, -0.39453125, 1.04736328125, 2.4892578125, 3.93115234375, 5.373046875, 6.81494140625, 8.2568359375, 9.69873046875, 11.140625, 12.58251953125, 14.0244140625, 15.46630859375, 16.908203125, 18.35009765625, 19.7919921875, 21.23388671875, 22.67578125, 24.11767578125, 25.5595703125, 27.00146484375, 28.443359375, 29.88525390625, 31.3271484375, 32.76904296875, 34.2109375, 35.65283203125, 37.0947265625, 38.53662109375, 39.978515625, 41.42041015625, 42.8623046875, 44.30419921875, 45.74609375, 47.18798828125, 48.6298828125, 50.07177734375, 51.513671875, 52.95556640625, 54.3974609375, 55.83935546875, 57.28125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 9.0, 8.0, 7.0, 26.0, 25.0, 47.0, 87.0, 144.0, 280.0, 577.0, 1455.0, 4144.0, 17406.0, 115107.0, 739433.0, 142070.0, 20086.0, 4687.0, 1535.0, 647.0, 341.0, 162.0, 91.0, 56.0, 44.0, 19.0, 19.0, 17.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.125, -122.126953125, -118.12890625, -114.130859375, -110.1328125, -106.134765625, -102.13671875, -98.138671875, -94.140625, -90.142578125, -86.14453125, -82.146484375, -78.1484375, -74.150390625, -70.15234375, -66.154296875, -62.15625, -58.158203125, -54.16015625, -50.162109375, -46.1640625, -42.166015625, -38.16796875, -34.169921875, -30.171875, -26.173828125, -22.17578125, -18.177734375, -14.1796875, -10.181640625, -6.18359375, -2.185546875, 1.8125, 5.810546875, 9.80859375, 13.806640625, 17.8046875, 21.802734375, 25.80078125, 29.798828125, 33.796875, 37.794921875, 41.79296875, 45.791015625, 49.7890625, 53.787109375, 57.78515625, 61.783203125, 65.78125, 69.779296875, 73.77734375, 77.775390625, 81.7734375, 85.771484375, 89.76953125, 93.767578125, 97.765625, 101.763671875, 105.76171875, 109.759765625, 113.7578125, 117.755859375, 121.75390625, 125.751953125, 129.75]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 5.0, 5.0, 6.0, 18.0, 5.0, 17.0, 23.0, 25.0, 29.0, 25.0, 50.0, 41.0, 40.0, 37.0, 40.0, 47.0, 43.0, 40.0, 47.0, 60.0, 54.0, 47.0, 35.0, 38.0, 28.0, 32.0, 27.0, 36.0, 11.0, 15.0, 12.0, 11.0, 6.0, 10.0, 5.0, 9.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-139.75, -135.7255859375, -131.701171875, -127.6767578125, -123.65234375, -119.6279296875, -115.603515625, -111.5791015625, -107.5546875, -103.5302734375, -99.505859375, -95.4814453125, -91.45703125, -87.4326171875, -83.408203125, -79.3837890625, -75.359375, -71.3349609375, -67.310546875, -63.2861328125, -59.26171875, -55.2373046875, -51.212890625, -47.1884765625, -43.1640625, -39.1396484375, -35.115234375, -31.0908203125, -27.06640625, -23.0419921875, -19.017578125, -14.9931640625, -10.96875, -6.9443359375, -2.919921875, 1.1044921875, 5.12890625, 9.1533203125, 13.177734375, 17.2021484375, 21.2265625, 25.2509765625, 29.275390625, 33.2998046875, 37.32421875, 41.3486328125, 45.373046875, 49.3974609375, 53.421875, 57.4462890625, 61.470703125, 65.4951171875, 69.51953125, 73.5439453125, 77.568359375, 81.5927734375, 85.6171875, 89.6416015625, 93.666015625, 97.6904296875, 101.71484375, 105.7392578125, 109.763671875, 113.7880859375, 117.8125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 10.0, 1.0, 12.0, 16.0, 20.0, 38.0, 69.0, 127.0, 273.0, 871.0, 4185.0, 60504.0, 953561.0, 25124.0, 2670.0, 600.0, 221.0, 103.0, 67.0, 21.0, 20.0, 11.0, 13.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.875, -95.7236328125, -92.572265625, -89.4208984375, -86.26953125, -83.1181640625, -79.966796875, -76.8154296875, -73.6640625, -70.5126953125, -67.361328125, -64.2099609375, -61.05859375, -57.9072265625, -54.755859375, -51.6044921875, -48.453125, -45.3017578125, -42.150390625, -38.9990234375, -35.84765625, -32.6962890625, -29.544921875, -26.3935546875, -23.2421875, -20.0908203125, -16.939453125, -13.7880859375, -10.63671875, -7.4853515625, -4.333984375, -1.1826171875, 1.96875, 5.1201171875, 8.271484375, 11.4228515625, 14.57421875, 17.7255859375, 20.876953125, 24.0283203125, 27.1796875, 30.3310546875, 33.482421875, 36.6337890625, 39.78515625, 42.9365234375, 46.087890625, 49.2392578125, 52.390625, 55.5419921875, 58.693359375, 61.8447265625, 64.99609375, 68.1474609375, 71.298828125, 74.4501953125, 77.6015625, 80.7529296875, 83.904296875, 87.0556640625, 90.20703125, 93.3583984375, 96.509765625, 99.6611328125, 102.8125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 11.0, 10.0, 16.0, 31.0, 21.0, 34.0, 34.0, 61.0, 85.0, 130.0, 126.0, 116.0, 96.0, 61.0, 51.0, 28.0, 22.0, 17.0, 14.0, 9.0, 1.0, 4.0, 2.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004779815673828125, -0.004592418670654297, -0.004405021667480469, -0.004217624664306641, -0.0040302276611328125, -0.0038428306579589844, -0.0036554336547851562, -0.003468036651611328, -0.0032806396484375, -0.003093242645263672, -0.0029058456420898438, -0.0027184486389160156, -0.0025310516357421875, -0.0023436546325683594, -0.0021562576293945312, -0.001968860626220703, -0.001781463623046875, -0.0015940666198730469, -0.0014066696166992188, -0.0012192726135253906, -0.0010318756103515625, -0.0008444786071777344, -0.0006570816040039062, -0.0004696846008300781, -0.00028228759765625, -9.489059448242188e-05, 9.250640869140625e-05, 0.0002799034118652344, 0.0004673004150390625, 0.0006546974182128906, 0.0008420944213867188, 0.0010294914245605469, 0.001216888427734375, 0.0014042854309082031, 0.0015916824340820312, 0.0017790794372558594, 0.0019664764404296875, 0.0021538734436035156, 0.0023412704467773438, 0.002528667449951172, 0.002716064453125, 0.002903461456298828, 0.0030908584594726562, 0.0032782554626464844, 0.0034656524658203125, 0.0036530494689941406, 0.0038404464721679688, 0.004027843475341797, 0.004215240478515625, 0.004402637481689453, 0.004590034484863281, 0.004777431488037109, 0.0049648284912109375, 0.005152225494384766, 0.005339622497558594, 0.005527019500732422, 0.00571441650390625, 0.005901813507080078, 0.006089210510253906, 0.006276607513427734, 0.0064640045166015625, 0.006651401519775391, 0.006838798522949219, 0.007026195526123047, 0.007213592529296875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 4.0, 5.0, 17.0, 11.0, 27.0, 34.0, 74.0, 104.0, 183.0, 289.0, 537.0, 1066.0, 2083.0, 4998.0, 13404.0, 50723.0, 389636.0, 504601.0, 56355.0, 14427.0, 5298.0, 2249.0, 1054.0, 563.0, 312.0, 197.0, 108.0, 55.0, 38.0, 28.0, 19.0, 15.0, 8.0, 1.0, 5.0, 8.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.78125, -32.431640625, -31.08203125, -29.732421875, -28.3828125, -27.033203125, -25.68359375, -24.333984375, -22.984375, -21.634765625, -20.28515625, -18.935546875, -17.5859375, -16.236328125, -14.88671875, -13.537109375, -12.1875, -10.837890625, -9.48828125, -8.138671875, -6.7890625, -5.439453125, -4.08984375, -2.740234375, -1.390625, -0.041015625, 1.30859375, 2.658203125, 4.0078125, 5.357421875, 6.70703125, 8.056640625, 9.40625, 10.755859375, 12.10546875, 13.455078125, 14.8046875, 16.154296875, 17.50390625, 18.853515625, 20.203125, 21.552734375, 22.90234375, 24.251953125, 25.6015625, 26.951171875, 28.30078125, 29.650390625, 31.0, 32.349609375, 33.69921875, 35.048828125, 36.3984375, 37.748046875, 39.09765625, 40.447265625, 41.796875, 43.146484375, 44.49609375, 45.845703125, 47.1953125, 48.544921875, 49.89453125, 51.244140625, 52.59375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 3.0, 7.0, 13.0, 16.0, 7.0, 27.0, 30.0, 50.0, 64.0, 70.0, 77.0, 103.0, 130.0, 93.0, 60.0, 55.0, 37.0, 28.0, 29.0, 20.0, 13.0, 9.0, 10.0, 9.0, 8.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.71875, -35.36181640625, -34.0048828125, -32.64794921875, -31.291015625, -29.93408203125, -28.5771484375, -27.22021484375, -25.86328125, -24.50634765625, -23.1494140625, -21.79248046875, -20.435546875, -19.07861328125, -17.7216796875, -16.36474609375, -15.0078125, -13.65087890625, -12.2939453125, -10.93701171875, -9.580078125, -8.22314453125, -6.8662109375, -5.50927734375, -4.15234375, -2.79541015625, -1.4384765625, -0.08154296875, 1.275390625, 2.63232421875, 3.9892578125, 5.34619140625, 6.703125, 8.06005859375, 9.4169921875, 10.77392578125, 12.130859375, 13.48779296875, 14.8447265625, 16.20166015625, 17.55859375, 18.91552734375, 20.2724609375, 21.62939453125, 22.986328125, 24.34326171875, 25.7001953125, 27.05712890625, 28.4140625, 29.77099609375, 31.1279296875, 32.48486328125, 33.841796875, 35.19873046875, 36.5556640625, 37.91259765625, 39.26953125, 40.62646484375, 41.9833984375, 43.34033203125, 44.697265625, 46.05419921875, 47.4111328125, 48.76806640625, 50.125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 6.0, 11.0, 20.0, 50.0, 74.0, 140.0, 235.0, 208.0, 115.0, 58.0, 37.0, 19.0, 10.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1132.560791015625, -1101.088134765625, -1069.6153564453125, -1038.1427001953125, -1006.6699829101562, -975.197265625, -943.7245483398438, -912.2518310546875, -880.7791748046875, -849.3064575195312, -817.833740234375, -786.361083984375, -754.8883666992188, -723.4156494140625, -691.9429321289062, -660.47021484375, -628.9974975585938, -597.5247802734375, -566.0520629882812, -534.579345703125, -503.106689453125, -471.63397216796875, -440.1612548828125, -408.68853759765625, -377.2158508300781, -345.7431335449219, -314.27044677734375, -282.7977294921875, -251.3250274658203, -219.85232543945312, -188.37960815429688, -156.9069061279297, -125.4342041015625, -93.96150207519531, -62.488792419433594, -31.016082763671875, 0.4566192626953125, 31.9293212890625, 63.40203857421875, 94.87474060058594, 126.34744262695312, 157.8201446533203, 189.2928466796875, 220.76556396484375, 252.23826599121094, 283.7109680175781, 315.1836853027344, 346.6563720703125, 378.12908935546875, 409.601806640625, 441.0744934082031, 472.5472106933594, 504.0198974609375, 535.4926147460938, 566.96533203125, 598.4380493164062, 629.9107666015625, 661.3834838867188, 692.856201171875, 724.328857421875, 755.8015747070312, 787.2742919921875, 818.7470092773438, 850.2197265625, 881.6923828125]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 2.0, 12.0, 12.0, 6.0, 11.0, 11.0, 15.0, 24.0, 27.0, 32.0, 30.0, 42.0, 34.0, 24.0, 39.0, 53.0, 55.0, 64.0, 54.0, 61.0, 47.0, 37.0, 25.0, 46.0, 34.0, 32.0, 22.0, 30.0, 22.0, 11.0, 10.0, 15.0, 13.0, 5.0, 6.0, 9.0, 4.0, 2.0, 0.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-562.947998046875, -545.3240966796875, -527.7001953125, -510.0763244628906, -492.4524230957031, -474.8285217285156, -457.20465087890625, -439.58074951171875, -421.95684814453125, -404.33294677734375, -386.70904541015625, -369.0851745605469, -351.4612731933594, -333.8373718261719, -316.2135009765625, -298.589599609375, -280.9656982421875, -263.341796875, -245.71791076660156, -228.09402465820312, -210.47012329101562, -192.84622192382812, -175.2223358154297, -157.59844970703125, -139.97454833984375, -122.35065460205078, -104.72676086425781, -87.10286712646484, -69.47897338867188, -51.855079650878906, -34.23118591308594, -16.60729217529297, 1.01666259765625, 18.64055633544922, 36.26445007324219, 53.888343811035156, 71.51223754882812, 89.1361312866211, 106.76002502441406, 124.38391876220703, 142.0078125, 159.6317138671875, 177.25559997558594, 194.87948608398438, 212.50338745117188, 230.12728881835938, 247.7511749267578, 265.37506103515625, 282.99896240234375, 300.62286376953125, 318.24676513671875, 335.8706359863281, 353.4945373535156, 371.1184387207031, 388.7423095703125, 406.3662109375, 423.9901123046875, 441.614013671875, 459.2379150390625, 476.8617858886719, 494.4856872558594, 512.1095581054688, 529.7334594726562, 547.3573608398438, 564.9812622070312]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 6.0, 5.0, 12.0, 11.0, 20.0, 32.0, 42.0, 56.0, 86.0, 116.0, 174.0, 256.0, 347.0, 555.0, 897.0, 1374.0, 2575.0, 5270.0, 13257.0, 58151.0, 1085053.0, 2892872.0, 101551.0, 17461.0, 6436.0, 2975.0, 1693.0, 941.0, 661.0, 445.0, 270.0, 184.0, 133.0, 88.0, 78.0, 52.0, 32.0, 25.0, 34.0, 16.0, 19.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.5, -63.171875, -60.84375, -58.515625, -56.1875, -53.859375, -51.53125, -49.203125, -46.875, -44.546875, -42.21875, -39.890625, -37.5625, -35.234375, -32.90625, -30.578125, -28.25, -25.921875, -23.59375, -21.265625, -18.9375, -16.609375, -14.28125, -11.953125, -9.625, -7.296875, -4.96875, -2.640625, -0.3125, 2.015625, 4.34375, 6.671875, 9.0, 11.328125, 13.65625, 15.984375, 18.3125, 20.640625, 22.96875, 25.296875, 27.625, 29.953125, 32.28125, 34.609375, 36.9375, 39.265625, 41.59375, 43.921875, 46.25, 48.578125, 50.90625, 53.234375, 55.5625, 57.890625, 60.21875, 62.546875, 64.875, 67.203125, 69.53125, 71.859375, 74.1875, 76.515625, 78.84375, 81.171875, 83.5]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 3.0, 7.0, 4.0, 6.0, 12.0, 13.0, 14.0, 21.0, 28.0, 23.0, 24.0, 27.0, 34.0, 31.0, 35.0, 48.0, 48.0, 44.0, 55.0, 50.0, 71.0, 48.0, 58.0, 35.0, 43.0, 33.0, 36.0, 28.0, 25.0, 20.0, 20.0, 13.0, 15.0, 10.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.78125, -21.79736328125, -20.8134765625, -19.82958984375, -18.845703125, -17.86181640625, -16.8779296875, -15.89404296875, -14.91015625, -13.92626953125, -12.9423828125, -11.95849609375, -10.974609375, -9.99072265625, -9.0068359375, -8.02294921875, -7.0390625, -6.05517578125, -5.0712890625, -4.08740234375, -3.103515625, -2.11962890625, -1.1357421875, -0.15185546875, 0.83203125, 1.81591796875, 2.7998046875, 3.78369140625, 4.767578125, 5.75146484375, 6.7353515625, 7.71923828125, 8.703125, 9.68701171875, 10.6708984375, 11.65478515625, 12.638671875, 13.62255859375, 14.6064453125, 15.59033203125, 16.57421875, 17.55810546875, 18.5419921875, 19.52587890625, 20.509765625, 21.49365234375, 22.4775390625, 23.46142578125, 24.4453125, 25.42919921875, 26.4130859375, 27.39697265625, 28.380859375, 29.36474609375, 30.3486328125, 31.33251953125, 32.31640625, 33.30029296875, 34.2841796875, 35.26806640625, 36.251953125, 37.23583984375, 38.2197265625, 39.20361328125, 40.1875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 2.0, 11.0, 4.0, 7.0, 7.0, 15.0, 36.0, 36.0, 61.0, 108.0, 146.0, 240.0, 413.0, 781.0, 1586.0, 3477.0, 8957.0, 29673.0, 289206.0, 3723167.0, 103311.0, 19353.0, 6902.0, 3078.0, 1518.0, 880.0, 466.0, 326.0, 171.0, 92.0, 69.0, 51.0, 38.0, 22.0, 12.0, 15.0, 13.0, 12.0, 8.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-105.0625, -101.7099609375, -98.357421875, -95.0048828125, -91.65234375, -88.2998046875, -84.947265625, -81.5947265625, -78.2421875, -74.8896484375, -71.537109375, -68.1845703125, -64.83203125, -61.4794921875, -58.126953125, -54.7744140625, -51.421875, -48.0693359375, -44.716796875, -41.3642578125, -38.01171875, -34.6591796875, -31.306640625, -27.9541015625, -24.6015625, -21.2490234375, -17.896484375, -14.5439453125, -11.19140625, -7.8388671875, -4.486328125, -1.1337890625, 2.21875, 5.5712890625, 8.923828125, 12.2763671875, 15.62890625, 18.9814453125, 22.333984375, 25.6865234375, 29.0390625, 32.3916015625, 35.744140625, 39.0966796875, 42.44921875, 45.8017578125, 49.154296875, 52.5068359375, 55.859375, 59.2119140625, 62.564453125, 65.9169921875, 69.26953125, 72.6220703125, 75.974609375, 79.3271484375, 82.6796875, 86.0322265625, 89.384765625, 92.7373046875, 96.08984375, 99.4423828125, 102.794921875, 106.1474609375, 109.5]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 6.0, 6.0, 8.0, 9.0, 18.0, 20.0, 31.0, 44.0, 83.0, 159.0, 342.0, 841.0, 1221.0, 659.0, 253.0, 121.0, 67.0, 45.0, 28.0, 22.0, 9.0, 10.0, 14.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 4.0, 5.0, 1.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.4375, -70.5400390625, -67.642578125, -64.7451171875, -61.84765625, -58.9501953125, -56.052734375, -53.1552734375, -50.2578125, -47.3603515625, -44.462890625, -41.5654296875, -38.66796875, -35.7705078125, -32.873046875, -29.9755859375, -27.078125, -24.1806640625, -21.283203125, -18.3857421875, -15.48828125, -12.5908203125, -9.693359375, -6.7958984375, -3.8984375, -1.0009765625, 1.896484375, 4.7939453125, 7.69140625, 10.5888671875, 13.486328125, 16.3837890625, 19.28125, 22.1787109375, 25.076171875, 27.9736328125, 30.87109375, 33.7685546875, 36.666015625, 39.5634765625, 42.4609375, 45.3583984375, 48.255859375, 51.1533203125, 54.05078125, 56.9482421875, 59.845703125, 62.7431640625, 65.640625, 68.5380859375, 71.435546875, 74.3330078125, 77.23046875, 80.1279296875, 83.025390625, 85.9228515625, 88.8203125, 91.7177734375, 94.615234375, 97.5126953125, 100.41015625, 103.3076171875, 106.205078125, 109.1025390625, 112.0]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 9.0, 18.0, 32.0, 79.0, 165.0, 257.0, 243.0, 84.0, 47.0, 27.0, 15.0, 10.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-639.6728515625, -603.2737426757812, -566.8746337890625, -530.4755859375, -494.07647705078125, -457.6773681640625, -421.2782897949219, -384.87921142578125, -348.4801025390625, -312.08099365234375, -275.6819152832031, -239.28282165527344, -202.88372802734375, -166.48463439941406, -130.08554077148438, -93.68644714355469, -57.287353515625, -20.888259887695312, 15.510833740234375, 51.90992736816406, 88.30902099609375, 124.70811462402344, 161.10720825195312, 197.5063018798828, 233.9053955078125, 270.30450439453125, 306.7035827636719, 343.1026611328125, 379.50177001953125, 415.90087890625, 452.2999572753906, 488.69903564453125, 525.0980224609375, 561.4971313476562, 597.896240234375, 634.2952880859375, 670.6943969726562, 707.093505859375, 743.4925537109375, 779.8916625976562, 816.290771484375, 852.6898803710938, 889.0889892578125, 925.488037109375, 961.8871459960938, 998.2862548828125, 1034.685302734375, 1071.08447265625, 1107.4835205078125, 1143.882568359375, 1180.28173828125, 1216.6807861328125, 1253.079833984375, 1289.47900390625, 1325.8780517578125, 1362.2772216796875, 1398.67626953125, 1435.0753173828125, 1471.4744873046875, 1507.87353515625, 1544.272705078125, 1580.6717529296875, 1617.07080078125, 1653.469970703125, 1689.8690185546875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 4.0, 7.0, 14.0, 6.0, 11.0, 13.0, 12.0, 22.0, 28.0, 18.0, 32.0, 28.0, 23.0, 34.0, 37.0, 50.0, 47.0, 53.0, 43.0, 58.0, 55.0, 42.0, 45.0, 47.0, 33.0, 39.0, 36.0, 26.0, 26.0, 23.0, 15.0, 17.0, 14.0, 9.0, 13.0, 3.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-446.34442138671875, -434.5840148925781, -422.8236083984375, -411.0632019042969, -399.30279541015625, -387.5423889160156, -375.781982421875, -364.0215759277344, -352.26116943359375, -340.5007629394531, -328.7403564453125, -316.9799499511719, -305.21954345703125, -293.4591369628906, -281.69873046875, -269.9383239746094, -258.17791748046875, -246.41751098632812, -234.6571044921875, -222.89669799804688, -211.13629150390625, -199.37588500976562, -187.615478515625, -175.85507202148438, -164.09466552734375, -152.33425903320312, -140.5738525390625, -128.81344604492188, -117.05303955078125, -105.29263305664062, -93.5322265625, -81.77182006835938, -70.01138305664062, -58.2509765625, -46.490570068359375, -34.73016357421875, -22.969757080078125, -11.2093505859375, 0.551055908203125, 12.31146240234375, 24.071868896484375, 35.832275390625, 47.592681884765625, 59.35308837890625, 71.11349487304688, 82.8739013671875, 94.63430786132812, 106.39471435546875, 118.15512084960938, 129.91552734375, 141.67593383789062, 153.43634033203125, 165.19674682617188, 176.9571533203125, 188.71755981445312, 200.47796630859375, 212.23837280273438, 223.998779296875, 235.75918579101562, 247.51959228515625, 259.2799987792969, 271.0404052734375, 282.8008117675781, 294.56121826171875, 306.3216247558594]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 14.0, 35.0, 43.0, 38.0, 96.0, 117.0, 199.0, 286.0, 408.0, 648.0, 1053.0, 1492.0, 2299.0, 3639.0, 5891.0, 9314.0, 15588.0, 25892.0, 44546.0, 77623.0, 137745.0, 224707.0, 206937.0, 121366.0, 68879.0, 39436.0, 23199.0, 13975.0, 8468.0, 5315.0, 3295.0, 2027.0, 1339.0, 867.0, 621.0, 369.0, 268.0, 176.0, 104.0, 74.0, 52.0, 29.0, 23.0, 20.0, 13.0, 10.0, 2.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.59375, -28.665771484375, -27.73779296875, -26.809814453125, -25.8818359375, -24.953857421875, -24.02587890625, -23.097900390625, -22.169921875, -21.241943359375, -20.31396484375, -19.385986328125, -18.4580078125, -17.530029296875, -16.60205078125, -15.674072265625, -14.74609375, -13.818115234375, -12.89013671875, -11.962158203125, -11.0341796875, -10.106201171875, -9.17822265625, -8.250244140625, -7.322265625, -6.394287109375, -5.46630859375, -4.538330078125, -3.6103515625, -2.682373046875, -1.75439453125, -0.826416015625, 0.1015625, 1.029541015625, 1.95751953125, 2.885498046875, 3.8134765625, 4.741455078125, 5.66943359375, 6.597412109375, 7.525390625, 8.453369140625, 9.38134765625, 10.309326171875, 11.2373046875, 12.165283203125, 13.09326171875, 14.021240234375, 14.94921875, 15.877197265625, 16.80517578125, 17.733154296875, 18.6611328125, 19.589111328125, 20.51708984375, 21.445068359375, 22.373046875, 23.301025390625, 24.22900390625, 25.156982421875, 26.0849609375, 27.012939453125, 27.94091796875, 28.868896484375, 29.796875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 4.0, 5.0, 5.0, 4.0, 6.0, 5.0, 5.0, 9.0, 13.0, 22.0, 18.0, 15.0, 16.0, 21.0, 16.0, 25.0, 27.0, 25.0, 31.0, 34.0, 32.0, 41.0, 38.0, 32.0, 46.0, 49.0, 28.0, 41.0, 44.0, 34.0, 35.0, 23.0, 32.0, 28.0, 39.0, 27.0, 19.0, 13.0, 17.0, 11.0, 11.0, 11.0, 11.0, 7.0, 5.0, 4.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-23.390625, -22.658203125, -21.92578125, -21.193359375, -20.4609375, -19.728515625, -18.99609375, -18.263671875, -17.53125, -16.798828125, -16.06640625, -15.333984375, -14.6015625, -13.869140625, -13.13671875, -12.404296875, -11.671875, -10.939453125, -10.20703125, -9.474609375, -8.7421875, -8.009765625, -7.27734375, -6.544921875, -5.8125, -5.080078125, -4.34765625, -3.615234375, -2.8828125, -2.150390625, -1.41796875, -0.685546875, 0.046875, 0.779296875, 1.51171875, 2.244140625, 2.9765625, 3.708984375, 4.44140625, 5.173828125, 5.90625, 6.638671875, 7.37109375, 8.103515625, 8.8359375, 9.568359375, 10.30078125, 11.033203125, 11.765625, 12.498046875, 13.23046875, 13.962890625, 14.6953125, 15.427734375, 16.16015625, 16.892578125, 17.625, 18.357421875, 19.08984375, 19.822265625, 20.5546875, 21.287109375, 22.01953125, 22.751953125, 23.484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 15.0, 20.0, 24.0, 37.0, 45.0, 82.0, 117.0, 174.0, 281.0, 439.0, 816.0, 1648.0, 4004.0, 15071.0, 105223.0, 786578.0, 110573.0, 15667.0, 4029.0, 1583.0, 819.0, 481.0, 276.0, 178.0, 135.0, 76.0, 50.0, 29.0, 28.0, 16.0, 16.0, 7.0, 1.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.625, -123.69921875, -119.7734375, -115.84765625, -111.921875, -107.99609375, -104.0703125, -100.14453125, -96.21875, -92.29296875, -88.3671875, -84.44140625, -80.515625, -76.58984375, -72.6640625, -68.73828125, -64.8125, -60.88671875, -56.9609375, -53.03515625, -49.109375, -45.18359375, -41.2578125, -37.33203125, -33.40625, -29.48046875, -25.5546875, -21.62890625, -17.703125, -13.77734375, -9.8515625, -5.92578125, -2.0, 1.92578125, 5.8515625, 9.77734375, 13.703125, 17.62890625, 21.5546875, 25.48046875, 29.40625, 33.33203125, 37.2578125, 41.18359375, 45.109375, 49.03515625, 52.9609375, 56.88671875, 60.8125, 64.73828125, 68.6640625, 72.58984375, 76.515625, 80.44140625, 84.3671875, 88.29296875, 92.21875, 96.14453125, 100.0703125, 103.99609375, 107.921875, 111.84765625, 115.7734375, 119.69921875, 123.625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 5.0, 13.0, 5.0, 9.0, 9.0, 12.0, 16.0, 9.0, 22.0, 22.0, 12.0, 34.0, 30.0, 30.0, 43.0, 42.0, 49.0, 41.0, 45.0, 48.0, 40.0, 47.0, 45.0, 46.0, 45.0, 34.0, 33.0, 29.0, 20.0, 26.0, 19.0, 18.0, 22.0, 19.0, 14.0, 13.0, 6.0, 5.0, 6.0, 4.0, 6.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-114.4375, -110.763671875, -107.08984375, -103.416015625, -99.7421875, -96.068359375, -92.39453125, -88.720703125, -85.046875, -81.373046875, -77.69921875, -74.025390625, -70.3515625, -66.677734375, -63.00390625, -59.330078125, -55.65625, -51.982421875, -48.30859375, -44.634765625, -40.9609375, -37.287109375, -33.61328125, -29.939453125, -26.265625, -22.591796875, -18.91796875, -15.244140625, -11.5703125, -7.896484375, -4.22265625, -0.548828125, 3.125, 6.798828125, 10.47265625, 14.146484375, 17.8203125, 21.494140625, 25.16796875, 28.841796875, 32.515625, 36.189453125, 39.86328125, 43.537109375, 47.2109375, 50.884765625, 54.55859375, 58.232421875, 61.90625, 65.580078125, 69.25390625, 72.927734375, 76.6015625, 80.275390625, 83.94921875, 87.623046875, 91.296875, 94.970703125, 98.64453125, 102.318359375, 105.9921875, 109.666015625, 113.33984375, 117.013671875, 120.6875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 13.0, 15.0, 17.0, 16.0, 32.0, 26.0, 40.0, 33.0, 71.0, 88.0, 139.0, 171.0, 275.0, 465.0, 800.0, 1523.0, 3404.0, 10577.0, 53150.0, 577252.0, 342667.0, 42225.0, 8834.0, 3151.0, 1470.0, 780.0, 433.0, 251.0, 173.0, 110.0, 85.0, 65.0, 44.0, 28.0, 13.0, 33.0, 16.0, 18.0, 11.0, 6.0, 8.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-27.40625, -26.548095703125, -25.68994140625, -24.831787109375, -23.9736328125, -23.115478515625, -22.25732421875, -21.399169921875, -20.541015625, -19.682861328125, -18.82470703125, -17.966552734375, -17.1083984375, -16.250244140625, -15.39208984375, -14.533935546875, -13.67578125, -12.817626953125, -11.95947265625, -11.101318359375, -10.2431640625, -9.385009765625, -8.52685546875, -7.668701171875, -6.810546875, -5.952392578125, -5.09423828125, -4.236083984375, -3.3779296875, -2.519775390625, -1.66162109375, -0.803466796875, 0.0546875, 0.912841796875, 1.77099609375, 2.629150390625, 3.4873046875, 4.345458984375, 5.20361328125, 6.061767578125, 6.919921875, 7.778076171875, 8.63623046875, 9.494384765625, 10.3525390625, 11.210693359375, 12.06884765625, 12.927001953125, 13.78515625, 14.643310546875, 15.50146484375, 16.359619140625, 17.2177734375, 18.075927734375, 18.93408203125, 19.792236328125, 20.650390625, 21.508544921875, 22.36669921875, 23.224853515625, 24.0830078125, 24.941162109375, 25.79931640625, 26.657470703125, 27.515625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 4.0, 4.0, 11.0, 9.0, 7.0, 16.0, 21.0, 29.0, 41.0, 47.0, 49.0, 67.0, 68.0, 114.0, 102.0, 97.0, 74.0, 43.0, 37.0, 31.0, 21.0, 22.0, 16.0, 12.0, 12.0, 11.0, 3.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004245758056640625, -0.0041165947914123535, -0.003987431526184082, -0.0038582682609558105, -0.003729104995727539, -0.0035999417304992676, -0.003470778465270996, -0.0033416152000427246, -0.003212451934814453, -0.0030832886695861816, -0.00295412540435791, -0.0028249621391296387, -0.002695798873901367, -0.0025666356086730957, -0.0024374723434448242, -0.0023083090782165527, -0.0021791458129882812, -0.0020499825477600098, -0.0019208192825317383, -0.0017916560173034668, -0.0016624927520751953, -0.0015333294868469238, -0.0014041662216186523, -0.0012750029563903809, -0.0011458396911621094, -0.0010166764259338379, -0.0008875131607055664, -0.0007583498954772949, -0.0006291866302490234, -0.000500023365020752, -0.00037086009979248047, -0.00024169683456420898, -0.0001125335693359375, 1.6629695892333984e-05, 0.00014579296112060547, 0.00027495622634887695, 0.00040411949157714844, 0.0005332827568054199, 0.0006624460220336914, 0.0007916092872619629, 0.0009207725524902344, 0.0010499358177185059, 0.0011790990829467773, 0.0013082623481750488, 0.0014374256134033203, 0.0015665888786315918, 0.0016957521438598633, 0.0018249154090881348, 0.0019540786743164062, 0.0020832419395446777, 0.0022124052047729492, 0.0023415684700012207, 0.002470731735229492, 0.0025998950004577637, 0.002729058265686035, 0.0028582215309143066, 0.002987384796142578, 0.0031165480613708496, 0.003245711326599121, 0.0033748745918273926, 0.003504037857055664, 0.0036332011222839355, 0.003762364387512207, 0.0038915276527404785, 0.00402069091796875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 12.0, 18.0, 12.0, 27.0, 30.0, 58.0, 69.0, 115.0, 143.0, 246.0, 436.0, 671.0, 1296.0, 2528.0, 5851.0, 15299.0, 55037.0, 386637.0, 494849.0, 57591.0, 15701.0, 6030.0, 2610.0, 1349.0, 773.0, 391.0, 246.0, 153.0, 106.0, 64.0, 42.0, 43.0, 16.0, 18.0, 11.0, 17.0, 11.0, 5.0, 7.0, 9.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-33.34375, -32.30224609375, -31.2607421875, -30.21923828125, -29.177734375, -28.13623046875, -27.0947265625, -26.05322265625, -25.01171875, -23.97021484375, -22.9287109375, -21.88720703125, -20.845703125, -19.80419921875, -18.7626953125, -17.72119140625, -16.6796875, -15.63818359375, -14.5966796875, -13.55517578125, -12.513671875, -11.47216796875, -10.4306640625, -9.38916015625, -8.34765625, -7.30615234375, -6.2646484375, -5.22314453125, -4.181640625, -3.14013671875, -2.0986328125, -1.05712890625, -0.015625, 1.02587890625, 2.0673828125, 3.10888671875, 4.150390625, 5.19189453125, 6.2333984375, 7.27490234375, 8.31640625, 9.35791015625, 10.3994140625, 11.44091796875, 12.482421875, 13.52392578125, 14.5654296875, 15.60693359375, 16.6484375, 17.68994140625, 18.7314453125, 19.77294921875, 20.814453125, 21.85595703125, 22.8974609375, 23.93896484375, 24.98046875, 26.02197265625, 27.0634765625, 28.10498046875, 29.146484375, 30.18798828125, 31.2294921875, 32.27099609375, 33.3125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 8.0, 6.0, 10.0, 9.0, 8.0, 19.0, 27.0, 35.0, 38.0, 39.0, 57.0, 63.0, 88.0, 75.0, 76.0, 93.0, 57.0, 57.0, 33.0, 34.0, 36.0, 22.0, 22.0, 14.0, 12.0, 13.0, 6.0, 9.0, 3.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-34.84375, -33.919677734375, -32.99560546875, -32.071533203125, -31.1474609375, -30.223388671875, -29.29931640625, -28.375244140625, -27.451171875, -26.527099609375, -25.60302734375, -24.678955078125, -23.7548828125, -22.830810546875, -21.90673828125, -20.982666015625, -20.05859375, -19.134521484375, -18.21044921875, -17.286376953125, -16.3623046875, -15.438232421875, -14.51416015625, -13.590087890625, -12.666015625, -11.741943359375, -10.81787109375, -9.893798828125, -8.9697265625, -8.045654296875, -7.12158203125, -6.197509765625, -5.2734375, -4.349365234375, -3.42529296875, -2.501220703125, -1.5771484375, -0.653076171875, 0.27099609375, 1.195068359375, 2.119140625, 3.043212890625, 3.96728515625, 4.891357421875, 5.8154296875, 6.739501953125, 7.66357421875, 8.587646484375, 9.51171875, 10.435791015625, 11.35986328125, 12.283935546875, 13.2080078125, 14.132080078125, 15.05615234375, 15.980224609375, 16.904296875, 17.828369140625, 18.75244140625, 19.676513671875, 20.6005859375, 21.524658203125, 22.44873046875, 23.372802734375, 24.296875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 7.0, 6.0, 12.0, 26.0, 36.0, 87.0, 163.0, 265.0, 183.0, 100.0, 50.0, 31.0, 14.0, 10.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-624.7486572265625, -597.037109375, -569.3255615234375, -541.6140747070312, -513.9025268554688, -486.19097900390625, -458.4794616699219, -430.7679443359375, -403.056396484375, -375.3448486328125, -347.6333312988281, -319.92181396484375, -292.21026611328125, -264.49871826171875, -236.78720092773438, -209.07566833496094, -181.3641357421875, -153.65260314941406, -125.94107055664062, -98.22953796386719, -70.51800537109375, -42.80647277832031, -15.094940185546875, 12.616592407226562, 40.328125, 68.03965759277344, 95.75119018554688, 123.46272277832031, 151.17425537109375, 178.8857879638672, 206.59732055664062, 234.30885314941406, 262.0203857421875, 289.73193359375, 317.4434509277344, 345.15496826171875, 372.86651611328125, 400.57806396484375, 428.2895812988281, 456.0010986328125, 483.712646484375, 511.4241943359375, 539.1357421875, 566.8472290039062, 594.5587768554688, 622.2703247070312, 649.9818115234375, 677.693359375, 705.4049072265625, 733.116455078125, 760.8280029296875, 788.5394897460938, 816.2510375976562, 843.9625854492188, 871.674072265625, 899.3856201171875, 927.09716796875, 954.8087158203125, 982.520263671875, 1010.2317504882812, 1037.943359375, 1065.65478515625, 1093.3663330078125, 1121.077880859375, 1148.7894287109375]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 8.0, 14.0, 7.0, 12.0, 12.0, 9.0, 25.0, 17.0, 21.0, 25.0, 24.0, 30.0, 29.0, 31.0, 28.0, 36.0, 57.0, 49.0, 58.0, 61.0, 49.0, 50.0, 44.0, 35.0, 32.0, 20.0, 20.0, 25.0, 23.0, 17.0, 18.0, 18.0, 13.0, 11.0, 17.0, 12.0, 9.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-385.46905517578125, -372.6074523925781, -359.7458190917969, -346.88421630859375, -334.0226135253906, -321.1609802246094, -308.29937744140625, -295.437744140625, -282.5761413574219, -269.71453857421875, -256.8529052734375, -243.99130249023438, -231.1296844482422, -218.26806640625, -205.40646362304688, -192.5448455810547, -179.68324279785156, -166.82162475585938, -153.96002197265625, -141.09840393066406, -128.23678588867188, -115.37517547607422, -102.51356506347656, -89.65194702148438, -76.79033660888672, -63.9287223815918, -51.067108154296875, -38.20549774169922, -25.343883514404297, -12.482269287109375, 0.37934112548828125, 13.240959167480469, 26.102569580078125, 38.96418380737305, 51.82579803466797, 64.68740844726562, 77.54902648925781, 90.41063690185547, 103.27224731445312, 116.13386535644531, 128.9954833984375, 141.8571014404297, 154.7187042236328, 167.580322265625, 180.4419403076172, 193.30355834960938, 206.1651611328125, 219.0267791748047, 231.8883819580078, 244.75, 257.6116027832031, 270.47320556640625, 283.3348388671875, 296.1964416503906, 309.05804443359375, 321.919677734375, 334.7812805175781, 347.64288330078125, 360.5045166015625, 373.3661193847656, 386.22772216796875, 399.08935546875, 411.9509582519531, 424.81256103515625, 437.6741943359375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 5.0, 8.0, 12.0, 11.0, 17.0, 33.0, 57.0, 56.0, 109.0, 123.0, 155.0, 233.0, 298.0, 471.0, 682.0, 1021.0, 1734.0, 2946.0, 5850.0, 13665.0, 41096.0, 220405.0, 2771472.0, 992530.0, 98100.0, 23827.0, 8881.0, 4079.0, 2212.0, 1331.0, 871.0, 577.0, 395.0, 265.0, 190.0, 144.0, 115.0, 74.0, 71.0, 40.0, 29.0, 26.0, 21.0, 9.0, 18.0, 5.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-40.03125, -38.77197265625, -37.5126953125, -36.25341796875, -34.994140625, -33.73486328125, -32.4755859375, -31.21630859375, -29.95703125, -28.69775390625, -27.4384765625, -26.17919921875, -24.919921875, -23.66064453125, -22.4013671875, -21.14208984375, -19.8828125, -18.62353515625, -17.3642578125, -16.10498046875, -14.845703125, -13.58642578125, -12.3271484375, -11.06787109375, -9.80859375, -8.54931640625, -7.2900390625, -6.03076171875, -4.771484375, -3.51220703125, -2.2529296875, -0.99365234375, 0.265625, 1.52490234375, 2.7841796875, 4.04345703125, 5.302734375, 6.56201171875, 7.8212890625, 9.08056640625, 10.33984375, 11.59912109375, 12.8583984375, 14.11767578125, 15.376953125, 16.63623046875, 17.8955078125, 19.15478515625, 20.4140625, 21.67333984375, 22.9326171875, 24.19189453125, 25.451171875, 26.71044921875, 27.9697265625, 29.22900390625, 30.48828125, 31.74755859375, 33.0068359375, 34.26611328125, 35.525390625, 36.78466796875, 38.0439453125, 39.30322265625, 40.5625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 2.0, 8.0, 4.0, 14.0, 5.0, 9.0, 16.0, 20.0, 15.0, 24.0, 32.0, 30.0, 34.0, 32.0, 32.0, 42.0, 43.0, 42.0, 61.0, 49.0, 62.0, 41.0, 50.0, 26.0, 32.0, 43.0, 29.0, 37.0, 30.0, 28.0, 16.0, 18.0, 15.0, 16.0, 11.0, 10.0, 7.0, 5.0, 5.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.28125, -26.4248046875, -25.568359375, -24.7119140625, -23.85546875, -22.9990234375, -22.142578125, -21.2861328125, -20.4296875, -19.5732421875, -18.716796875, -17.8603515625, -17.00390625, -16.1474609375, -15.291015625, -14.4345703125, -13.578125, -12.7216796875, -11.865234375, -11.0087890625, -10.15234375, -9.2958984375, -8.439453125, -7.5830078125, -6.7265625, -5.8701171875, -5.013671875, -4.1572265625, -3.30078125, -2.4443359375, -1.587890625, -0.7314453125, 0.125, 0.9814453125, 1.837890625, 2.6943359375, 3.55078125, 4.4072265625, 5.263671875, 6.1201171875, 6.9765625, 7.8330078125, 8.689453125, 9.5458984375, 10.40234375, 11.2587890625, 12.115234375, 12.9716796875, 13.828125, 14.6845703125, 15.541015625, 16.3974609375, 17.25390625, 18.1103515625, 18.966796875, 19.8232421875, 20.6796875, 21.5361328125, 22.392578125, 23.2490234375, 24.10546875, 24.9619140625, 25.818359375, 26.6748046875, 27.53125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 6.0, 14.0, 14.0, 17.0, 34.0, 49.0, 78.0, 110.0, 187.0, 340.0, 603.0, 1196.0, 2485.0, 6600.0, 25693.0, 370522.0, 3704087.0, 63269.0, 11418.0, 3758.0, 1652.0, 857.0, 442.0, 268.0, 160.0, 121.0, 65.0, 58.0, 42.0, 31.0, 30.0, 18.0, 17.0, 10.0, 8.0, 1.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.5, -89.3369140625, -86.173828125, -83.0107421875, -79.84765625, -76.6845703125, -73.521484375, -70.3583984375, -67.1953125, -64.0322265625, -60.869140625, -57.7060546875, -54.54296875, -51.3798828125, -48.216796875, -45.0537109375, -41.890625, -38.7275390625, -35.564453125, -32.4013671875, -29.23828125, -26.0751953125, -22.912109375, -19.7490234375, -16.5859375, -13.4228515625, -10.259765625, -7.0966796875, -3.93359375, -0.7705078125, 2.392578125, 5.5556640625, 8.71875, 11.8818359375, 15.044921875, 18.2080078125, 21.37109375, 24.5341796875, 27.697265625, 30.8603515625, 34.0234375, 37.1865234375, 40.349609375, 43.5126953125, 46.67578125, 49.8388671875, 53.001953125, 56.1650390625, 59.328125, 62.4912109375, 65.654296875, 68.8173828125, 71.98046875, 75.1435546875, 78.306640625, 81.4697265625, 84.6328125, 87.7958984375, 90.958984375, 94.1220703125, 97.28515625, 100.4482421875, 103.611328125, 106.7744140625, 109.9375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 7.0, 13.0, 16.0, 18.0, 26.0, 49.0, 75.0, 191.0, 634.0, 1613.0, 913.0, 279.0, 95.0, 54.0, 21.0, 23.0, 17.0, 6.0, 4.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.875, -62.68359375, -59.4921875, -56.30078125, -53.109375, -49.91796875, -46.7265625, -43.53515625, -40.34375, -37.15234375, -33.9609375, -30.76953125, -27.578125, -24.38671875, -21.1953125, -18.00390625, -14.8125, -11.62109375, -8.4296875, -5.23828125, -2.046875, 1.14453125, 4.3359375, 7.52734375, 10.71875, 13.91015625, 17.1015625, 20.29296875, 23.484375, 26.67578125, 29.8671875, 33.05859375, 36.25, 39.44140625, 42.6328125, 45.82421875, 49.015625, 52.20703125, 55.3984375, 58.58984375, 61.78125, 64.97265625, 68.1640625, 71.35546875, 74.546875, 77.73828125, 80.9296875, 84.12109375, 87.3125, 90.50390625, 93.6953125, 96.88671875, 100.078125, 103.26953125, 106.4609375, 109.65234375, 112.84375, 116.03515625, 119.2265625, 122.41796875, 125.609375, 128.80078125, 131.9921875, 135.18359375, 138.375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 17.0, 30.0, 62.0, 110.0, 179.0, 228.0, 166.0, 108.0, 35.0, 15.0, 12.0, 10.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-683.08544921875, -661.9652099609375, -640.8450317382812, -619.7247924804688, -598.6045532226562, -577.484375, -556.3641357421875, -535.243896484375, -514.1237182617188, -493.0035095214844, -471.8832702636719, -450.7630615234375, -429.6428527832031, -408.52264404296875, -387.40240478515625, -366.2821960449219, -345.1619567871094, -324.041748046875, -302.9215087890625, -281.8013000488281, -260.68109130859375, -239.5608673095703, -218.44064331054688, -197.3204345703125, -176.20021057128906, -155.07998657226562, -133.95977783203125, -112.83955383300781, -91.7193374633789, -70.59912109375, -49.47889709472656, -28.358688354492188, -7.23846435546875, 13.881753921508789, 35.00197219848633, 56.1221923828125, 77.2424087524414, 98.36262512207031, 119.48284912109375, 140.60305786132812, 161.72328186035156, 182.843505859375, 203.96371459960938, 225.0839385986328, 246.20416259765625, 267.3243713378906, 288.444580078125, 309.5648193359375, 330.6850280761719, 351.80523681640625, 372.92547607421875, 394.0456848144531, 415.1658935546875, 436.2861328125, 457.4063415527344, 478.52655029296875, 499.64678955078125, 520.7670288085938, 541.88720703125, 563.0074462890625, 584.127685546875, 605.2478637695312, 626.3681030273438, 647.48828125, 668.6085205078125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 6.0, 9.0, 8.0, 14.0, 12.0, 25.0, 18.0, 21.0, 35.0, 33.0, 36.0, 62.0, 42.0, 60.0, 52.0, 47.0, 58.0, 64.0, 62.0, 55.0, 45.0, 49.0, 25.0, 30.0, 25.0, 19.0, 19.0, 21.0, 9.0, 8.0, 9.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-270.9271545410156, -261.7055358886719, -252.48391723632812, -243.2622833251953, -234.04066467285156, -224.8190460205078, -215.597412109375, -206.37579345703125, -197.1541748046875, -187.93255615234375, -178.7109375, -169.4893035888672, -160.26768493652344, -151.0460662841797, -141.82443237304688, -132.60281372070312, -123.38119506835938, -114.15957641601562, -104.93795013427734, -95.71632385253906, -86.49470520019531, -77.27308654785156, -68.05146026611328, -58.829833984375, -49.60821533203125, -40.386592864990234, -31.16497039794922, -21.943347930908203, -12.721725463867188, -3.500102996826172, 5.721519470214844, 14.943145751953125, 24.164794921875, 33.386417388916016, 42.60803985595703, 51.82966232299805, 61.05128479003906, 70.27290344238281, 79.4945297241211, 88.71615600585938, 97.93777465820312, 107.15939331054688, 116.38101959228516, 125.60264587402344, 134.8242645263672, 144.04588317871094, 153.26751708984375, 162.4891357421875, 171.71075439453125, 180.932373046875, 190.15399169921875, 199.37562561035156, 208.5972442626953, 217.81886291503906, 227.04049682617188, 236.26211547851562, 245.48373413085938, 254.70535278320312, 263.9269714355469, 273.1485900878906, 282.3702392578125, 291.59185791015625, 300.8134765625, 310.03509521484375, 319.2567138671875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 8.0, 5.0, 21.0, 32.0, 38.0, 69.0, 90.0, 154.0, 181.0, 303.0, 481.0, 739.0, 1082.0, 1831.0, 2909.0, 4961.0, 8204.0, 14095.0, 25842.0, 48182.0, 93186.0, 182765.0, 280958.0, 181379.0, 92618.0, 47889.0, 25588.0, 14074.0, 8182.0, 4751.0, 2908.0, 1755.0, 1143.0, 714.0, 507.0, 319.0, 194.0, 126.0, 92.0, 51.0, 36.0, 23.0, 24.0, 19.0, 14.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-37.84375, -36.7138671875, -35.583984375, -34.4541015625, -33.32421875, -32.1943359375, -31.064453125, -29.9345703125, -28.8046875, -27.6748046875, -26.544921875, -25.4150390625, -24.28515625, -23.1552734375, -22.025390625, -20.8955078125, -19.765625, -18.6357421875, -17.505859375, -16.3759765625, -15.24609375, -14.1162109375, -12.986328125, -11.8564453125, -10.7265625, -9.5966796875, -8.466796875, -7.3369140625, -6.20703125, -5.0771484375, -3.947265625, -2.8173828125, -1.6875, -0.5576171875, 0.572265625, 1.7021484375, 2.83203125, 3.9619140625, 5.091796875, 6.2216796875, 7.3515625, 8.4814453125, 9.611328125, 10.7412109375, 11.87109375, 13.0009765625, 14.130859375, 15.2607421875, 16.390625, 17.5205078125, 18.650390625, 19.7802734375, 20.91015625, 22.0400390625, 23.169921875, 24.2998046875, 25.4296875, 26.5595703125, 27.689453125, 28.8193359375, 29.94921875, 31.0791015625, 32.208984375, 33.3388671875, 34.46875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 5.0, 10.0, 16.0, 27.0, 26.0, 29.0, 24.0, 32.0, 40.0, 45.0, 55.0, 44.0, 56.0, 47.0, 65.0, 59.0, 69.0, 45.0, 34.0, 43.0, 37.0, 37.0, 20.0, 32.0, 15.0, 19.0, 9.0, 17.0, 12.0, 6.0, 5.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.46875, -31.498779296875, -30.52880859375, -29.558837890625, -28.5888671875, -27.618896484375, -26.64892578125, -25.678955078125, -24.708984375, -23.739013671875, -22.76904296875, -21.799072265625, -20.8291015625, -19.859130859375, -18.88916015625, -17.919189453125, -16.94921875, -15.979248046875, -15.00927734375, -14.039306640625, -13.0693359375, -12.099365234375, -11.12939453125, -10.159423828125, -9.189453125, -8.219482421875, -7.24951171875, -6.279541015625, -5.3095703125, -4.339599609375, -3.36962890625, -2.399658203125, -1.4296875, -0.459716796875, 0.51025390625, 1.480224609375, 2.4501953125, 3.420166015625, 4.39013671875, 5.360107421875, 6.330078125, 7.300048828125, 8.27001953125, 9.239990234375, 10.2099609375, 11.179931640625, 12.14990234375, 13.119873046875, 14.08984375, 15.059814453125, 16.02978515625, 16.999755859375, 17.9697265625, 18.939697265625, 19.90966796875, 20.879638671875, 21.849609375, 22.819580078125, 23.78955078125, 24.759521484375, 25.7294921875, 26.699462890625, 27.66943359375, 28.639404296875, 29.609375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 8.0, 5.0, 9.0, 16.0, 16.0, 23.0, 20.0, 48.0, 80.0, 107.0, 197.0, 378.0, 769.0, 1849.0, 6426.0, 39195.0, 695370.0, 275005.0, 21900.0, 4310.0, 1441.0, 613.0, 293.0, 169.0, 97.0, 64.0, 43.0, 31.0, 17.0, 13.0, 11.0, 15.0, 7.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.375, -130.841796875, -126.30859375, -121.775390625, -117.2421875, -112.708984375, -108.17578125, -103.642578125, -99.109375, -94.576171875, -90.04296875, -85.509765625, -80.9765625, -76.443359375, -71.91015625, -67.376953125, -62.84375, -58.310546875, -53.77734375, -49.244140625, -44.7109375, -40.177734375, -35.64453125, -31.111328125, -26.578125, -22.044921875, -17.51171875, -12.978515625, -8.4453125, -3.912109375, 0.62109375, 5.154296875, 9.6875, 14.220703125, 18.75390625, 23.287109375, 27.8203125, 32.353515625, 36.88671875, 41.419921875, 45.953125, 50.486328125, 55.01953125, 59.552734375, 64.0859375, 68.619140625, 73.15234375, 77.685546875, 82.21875, 86.751953125, 91.28515625, 95.818359375, 100.3515625, 104.884765625, 109.41796875, 113.951171875, 118.484375, 123.017578125, 127.55078125, 132.083984375, 136.6171875, 141.150390625, 145.68359375, 150.216796875, 154.75]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 5.0, 11.0, 6.0, 9.0, 22.0, 20.0, 24.0, 31.0, 35.0, 42.0, 48.0, 44.0, 53.0, 51.0, 56.0, 58.0, 59.0, 52.0, 39.0, 51.0, 30.0, 36.0, 44.0, 33.0, 27.0, 21.0, 19.0, 14.0, 13.0, 6.0, 6.0, 4.0, 6.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-108.5, -104.9970703125, -101.494140625, -97.9912109375, -94.48828125, -90.9853515625, -87.482421875, -83.9794921875, -80.4765625, -76.9736328125, -73.470703125, -69.9677734375, -66.46484375, -62.9619140625, -59.458984375, -55.9560546875, -52.453125, -48.9501953125, -45.447265625, -41.9443359375, -38.44140625, -34.9384765625, -31.435546875, -27.9326171875, -24.4296875, -20.9267578125, -17.423828125, -13.9208984375, -10.41796875, -6.9150390625, -3.412109375, 0.0908203125, 3.59375, 7.0966796875, 10.599609375, 14.1025390625, 17.60546875, 21.1083984375, 24.611328125, 28.1142578125, 31.6171875, 35.1201171875, 38.623046875, 42.1259765625, 45.62890625, 49.1318359375, 52.634765625, 56.1376953125, 59.640625, 63.1435546875, 66.646484375, 70.1494140625, 73.65234375, 77.1552734375, 80.658203125, 84.1611328125, 87.6640625, 91.1669921875, 94.669921875, 98.1728515625, 101.67578125, 105.1787109375, 108.681640625, 112.1845703125, 115.6875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 9.0, 8.0, 20.0, 19.0, 13.0, 24.0, 47.0, 70.0, 104.0, 167.0, 300.0, 605.0, 1181.0, 3389.0, 12539.0, 65256.0, 658028.0, 260331.0, 34409.0, 7578.0, 2429.0, 909.0, 446.0, 240.0, 130.0, 94.0, 52.0, 38.0, 28.0, 27.0, 16.0, 10.0, 6.0, 5.0, 4.0, 2.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-35.34375, -34.357177734375, -33.37060546875, -32.384033203125, -31.3974609375, -30.410888671875, -29.42431640625, -28.437744140625, -27.451171875, -26.464599609375, -25.47802734375, -24.491455078125, -23.5048828125, -22.518310546875, -21.53173828125, -20.545166015625, -19.55859375, -18.572021484375, -17.58544921875, -16.598876953125, -15.6123046875, -14.625732421875, -13.63916015625, -12.652587890625, -11.666015625, -10.679443359375, -9.69287109375, -8.706298828125, -7.7197265625, -6.733154296875, -5.74658203125, -4.760009765625, -3.7734375, -2.786865234375, -1.80029296875, -0.813720703125, 0.1728515625, 1.159423828125, 2.14599609375, 3.132568359375, 4.119140625, 5.105712890625, 6.09228515625, 7.078857421875, 8.0654296875, 9.052001953125, 10.03857421875, 11.025146484375, 12.01171875, 12.998291015625, 13.98486328125, 14.971435546875, 15.9580078125, 16.944580078125, 17.93115234375, 18.917724609375, 19.904296875, 20.890869140625, 21.87744140625, 22.864013671875, 23.8505859375, 24.837158203125, 25.82373046875, 26.810302734375, 27.796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 0.0, 2.0, 3.0, 6.0, 1.0, 6.0, 7.0, 3.0, 9.0, 19.0, 9.0, 18.0, 23.0, 37.0, 56.0, 61.0, 80.0, 81.0, 102.0, 97.0, 81.0, 52.0, 50.0, 41.0, 32.0, 27.0, 22.0, 12.0, 16.0, 8.0, 14.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0059814453125, -0.005818963050842285, -0.00565648078918457, -0.0054939985275268555, -0.005331516265869141, -0.005169034004211426, -0.005006551742553711, -0.004844069480895996, -0.004681587219238281, -0.004519104957580566, -0.0043566226959228516, -0.004194140434265137, -0.004031658172607422, -0.003869175910949707, -0.003706693649291992, -0.0035442113876342773, -0.0033817291259765625, -0.0032192468643188477, -0.003056764602661133, -0.002894282341003418, -0.002731800079345703, -0.0025693178176879883, -0.0024068355560302734, -0.0022443532943725586, -0.0020818710327148438, -0.001919388771057129, -0.001756906509399414, -0.0015944242477416992, -0.0014319419860839844, -0.0012694597244262695, -0.0011069774627685547, -0.0009444952011108398, -0.000782012939453125, -0.0006195306777954102, -0.0004570484161376953, -0.00029456615447998047, -0.00013208389282226562, 3.039836883544922e-05, 0.00019288063049316406, 0.0003553628921508789, 0.0005178451538085938, 0.0006803274154663086, 0.0008428096771240234, 0.0010052919387817383, 0.0011677742004394531, 0.001330256462097168, 0.0014927387237548828, 0.0016552209854125977, 0.0018177032470703125, 0.0019801855087280273, 0.002142667770385742, 0.002305150032043457, 0.002467632293701172, 0.0026301145553588867, 0.0027925968170166016, 0.0029550790786743164, 0.0031175613403320312, 0.003280043601989746, 0.003442525863647461, 0.0036050081253051758, 0.0037674903869628906, 0.0039299726486206055, 0.00409245491027832, 0.004254937171936035, 0.00441741943359375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 7.0, 20.0, 24.0, 23.0, 28.0, 43.0, 70.0, 128.0, 195.0, 320.0, 584.0, 1044.0, 2103.0, 4769.0, 11743.0, 35609.0, 139943.0, 611165.0, 174188.0, 42512.0, 13570.0, 5350.0, 2396.0, 1159.0, 627.0, 351.0, 211.0, 122.0, 68.0, 47.0, 41.0, 19.0, 24.0, 14.0, 10.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.984375, -24.21728515625, -23.4501953125, -22.68310546875, -21.916015625, -21.14892578125, -20.3818359375, -19.61474609375, -18.84765625, -18.08056640625, -17.3134765625, -16.54638671875, -15.779296875, -15.01220703125, -14.2451171875, -13.47802734375, -12.7109375, -11.94384765625, -11.1767578125, -10.40966796875, -9.642578125, -8.87548828125, -8.1083984375, -7.34130859375, -6.57421875, -5.80712890625, -5.0400390625, -4.27294921875, -3.505859375, -2.73876953125, -1.9716796875, -1.20458984375, -0.4375, 0.32958984375, 1.0966796875, 1.86376953125, 2.630859375, 3.39794921875, 4.1650390625, 4.93212890625, 5.69921875, 6.46630859375, 7.2333984375, 8.00048828125, 8.767578125, 9.53466796875, 10.3017578125, 11.06884765625, 11.8359375, 12.60302734375, 13.3701171875, 14.13720703125, 14.904296875, 15.67138671875, 16.4384765625, 17.20556640625, 17.97265625, 18.73974609375, 19.5068359375, 20.27392578125, 21.041015625, 21.80810546875, 22.5751953125, 23.34228515625, 24.109375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 3.0, 2.0, 7.0, 6.0, 4.0, 4.0, 8.0, 13.0, 15.0, 15.0, 19.0, 31.0, 37.0, 46.0, 47.0, 58.0, 86.0, 71.0, 68.0, 76.0, 63.0, 66.0, 57.0, 37.0, 26.0, 44.0, 26.0, 13.0, 13.0, 7.0, 10.0, 7.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.421875, -19.720703125, -19.01953125, -18.318359375, -17.6171875, -16.916015625, -16.21484375, -15.513671875, -14.8125, -14.111328125, -13.41015625, -12.708984375, -12.0078125, -11.306640625, -10.60546875, -9.904296875, -9.203125, -8.501953125, -7.80078125, -7.099609375, -6.3984375, -5.697265625, -4.99609375, -4.294921875, -3.59375, -2.892578125, -2.19140625, -1.490234375, -0.7890625, -0.087890625, 0.61328125, 1.314453125, 2.015625, 2.716796875, 3.41796875, 4.119140625, 4.8203125, 5.521484375, 6.22265625, 6.923828125, 7.625, 8.326171875, 9.02734375, 9.728515625, 10.4296875, 11.130859375, 11.83203125, 12.533203125, 13.234375, 13.935546875, 14.63671875, 15.337890625, 16.0390625, 16.740234375, 17.44140625, 18.142578125, 18.84375, 19.544921875, 20.24609375, 20.947265625, 21.6484375, 22.349609375, 23.05078125, 23.751953125, 24.453125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 13.0, 29.0, 67.0, 185.0, 392.0, 188.0, 74.0, 20.0, 17.0, 2.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1353.007568359375, -1316.8260498046875, -1280.64453125, -1244.4630126953125, -1208.281494140625, -1172.099853515625, -1135.9183349609375, -1099.73681640625, -1063.5552978515625, -1027.373779296875, -991.1922607421875, -955.0106811523438, -918.8291625976562, -882.6476440429688, -846.466064453125, -810.2845458984375, -774.10302734375, -737.9215087890625, -701.739990234375, -665.5584106445312, -629.3768920898438, -593.1953735351562, -557.0137939453125, -520.832275390625, -484.6507568359375, -448.46923828125, -412.2876892089844, -376.10614013671875, -339.92462158203125, -303.74310302734375, -267.5615539550781, -231.38002014160156, -195.1986083984375, -159.01707458496094, -122.83554077148438, -86.65400695800781, -50.47247314453125, -14.290939331054688, 21.890594482421875, 58.07212829589844, 94.253662109375, 130.43519592285156, 166.61672973632812, 202.7982635498047, 238.97979736328125, 275.16131591796875, 311.3428649902344, 347.5244140625, 383.7059326171875, 419.887451171875, 456.0690002441406, 492.25054931640625, 528.4320678710938, 564.6135864257812, 600.795166015625, 636.9766845703125, 673.158203125, 709.3397216796875, 745.521240234375, 781.7028198242188, 817.8843383789062, 854.0658569335938, 890.2474365234375, 926.428955078125, 962.6104736328125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 3.0, 6.0, 8.0, 9.0, 10.0, 14.0, 13.0, 18.0, 14.0, 19.0, 22.0, 25.0, 30.0, 32.0, 36.0, 29.0, 48.0, 52.0, 64.0, 74.0, 67.0, 57.0, 39.0, 33.0, 41.0, 19.0, 19.0, 35.0, 21.0, 16.0, 23.0, 21.0, 21.0, 15.0, 8.0, 10.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-384.29071044921875, -372.443603515625, -360.59649658203125, -348.7493896484375, -336.90228271484375, -325.0552062988281, -313.2080993652344, -301.3609924316406, -289.5138854980469, -277.6667785644531, -265.8196716308594, -253.9725799560547, -242.12547302246094, -230.2783660888672, -218.4312744140625, -206.58416748046875, -194.737060546875, -182.88995361328125, -171.0428466796875, -159.1957550048828, -147.34864807128906, -135.5015411376953, -123.6544418334961, -111.80734252929688, -99.96023559570312, -88.11312866210938, -76.26602935791016, -64.41893005371094, -52.57182312011719, -40.7247200012207, -28.87761688232422, -17.030517578125, -5.18341064453125, 6.663692474365234, 18.51079559326172, 30.357898712158203, 42.20500183105469, 54.05210494995117, 65.89920806884766, 77.74630737304688, 89.59341430664062, 101.44052124023438, 113.2876205444336, 125.13471984863281, 136.98182678222656, 148.8289337158203, 160.676025390625, 172.52313232421875, 184.3702392578125, 196.21734619140625, 208.064453125, 219.9115447998047, 231.75865173339844, 243.6057586669922, 255.45285034179688, 267.2999572753906, 279.1470642089844, 290.9941711425781, 302.8412780761719, 314.6883850097656, 326.53546142578125, 338.382568359375, 350.22967529296875, 362.0767822265625, 373.92388916015625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 7.0, 4.0, 2.0, 10.0, 7.0, 11.0, 17.0, 14.0, 25.0, 41.0, 64.0, 86.0, 130.0, 219.0, 283.0, 465.0, 723.0, 1014.0, 1615.0, 2567.0, 4771.0, 12628.0, 85210.0, 3008347.0, 1015908.0, 41289.0, 8706.0, 3809.0, 2172.0, 1402.0, 899.0, 611.0, 367.0, 261.0, 154.0, 123.0, 94.0, 63.0, 47.0, 39.0, 20.0, 14.0, 18.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-64.1875, -62.037109375, -59.88671875, -57.736328125, -55.5859375, -53.435546875, -51.28515625, -49.134765625, -46.984375, -44.833984375, -42.68359375, -40.533203125, -38.3828125, -36.232421875, -34.08203125, -31.931640625, -29.78125, -27.630859375, -25.48046875, -23.330078125, -21.1796875, -19.029296875, -16.87890625, -14.728515625, -12.578125, -10.427734375, -8.27734375, -6.126953125, -3.9765625, -1.826171875, 0.32421875, 2.474609375, 4.625, 6.775390625, 8.92578125, 11.076171875, 13.2265625, 15.376953125, 17.52734375, 19.677734375, 21.828125, 23.978515625, 26.12890625, 28.279296875, 30.4296875, 32.580078125, 34.73046875, 36.880859375, 39.03125, 41.181640625, 43.33203125, 45.482421875, 47.6328125, 49.783203125, 51.93359375, 54.083984375, 56.234375, 58.384765625, 60.53515625, 62.685546875, 64.8359375, 66.986328125, 69.13671875, 71.287109375, 73.4375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 5.0, 11.0, 15.0, 13.0, 13.0, 23.0, 18.0, 23.0, 32.0, 28.0, 31.0, 46.0, 35.0, 46.0, 35.0, 37.0, 38.0, 49.0, 47.0, 57.0, 46.0, 52.0, 31.0, 46.0, 28.0, 21.0, 28.0, 21.0, 15.0, 24.0, 11.0, 14.0, 10.0, 8.0, 13.0, 5.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.046875, -22.291748046875, -21.53662109375, -20.781494140625, -20.0263671875, -19.271240234375, -18.51611328125, -17.760986328125, -17.005859375, -16.250732421875, -15.49560546875, -14.740478515625, -13.9853515625, -13.230224609375, -12.47509765625, -11.719970703125, -10.96484375, -10.209716796875, -9.45458984375, -8.699462890625, -7.9443359375, -7.189208984375, -6.43408203125, -5.678955078125, -4.923828125, -4.168701171875, -3.41357421875, -2.658447265625, -1.9033203125, -1.148193359375, -0.39306640625, 0.362060546875, 1.1171875, 1.872314453125, 2.62744140625, 3.382568359375, 4.1376953125, 4.892822265625, 5.64794921875, 6.403076171875, 7.158203125, 7.913330078125, 8.66845703125, 9.423583984375, 10.1787109375, 10.933837890625, 11.68896484375, 12.444091796875, 13.19921875, 13.954345703125, 14.70947265625, 15.464599609375, 16.2197265625, 16.974853515625, 17.72998046875, 18.485107421875, 19.240234375, 19.995361328125, 20.75048828125, 21.505615234375, 22.2607421875, 23.015869140625, 23.77099609375, 24.526123046875, 25.28125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 7.0, 10.0, 22.0, 28.0, 35.0, 49.0, 95.0, 87.0, 158.0, 221.0, 757.0, 11328.0, 4173740.0, 6323.0, 697.0, 243.0, 156.0, 96.0, 73.0, 48.0, 36.0, 26.0, 18.0, 14.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-561.0, -544.21875, -527.4375, -510.65625, -493.875, -477.09375, -460.3125, -443.53125, -426.75, -409.96875, -393.1875, -376.40625, -359.625, -342.84375, -326.0625, -309.28125, -292.5, -275.71875, -258.9375, -242.15625, -225.375, -208.59375, -191.8125, -175.03125, -158.25, -141.46875, -124.6875, -107.90625, -91.125, -74.34375, -57.5625, -40.78125, -24.0, -7.21875, 9.5625, 26.34375, 43.125, 59.90625, 76.6875, 93.46875, 110.25, 127.03125, 143.8125, 160.59375, 177.375, 194.15625, 210.9375, 227.71875, 244.5, 261.28125, 278.0625, 294.84375, 311.625, 328.40625, 345.1875, 361.96875, 378.75, 395.53125, 412.3125, 429.09375, 445.875, 462.65625, 479.4375, 496.21875, 513.0]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 10.0, 27.0, 114.0, 2832.0, 1011.0, 63.0, 17.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-398.5, -386.3671875, -374.234375, -362.1015625, -349.96875, -337.8359375, -325.703125, -313.5703125, -301.4375, -289.3046875, -277.171875, -265.0390625, -252.90625, -240.7734375, -228.640625, -216.5078125, -204.375, -192.2421875, -180.109375, -167.9765625, -155.84375, -143.7109375, -131.578125, -119.4453125, -107.3125, -95.1796875, -83.046875, -70.9140625, -58.78125, -46.6484375, -34.515625, -22.3828125, -10.25, 1.8828125, 14.015625, 26.1484375, 38.28125, 50.4140625, 62.546875, 74.6796875, 86.8125, 98.9453125, 111.078125, 123.2109375, 135.34375, 147.4765625, 159.609375, 171.7421875, 183.875, 196.0078125, 208.140625, 220.2734375, 232.40625, 244.5390625, 256.671875, 268.8046875, 280.9375, 293.0703125, 305.203125, 317.3359375, 329.46875, 341.6015625, 353.734375, 365.8671875, 378.0]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 3.0, 17.0, 43.0, 164.0, 487.0, 200.0, 58.0, 19.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3280.80029296875, -3218.465087890625, -3156.130126953125, -3093.794921875, -3031.4599609375, -2969.124755859375, -2906.78955078125, -2844.45458984375, -2782.119384765625, -2719.7841796875, -2657.44921875, -2595.114013671875, -2532.779052734375, -2470.44384765625, -2408.10888671875, -2345.773681640625, -2283.4384765625, -2221.103271484375, -2158.768310546875, -2096.43310546875, -2034.0980224609375, -1971.762939453125, -1909.4278564453125, -1847.0927734375, -1784.7578125, -1722.4227294921875, -1660.087646484375, -1597.75244140625, -1535.4173583984375, -1473.082275390625, -1410.7471923828125, -1348.412109375, -1286.0767822265625, -1223.74169921875, -1161.4066162109375, -1099.071533203125, -1036.736328125, -974.4012451171875, -912.066162109375, -849.7310791015625, -787.3959350585938, -725.0608520507812, -662.7257080078125, -600.390625, -538.0555419921875, -475.72039794921875, -413.38531494140625, -351.0502014160156, -288.715087890625, -226.37997436523438, -164.0448760986328, -101.70977783203125, -39.374664306640625, 22.96044921875, 85.2955322265625, 147.63064575195312, 209.96575927734375, 272.3008728027344, 334.635986328125, 396.9710693359375, 459.3061828613281, 521.6412963867188, 583.9763793945312, 646.3115234375, 708.6466064453125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 21.0, 32.0, 55.0, 50.0, 76.0, 81.0, 108.0, 100.0, 109.0, 94.0, 64.0, 49.0, 44.0, 48.0, 14.0, 16.0, 13.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-621.919921875, -600.1669311523438, -578.4139404296875, -556.6609497070312, -534.907958984375, -513.1549682617188, -491.4019470214844, -469.6489562988281, -447.8959655761719, -426.1429748535156, -404.3899841308594, -382.636962890625, -360.88397216796875, -339.1309814453125, -317.37799072265625, -295.625, -273.87200927734375, -252.1190185546875, -230.36602783203125, -208.61302185058594, -186.8600311279297, -165.10704040527344, -143.35403442382812, -121.60104370117188, -99.84805297851562, -78.09506225585938, -56.342063903808594, -34.58906555175781, -12.836074829101562, 8.916915893554688, 30.669921875, 52.42291259765625, 74.17584228515625, 95.9288330078125, 117.68183135986328, 139.43482971191406, 161.1878204345703, 182.94081115722656, 204.69381713867188, 226.44680786132812, 248.19979858398438, 269.9527893066406, 291.7057800292969, 313.45880126953125, 335.2117919921875, 356.96478271484375, 378.7177734375, 400.47076416015625, 422.2237548828125, 443.97674560546875, 465.729736328125, 487.48272705078125, 509.2357177734375, 530.9887084960938, 552.74169921875, 574.4947509765625, 596.2476806640625, 618.0006713867188, 639.753662109375, 661.5066528320312, 683.2596435546875, 705.0126342773438, 726.765625, 748.5186767578125, 770.2716674804688]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 8.0, 11.0, 14.0, 11.0, 18.0, 31.0, 40.0, 56.0, 67.0, 102.0, 155.0, 267.0, 376.0, 600.0, 873.0, 1413.0, 2203.0, 3618.0, 6114.0, 10969.0, 20055.0, 38422.0, 80040.0, 179173.0, 320666.0, 200430.0, 89278.0, 42344.0, 22030.0, 12008.0, 6637.0, 3894.0, 2346.0, 1569.0, 876.0, 602.0, 404.0, 265.0, 169.0, 101.0, 98.0, 69.0, 33.0, 22.0, 23.0, 16.0, 14.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-48.1875, -46.7080078125, -45.228515625, -43.7490234375, -42.26953125, -40.7900390625, -39.310546875, -37.8310546875, -36.3515625, -34.8720703125, -33.392578125, -31.9130859375, -30.43359375, -28.9541015625, -27.474609375, -25.9951171875, -24.515625, -23.0361328125, -21.556640625, -20.0771484375, -18.59765625, -17.1181640625, -15.638671875, -14.1591796875, -12.6796875, -11.2001953125, -9.720703125, -8.2412109375, -6.76171875, -5.2822265625, -3.802734375, -2.3232421875, -0.84375, 0.6357421875, 2.115234375, 3.5947265625, 5.07421875, 6.5537109375, 8.033203125, 9.5126953125, 10.9921875, 12.4716796875, 13.951171875, 15.4306640625, 16.91015625, 18.3896484375, 19.869140625, 21.3486328125, 22.828125, 24.3076171875, 25.787109375, 27.2666015625, 28.74609375, 30.2255859375, 31.705078125, 33.1845703125, 34.6640625, 36.1435546875, 37.623046875, 39.1025390625, 40.58203125, 42.0615234375, 43.541015625, 45.0205078125, 46.5]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 12.0, 10.0, 12.0, 7.0, 9.0, 14.0, 19.0, 24.0, 27.0, 28.0, 34.0, 25.0, 35.0, 35.0, 40.0, 34.0, 33.0, 38.0, 43.0, 40.0, 42.0, 41.0, 33.0, 43.0, 36.0, 43.0, 36.0, 29.0, 22.0, 23.0, 17.0, 17.0, 15.0, 11.0, 12.0, 8.0, 6.0, 3.0, 14.0, 6.0, 3.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-22.921875, -22.158447265625, -21.39501953125, -20.631591796875, -19.8681640625, -19.104736328125, -18.34130859375, -17.577880859375, -16.814453125, -16.051025390625, -15.28759765625, -14.524169921875, -13.7607421875, -12.997314453125, -12.23388671875, -11.470458984375, -10.70703125, -9.943603515625, -9.18017578125, -8.416748046875, -7.6533203125, -6.889892578125, -6.12646484375, -5.363037109375, -4.599609375, -3.836181640625, -3.07275390625, -2.309326171875, -1.5458984375, -0.782470703125, -0.01904296875, 0.744384765625, 1.5078125, 2.271240234375, 3.03466796875, 3.798095703125, 4.5615234375, 5.324951171875, 6.08837890625, 6.851806640625, 7.615234375, 8.378662109375, 9.14208984375, 9.905517578125, 10.6689453125, 11.432373046875, 12.19580078125, 12.959228515625, 13.72265625, 14.486083984375, 15.24951171875, 16.012939453125, 16.7763671875, 17.539794921875, 18.30322265625, 19.066650390625, 19.830078125, 20.593505859375, 21.35693359375, 22.120361328125, 22.8837890625, 23.647216796875, 24.41064453125, 25.174072265625, 25.9375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 5.0, 6.0, 8.0, 9.0, 14.0, 11.0, 16.0, 28.0, 36.0, 57.0, 84.0, 150.0, 260.0, 498.0, 956.0, 2292.0, 5777.0, 17626.0, 63992.0, 339511.0, 516883.0, 70328.0, 18996.0, 6364.0, 2430.0, 1041.0, 494.0, 257.0, 111.0, 90.0, 52.0, 45.0, 41.0, 15.0, 15.0, 13.0, 11.0, 9.0, 10.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-89.75, -86.9482421875, -84.146484375, -81.3447265625, -78.54296875, -75.7412109375, -72.939453125, -70.1376953125, -67.3359375, -64.5341796875, -61.732421875, -58.9306640625, -56.12890625, -53.3271484375, -50.525390625, -47.7236328125, -44.921875, -42.1201171875, -39.318359375, -36.5166015625, -33.71484375, -30.9130859375, -28.111328125, -25.3095703125, -22.5078125, -19.7060546875, -16.904296875, -14.1025390625, -11.30078125, -8.4990234375, -5.697265625, -2.8955078125, -0.09375, 2.7080078125, 5.509765625, 8.3115234375, 11.11328125, 13.9150390625, 16.716796875, 19.5185546875, 22.3203125, 25.1220703125, 27.923828125, 30.7255859375, 33.52734375, 36.3291015625, 39.130859375, 41.9326171875, 44.734375, 47.5361328125, 50.337890625, 53.1396484375, 55.94140625, 58.7431640625, 61.544921875, 64.3466796875, 67.1484375, 69.9501953125, 72.751953125, 75.5537109375, 78.35546875, 81.1572265625, 83.958984375, 86.7607421875, 89.5625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 9.0, 12.0, 18.0, 11.0, 19.0, 26.0, 26.0, 27.0, 32.0, 39.0, 52.0, 38.0, 64.0, 53.0, 49.0, 54.0, 52.0, 56.0, 54.0, 49.0, 29.0, 30.0, 29.0, 14.0, 26.0, 17.0, 27.0, 18.0, 13.0, 10.0, 9.0, 11.0, 8.0, 2.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-113.9375, -110.5439453125, -107.150390625, -103.7568359375, -100.36328125, -96.9697265625, -93.576171875, -90.1826171875, -86.7890625, -83.3955078125, -80.001953125, -76.6083984375, -73.21484375, -69.8212890625, -66.427734375, -63.0341796875, -59.640625, -56.2470703125, -52.853515625, -49.4599609375, -46.06640625, -42.6728515625, -39.279296875, -35.8857421875, -32.4921875, -29.0986328125, -25.705078125, -22.3115234375, -18.91796875, -15.5244140625, -12.130859375, -8.7373046875, -5.34375, -1.9501953125, 1.443359375, 4.8369140625, 8.23046875, 11.6240234375, 15.017578125, 18.4111328125, 21.8046875, 25.1982421875, 28.591796875, 31.9853515625, 35.37890625, 38.7724609375, 42.166015625, 45.5595703125, 48.953125, 52.3466796875, 55.740234375, 59.1337890625, 62.52734375, 65.9208984375, 69.314453125, 72.7080078125, 76.1015625, 79.4951171875, 82.888671875, 86.2822265625, 89.67578125, 93.0693359375, 96.462890625, 99.8564453125, 103.25]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 7.0, 7.0, 12.0, 17.0, 23.0, 22.0, 45.0, 68.0, 98.0, 107.0, 185.0, 288.0, 421.0, 657.0, 1068.0, 1898.0, 3800.0, 8748.0, 28149.0, 150930.0, 716328.0, 99110.0, 21337.0, 7538.0, 3259.0, 1723.0, 967.0, 590.0, 385.0, 253.0, 171.0, 102.0, 68.0, 42.0, 29.0, 30.0, 16.0, 16.0, 9.0, 9.0, 3.0, 5.0, 6.0, 4.0, 8.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.078125, -29.018798828125, -27.95947265625, -26.900146484375, -25.8408203125, -24.781494140625, -23.72216796875, -22.662841796875, -21.603515625, -20.544189453125, -19.48486328125, -18.425537109375, -17.3662109375, -16.306884765625, -15.24755859375, -14.188232421875, -13.12890625, -12.069580078125, -11.01025390625, -9.950927734375, -8.8916015625, -7.832275390625, -6.77294921875, -5.713623046875, -4.654296875, -3.594970703125, -2.53564453125, -1.476318359375, -0.4169921875, 0.642333984375, 1.70166015625, 2.760986328125, 3.8203125, 4.879638671875, 5.93896484375, 6.998291015625, 8.0576171875, 9.116943359375, 10.17626953125, 11.235595703125, 12.294921875, 13.354248046875, 14.41357421875, 15.472900390625, 16.5322265625, 17.591552734375, 18.65087890625, 19.710205078125, 20.76953125, 21.828857421875, 22.88818359375, 23.947509765625, 25.0068359375, 26.066162109375, 27.12548828125, 28.184814453125, 29.244140625, 30.303466796875, 31.36279296875, 32.422119140625, 33.4814453125, 34.540771484375, 35.60009765625, 36.659423828125, 37.71875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 2.0, 5.0, 3.0, 5.0, 11.0, 19.0, 27.0, 32.0, 49.0, 91.0, 194.0, 201.0, 133.0, 90.0, 40.0, 34.0, 22.0, 21.0, 9.0, 6.0, 6.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0087738037109375, -0.008453011512756348, -0.008132219314575195, -0.007811427116394043, -0.007490634918212891, -0.007169842720031738, -0.006849050521850586, -0.006528258323669434, -0.006207466125488281, -0.005886673927307129, -0.0055658817291259766, -0.005245089530944824, -0.004924297332763672, -0.0046035051345825195, -0.004282712936401367, -0.003961920738220215, -0.0036411285400390625, -0.00332033634185791, -0.002999544143676758, -0.0026787519454956055, -0.002357959747314453, -0.0020371675491333008, -0.0017163753509521484, -0.001395583152770996, -0.0010747909545898438, -0.0007539987564086914, -0.00043320655822753906, -0.00011241436004638672, 0.00020837783813476562, 0.000529170036315918, 0.0008499622344970703, 0.0011707544326782227, 0.001491546630859375, 0.0018123388290405273, 0.0021331310272216797, 0.002453923225402832, 0.0027747154235839844, 0.0030955076217651367, 0.003416299819946289, 0.0037370920181274414, 0.004057884216308594, 0.004378676414489746, 0.0046994686126708984, 0.005020260810852051, 0.005341053009033203, 0.0056618452072143555, 0.005982637405395508, 0.00630342960357666, 0.0066242218017578125, 0.006945013999938965, 0.007265806198120117, 0.0075865983963012695, 0.007907390594482422, 0.008228182792663574, 0.008548974990844727, 0.008869767189025879, 0.009190559387207031, 0.009511351585388184, 0.009832143783569336, 0.010152935981750488, 0.01047372817993164, 0.010794520378112793, 0.011115312576293945, 0.011436104774475098, 0.01175689697265625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 1.0, 7.0, 9.0, 15.0, 26.0, 41.0, 63.0, 95.0, 179.0, 320.0, 644.0, 1548.0, 4264.0, 17798.0, 172670.0, 782686.0, 54547.0, 8916.0, 2595.0, 1032.0, 492.0, 251.0, 137.0, 93.0, 58.0, 15.0, 22.0, 6.0, 9.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.03125, -45.3681640625, -43.705078125, -42.0419921875, -40.37890625, -38.7158203125, -37.052734375, -35.3896484375, -33.7265625, -32.0634765625, -30.400390625, -28.7373046875, -27.07421875, -25.4111328125, -23.748046875, -22.0849609375, -20.421875, -18.7587890625, -17.095703125, -15.4326171875, -13.76953125, -12.1064453125, -10.443359375, -8.7802734375, -7.1171875, -5.4541015625, -3.791015625, -2.1279296875, -0.46484375, 1.1982421875, 2.861328125, 4.5244140625, 6.1875, 7.8505859375, 9.513671875, 11.1767578125, 12.83984375, 14.5029296875, 16.166015625, 17.8291015625, 19.4921875, 21.1552734375, 22.818359375, 24.4814453125, 26.14453125, 27.8076171875, 29.470703125, 31.1337890625, 32.796875, 34.4599609375, 36.123046875, 37.7861328125, 39.44921875, 41.1123046875, 42.775390625, 44.4384765625, 46.1015625, 47.7646484375, 49.427734375, 51.0908203125, 52.75390625, 54.4169921875, 56.080078125, 57.7431640625, 59.40625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 13.0, 16.0, 9.0, 18.0, 35.0, 52.0, 53.0, 92.0, 117.0, 131.0, 130.0, 103.0, 63.0, 60.0, 42.0, 21.0, 10.0, 8.0, 3.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.71875, -34.4677734375, -33.216796875, -31.9658203125, -30.71484375, -29.4638671875, -28.212890625, -26.9619140625, -25.7109375, -24.4599609375, -23.208984375, -21.9580078125, -20.70703125, -19.4560546875, -18.205078125, -16.9541015625, -15.703125, -14.4521484375, -13.201171875, -11.9501953125, -10.69921875, -9.4482421875, -8.197265625, -6.9462890625, -5.6953125, -4.4443359375, -3.193359375, -1.9423828125, -0.69140625, 0.5595703125, 1.810546875, 3.0615234375, 4.3125, 5.5634765625, 6.814453125, 8.0654296875, 9.31640625, 10.5673828125, 11.818359375, 13.0693359375, 14.3203125, 15.5712890625, 16.822265625, 18.0732421875, 19.32421875, 20.5751953125, 21.826171875, 23.0771484375, 24.328125, 25.5791015625, 26.830078125, 28.0810546875, 29.33203125, 30.5830078125, 31.833984375, 33.0849609375, 34.3359375, 35.5869140625, 36.837890625, 38.0888671875, 39.33984375, 40.5908203125, 41.841796875, 43.0927734375, 44.34375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 9.0, 20.0, 13.0, 46.0, 90.0, 92.0, 211.0, 227.0, 100.0, 64.0, 43.0, 24.0, 21.0, 8.0, 7.0, 5.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-731.3955688476562, -710.4580688476562, -689.5205078125, -668.5830078125, -647.6455078125, -626.7080078125, -605.7704467773438, -584.8329467773438, -563.8953857421875, -542.9578857421875, -522.0203247070312, -501.08282470703125, -480.14532470703125, -459.2077941894531, -438.270263671875, -417.332763671875, -396.395263671875, -375.4577331542969, -354.5202331542969, -333.58270263671875, -312.64520263671875, -291.7076721191406, -270.7701416015625, -249.83262634277344, -228.89511108398438, -207.9575958251953, -187.02008056640625, -166.08255004882812, -145.14503479003906, -124.20751953125, -103.2699966430664, -82.33247375488281, -61.3948974609375, -40.45737838745117, -19.519859313964844, 1.4176597595214844, 22.355178833007812, 43.292694091796875, 64.23021697998047, 85.16773986816406, 106.10525512695312, 127.04277038574219, 147.98028564453125, 168.91781616210938, 189.85533142089844, 210.7928466796875, 231.73037719726562, 252.6678924560547, 273.60540771484375, 294.5429382324219, 315.4804382324219, 336.41796875, 357.35546875, 378.2929992675781, 399.23052978515625, 420.16802978515625, 441.1055603027344, 462.0430908203125, 482.9805908203125, 503.9181213378906, 524.8556518554688, 545.7931518554688, 566.7306518554688, 587.668212890625, 608.605712890625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 6.0, 8.0, 12.0, 19.0, 11.0, 16.0, 16.0, 19.0, 28.0, 36.0, 33.0, 17.0, 31.0, 45.0, 49.0, 86.0, 80.0, 79.0, 59.0, 52.0, 38.0, 38.0, 31.0, 23.0, 21.0, 36.0, 20.0, 14.0, 14.0, 14.0, 15.0, 5.0, 6.0, 6.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-516.142578125, -502.32147216796875, -488.5003662109375, -474.67926025390625, -460.858154296875, -447.03704833984375, -433.2159118652344, -419.3948059082031, -405.5736999511719, -391.7525939941406, -377.9314880371094, -364.1103820800781, -350.28924560546875, -336.4681396484375, -322.64703369140625, -308.825927734375, -295.00482177734375, -281.1837158203125, -267.36260986328125, -253.54148864746094, -239.7203826904297, -225.89927673339844, -212.07815551757812, -198.25704956054688, -184.43594360351562, -170.61483764648438, -156.79373168945312, -142.9726104736328, -129.15150451660156, -115.33039855957031, -101.50928497314453, -87.68817138671875, -73.8670654296875, -60.045955657958984, -46.22484588623047, -32.40373611450195, -18.582626342773438, -4.7615203857421875, 9.059593200683594, 22.880706787109375, 36.701812744140625, 50.52292251586914, 64.34403228759766, 78.16514587402344, 91.98625183105469, 105.80735778808594, 119.62847137451172, 133.4495849609375, 147.27069091796875, 161.091796875, 174.91290283203125, 188.73402404785156, 202.5551300048828, 216.37623596191406, 230.19735717773438, 244.01846313476562, 257.8395690917969, 271.6606750488281, 285.4817810058594, 299.3028869628906, 313.1240234375, 326.94512939453125, 340.7662353515625, 354.58734130859375, 368.408447265625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 6.0, 9.0, 11.0, 12.0, 14.0, 17.0, 35.0, 39.0, 50.0, 83.0, 104.0, 138.0, 165.0, 274.0, 342.0, 537.0, 827.0, 1451.0, 2578.0, 5486.0, 19532.0, 315848.0, 3706948.0, 117010.0, 12782.0, 4330.0, 2132.0, 1172.0, 732.0, 488.0, 301.0, 234.0, 155.0, 105.0, 94.0, 59.0, 52.0, 30.0, 24.0, 16.0, 19.0, 10.0, 11.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.0625, -80.49609375, -77.9296875, -75.36328125, -72.796875, -70.23046875, -67.6640625, -65.09765625, -62.53125, -59.96484375, -57.3984375, -54.83203125, -52.265625, -49.69921875, -47.1328125, -44.56640625, -42.0, -39.43359375, -36.8671875, -34.30078125, -31.734375, -29.16796875, -26.6015625, -24.03515625, -21.46875, -18.90234375, -16.3359375, -13.76953125, -11.203125, -8.63671875, -6.0703125, -3.50390625, -0.9375, 1.62890625, 4.1953125, 6.76171875, 9.328125, 11.89453125, 14.4609375, 17.02734375, 19.59375, 22.16015625, 24.7265625, 27.29296875, 29.859375, 32.42578125, 34.9921875, 37.55859375, 40.125, 42.69140625, 45.2578125, 47.82421875, 50.390625, 52.95703125, 55.5234375, 58.08984375, 60.65625, 63.22265625, 65.7890625, 68.35546875, 70.921875, 73.48828125, 76.0546875, 78.62109375, 81.1875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 3.0, 6.0, 5.0, 11.0, 8.0, 14.0, 14.0, 17.0, 9.0, 18.0, 19.0, 23.0, 35.0, 39.0, 28.0, 25.0, 38.0, 46.0, 31.0, 46.0, 58.0, 34.0, 50.0, 37.0, 35.0, 41.0, 52.0, 36.0, 28.0, 31.0, 28.0, 14.0, 12.0, 23.0, 16.0, 11.0, 10.0, 11.0, 3.0, 8.0, 5.0, 5.0, 0.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.359375, -22.601806640625, -21.84423828125, -21.086669921875, -20.3291015625, -19.571533203125, -18.81396484375, -18.056396484375, -17.298828125, -16.541259765625, -15.78369140625, -15.026123046875, -14.2685546875, -13.510986328125, -12.75341796875, -11.995849609375, -11.23828125, -10.480712890625, -9.72314453125, -8.965576171875, -8.2080078125, -7.450439453125, -6.69287109375, -5.935302734375, -5.177734375, -4.420166015625, -3.66259765625, -2.905029296875, -2.1474609375, -1.389892578125, -0.63232421875, 0.125244140625, 0.8828125, 1.640380859375, 2.39794921875, 3.155517578125, 3.9130859375, 4.670654296875, 5.42822265625, 6.185791015625, 6.943359375, 7.700927734375, 8.45849609375, 9.216064453125, 9.9736328125, 10.731201171875, 11.48876953125, 12.246337890625, 13.00390625, 13.761474609375, 14.51904296875, 15.276611328125, 16.0341796875, 16.791748046875, 17.54931640625, 18.306884765625, 19.064453125, 19.822021484375, 20.57958984375, 21.337158203125, 22.0947265625, 22.852294921875, 23.60986328125, 24.367431640625, 25.125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 10.0, 10.0, 10.0, 34.0, 36.0, 70.0, 109.0, 261.0, 545.0, 1388.0, 3990.0, 17057.0, 1812097.0, 2334533.0, 17492.0, 4057.0, 1377.0, 570.0, 281.0, 133.0, 74.0, 46.0, 23.0, 24.0, 13.0, 8.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-161.375, -156.486328125, -151.59765625, -146.708984375, -141.8203125, -136.931640625, -132.04296875, -127.154296875, -122.265625, -117.376953125, -112.48828125, -107.599609375, -102.7109375, -97.822265625, -92.93359375, -88.044921875, -83.15625, -78.267578125, -73.37890625, -68.490234375, -63.6015625, -58.712890625, -53.82421875, -48.935546875, -44.046875, -39.158203125, -34.26953125, -29.380859375, -24.4921875, -19.603515625, -14.71484375, -9.826171875, -4.9375, -0.048828125, 4.83984375, 9.728515625, 14.6171875, 19.505859375, 24.39453125, 29.283203125, 34.171875, 39.060546875, 43.94921875, 48.837890625, 53.7265625, 58.615234375, 63.50390625, 68.392578125, 73.28125, 78.169921875, 83.05859375, 87.947265625, 92.8359375, 97.724609375, 102.61328125, 107.501953125, 112.390625, 117.279296875, 122.16796875, 127.056640625, 131.9453125, 136.833984375, 141.72265625, 146.611328125, 151.5]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 4.0, 8.0, 9.0, 7.0, 13.0, 28.0, 44.0, 49.0, 164.0, 397.0, 1193.0, 1340.0, 462.0, 167.0, 75.0, 51.0, 18.0, 12.0, 8.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-105.4375, -102.341796875, -99.24609375, -96.150390625, -93.0546875, -89.958984375, -86.86328125, -83.767578125, -80.671875, -77.576171875, -74.48046875, -71.384765625, -68.2890625, -65.193359375, -62.09765625, -59.001953125, -55.90625, -52.810546875, -49.71484375, -46.619140625, -43.5234375, -40.427734375, -37.33203125, -34.236328125, -31.140625, -28.044921875, -24.94921875, -21.853515625, -18.7578125, -15.662109375, -12.56640625, -9.470703125, -6.375, -3.279296875, -0.18359375, 2.912109375, 6.0078125, 9.103515625, 12.19921875, 15.294921875, 18.390625, 21.486328125, 24.58203125, 27.677734375, 30.7734375, 33.869140625, 36.96484375, 40.060546875, 43.15625, 46.251953125, 49.34765625, 52.443359375, 55.5390625, 58.634765625, 61.73046875, 64.826171875, 67.921875, 71.017578125, 74.11328125, 77.208984375, 80.3046875, 83.400390625, 86.49609375, 89.591796875, 92.6875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 12.0, 19.0, 36.0, 73.0, 168.0, 244.0, 197.0, 118.0, 49.0, 30.0, 21.0, 12.0, 7.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-929.636962890625, -907.412841796875, -885.1887817382812, -862.9646606445312, -840.7406005859375, -818.5164794921875, -796.2923583984375, -774.0682373046875, -751.8441772460938, -729.6200561523438, -707.39599609375, -685.171875, -662.94775390625, -640.7236938476562, -618.4995727539062, -596.2755126953125, -574.0513916015625, -551.8272705078125, -529.6032104492188, -507.37908935546875, -485.1549987792969, -462.930908203125, -440.706787109375, -418.4826965332031, -396.25860595703125, -374.0345153808594, -351.8104248046875, -329.5863037109375, -307.3622131347656, -285.13812255859375, -262.91400146484375, -240.68991088867188, -218.46578979492188, -196.24169921875, -174.01759338378906, -151.79348754882812, -129.56939697265625, -107.34529876708984, -85.12120056152344, -62.8970947265625, -40.673004150390625, -18.44890594482422, 3.7751922607421875, 25.999290466308594, 48.223388671875, 70.4474868774414, 92.67158508300781, 114.89569091796875, 137.11978149414062, 159.3438720703125, 181.56797790527344, 203.79208374023438, 226.01617431640625, 248.24026489257812, 270.46435546875, 292.6884765625, 314.9125671386719, 337.13665771484375, 359.36077880859375, 381.5848693847656, 403.8089599609375, 426.0330505371094, 448.25714111328125, 470.48126220703125, 492.7053527832031]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 2.0, 8.0, 4.0, 8.0, 8.0, 6.0, 10.0, 16.0, 5.0, 16.0, 12.0, 19.0, 20.0, 12.0, 23.0, 28.0, 27.0, 19.0, 34.0, 40.0, 34.0, 41.0, 46.0, 38.0, 38.0, 42.0, 46.0, 35.0, 29.0, 34.0, 33.0, 38.0, 19.0, 22.0, 27.0, 23.0, 12.0, 16.0, 16.0, 12.0, 10.0, 7.0, 11.0, 10.0, 9.0, 9.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-209.38430786132812, -202.33154296875, -195.27879333496094, -188.2260284423828, -181.17327880859375, -174.12051391601562, -167.0677490234375, -160.01498413085938, -152.9622344970703, -145.9094696044922, -138.85671997070312, -131.803955078125, -124.7511978149414, -117.69844055175781, -110.64567565917969, -103.5929183959961, -96.5401611328125, -89.4874038696289, -82.43464660644531, -75.38188171386719, -68.3291244506836, -61.2763671875, -54.22360610961914, -47.17084503173828, -40.11808776855469, -33.065330505371094, -26.012569427490234, -18.959810256958008, -11.907051086425781, -4.8542938232421875, 2.198467254638672, 9.251228332519531, 16.303985595703125, 23.35674476623535, 30.409503936767578, 37.46226501464844, 44.51502227783203, 51.567779541015625, 58.620540618896484, 65.67330169677734, 72.72605895996094, 79.77881622314453, 86.83157348632812, 93.88433837890625, 100.93709564208984, 107.98985290527344, 115.04261779785156, 122.09537506103516, 129.14813232421875, 136.20089721679688, 143.25364685058594, 150.30641174316406, 157.35916137695312, 164.41192626953125, 171.46469116210938, 178.5174560546875, 185.57020568847656, 192.6229705810547, 199.67572021484375, 206.72848510742188, 213.78125, 220.83399963378906, 227.8867645263672, 234.93951416015625, 241.99227905273438]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 9.0, 10.0, 18.0, 24.0, 24.0, 41.0, 45.0, 52.0, 88.0, 109.0, 179.0, 239.0, 380.0, 577.0, 880.0, 1440.0, 2359.0, 4169.0, 8102.0, 17474.0, 41335.0, 118152.0, 396617.0, 301580.0, 90096.0, 33801.0, 14295.0, 6993.0, 3690.0, 2143.0, 1245.0, 816.0, 500.0, 319.0, 240.0, 155.0, 86.0, 94.0, 46.0, 35.0, 30.0, 14.0, 11.0, 12.0, 15.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-67.5625, -65.443359375, -63.32421875, -61.205078125, -59.0859375, -56.966796875, -54.84765625, -52.728515625, -50.609375, -48.490234375, -46.37109375, -44.251953125, -42.1328125, -40.013671875, -37.89453125, -35.775390625, -33.65625, -31.537109375, -29.41796875, -27.298828125, -25.1796875, -23.060546875, -20.94140625, -18.822265625, -16.703125, -14.583984375, -12.46484375, -10.345703125, -8.2265625, -6.107421875, -3.98828125, -1.869140625, 0.25, 2.369140625, 4.48828125, 6.607421875, 8.7265625, 10.845703125, 12.96484375, 15.083984375, 17.203125, 19.322265625, 21.44140625, 23.560546875, 25.6796875, 27.798828125, 29.91796875, 32.037109375, 34.15625, 36.275390625, 38.39453125, 40.513671875, 42.6328125, 44.751953125, 46.87109375, 48.990234375, 51.109375, 53.228515625, 55.34765625, 57.466796875, 59.5859375, 61.705078125, 63.82421875, 65.943359375, 68.0625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 3.0, 8.0, 7.0, 12.0, 9.0, 24.0, 14.0, 22.0, 24.0, 26.0, 27.0, 39.0, 38.0, 54.0, 44.0, 50.0, 56.0, 63.0, 57.0, 52.0, 50.0, 44.0, 49.0, 38.0, 35.0, 38.0, 20.0, 17.0, 19.0, 16.0, 14.0, 13.0, 5.0, 4.0, 4.0, 3.0, 1.0, 5.0, 3.0, 0.0, 0.0, 2.0], "bins": [-40.46875, -39.444580078125, -38.42041015625, -37.396240234375, -36.3720703125, -35.347900390625, -34.32373046875, -33.299560546875, -32.275390625, -31.251220703125, -30.22705078125, -29.202880859375, -28.1787109375, -27.154541015625, -26.13037109375, -25.106201171875, -24.08203125, -23.057861328125, -22.03369140625, -21.009521484375, -19.9853515625, -18.961181640625, -17.93701171875, -16.912841796875, -15.888671875, -14.864501953125, -13.84033203125, -12.816162109375, -11.7919921875, -10.767822265625, -9.74365234375, -8.719482421875, -7.6953125, -6.671142578125, -5.64697265625, -4.622802734375, -3.5986328125, -2.574462890625, -1.55029296875, -0.526123046875, 0.498046875, 1.522216796875, 2.54638671875, 3.570556640625, 4.5947265625, 5.618896484375, 6.64306640625, 7.667236328125, 8.69140625, 9.715576171875, 10.73974609375, 11.763916015625, 12.7880859375, 13.812255859375, 14.83642578125, 15.860595703125, 16.884765625, 17.908935546875, 18.93310546875, 19.957275390625, 20.9814453125, 22.005615234375, 23.02978515625, 24.053955078125, 25.078125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 7.0, 6.0, 5.0, 14.0, 12.0, 22.0, 32.0, 44.0, 65.0, 96.0, 153.0, 251.0, 503.0, 954.0, 2453.0, 6984.0, 28936.0, 216876.0, 713223.0, 59382.0, 12003.0, 3638.0, 1399.0, 631.0, 331.0, 168.0, 123.0, 82.0, 50.0, 26.0, 21.0, 23.0, 10.0, 11.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.9375, -104.2412109375, -100.544921875, -96.8486328125, -93.15234375, -89.4560546875, -85.759765625, -82.0634765625, -78.3671875, -74.6708984375, -70.974609375, -67.2783203125, -63.58203125, -59.8857421875, -56.189453125, -52.4931640625, -48.796875, -45.1005859375, -41.404296875, -37.7080078125, -34.01171875, -30.3154296875, -26.619140625, -22.9228515625, -19.2265625, -15.5302734375, -11.833984375, -8.1376953125, -4.44140625, -0.7451171875, 2.951171875, 6.6474609375, 10.34375, 14.0400390625, 17.736328125, 21.4326171875, 25.12890625, 28.8251953125, 32.521484375, 36.2177734375, 39.9140625, 43.6103515625, 47.306640625, 51.0029296875, 54.69921875, 58.3955078125, 62.091796875, 65.7880859375, 69.484375, 73.1806640625, 76.876953125, 80.5732421875, 84.26953125, 87.9658203125, 91.662109375, 95.3583984375, 99.0546875, 102.7509765625, 106.447265625, 110.1435546875, 113.83984375, 117.5361328125, 121.232421875, 124.9287109375, 128.625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 1.0, 4.0, 6.0, 7.0, 12.0, 11.0, 13.0, 20.0, 26.0, 28.0, 54.0, 54.0, 53.0, 50.0, 56.0, 63.0, 65.0, 54.0, 54.0, 60.0, 56.0, 48.0, 30.0, 31.0, 31.0, 19.0, 16.0, 17.0, 17.0, 16.0, 8.0, 9.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.25, -103.046875, -98.84375, -94.640625, -90.4375, -86.234375, -82.03125, -77.828125, -73.625, -69.421875, -65.21875, -61.015625, -56.8125, -52.609375, -48.40625, -44.203125, -40.0, -35.796875, -31.59375, -27.390625, -23.1875, -18.984375, -14.78125, -10.578125, -6.375, -2.171875, 2.03125, 6.234375, 10.4375, 14.640625, 18.84375, 23.046875, 27.25, 31.453125, 35.65625, 39.859375, 44.0625, 48.265625, 52.46875, 56.671875, 60.875, 65.078125, 69.28125, 73.484375, 77.6875, 81.890625, 86.09375, 90.296875, 94.5, 98.703125, 102.90625, 107.109375, 111.3125, 115.515625, 119.71875, 123.921875, 128.125, 132.328125, 136.53125, 140.734375, 144.9375, 149.140625, 153.34375, 157.546875, 161.75]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 7.0, 15.0, 11.0, 21.0, 35.0, 38.0, 75.0, 144.0, 244.0, 463.0, 923.0, 2175.0, 6129.0, 22284.0, 151271.0, 782373.0, 62542.0, 12803.0, 3883.0, 1591.0, 708.0, 350.0, 199.0, 100.0, 63.0, 34.0, 23.0, 16.0, 12.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.21875, -41.837890625, -40.45703125, -39.076171875, -37.6953125, -36.314453125, -34.93359375, -33.552734375, -32.171875, -30.791015625, -29.41015625, -28.029296875, -26.6484375, -25.267578125, -23.88671875, -22.505859375, -21.125, -19.744140625, -18.36328125, -16.982421875, -15.6015625, -14.220703125, -12.83984375, -11.458984375, -10.078125, -8.697265625, -7.31640625, -5.935546875, -4.5546875, -3.173828125, -1.79296875, -0.412109375, 0.96875, 2.349609375, 3.73046875, 5.111328125, 6.4921875, 7.873046875, 9.25390625, 10.634765625, 12.015625, 13.396484375, 14.77734375, 16.158203125, 17.5390625, 18.919921875, 20.30078125, 21.681640625, 23.0625, 24.443359375, 25.82421875, 27.205078125, 28.5859375, 29.966796875, 31.34765625, 32.728515625, 34.109375, 35.490234375, 36.87109375, 38.251953125, 39.6328125, 41.013671875, 42.39453125, 43.775390625, 45.15625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 5.0, 3.0, 6.0, 5.0, 11.0, 9.0, 21.0, 17.0, 29.0, 45.0, 38.0, 51.0, 71.0, 93.0, 129.0, 97.0, 83.0, 51.0, 48.0, 36.0, 27.0, 19.0, 24.0, 24.0, 14.0, 4.0, 8.0, 9.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.005367279052734375, -0.0052290260791778564, -0.005090773105621338, -0.004952520132064819, -0.004814267158508301, -0.004676014184951782, -0.004537761211395264, -0.004399508237838745, -0.0042612552642822266, -0.004123002290725708, -0.0039847493171691895, -0.003846496343612671, -0.0037082433700561523, -0.003569990396499634, -0.0034317374229431152, -0.0032934844493865967, -0.003155231475830078, -0.0030169785022735596, -0.002878725528717041, -0.0027404725551605225, -0.002602219581604004, -0.0024639666080474854, -0.002325713634490967, -0.0021874606609344482, -0.0020492076873779297, -0.0019109547138214111, -0.0017727017402648926, -0.001634448766708374, -0.0014961957931518555, -0.001357942819595337, -0.0012196898460388184, -0.0010814368724822998, -0.0009431838989257812, -0.0008049309253692627, -0.0006666779518127441, -0.0005284249782562256, -0.00039017200469970703, -0.0002519190311431885, -0.00011366605758666992, 2.4586915969848633e-05, 0.0001628398895263672, 0.00030109286308288574, 0.0004393458366394043, 0.0005775988101959229, 0.0007158517837524414, 0.00085410475730896, 0.0009923577308654785, 0.001130610704421997, 0.0012688636779785156, 0.0014071166515350342, 0.0015453696250915527, 0.0016836225986480713, 0.0018218755722045898, 0.0019601285457611084, 0.002098381519317627, 0.0022366344928741455, 0.002374887466430664, 0.0025131404399871826, 0.002651393413543701, 0.0027896463871002197, 0.0029278993606567383, 0.003066152334213257, 0.0032044053077697754, 0.003342658281326294, 0.0034809112548828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 6.0, 5.0, 11.0, 20.0, 29.0, 45.0, 85.0, 151.0, 264.0, 471.0, 916.0, 1929.0, 4797.0, 15077.0, 79805.0, 803712.0, 112446.0, 18622.0, 5647.0, 2217.0, 1031.0, 577.0, 289.0, 145.0, 103.0, 57.0, 35.0, 18.0, 10.0, 8.0, 3.0, 5.0, 7.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-44.40625, -43.0, -41.59375, -40.1875, -38.78125, -37.375, -35.96875, -34.5625, -33.15625, -31.75, -30.34375, -28.9375, -27.53125, -26.125, -24.71875, -23.3125, -21.90625, -20.5, -19.09375, -17.6875, -16.28125, -14.875, -13.46875, -12.0625, -10.65625, -9.25, -7.84375, -6.4375, -5.03125, -3.625, -2.21875, -0.8125, 0.59375, 2.0, 3.40625, 4.8125, 6.21875, 7.625, 9.03125, 10.4375, 11.84375, 13.25, 14.65625, 16.0625, 17.46875, 18.875, 20.28125, 21.6875, 23.09375, 24.5, 25.90625, 27.3125, 28.71875, 30.125, 31.53125, 32.9375, 34.34375, 35.75, 37.15625, 38.5625, 39.96875, 41.375, 42.78125, 44.1875, 45.59375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 14.0, 14.0, 23.0, 27.0, 39.0, 51.0, 73.0, 104.0, 156.0, 142.0, 85.0, 59.0, 60.0, 45.0, 24.0, 14.0, 13.0, 12.0, 4.0, 3.0, 3.0, 5.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.65625, -35.29150390625, -33.9267578125, -32.56201171875, -31.197265625, -29.83251953125, -28.4677734375, -27.10302734375, -25.73828125, -24.37353515625, -23.0087890625, -21.64404296875, -20.279296875, -18.91455078125, -17.5498046875, -16.18505859375, -14.8203125, -13.45556640625, -12.0908203125, -10.72607421875, -9.361328125, -7.99658203125, -6.6318359375, -5.26708984375, -3.90234375, -2.53759765625, -1.1728515625, 0.19189453125, 1.556640625, 2.92138671875, 4.2861328125, 5.65087890625, 7.015625, 8.38037109375, 9.7451171875, 11.10986328125, 12.474609375, 13.83935546875, 15.2041015625, 16.56884765625, 17.93359375, 19.29833984375, 20.6630859375, 22.02783203125, 23.392578125, 24.75732421875, 26.1220703125, 27.48681640625, 28.8515625, 30.21630859375, 31.5810546875, 32.94580078125, 34.310546875, 35.67529296875, 37.0400390625, 38.40478515625, 39.76953125, 41.13427734375, 42.4990234375, 43.86376953125, 45.228515625, 46.59326171875, 47.9580078125, 49.32275390625, 50.6875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 17.0, 29.0, 71.0, 247.0, 508.0, 104.0, 24.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3007.800537109375, -2947.953857421875, -2888.107177734375, -2828.26025390625, -2768.41357421875, -2708.56689453125, -2648.72021484375, -2588.873291015625, -2529.026611328125, -2469.179931640625, -2409.333251953125, -2349.486328125, -2289.6396484375, -2229.79296875, -2169.9462890625, -2110.099365234375, -2050.252685546875, -1990.406005859375, -1930.5592041015625, -1870.7125244140625, -1810.86572265625, -1751.01904296875, -1691.1722412109375, -1631.3255615234375, -1571.4788818359375, -1511.6322021484375, -1451.785400390625, -1391.938720703125, -1332.0919189453125, -1272.2452392578125, -1212.3984375, -1152.5517578125, -1092.7049560546875, -1032.8582763671875, -973.011474609375, -913.1647338867188, -853.3179931640625, -793.4713134765625, -733.62451171875, -673.77783203125, -613.9310302734375, -554.0842895507812, -494.237548828125, -434.39080810546875, -374.5440673828125, -314.6973571777344, -254.85061645507812, -195.00387573242188, -135.15716552734375, -75.3104248046875, -15.463691711425781, 44.38304138183594, 104.22978210449219, 164.07650756835938, 223.92324829101562, 283.7699890136719, 343.6167297363281, 403.4634704589844, 463.3102111816406, 523.1569213867188, 583.003662109375, 642.8504028320312, 702.6971435546875, 762.5438842773438, 822.390625]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 8.0, 10.0, 10.0, 12.0, 19.0, 23.0, 23.0, 22.0, 21.0, 29.0, 33.0, 39.0, 48.0, 60.0, 80.0, 95.0, 82.0, 58.0, 39.0, 29.0, 31.0, 32.0, 28.0, 14.0, 22.0, 27.0, 12.0, 12.0, 11.0, 8.0, 8.0, 6.0, 12.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-458.272216796875, -443.7381591796875, -429.2041015625, -414.6700439453125, -400.135986328125, -385.6019287109375, -371.06787109375, -356.5338439941406, -341.9997863769531, -327.4657287597656, -312.9316711425781, -298.3976135253906, -283.8635559082031, -269.32952880859375, -254.7954559326172, -240.26141357421875, -225.7273406982422, -211.1932830810547, -196.6592254638672, -182.12518310546875, -167.59112548828125, -153.05706787109375, -138.52301025390625, -123.98896026611328, -109.45490264892578, -94.92084503173828, -80.38679504394531, -65.85273742675781, -51.31868362426758, -36.784629821777344, -22.250572204589844, -7.716522216796875, 6.817535400390625, 21.35158920288086, 35.885643005371094, 50.419700622558594, 64.95375061035156, 79.48780822753906, 94.02186584472656, 108.55591583251953, 123.08997344970703, 137.6240234375, 152.1580810546875, 166.692138671875, 181.2261962890625, 195.76025390625, 210.2943115234375, 224.82835388183594, 239.36241149902344, 253.89646911621094, 268.4305114746094, 282.9645690917969, 297.4986267089844, 312.0326843261719, 326.5667419433594, 341.1007995605469, 355.6348571777344, 370.1689147949219, 384.7029724121094, 399.2370300292969, 413.7710876464844, 428.30511474609375, 442.83917236328125, 457.37322998046875, 471.90728759765625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 11.0, 7.0, 15.0, 17.0, 30.0, 29.0, 43.0, 54.0, 77.0, 100.0, 138.0, 203.0, 323.0, 515.0, 1021.0, 2083.0, 5491.0, 50747.0, 4024462.0, 97592.0, 6340.0, 2255.0, 1062.0, 578.0, 308.0, 222.0, 143.0, 105.0, 64.0, 65.0, 33.0, 35.0, 24.0, 20.0, 17.0, 14.0, 10.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-154.75, -149.515625, -144.28125, -139.046875, -133.8125, -128.578125, -123.34375, -118.109375, -112.875, -107.640625, -102.40625, -97.171875, -91.9375, -86.703125, -81.46875, -76.234375, -71.0, -65.765625, -60.53125, -55.296875, -50.0625, -44.828125, -39.59375, -34.359375, -29.125, -23.890625, -18.65625, -13.421875, -8.1875, -2.953125, 2.28125, 7.515625, 12.75, 17.984375, 23.21875, 28.453125, 33.6875, 38.921875, 44.15625, 49.390625, 54.625, 59.859375, 65.09375, 70.328125, 75.5625, 80.796875, 86.03125, 91.265625, 96.5, 101.734375, 106.96875, 112.203125, 117.4375, 122.671875, 127.90625, 133.140625, 138.375, 143.609375, 148.84375, 154.078125, 159.3125, 164.546875, 169.78125, 175.015625, 180.25]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 4.0, 7.0, 4.0, 3.0, 11.0, 4.0, 10.0, 7.0, 16.0, 10.0, 21.0, 16.0, 18.0, 21.0, 16.0, 29.0, 20.0, 35.0, 41.0, 22.0, 39.0, 33.0, 44.0, 51.0, 54.0, 39.0, 40.0, 38.0, 38.0, 37.0, 29.0, 28.0, 29.0, 24.0, 16.0, 19.0, 9.0, 23.0, 21.0, 12.0, 10.0, 9.0, 15.0, 7.0, 2.0, 1.0, 5.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-23.34375, -22.600341796875, -21.85693359375, -21.113525390625, -20.3701171875, -19.626708984375, -18.88330078125, -18.139892578125, -17.396484375, -16.653076171875, -15.90966796875, -15.166259765625, -14.4228515625, -13.679443359375, -12.93603515625, -12.192626953125, -11.44921875, -10.705810546875, -9.96240234375, -9.218994140625, -8.4755859375, -7.732177734375, -6.98876953125, -6.245361328125, -5.501953125, -4.758544921875, -4.01513671875, -3.271728515625, -2.5283203125, -1.784912109375, -1.04150390625, -0.298095703125, 0.4453125, 1.188720703125, 1.93212890625, 2.675537109375, 3.4189453125, 4.162353515625, 4.90576171875, 5.649169921875, 6.392578125, 7.135986328125, 7.87939453125, 8.622802734375, 9.3662109375, 10.109619140625, 10.85302734375, 11.596435546875, 12.33984375, 13.083251953125, 13.82666015625, 14.570068359375, 15.3134765625, 16.056884765625, 16.80029296875, 17.543701171875, 18.287109375, 19.030517578125, 19.77392578125, 20.517333984375, 21.2607421875, 22.004150390625, 22.74755859375, 23.490966796875, 24.234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 3.0, 7.0, 4.0, 10.0, 10.0, 20.0, 22.0, 41.0, 68.0, 163.0, 310.0, 844.0, 2833.0, 14014.0, 2657828.0, 1500971.0, 12977.0, 2660.0, 866.0, 303.0, 125.0, 83.0, 36.0, 25.0, 21.0, 7.0, 9.0, 3.0, 5.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-240.0, -232.72265625, -225.4453125, -218.16796875, -210.890625, -203.61328125, -196.3359375, -189.05859375, -181.78125, -174.50390625, -167.2265625, -159.94921875, -152.671875, -145.39453125, -138.1171875, -130.83984375, -123.5625, -116.28515625, -109.0078125, -101.73046875, -94.453125, -87.17578125, -79.8984375, -72.62109375, -65.34375, -58.06640625, -50.7890625, -43.51171875, -36.234375, -28.95703125, -21.6796875, -14.40234375, -7.125, 0.15234375, 7.4296875, 14.70703125, 21.984375, 29.26171875, 36.5390625, 43.81640625, 51.09375, 58.37109375, 65.6484375, 72.92578125, 80.203125, 87.48046875, 94.7578125, 102.03515625, 109.3125, 116.58984375, 123.8671875, 131.14453125, 138.421875, 145.69921875, 152.9765625, 160.25390625, 167.53125, 174.80859375, 182.0859375, 189.36328125, 196.640625, 203.91796875, 211.1953125, 218.47265625, 225.75]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 4.0, 6.0, 9.0, 17.0, 23.0, 48.0, 124.0, 309.0, 876.0, 1577.0, 644.0, 194.0, 85.0, 50.0, 27.0, 27.0, 7.0, 10.0, 10.0, 6.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.875, -136.521484375, -132.16796875, -127.814453125, -123.4609375, -119.107421875, -114.75390625, -110.400390625, -106.046875, -101.693359375, -97.33984375, -92.986328125, -88.6328125, -84.279296875, -79.92578125, -75.572265625, -71.21875, -66.865234375, -62.51171875, -58.158203125, -53.8046875, -49.451171875, -45.09765625, -40.744140625, -36.390625, -32.037109375, -27.68359375, -23.330078125, -18.9765625, -14.623046875, -10.26953125, -5.916015625, -1.5625, 2.791015625, 7.14453125, 11.498046875, 15.8515625, 20.205078125, 24.55859375, 28.912109375, 33.265625, 37.619140625, 41.97265625, 46.326171875, 50.6796875, 55.033203125, 59.38671875, 63.740234375, 68.09375, 72.447265625, 76.80078125, 81.154296875, 85.5078125, 89.861328125, 94.21484375, 98.568359375, 102.921875, 107.275390625, 111.62890625, 115.982421875, 120.3359375, 124.689453125, 129.04296875, 133.396484375, 137.75]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 5.0, 17.0, 38.0, 106.0, 303.0, 323.0, 127.0, 45.0, 21.0, 9.0, 12.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-518.0655517578125, -471.11444091796875, -424.163330078125, -377.2121887207031, -330.2610778808594, -283.3099670410156, -236.35882568359375, -189.40771484375, -142.45660400390625, -95.50548553466797, -48.55436706542969, -1.603240966796875, 45.347869873046875, 92.29898071289062, 139.2501220703125, 186.20123291015625, 233.15234375, 280.10345458984375, 327.0545654296875, 374.0057067871094, 420.9568176269531, 467.9079284667969, 514.8590698242188, 561.8101806640625, 608.7612915039062, 655.71240234375, 702.6635131835938, 749.6146240234375, 796.5657958984375, 843.516845703125, 890.468017578125, 937.4191284179688, 984.370361328125, 1031.321533203125, 1078.2725830078125, 1125.2237548828125, 1172.1748046875, 1219.1259765625, 1266.0771484375, 1313.0281982421875, 1359.979248046875, 1406.930419921875, 1453.8814697265625, 1500.8326416015625, 1547.78369140625, 1594.73486328125, 1641.68603515625, 1688.6370849609375, 1735.5882568359375, 1782.5394287109375, 1829.490478515625, 1876.441650390625, 1923.3927001953125, 1970.3438720703125, 2017.294921875, 2064.24609375, 2111.197265625, 2158.1484375, 2205.099609375, 2252.050537109375, 2299.001708984375, 2345.952880859375, 2392.904052734375, 2439.85498046875, 2486.80615234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 6.0, 6.0, 6.0, 9.0, 9.0, 11.0, 15.0, 24.0, 38.0, 17.0, 28.0, 31.0, 41.0, 48.0, 34.0, 46.0, 37.0, 28.0, 44.0, 49.0, 31.0, 39.0, 40.0, 38.0, 36.0, 43.0, 37.0, 39.0, 24.0, 15.0, 20.0, 27.0, 15.0, 11.0, 10.0, 7.0, 10.0, 8.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-346.2876892089844, -335.70721435546875, -325.12677001953125, -314.54632568359375, -303.9658508300781, -293.3853759765625, -282.804931640625, -272.2244873046875, -261.6440124511719, -251.0635528564453, -240.48309326171875, -229.9026336669922, -219.32217407226562, -208.74171447753906, -198.1612548828125, -187.58079528808594, -177.00033569335938, -166.4198760986328, -155.83941650390625, -145.2589569091797, -134.67849731445312, -124.09803771972656, -113.517578125, -102.93711853027344, -92.35665893554688, -81.77619934082031, -71.19573974609375, -60.61528015136719, -50.034820556640625, -39.45436096191406, -28.8739013671875, -18.293441772460938, -7.712982177734375, 2.8674774169921875, 13.44793701171875, 24.028396606445312, 34.608856201171875, 45.18931579589844, 55.769775390625, 66.35023498535156, 76.93069458007812, 87.51115417480469, 98.09161376953125, 108.67207336425781, 119.25253295898438, 129.83299255371094, 140.4134521484375, 150.99391174316406, 161.57437133789062, 172.1548309326172, 182.73529052734375, 193.3157501220703, 203.89620971679688, 214.47666931152344, 225.05712890625, 235.63758850097656, 246.21804809570312, 256.79852294921875, 267.37896728515625, 277.95941162109375, 288.5398864746094, 299.120361328125, 309.7008056640625, 320.28125, 330.8617248535156]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 2.0, 7.0, 10.0, 10.0, 8.0, 11.0, 19.0, 24.0, 53.0, 68.0, 96.0, 164.0, 268.0, 414.0, 702.0, 1131.0, 1734.0, 3178.0, 5413.0, 10109.0, 19351.0, 41889.0, 102215.0, 316010.0, 345544.0, 110591.0, 44415.0, 20591.0, 10469.0, 5894.0, 3234.0, 1857.0, 1136.0, 735.0, 425.0, 267.0, 193.0, 131.0, 60.0, 40.0, 25.0, 22.0, 13.0, 9.0, 6.0, 5.0, 2.0, 1.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-52.5, -50.80859375, -49.1171875, -47.42578125, -45.734375, -44.04296875, -42.3515625, -40.66015625, -38.96875, -37.27734375, -35.5859375, -33.89453125, -32.203125, -30.51171875, -28.8203125, -27.12890625, -25.4375, -23.74609375, -22.0546875, -20.36328125, -18.671875, -16.98046875, -15.2890625, -13.59765625, -11.90625, -10.21484375, -8.5234375, -6.83203125, -5.140625, -3.44921875, -1.7578125, -0.06640625, 1.625, 3.31640625, 5.0078125, 6.69921875, 8.390625, 10.08203125, 11.7734375, 13.46484375, 15.15625, 16.84765625, 18.5390625, 20.23046875, 21.921875, 23.61328125, 25.3046875, 26.99609375, 28.6875, 30.37890625, 32.0703125, 33.76171875, 35.453125, 37.14453125, 38.8359375, 40.52734375, 42.21875, 43.91015625, 45.6015625, 47.29296875, 48.984375, 50.67578125, 52.3671875, 54.05859375, 55.75]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 3.0, 7.0, 14.0, 10.0, 11.0, 18.0, 19.0, 19.0, 28.0, 36.0, 21.0, 40.0, 49.0, 42.0, 34.0, 44.0, 49.0, 50.0, 42.0, 49.0, 44.0, 56.0, 34.0, 29.0, 34.0, 38.0, 24.0, 25.0, 21.0, 20.0, 12.0, 13.0, 9.0, 9.0, 8.0, 9.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.96875, -29.021728515625, -28.07470703125, -27.127685546875, -26.1806640625, -25.233642578125, -24.28662109375, -23.339599609375, -22.392578125, -21.445556640625, -20.49853515625, -19.551513671875, -18.6044921875, -17.657470703125, -16.71044921875, -15.763427734375, -14.81640625, -13.869384765625, -12.92236328125, -11.975341796875, -11.0283203125, -10.081298828125, -9.13427734375, -8.187255859375, -7.240234375, -6.293212890625, -5.34619140625, -4.399169921875, -3.4521484375, -2.505126953125, -1.55810546875, -0.611083984375, 0.3359375, 1.282958984375, 2.22998046875, 3.177001953125, 4.1240234375, 5.071044921875, 6.01806640625, 6.965087890625, 7.912109375, 8.859130859375, 9.80615234375, 10.753173828125, 11.7001953125, 12.647216796875, 13.59423828125, 14.541259765625, 15.48828125, 16.435302734375, 17.38232421875, 18.329345703125, 19.2763671875, 20.223388671875, 21.17041015625, 22.117431640625, 23.064453125, 24.011474609375, 24.95849609375, 25.905517578125, 26.8525390625, 27.799560546875, 28.74658203125, 29.693603515625, 30.640625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 10.0, 8.0, 15.0, 13.0, 19.0, 29.0, 42.0, 45.0, 62.0, 78.0, 114.0, 169.0, 187.0, 274.0, 417.0, 650.0, 1287.0, 3168.0, 11487.0, 67731.0, 816987.0, 120546.0, 16857.0, 4302.0, 1612.0, 763.0, 505.0, 312.0, 216.0, 159.0, 104.0, 89.0, 82.0, 53.0, 34.0, 20.0, 26.0, 17.0, 18.0, 9.0, 7.0, 4.0, 7.0, 8.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-115.9375, -112.3837890625, -108.830078125, -105.2763671875, -101.72265625, -98.1689453125, -94.615234375, -91.0615234375, -87.5078125, -83.9541015625, -80.400390625, -76.8466796875, -73.29296875, -69.7392578125, -66.185546875, -62.6318359375, -59.078125, -55.5244140625, -51.970703125, -48.4169921875, -44.86328125, -41.3095703125, -37.755859375, -34.2021484375, -30.6484375, -27.0947265625, -23.541015625, -19.9873046875, -16.43359375, -12.8798828125, -9.326171875, -5.7724609375, -2.21875, 1.3349609375, 4.888671875, 8.4423828125, 11.99609375, 15.5498046875, 19.103515625, 22.6572265625, 26.2109375, 29.7646484375, 33.318359375, 36.8720703125, 40.42578125, 43.9794921875, 47.533203125, 51.0869140625, 54.640625, 58.1943359375, 61.748046875, 65.3017578125, 68.85546875, 72.4091796875, 75.962890625, 79.5166015625, 83.0703125, 86.6240234375, 90.177734375, 93.7314453125, 97.28515625, 100.8388671875, 104.392578125, 107.9462890625, 111.5]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 8.0, 9.0, 12.0, 9.0, 16.0, 15.0, 15.0, 17.0, 25.0, 24.0, 30.0, 33.0, 35.0, 48.0, 53.0, 56.0, 52.0, 41.0, 67.0, 52.0, 53.0, 38.0, 41.0, 30.0, 25.0, 35.0, 21.0, 30.0, 16.0, 15.0, 9.0, 8.0, 13.0, 10.0, 4.0, 4.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-122.375, -118.705078125, -115.03515625, -111.365234375, -107.6953125, -104.025390625, -100.35546875, -96.685546875, -93.015625, -89.345703125, -85.67578125, -82.005859375, -78.3359375, -74.666015625, -70.99609375, -67.326171875, -63.65625, -59.986328125, -56.31640625, -52.646484375, -48.9765625, -45.306640625, -41.63671875, -37.966796875, -34.296875, -30.626953125, -26.95703125, -23.287109375, -19.6171875, -15.947265625, -12.27734375, -8.607421875, -4.9375, -1.267578125, 2.40234375, 6.072265625, 9.7421875, 13.412109375, 17.08203125, 20.751953125, 24.421875, 28.091796875, 31.76171875, 35.431640625, 39.1015625, 42.771484375, 46.44140625, 50.111328125, 53.78125, 57.451171875, 61.12109375, 64.791015625, 68.4609375, 72.130859375, 75.80078125, 79.470703125, 83.140625, 86.810546875, 90.48046875, 94.150390625, 97.8203125, 101.490234375, 105.16015625, 108.830078125, 112.5]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 4.0, 10.0, 15.0, 14.0, 17.0, 32.0, 43.0, 60.0, 84.0, 113.0, 157.0, 243.0, 458.0, 806.0, 1901.0, 4693.0, 14168.0, 57892.0, 663583.0, 245804.0, 40673.0, 10585.0, 3715.0, 1558.0, 740.0, 424.0, 234.0, 141.0, 100.0, 73.0, 52.0, 36.0, 17.0, 20.0, 11.0, 16.0, 10.0, 11.0, 9.0, 6.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.640625, -20.031494140625, -19.42236328125, -18.813232421875, -18.2041015625, -17.594970703125, -16.98583984375, -16.376708984375, -15.767578125, -15.158447265625, -14.54931640625, -13.940185546875, -13.3310546875, -12.721923828125, -12.11279296875, -11.503662109375, -10.89453125, -10.285400390625, -9.67626953125, -9.067138671875, -8.4580078125, -7.848876953125, -7.23974609375, -6.630615234375, -6.021484375, -5.412353515625, -4.80322265625, -4.194091796875, -3.5849609375, -2.975830078125, -2.36669921875, -1.757568359375, -1.1484375, -0.539306640625, 0.06982421875, 0.678955078125, 1.2880859375, 1.897216796875, 2.50634765625, 3.115478515625, 3.724609375, 4.333740234375, 4.94287109375, 5.552001953125, 6.1611328125, 6.770263671875, 7.37939453125, 7.988525390625, 8.59765625, 9.206787109375, 9.81591796875, 10.425048828125, 11.0341796875, 11.643310546875, 12.25244140625, 12.861572265625, 13.470703125, 14.079833984375, 14.68896484375, 15.298095703125, 15.9072265625, 16.516357421875, 17.12548828125, 17.734619140625, 18.34375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 9.0, 4.0, 4.0, 17.0, 18.0, 27.0, 30.0, 42.0, 66.0, 91.0, 143.0, 140.0, 106.0, 71.0, 57.0, 52.0, 24.0, 25.0, 21.0, 8.0, 12.0, 10.0, 5.0, 3.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004322052001953125, -0.004174530506134033, -0.004027009010314941, -0.0038794875144958496, -0.003731966018676758, -0.003584444522857666, -0.0034369230270385742, -0.0032894015312194824, -0.0031418800354003906, -0.002994358539581299, -0.002846837043762207, -0.0026993155479431152, -0.0025517940521240234, -0.0024042725563049316, -0.00225675106048584, -0.002109229564666748, -0.0019617080688476562, -0.0018141865730285645, -0.0016666650772094727, -0.0015191435813903809, -0.001371622085571289, -0.0012241005897521973, -0.0010765790939331055, -0.0009290575981140137, -0.0007815361022949219, -0.0006340146064758301, -0.0004864931106567383, -0.0003389716148376465, -0.0001914501190185547, -4.392862319946289e-05, 0.0001035928726196289, 0.0002511143684387207, 0.0003986358642578125, 0.0005461573600769043, 0.0006936788558959961, 0.0008412003517150879, 0.0009887218475341797, 0.0011362433433532715, 0.0012837648391723633, 0.001431286334991455, 0.0015788078308105469, 0.0017263293266296387, 0.0018738508224487305, 0.0020213723182678223, 0.002168893814086914, 0.002316415309906006, 0.0024639368057250977, 0.0026114583015441895, 0.0027589797973632812, 0.002906501293182373, 0.003054022789001465, 0.0032015442848205566, 0.0033490657806396484, 0.0034965872764587402, 0.003644108772277832, 0.003791630268096924, 0.003939151763916016, 0.004086673259735107, 0.004234194755554199, 0.004381716251373291, 0.004529237747192383, 0.004676759243011475, 0.004824280738830566, 0.004971802234649658, 0.00511932373046875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 11.0, 8.0, 12.0, 16.0, 23.0, 28.0, 43.0, 54.0, 67.0, 106.0, 171.0, 304.0, 498.0, 889.0, 1855.0, 4035.0, 10318.0, 33425.0, 175533.0, 714973.0, 74993.0, 18901.0, 6401.0, 2845.0, 1243.0, 710.0, 386.0, 198.0, 162.0, 94.0, 60.0, 54.0, 35.0, 25.0, 20.0, 13.0, 11.0, 3.0, 9.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-22.65625, -21.9951171875, -21.333984375, -20.6728515625, -20.01171875, -19.3505859375, -18.689453125, -18.0283203125, -17.3671875, -16.7060546875, -16.044921875, -15.3837890625, -14.72265625, -14.0615234375, -13.400390625, -12.7392578125, -12.078125, -11.4169921875, -10.755859375, -10.0947265625, -9.43359375, -8.7724609375, -8.111328125, -7.4501953125, -6.7890625, -6.1279296875, -5.466796875, -4.8056640625, -4.14453125, -3.4833984375, -2.822265625, -2.1611328125, -1.5, -0.8388671875, -0.177734375, 0.4833984375, 1.14453125, 1.8056640625, 2.466796875, 3.1279296875, 3.7890625, 4.4501953125, 5.111328125, 5.7724609375, 6.43359375, 7.0947265625, 7.755859375, 8.4169921875, 9.078125, 9.7392578125, 10.400390625, 11.0615234375, 11.72265625, 12.3837890625, 13.044921875, 13.7060546875, 14.3671875, 15.0283203125, 15.689453125, 16.3505859375, 17.01171875, 17.6728515625, 18.333984375, 18.9951171875, 19.65625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 8.0, 6.0, 14.0, 8.0, 11.0, 21.0, 16.0, 18.0, 22.0, 43.0, 30.0, 43.0, 67.0, 45.0, 62.0, 61.0, 72.0, 65.0, 71.0, 49.0, 50.0, 41.0, 23.0, 23.0, 16.0, 12.0, 15.0, 15.0, 13.0, 8.0, 9.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 5.0, 0.0, 1.0, 1.0], "bins": [-17.09375, -16.60400390625, -16.1142578125, -15.62451171875, -15.134765625, -14.64501953125, -14.1552734375, -13.66552734375, -13.17578125, -12.68603515625, -12.1962890625, -11.70654296875, -11.216796875, -10.72705078125, -10.2373046875, -9.74755859375, -9.2578125, -8.76806640625, -8.2783203125, -7.78857421875, -7.298828125, -6.80908203125, -6.3193359375, -5.82958984375, -5.33984375, -4.85009765625, -4.3603515625, -3.87060546875, -3.380859375, -2.89111328125, -2.4013671875, -1.91162109375, -1.421875, -0.93212890625, -0.4423828125, 0.04736328125, 0.537109375, 1.02685546875, 1.5166015625, 2.00634765625, 2.49609375, 2.98583984375, 3.4755859375, 3.96533203125, 4.455078125, 4.94482421875, 5.4345703125, 5.92431640625, 6.4140625, 6.90380859375, 7.3935546875, 7.88330078125, 8.373046875, 8.86279296875, 9.3525390625, 9.84228515625, 10.33203125, 10.82177734375, 11.3115234375, 11.80126953125, 12.291015625, 12.78076171875, 13.2705078125, 13.76025390625, 14.25]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 6.0, 5.0, 21.0, 41.0, 121.0, 412.0, 238.0, 86.0, 36.0, 19.0, 10.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1199.6812744140625, -1164.2996826171875, -1128.91796875, -1093.536376953125, -1058.15478515625, -1022.7731323242188, -987.3914794921875, -952.0098876953125, -916.6282348632812, -881.24658203125, -845.864990234375, -810.4833374023438, -775.1016845703125, -739.7200927734375, -704.3384399414062, -668.956787109375, -633.5751953125, -598.1935424804688, -562.8119506835938, -527.4302978515625, -492.0486755371094, -456.66705322265625, -421.285400390625, -385.9037780761719, -350.52215576171875, -315.1405334472656, -279.7589111328125, -244.37725830078125, -208.99563598632812, -173.614013671875, -138.2323760986328, -102.85073852539062, -67.468994140625, -32.087364196777344, 3.2942657470703125, 38.67589569091797, 74.05752563476562, 109.43914794921875, 144.82078552246094, 180.20242309570312, 215.58404541015625, 250.96566772460938, 286.3472900390625, 321.72894287109375, 357.1105651855469, 392.4921875, 427.87384033203125, 463.2554626464844, 498.6370849609375, 534.0187377929688, 569.4003295898438, 604.781982421875, 640.16357421875, 675.5452270507812, 710.9268798828125, 746.3084716796875, 781.6901245117188, 817.07177734375, 852.453369140625, 887.8350219726562, 923.2166748046875, 958.5982666015625, 993.9799194335938, 1029.361572265625, 1064.7431640625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 8.0, 10.0, 6.0, 15.0, 15.0, 15.0, 22.0, 19.0, 19.0, 20.0, 19.0, 21.0, 30.0, 27.0, 42.0, 64.0, 101.0, 136.0, 95.0, 46.0, 28.0, 38.0, 28.0, 27.0, 13.0, 21.0, 19.0, 15.0, 8.0, 10.0, 16.0, 8.0, 12.0, 9.0, 7.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-416.2005920410156, -400.39788818359375, -384.59515380859375, -368.7924499511719, -352.9897155761719, -337.18701171875, -321.38427734375, -305.5815734863281, -289.77886962890625, -273.9761657714844, -258.1734313964844, -242.3707275390625, -226.5679931640625, -210.76528930664062, -194.9625701904297, -179.15985107421875, -163.35711669921875, -147.5543975830078, -131.75167846679688, -115.94896697998047, -100.14624786376953, -84.3435287475586, -68.54081726074219, -52.73809814453125, -36.93537902832031, -21.132661819458008, -5.329944610595703, 10.472770690917969, 26.275489807128906, 42.078208923339844, 57.88092041015625, 73.68363952636719, 89.48638916015625, 105.28910827636719, 121.09182739257812, 136.89453125, 152.697265625, 168.49996948242188, 184.3026885986328, 200.10540771484375, 215.9081268310547, 231.71084594726562, 247.51356506347656, 263.3162841796875, 279.1189880371094, 294.9217224121094, 310.72442626953125, 326.52716064453125, 342.3298645019531, 358.132568359375, 373.935302734375, 389.7380065917969, 405.5407409667969, 421.34344482421875, 437.14617919921875, 452.9488830566406, 468.7515869140625, 484.5542907714844, 500.3570251464844, 516.1597290039062, 531.9624633789062, 547.7651977539062, 563.56787109375, 579.37060546875, 595.17333984375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 9.0, 6.0, 11.0, 11.0, 11.0, 25.0, 32.0, 35.0, 41.0, 62.0, 71.0, 126.0, 203.0, 265.0, 357.0, 548.0, 858.0, 1267.0, 1956.0, 3228.0, 5906.0, 11870.0, 30536.0, 122628.0, 771674.0, 2344489.0, 714922.0, 127144.0, 29969.0, 11614.0, 5677.0, 3141.0, 1900.0, 1183.0, 773.0, 518.0, 353.0, 226.0, 199.0, 128.0, 93.0, 45.0, 55.0, 44.0, 21.0, 13.0, 11.0, 7.0, 9.0, 6.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-49.28125, -47.55126953125, -45.8212890625, -44.09130859375, -42.361328125, -40.63134765625, -38.9013671875, -37.17138671875, -35.44140625, -33.71142578125, -31.9814453125, -30.25146484375, -28.521484375, -26.79150390625, -25.0615234375, -23.33154296875, -21.6015625, -19.87158203125, -18.1416015625, -16.41162109375, -14.681640625, -12.95166015625, -11.2216796875, -9.49169921875, -7.76171875, -6.03173828125, -4.3017578125, -2.57177734375, -0.841796875, 0.88818359375, 2.6181640625, 4.34814453125, 6.078125, 7.80810546875, 9.5380859375, 11.26806640625, 12.998046875, 14.72802734375, 16.4580078125, 18.18798828125, 19.91796875, 21.64794921875, 23.3779296875, 25.10791015625, 26.837890625, 28.56787109375, 30.2978515625, 32.02783203125, 33.7578125, 35.48779296875, 37.2177734375, 38.94775390625, 40.677734375, 42.40771484375, 44.1376953125, 45.86767578125, 47.59765625, 49.32763671875, 51.0576171875, 52.78759765625, 54.517578125, 56.24755859375, 57.9775390625, 59.70751953125, 61.4375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 12.0, 9.0, 12.0, 7.0, 18.0, 15.0, 14.0, 15.0, 22.0, 26.0, 23.0, 40.0, 31.0, 40.0, 50.0, 36.0, 38.0, 36.0, 43.0, 42.0, 44.0, 48.0, 41.0, 35.0, 31.0, 45.0, 31.0, 30.0, 21.0, 27.0, 13.0, 18.0, 17.0, 12.0, 10.0, 7.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.15625, -25.300537109375, -24.44482421875, -23.589111328125, -22.7333984375, -21.877685546875, -21.02197265625, -20.166259765625, -19.310546875, -18.454833984375, -17.59912109375, -16.743408203125, -15.8876953125, -15.031982421875, -14.17626953125, -13.320556640625, -12.46484375, -11.609130859375, -10.75341796875, -9.897705078125, -9.0419921875, -8.186279296875, -7.33056640625, -6.474853515625, -5.619140625, -4.763427734375, -3.90771484375, -3.052001953125, -2.1962890625, -1.340576171875, -0.48486328125, 0.370849609375, 1.2265625, 2.082275390625, 2.93798828125, 3.793701171875, 4.6494140625, 5.505126953125, 6.36083984375, 7.216552734375, 8.072265625, 8.927978515625, 9.78369140625, 10.639404296875, 11.4951171875, 12.350830078125, 13.20654296875, 14.062255859375, 14.91796875, 15.773681640625, 16.62939453125, 17.485107421875, 18.3408203125, 19.196533203125, 20.05224609375, 20.907958984375, 21.763671875, 22.619384765625, 23.47509765625, 24.330810546875, 25.1865234375, 26.042236328125, 26.89794921875, 27.753662109375, 28.609375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 9.0, 11.0, 42.0, 60.0, 119.0, 267.0, 628.0, 2765.0, 87807.0, 4090849.0, 9603.0, 1369.0, 412.0, 168.0, 86.0, 38.0, 20.0, 10.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-446.0, -433.34765625, -420.6953125, -408.04296875, -395.390625, -382.73828125, -370.0859375, -357.43359375, -344.78125, -332.12890625, -319.4765625, -306.82421875, -294.171875, -281.51953125, -268.8671875, -256.21484375, -243.5625, -230.91015625, -218.2578125, -205.60546875, -192.953125, -180.30078125, -167.6484375, -154.99609375, -142.34375, -129.69140625, -117.0390625, -104.38671875, -91.734375, -79.08203125, -66.4296875, -53.77734375, -41.125, -28.47265625, -15.8203125, -3.16796875, 9.484375, 22.13671875, 34.7890625, 47.44140625, 60.09375, 72.74609375, 85.3984375, 98.05078125, 110.703125, 123.35546875, 136.0078125, 148.66015625, 161.3125, 173.96484375, 186.6171875, 199.26953125, 211.921875, 224.57421875, 237.2265625, 249.87890625, 262.53125, 275.18359375, 287.8359375, 300.48828125, 313.140625, 325.79296875, 338.4453125, 351.09765625, 363.75]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 13.0, 22.0, 18.0, 45.0, 75.0, 138.0, 279.0, 746.0, 1378.0, 725.0, 311.0, 141.0, 74.0, 43.0, 31.0, 22.0, 10.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.4375, -117.0908203125, -110.744140625, -104.3974609375, -98.05078125, -91.7041015625, -85.357421875, -79.0107421875, -72.6640625, -66.3173828125, -59.970703125, -53.6240234375, -47.27734375, -40.9306640625, -34.583984375, -28.2373046875, -21.890625, -15.5439453125, -9.197265625, -2.8505859375, 3.49609375, 9.8427734375, 16.189453125, 22.5361328125, 28.8828125, 35.2294921875, 41.576171875, 47.9228515625, 54.26953125, 60.6162109375, 66.962890625, 73.3095703125, 79.65625, 86.0029296875, 92.349609375, 98.6962890625, 105.04296875, 111.3896484375, 117.736328125, 124.0830078125, 130.4296875, 136.7763671875, 143.123046875, 149.4697265625, 155.81640625, 162.1630859375, 168.509765625, 174.8564453125, 181.203125, 187.5498046875, 193.896484375, 200.2431640625, 206.58984375, 212.9365234375, 219.283203125, 225.6298828125, 231.9765625, 238.3232421875, 244.669921875, 251.0166015625, 257.36328125, 263.7099609375, 270.056640625, 276.4033203125, 282.75]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 7.0, 7.0, 23.0, 38.0, 86.0, 169.0, 279.0, 166.0, 92.0, 53.0, 29.0, 21.0, 13.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-971.4273071289062, -923.8911743164062, -876.3550415039062, -828.8189086914062, -781.2827758789062, -733.7466430664062, -686.21044921875, -638.67431640625, -591.13818359375, -543.60205078125, -496.06591796875, -448.52978515625, -400.99365234375, -353.45751953125, -305.9213562011719, -258.3852233886719, -210.84912109375, -163.31298828125, -115.77684783935547, -68.24070739746094, -20.704574584960938, 26.831558227539062, 74.36770629882812, 121.90383911132812, 169.43997192382812, 216.97610473632812, 264.5122375488281, 312.04840087890625, 359.58453369140625, 407.12066650390625, 454.65679931640625, 502.19293212890625, 549.7291259765625, 597.2652587890625, 644.8013916015625, 692.3375244140625, 739.8736572265625, 787.4097900390625, 834.9459228515625, 882.4820556640625, 930.0181884765625, 977.5543212890625, 1025.0904541015625, 1072.6265869140625, 1120.1627197265625, 1167.6988525390625, 1215.2349853515625, 1262.7711181640625, 1310.307373046875, 1357.843505859375, 1405.379638671875, 1452.915771484375, 1500.451904296875, 1547.988037109375, 1595.524169921875, 1643.060302734375, 1690.596435546875, 1738.132568359375, 1785.668701171875, 1833.204833984375, 1880.740966796875, 1928.277099609375, 1975.813232421875, 2023.349365234375, 2070.885498046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 11.0, 9.0, 18.0, 20.0, 18.0, 34.0, 30.0, 36.0, 35.0, 49.0, 37.0, 42.0, 48.0, 64.0, 73.0, 68.0, 70.0, 53.0, 56.0, 41.0, 34.0, 28.0, 21.0, 21.0, 22.0, 12.0, 9.0, 11.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-873.4290771484375, -850.9620971679688, -828.4951782226562, -806.0281982421875, -783.561279296875, -761.0942993164062, -738.6273193359375, -716.160400390625, -693.6934814453125, -671.2265014648438, -648.7595825195312, -626.2926025390625, -603.82568359375, -581.3587036132812, -558.8917236328125, -536.4248046875, -513.9578247070312, -491.4908752441406, -469.02392578125, -446.55694580078125, -424.09002685546875, -401.623046875, -379.1560974121094, -356.68914794921875, -334.2221984863281, -311.7552490234375, -289.2882995605469, -266.82135009765625, -244.35438537597656, -221.88743591308594, -199.42047119140625, -176.95352172851562, -154.486572265625, -132.01962280273438, -109.55266571044922, -87.08570861816406, -64.61875915527344, -42.15180969238281, -19.684844970703125, 2.7821044921875, 25.249053955078125, 47.716007232666016, 70.1829605102539, 92.64991760253906, 115.11686706542969, 137.5838165283203, 160.05078125, 182.51773071289062, 204.98468017578125, 227.45162963867188, 249.9185791015625, 272.38555908203125, 294.85247802734375, 317.3194580078125, 339.7864074707031, 362.25335693359375, 384.7203063964844, 407.187255859375, 429.6542053222656, 452.12115478515625, 474.588134765625, 497.0550537109375, 519.5220336914062, 541.989013671875, 564.4559326171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 5.0, 5.0, 6.0, 7.0, 11.0, 15.0, 27.0, 33.0, 70.0, 77.0, 132.0, 192.0, 263.0, 452.0, 781.0, 1265.0, 2160.0, 4088.0, 8046.0, 17176.0, 42621.0, 140713.0, 631030.0, 126392.0, 39624.0, 16441.0, 7680.0, 3915.0, 2135.0, 1221.0, 705.0, 433.0, 288.0, 171.0, 123.0, 83.0, 60.0, 30.0, 14.0, 17.0, 16.0, 10.0, 7.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.46875, -50.62548828125, -48.7822265625, -46.93896484375, -45.095703125, -43.25244140625, -41.4091796875, -39.56591796875, -37.72265625, -35.87939453125, -34.0361328125, -32.19287109375, -30.349609375, -28.50634765625, -26.6630859375, -24.81982421875, -22.9765625, -21.13330078125, -19.2900390625, -17.44677734375, -15.603515625, -13.76025390625, -11.9169921875, -10.07373046875, -8.23046875, -6.38720703125, -4.5439453125, -2.70068359375, -0.857421875, 0.98583984375, 2.8291015625, 4.67236328125, 6.515625, 8.35888671875, 10.2021484375, 12.04541015625, 13.888671875, 15.73193359375, 17.5751953125, 19.41845703125, 21.26171875, 23.10498046875, 24.9482421875, 26.79150390625, 28.634765625, 30.47802734375, 32.3212890625, 34.16455078125, 36.0078125, 37.85107421875, 39.6943359375, 41.53759765625, 43.380859375, 45.22412109375, 47.0673828125, 48.91064453125, 50.75390625, 52.59716796875, 54.4404296875, 56.28369140625, 58.126953125, 59.97021484375, 61.8134765625, 63.65673828125, 65.5]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 9.0, 4.0, 2.0, 6.0, 10.0, 15.0, 15.0, 23.0, 20.0, 31.0, 33.0, 31.0, 50.0, 55.0, 52.0, 66.0, 71.0, 54.0, 62.0, 55.0, 60.0, 52.0, 36.0, 52.0, 32.0, 24.0, 20.0, 18.0, 18.0, 7.0, 5.0, 6.0, 3.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.78125, -43.29296875, -41.8046875, -40.31640625, -38.828125, -37.33984375, -35.8515625, -34.36328125, -32.875, -31.38671875, -29.8984375, -28.41015625, -26.921875, -25.43359375, -23.9453125, -22.45703125, -20.96875, -19.48046875, -17.9921875, -16.50390625, -15.015625, -13.52734375, -12.0390625, -10.55078125, -9.0625, -7.57421875, -6.0859375, -4.59765625, -3.109375, -1.62109375, -0.1328125, 1.35546875, 2.84375, 4.33203125, 5.8203125, 7.30859375, 8.796875, 10.28515625, 11.7734375, 13.26171875, 14.75, 16.23828125, 17.7265625, 19.21484375, 20.703125, 22.19140625, 23.6796875, 25.16796875, 26.65625, 28.14453125, 29.6328125, 31.12109375, 32.609375, 34.09765625, 35.5859375, 37.07421875, 38.5625, 40.05078125, 41.5390625, 43.02734375, 44.515625, 46.00390625, 47.4921875, 48.98046875, 50.46875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 11.0, 8.0, 14.0, 27.0, 28.0, 33.0, 62.0, 69.0, 96.0, 145.0, 216.0, 401.0, 740.0, 1636.0, 5081.0, 23857.0, 813837.0, 178433.0, 16887.0, 4005.0, 1385.0, 626.0, 315.0, 195.0, 128.0, 86.0, 63.0, 42.0, 29.0, 20.0, 22.0, 8.0, 8.0, 6.0, 5.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-95.25, -92.2646484375, -89.279296875, -86.2939453125, -83.30859375, -80.3232421875, -77.337890625, -74.3525390625, -71.3671875, -68.3818359375, -65.396484375, -62.4111328125, -59.42578125, -56.4404296875, -53.455078125, -50.4697265625, -47.484375, -44.4990234375, -41.513671875, -38.5283203125, -35.54296875, -32.5576171875, -29.572265625, -26.5869140625, -23.6015625, -20.6162109375, -17.630859375, -14.6455078125, -11.66015625, -8.6748046875, -5.689453125, -2.7041015625, 0.28125, 3.2666015625, 6.251953125, 9.2373046875, 12.22265625, 15.2080078125, 18.193359375, 21.1787109375, 24.1640625, 27.1494140625, 30.134765625, 33.1201171875, 36.10546875, 39.0908203125, 42.076171875, 45.0615234375, 48.046875, 51.0322265625, 54.017578125, 57.0029296875, 59.98828125, 62.9736328125, 65.958984375, 68.9443359375, 71.9296875, 74.9150390625, 77.900390625, 80.8857421875, 83.87109375, 86.8564453125, 89.841796875, 92.8271484375, 95.8125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 1.0, 5.0, 6.0, 7.0, 13.0, 7.0, 16.0, 16.0, 17.0, 21.0, 15.0, 29.0, 39.0, 33.0, 50.0, 69.0, 62.0, 82.0, 78.0, 74.0, 59.0, 57.0, 43.0, 34.0, 31.0, 26.0, 22.0, 16.0, 13.0, 10.0, 12.0, 6.0, 4.0, 7.0, 5.0, 6.0, 1.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-166.625, -161.4609375, -156.296875, -151.1328125, -145.96875, -140.8046875, -135.640625, -130.4765625, -125.3125, -120.1484375, -114.984375, -109.8203125, -104.65625, -99.4921875, -94.328125, -89.1640625, -84.0, -78.8359375, -73.671875, -68.5078125, -63.34375, -58.1796875, -53.015625, -47.8515625, -42.6875, -37.5234375, -32.359375, -27.1953125, -22.03125, -16.8671875, -11.703125, -6.5390625, -1.375, 3.7890625, 8.953125, 14.1171875, 19.28125, 24.4453125, 29.609375, 34.7734375, 39.9375, 45.1015625, 50.265625, 55.4296875, 60.59375, 65.7578125, 70.921875, 76.0859375, 81.25, 86.4140625, 91.578125, 96.7421875, 101.90625, 107.0703125, 112.234375, 117.3984375, 122.5625, 127.7265625, 132.890625, 138.0546875, 143.21875, 148.3828125, 153.546875, 158.7109375, 163.875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 3.0, 9.0, 8.0, 17.0, 19.0, 26.0, 39.0, 62.0, 93.0, 149.0, 210.0, 398.0, 894.0, 2034.0, 5670.0, 23190.0, 722608.0, 262342.0, 21410.0, 5469.0, 1959.0, 836.0, 440.0, 257.0, 141.0, 84.0, 55.0, 36.0, 35.0, 16.0, 4.0, 8.0, 8.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.3984375, -12.9659423828125, -12.533447265625, -12.1009521484375, -11.66845703125, -11.2359619140625, -10.803466796875, -10.3709716796875, -9.9384765625, -9.5059814453125, -9.073486328125, -8.6409912109375, -8.20849609375, -7.7760009765625, -7.343505859375, -6.9110107421875, -6.478515625, -6.0460205078125, -5.613525390625, -5.1810302734375, -4.74853515625, -4.3160400390625, -3.883544921875, -3.4510498046875, -3.0185546875, -2.5860595703125, -2.153564453125, -1.7210693359375, -1.28857421875, -0.8560791015625, -0.423583984375, 0.0089111328125, 0.44140625, 0.8739013671875, 1.306396484375, 1.7388916015625, 2.17138671875, 2.6038818359375, 3.036376953125, 3.4688720703125, 3.9013671875, 4.3338623046875, 4.766357421875, 5.1988525390625, 5.63134765625, 6.0638427734375, 6.496337890625, 6.9288330078125, 7.361328125, 7.7938232421875, 8.226318359375, 8.6588134765625, 9.09130859375, 9.5238037109375, 9.956298828125, 10.3887939453125, 10.8212890625, 11.2537841796875, 11.686279296875, 12.1187744140625, 12.55126953125, 12.9837646484375, 13.416259765625, 13.8487548828125, 14.28125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 9.0, 5.0, 4.0, 11.0, 11.0, 7.0, 21.0, 30.0, 41.0, 58.0, 84.0, 181.0, 197.0, 122.0, 58.0, 47.0, 23.0, 19.0, 11.0, 10.0, 7.0, 6.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.00472259521484375, -0.0046134889125823975, -0.004504382610321045, -0.004395276308059692, -0.00428617000579834, -0.004177063703536987, -0.004067957401275635, -0.003958851099014282, -0.0038497447967529297, -0.003740638494491577, -0.0036315321922302246, -0.003522425889968872, -0.0034133195877075195, -0.003304213285446167, -0.0031951069831848145, -0.003086000680923462, -0.0029768943786621094, -0.002867788076400757, -0.0027586817741394043, -0.0026495754718780518, -0.0025404691696166992, -0.0024313628673553467, -0.002322256565093994, -0.0022131502628326416, -0.002104043960571289, -0.0019949376583099365, -0.001885831356048584, -0.0017767250537872314, -0.001667618751525879, -0.0015585124492645264, -0.0014494061470031738, -0.0013402998447418213, -0.0012311935424804688, -0.0011220872402191162, -0.0010129809379577637, -0.0009038746356964111, -0.0007947683334350586, -0.0006856620311737061, -0.0005765557289123535, -0.000467449426651001, -0.00035834312438964844, -0.0002492368221282959, -0.00014013051986694336, -3.102421760559082e-05, 7.808208465576172e-05, 0.00018718838691711426, 0.0002962946891784668, 0.00040540099143981934, 0.0005145072937011719, 0.0006236135959625244, 0.000732719898223877, 0.0008418262004852295, 0.000950932502746582, 0.0010600388050079346, 0.0011691451072692871, 0.0012782514095306396, 0.0013873577117919922, 0.0014964640140533447, 0.0016055703163146973, 0.0017146766185760498, 0.0018237829208374023, 0.0019328892230987549, 0.0020419955253601074, 0.00215110182762146, 0.0022602081298828125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 6.0, 7.0, 6.0, 13.0, 16.0, 24.0, 47.0, 41.0, 64.0, 89.0, 119.0, 195.0, 280.0, 406.0, 657.0, 1041.0, 1789.0, 3249.0, 6555.0, 15433.0, 52629.0, 787507.0, 132314.0, 25919.0, 9537.0, 4393.0, 2352.0, 1406.0, 752.0, 518.0, 321.0, 248.0, 158.0, 128.0, 85.0, 58.0, 41.0, 30.0, 17.0, 33.0, 19.0, 12.0, 7.0, 7.0, 1.0, 8.0, 5.0, 8.0, 3.0, 2.0, 1.0], "bins": [-10.8203125, -10.5089111328125, -10.197509765625, -9.8861083984375, -9.57470703125, -9.2633056640625, -8.951904296875, -8.6405029296875, -8.3291015625, -8.0177001953125, -7.706298828125, -7.3948974609375, -7.08349609375, -6.7720947265625, -6.460693359375, -6.1492919921875, -5.837890625, -5.5264892578125, -5.215087890625, -4.9036865234375, -4.59228515625, -4.2808837890625, -3.969482421875, -3.6580810546875, -3.3466796875, -3.0352783203125, -2.723876953125, -2.4124755859375, -2.10107421875, -1.7896728515625, -1.478271484375, -1.1668701171875, -0.85546875, -0.5440673828125, -0.232666015625, 0.0787353515625, 0.39013671875, 0.7015380859375, 1.012939453125, 1.3243408203125, 1.6357421875, 1.9471435546875, 2.258544921875, 2.5699462890625, 2.88134765625, 3.1927490234375, 3.504150390625, 3.8155517578125, 4.126953125, 4.4383544921875, 4.749755859375, 5.0611572265625, 5.37255859375, 5.6839599609375, 5.995361328125, 6.3067626953125, 6.6181640625, 6.9295654296875, 7.240966796875, 7.5523681640625, 7.86376953125, 8.1751708984375, 8.486572265625, 8.7979736328125, 9.109375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 8.0, 6.0, 9.0, 11.0, 16.0, 18.0, 16.0, 23.0, 29.0, 32.0, 51.0, 64.0, 69.0, 122.0, 91.0, 85.0, 71.0, 52.0, 35.0, 26.0, 25.0, 20.0, 9.0, 14.0, 7.0, 9.0, 9.0, 6.0, 6.0, 4.0, 8.0, 9.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.7578125, -10.4315185546875, -10.105224609375, -9.7789306640625, -9.45263671875, -9.1263427734375, -8.800048828125, -8.4737548828125, -8.1474609375, -7.8211669921875, -7.494873046875, -7.1685791015625, -6.84228515625, -6.5159912109375, -6.189697265625, -5.8634033203125, -5.537109375, -5.2108154296875, -4.884521484375, -4.5582275390625, -4.23193359375, -3.9056396484375, -3.579345703125, -3.2530517578125, -2.9267578125, -2.6004638671875, -2.274169921875, -1.9478759765625, -1.62158203125, -1.2952880859375, -0.968994140625, -0.6427001953125, -0.31640625, 0.0098876953125, 0.336181640625, 0.6624755859375, 0.98876953125, 1.3150634765625, 1.641357421875, 1.9676513671875, 2.2939453125, 2.6202392578125, 2.946533203125, 3.2728271484375, 3.59912109375, 3.9254150390625, 4.251708984375, 4.5780029296875, 4.904296875, 5.2305908203125, 5.556884765625, 5.8831787109375, 6.20947265625, 6.5357666015625, 6.862060546875, 7.1883544921875, 7.5146484375, 7.8409423828125, 8.167236328125, 8.4935302734375, 8.81982421875, 9.1461181640625, 9.472412109375, 9.7987060546875, 10.125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 6.0, 10.0, 9.0, 12.0, 22.0, 36.0, 52.0, 88.0, 424.0, 147.0, 59.0, 33.0, 35.0, 19.0, 21.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-404.6357421875, -390.5158996582031, -376.3960876464844, -362.2762451171875, -348.15643310546875, -334.0365905761719, -319.916748046875, -305.79693603515625, -291.6770935058594, -277.5572509765625, -263.43743896484375, -249.31759643554688, -235.19776916503906, -221.07794189453125, -206.95811462402344, -192.83828735351562, -178.7184600830078, -164.5986328125, -150.4788055419922, -136.35897827148438, -122.2391357421875, -108.11930847167969, -93.99948120117188, -79.87964630126953, -65.75981903076172, -51.63998794555664, -37.52015686035156, -23.40032958984375, -9.280498504638672, 4.839332580566406, 18.95915985107422, 33.07899475097656, 47.198822021484375, 61.31865310668945, 75.43848419189453, 89.55831146240234, 103.67814636230469, 117.7979736328125, 131.9178009033203, 146.03762817382812, 160.157470703125, 174.2772979736328, 188.39712524414062, 202.5169677734375, 216.6367950439453, 230.75662231445312, 244.87644958496094, 258.99627685546875, 273.1160888671875, 287.2359313964844, 301.3557434082031, 315.4755859375, 329.59539794921875, 343.7152404785156, 357.8350830078125, 371.95489501953125, 386.0747375488281, 400.194580078125, 414.31439208984375, 428.4342346191406, 442.5540466308594, 456.67388916015625, 470.793701171875, 484.9135437011719, 499.03338623046875]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 9.0, 9.0, 12.0, 10.0, 14.0, 14.0, 12.0, 15.0, 19.0, 21.0, 19.0, 26.0, 30.0, 108.0, 251.0, 139.0, 46.0, 35.0, 32.0, 28.0, 21.0, 10.0, 20.0, 18.0, 9.0, 9.0, 13.0, 20.0, 9.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-497.37481689453125, -482.1007080078125, -466.82659912109375, -451.552490234375, -436.2783508300781, -421.0042419433594, -405.7301330566406, -390.4560241699219, -375.181884765625, -359.90777587890625, -344.6336669921875, -329.35955810546875, -314.0854187011719, -298.8113098144531, -283.5372009277344, -268.2630920410156, -252.98898315429688, -237.71487426757812, -222.4407501220703, -207.16664123535156, -191.89251708984375, -176.618408203125, -161.34429931640625, -146.0701904296875, -130.7960662841797, -115.5219497680664, -100.24783325195312, -84.97372436523438, -69.6996078491211, -54.42549133300781, -39.15138244628906, -23.87726593017578, -8.6031494140625, 6.670965194702148, 21.945079803466797, 37.21919250488281, 52.493309020996094, 67.76742553710938, 83.04153442382812, 98.3156509399414, 113.58976745605469, 128.86387634277344, 144.13800048828125, 159.412109375, 174.68621826171875, 189.96034240722656, 205.2344512939453, 220.50857543945312, 235.78268432617188, 251.05679321289062, 266.3309020996094, 281.60504150390625, 296.879150390625, 312.15325927734375, 327.4273681640625, 342.70147705078125, 357.9755859375, 373.24969482421875, 388.5238037109375, 403.79791259765625, 419.0720520019531, 434.3461608886719, 449.6202697753906, 464.8943786621094, 480.16851806640625]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 0.0, 3.0, 5.0, 4.0, 1.0, 4.0, 6.0, 11.0, 17.0, 13.0, 17.0, 22.0, 28.0, 30.0, 33.0, 62.0, 89.0, 318.0, 70.0, 44.0, 39.0, 45.0, 29.0, 30.0, 20.0, 14.0, 12.0, 10.0, 11.0, 4.0, 3.0, 5.0, 3.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.59375, -45.06591796875, -43.5380859375, -42.01025390625, -40.482421875, -38.95458984375, -37.4267578125, -35.89892578125, -34.37109375, -32.84326171875, -31.3154296875, -29.78759765625, -28.259765625, -26.73193359375, -25.2041015625, -23.67626953125, -22.1484375, -20.62060546875, -19.0927734375, -17.56494140625, -16.037109375, -14.50927734375, -12.9814453125, -11.45361328125, -9.92578125, -8.39794921875, -6.8701171875, -5.34228515625, -3.814453125, -2.28662109375, -0.7587890625, 0.76904296875, 2.296875, 3.82470703125, 5.3525390625, 6.88037109375, 8.408203125, 9.93603515625, 11.4638671875, 12.99169921875, 14.51953125, 16.04736328125, 17.5751953125, 19.10302734375, 20.630859375, 22.15869140625, 23.6865234375, 25.21435546875, 26.7421875, 28.27001953125, 29.7978515625, 31.32568359375, 32.853515625, 34.38134765625, 35.9091796875, 37.43701171875, 38.96484375, 40.49267578125, 42.0205078125, 43.54833984375, 45.076171875, 46.60400390625, 48.1318359375, 49.65966796875, 51.1875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 12.0, 14.0, 10.0, 28.0, 47.0, 54.0, 89.0, 155.0, 285.0, 684.0, 1814.0, 6236.0, 207326.0, 8160244.0, 7950.0, 2031.0, 806.0, 347.0, 164.0, 95.0, 47.0, 30.0, 32.0, 24.0, 10.0, 7.0, 7.0, 10.0, 2.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-398.8013916015625, -387.4292907714844, -376.0572204589844, -364.68511962890625, -353.31304931640625, -341.9409484863281, -330.56884765625, -319.19677734375, -307.8246765136719, -296.45257568359375, -285.08050537109375, -273.7084045410156, -262.3363342285156, -250.9642333984375, -239.59214782714844, -228.22006225585938, -216.8479766845703, -205.47589111328125, -194.1038055419922, -182.73171997070312, -171.359619140625, -159.98753356933594, -148.61544799804688, -137.24334716796875, -125.87126922607422, -114.49918365478516, -103.12709045410156, -91.7550048828125, -80.38291931152344, -69.01082611083984, -57.63874053955078, -46.26664733886719, -34.894561767578125, -23.522472381591797, -12.150384902954102, -0.7782974243164062, 10.593791961669922, 21.96588134765625, 33.33796691894531, 44.710060119628906, 56.08214569091797, 67.45423126220703, 78.82632446289062, 90.19841003417969, 101.57049560546875, 112.94258880615234, 124.3146743774414, 135.686767578125, 147.05885314941406, 158.43093872070312, 169.8030242919922, 181.17510986328125, 192.54721069335938, 203.91929626464844, 215.2913818359375, 226.66348266601562, 238.03555297851562, 249.4076385498047, 260.77972412109375, 272.1518249511719, 283.5238952636719, 294.89599609375, 306.26806640625, 317.6401672363281, 329.01226806640625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 3.0, 7.0, 3.0, 7.0, 3.0, 6.0, 1.0, 10.0, 4.0, 4.0, 9.0, 6.0, 3.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-549.675048828125, -529.4202880859375, -509.1654968261719, -488.91070556640625, -468.65594482421875, -448.40118408203125, -428.1463928222656, -407.8916015625, -387.6368408203125, -367.382080078125, -347.1272888183594, -326.87249755859375, -306.61773681640625, -286.36297607421875, -266.1081848144531, -245.85340881347656, -225.5986328125, -205.34385681152344, -185.08908081054688, -164.8343048095703, -144.57952880859375, -124.32475280761719, -104.06997680664062, -83.81520080566406, -63.5604248046875, -43.30564880371094, -23.050872802734375, -2.7960968017578125, 17.45867919921875, 37.71345520019531, 57.968231201171875, 78.22300720214844, 98.477783203125, 118.73255920410156, 138.98733520507812, 159.2421112060547, 179.49688720703125, 199.7516632080078, 220.00643920898438, 240.26121520996094, 260.5159912109375, 280.770751953125, 301.0255432128906, 321.28033447265625, 341.53509521484375, 361.78985595703125, 382.0446472167969, 402.2994384765625, 422.55419921875, 442.8089599609375, 463.0637512207031, 483.31854248046875, 503.57330322265625, 523.8280639648438, 544.0828857421875, 564.337646484375, 584.5924072265625, 604.84716796875, 625.1019287109375, 645.3567504882812, 665.6115112304688, 685.8662719726562, 706.12109375, 726.3758544921875, 746.630615234375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 7.0, 10.0, 15.0, 19.0, 22.0, 33.0, 36.0, 48.0, 101.0, 133.0, 160.0, 281.0, 458.0, 810.0, 1514.0, 3299.0, 8687.0, 29188.0, 133097.0, 252087.0, 66896.0, 16871.0, 5551.0, 2215.0, 1175.0, 590.0, 380.0, 204.0, 112.0, 78.0, 62.0, 35.0, 22.0, 17.0, 18.0, 6.0, 8.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-456.0, -444.390625, -432.78125, -421.171875, -409.5625, -397.953125, -386.34375, -374.734375, -363.125, -351.515625, -339.90625, -328.296875, -316.6875, -305.078125, -293.46875, -281.859375, -270.25, -258.640625, -247.03125, -235.421875, -223.8125, -212.203125, -200.59375, -188.984375, -177.375, -165.765625, -154.15625, -142.546875, -130.9375, -119.328125, -107.71875, -96.109375, -84.5, -72.890625, -61.28125, -49.671875, -38.0625, -26.453125, -14.84375, -3.234375, 8.375, 19.984375, 31.59375, 43.203125, 54.8125, 66.421875, 78.03125, 89.640625, 101.25, 112.859375, 124.46875, 136.078125, 147.6875, 159.296875, 170.90625, 182.515625, 194.125, 205.734375, 217.34375, 228.953125, 240.5625, 252.171875, 263.78125, 275.390625, 287.0]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 5.0, 6.0, 10.0, 19.0, 15.0, 27.0, 26.0, 29.0, 46.0, 69.0, 83.0, 67.0, 62.0, 73.0, 69.0, 61.0, 59.0, 52.0, 44.0, 33.0, 32.0, 23.0, 12.0, 12.0, 13.0, 9.0, 8.0, 4.0, 4.0, 2.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-53.65625, -52.21826171875, -50.7802734375, -49.34228515625, -47.904296875, -46.46630859375, -45.0283203125, -43.59033203125, -42.15234375, -40.71435546875, -39.2763671875, -37.83837890625, -36.400390625, -34.96240234375, -33.5244140625, -32.08642578125, -30.6484375, -29.21044921875, -27.7724609375, -26.33447265625, -24.896484375, -23.45849609375, -22.0205078125, -20.58251953125, -19.14453125, -17.70654296875, -16.2685546875, -14.83056640625, -13.392578125, -11.95458984375, -10.5166015625, -9.07861328125, -7.640625, -6.20263671875, -4.7646484375, -3.32666015625, -1.888671875, -0.45068359375, 0.9873046875, 2.42529296875, 3.86328125, 5.30126953125, 6.7392578125, 8.17724609375, 9.615234375, 11.05322265625, 12.4912109375, 13.92919921875, 15.3671875, 16.80517578125, 18.2431640625, 19.68115234375, 21.119140625, 22.55712890625, 23.9951171875, 25.43310546875, 26.87109375, 28.30908203125, 29.7470703125, 31.18505859375, 32.623046875, 34.06103515625, 35.4990234375, 36.93701171875, 38.375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 16.0, 10.0, 19.0, 42.0, 39.0, 101.0, 91.0, 61.0, 37.0, 22.0, 13.0, 4.0, 8.0, 5.0, 6.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-438.2787780761719, -424.8531494140625, -411.4275207519531, -398.00189208984375, -384.57623291015625, -371.150634765625, -357.7249755859375, -344.2993469238281, -330.87371826171875, -317.4480895996094, -304.0224609375, -290.5968322753906, -277.17120361328125, -263.74554443359375, -250.31991577148438, -236.894287109375, -223.46865844726562, -210.04302978515625, -196.61740112304688, -183.19175720214844, -169.76612854003906, -156.3404998779297, -142.91485595703125, -129.48922729492188, -116.0635986328125, -102.63796997070312, -89.21233367919922, -75.78669738769531, -62.36106872558594, -48.93544006347656, -35.509803771972656, -22.08416748046875, -8.6585693359375, 4.767063140869141, 18.19269561767578, 31.618328094482422, 45.04396057128906, 58.46958923339844, 71.89522552490234, 85.32086181640625, 98.74649047851562, 112.172119140625, 125.5977554321289, 139.0233917236328, 152.4490203857422, 165.87464904785156, 179.30029296875, 192.72592163085938, 206.15155029296875, 219.57717895507812, 233.0028076171875, 246.42845153808594, 259.85406494140625, 273.27972412109375, 286.7053527832031, 300.1309814453125, 313.5566101074219, 326.98223876953125, 340.4078674316406, 353.83349609375, 367.2591552734375, 380.68475341796875, 394.11041259765625, 407.5360412597656, 420.961669921875]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 4.0, 4.0, 3.0, 11.0, 22.0, 29.0, 43.0, 45.0, 62.0, 64.0, 48.0, 38.0, 20.0, 13.0, 12.0, 8.0, 6.0, 4.0, 6.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-238.9586639404297, -232.17811584472656, -225.3975830078125, -218.61703491210938, -211.83648681640625, -205.0559539794922, -198.27540588378906, -191.494873046875, -184.71432495117188, -177.93377685546875, -171.1532440185547, -164.37269592285156, -157.59214782714844, -150.81161499023438, -144.03106689453125, -137.25051879882812, -130.469970703125, -123.6894302368164, -116.90888214111328, -110.12834167480469, -103.3478012084961, -96.5672607421875, -89.78671264648438, -83.00617218017578, -76.22563171386719, -69.4450912475586, -62.664546966552734, -55.884002685546875, -49.10346221923828, -42.32291793823242, -35.54237365722656, -28.76183319091797, -21.981292724609375, -15.200750350952148, -8.420207023620605, -1.6396636962890625, 5.140878677368164, 11.92142105102539, 18.70196533203125, 25.482505798339844, 32.2630500793457, 39.04359436035156, 45.824134826660156, 52.604679107666016, 59.385223388671875, 66.16576385498047, 72.94630432128906, 79.72685241699219, 86.50739288330078, 93.28793334960938, 100.0684814453125, 106.8490219116211, 113.62956237792969, 120.41011047363281, 127.1906509399414, 133.97119140625, 140.75173950195312, 147.53228759765625, 154.3128204345703, 161.09336853027344, 167.87391662597656, 174.65444946289062, 181.43499755859375, 188.21554565429688, 194.99607849121094]}, "eval/loss": 6.144236087799072, "eval/wer": 1.5985872174931048, "eval/runtime": 1314.1566, "eval/samples_per_second": 2.01, "eval/steps_per_second": 0.252} \ No newline at end of file