diff --git "a/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" "b/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" --- "a/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" +++ "b/wandb/run-20220302_000300-2ebwk6gp/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.425, "train/learning_rate": 2.8011611030478957e-05, "train/epoch": 0.84, "train/global_step": 1000, "_runtime": 5740, "_timestamp": 1646185121, "_step": 1001, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 315.0, 699.0, 2.0, 0.0, 1.0], "bins": [-924.809326171875, -909.4195556640625, -894.02978515625, -878.6399536132812, -863.2501831054688, -847.8604125976562, -832.4706420898438, -817.080810546875, -801.6910400390625, -786.30126953125, -770.9114990234375, -755.5216674804688, -740.1318969726562, -724.7421264648438, -709.3523559570312, -693.9625244140625, -678.57275390625, -663.1829833984375, -647.793212890625, -632.4033813476562, -617.0136108398438, -601.6238403320312, -586.2340698242188, -570.84423828125, -555.4544677734375, -540.064697265625, -524.6749267578125, -509.2851257324219, -493.89532470703125, -478.50555419921875, -463.1157531738281, -447.7259826660156, -432.336181640625, -416.9464111328125, -401.5566101074219, -386.1668395996094, -370.77703857421875, -355.38726806640625, -339.9974670410156, -324.6076965332031, -309.2179260253906, -293.8281555175781, -278.4383544921875, -263.048583984375, -247.65878295898438, -232.26901245117188, -216.87921142578125, -201.48944091796875, -186.09963989257812, -170.70985412597656, -155.320068359375, -139.93028259277344, -124.54049682617188, -109.15071868896484, -93.76093292236328, -78.37114715576172, -62.98135757446289, -47.59157180786133, -32.20178985595703, -16.81200408935547, -1.4222183227539062, 13.96756362915039, 29.357349395751953, 44.747135162353516, 60.13692092895508]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 6.0, 10.0, 5.0, 14.0, 21.0, 29.0, 35.0, 44.0, 45.0, 57.0, 57.0, 62.0, 54.0, 65.0, 84.0, 73.0, 51.0, 71.0, 53.0, 51.0, 30.0, 17.0, 24.0, 11.0, 8.0, 8.0, 6.0, 5.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.4429931640625, -79.00655364990234, -76.57011413574219, -74.13367462158203, -71.69723510742188, -69.26079559326172, -66.82435607910156, -64.3879165649414, -61.95147705078125, -59.515037536621094, -57.07859802246094, -54.64215850830078, -52.205718994140625, -49.76927947998047, -47.33283996582031, -44.896400451660156, -42.4599609375, -40.023521423339844, -37.58708190917969, -35.15064239501953, -32.714202880859375, -30.27776336669922, -27.841323852539062, -25.404884338378906, -22.96844482421875, -20.532005310058594, -18.095565795898438, -15.659126281738281, -13.222686767578125, -10.786247253417969, -8.349807739257812, -5.913368225097656, -3.4769287109375, -1.0404891967773438, 1.3959503173828125, 3.8323898315429688, 6.268829345703125, 8.705268859863281, 11.141708374023438, 13.578147888183594, 16.01458740234375, 18.451026916503906, 20.887466430664062, 23.32390594482422, 25.760345458984375, 28.19678497314453, 30.633224487304688, 33.069664001464844, 35.506103515625, 37.942543029785156, 40.37898254394531, 42.81542205810547, 45.251861572265625, 47.68830108642578, 50.12474060058594, 52.561180114746094, 54.99761962890625, 57.434059143066406, 59.87049865722656, 62.30693817138672, 64.74337768554688, 67.17981719970703, 69.61625671386719, 72.05269622802734, 74.4891357421875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 8.0, 7.0, 7.0, 8.0, 6.0, 9.0, 12.0, 34.0, 24.0, 37.0, 25.0, 35.0, 31.0, 50.0, 40.0, 48.0, 45.0, 39.0, 52.0, 50.0, 55.0, 47.0, 49.0, 46.0, 41.0, 37.0, 34.0, 28.0, 28.0, 20.0, 12.0, 7.0, 12.0, 7.0, 7.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.75390625, -1.687469482421875, -1.62103271484375, -1.554595947265625, -1.4881591796875, -1.421722412109375, -1.35528564453125, -1.288848876953125, -1.222412109375, -1.155975341796875, -1.08953857421875, -1.023101806640625, -0.9566650390625, -0.890228271484375, -0.82379150390625, -0.757354736328125, -0.69091796875, -0.624481201171875, -0.55804443359375, -0.491607666015625, -0.4251708984375, -0.358734130859375, -0.29229736328125, -0.225860595703125, -0.159423828125, -0.092987060546875, -0.02655029296875, 0.039886474609375, 0.1063232421875, 0.172760009765625, 0.23919677734375, 0.305633544921875, 0.3720703125, 0.438507080078125, 0.50494384765625, 0.571380615234375, 0.6378173828125, 0.704254150390625, 0.77069091796875, 0.837127685546875, 0.903564453125, 0.970001220703125, 1.03643798828125, 1.102874755859375, 1.1693115234375, 1.235748291015625, 1.30218505859375, 1.368621826171875, 1.43505859375, 1.501495361328125, 1.56793212890625, 1.634368896484375, 1.7008056640625, 1.767242431640625, 1.83367919921875, 1.900115966796875, 1.966552734375, 2.032989501953125, 2.09942626953125, 2.165863037109375, 2.2322998046875, 2.298736572265625, 2.36517333984375, 2.431610107421875, 2.498046875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 4.0, 8.0, 15.0, 19.0, 26.0, 39.0, 54.0, 76.0, 129.0, 157.0, 255.0, 384.0, 630.0, 1084.0, 2168.0, 5136.0, 18434.0, 108915.0, 1991648.0, 1932368.0, 104808.0, 17783.0, 5253.0, 2074.0, 1064.0, 605.0, 373.0, 244.0, 160.0, 115.0, 61.0, 49.0, 43.0, 26.0, 20.0, 14.0, 13.0, 5.0, 9.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.1640625, -8.8245849609375, -8.485107421875, -8.1456298828125, -7.80615234375, -7.4666748046875, -7.127197265625, -6.7877197265625, -6.4482421875, -6.1087646484375, -5.769287109375, -5.4298095703125, -5.09033203125, -4.7508544921875, -4.411376953125, -4.0718994140625, -3.732421875, -3.3929443359375, -3.053466796875, -2.7139892578125, -2.37451171875, -2.0350341796875, -1.695556640625, -1.3560791015625, -1.0166015625, -0.6771240234375, -0.337646484375, 0.0018310546875, 0.34130859375, 0.6807861328125, 1.020263671875, 1.3597412109375, 1.69921875, 2.0386962890625, 2.378173828125, 2.7176513671875, 3.05712890625, 3.3966064453125, 3.736083984375, 4.0755615234375, 4.4150390625, 4.7545166015625, 5.093994140625, 5.4334716796875, 5.77294921875, 6.1124267578125, 6.451904296875, 6.7913818359375, 7.130859375, 7.4703369140625, 7.809814453125, 8.1492919921875, 8.48876953125, 8.8282470703125, 9.167724609375, 9.5072021484375, 9.8466796875, 10.1861572265625, 10.525634765625, 10.8651123046875, 11.20458984375, 11.5440673828125, 11.883544921875, 12.2230224609375, 12.5625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 17.0, 55.0, 113.0, 321.0, 722.0, 1254.0, 878.0, 418.0, 179.0, 62.0, 23.0, 15.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.6875, -29.00830078125, -28.3291015625, -27.64990234375, -26.970703125, -26.29150390625, -25.6123046875, -24.93310546875, -24.25390625, -23.57470703125, -22.8955078125, -22.21630859375, -21.537109375, -20.85791015625, -20.1787109375, -19.49951171875, -18.8203125, -18.14111328125, -17.4619140625, -16.78271484375, -16.103515625, -15.42431640625, -14.7451171875, -14.06591796875, -13.38671875, -12.70751953125, -12.0283203125, -11.34912109375, -10.669921875, -9.99072265625, -9.3115234375, -8.63232421875, -7.953125, -7.27392578125, -6.5947265625, -5.91552734375, -5.236328125, -4.55712890625, -3.8779296875, -3.19873046875, -2.51953125, -1.84033203125, -1.1611328125, -0.48193359375, 0.197265625, 0.87646484375, 1.5556640625, 2.23486328125, 2.9140625, 3.59326171875, 4.2724609375, 4.95166015625, 5.630859375, 6.31005859375, 6.9892578125, 7.66845703125, 8.34765625, 9.02685546875, 9.7060546875, 10.38525390625, 11.064453125, 11.74365234375, 12.4228515625, 13.10205078125, 13.78125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 10.0, 22.0, 60.0, 184.0, 600.0, 2690.0, 2091270.0, 2095917.0, 2577.0, 637.0, 183.0, 72.0, 26.0, 13.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.8125, -78.287109375, -75.76171875, -73.236328125, -70.7109375, -68.185546875, -65.66015625, -63.134765625, -60.609375, -58.083984375, -55.55859375, -53.033203125, -50.5078125, -47.982421875, -45.45703125, -42.931640625, -40.40625, -37.880859375, -35.35546875, -32.830078125, -30.3046875, -27.779296875, -25.25390625, -22.728515625, -20.203125, -17.677734375, -15.15234375, -12.626953125, -10.1015625, -7.576171875, -5.05078125, -2.525390625, 0.0, 2.525390625, 5.05078125, 7.576171875, 10.1015625, 12.626953125, 15.15234375, 17.677734375, 20.203125, 22.728515625, 25.25390625, 27.779296875, 30.3046875, 32.830078125, 35.35546875, 37.880859375, 40.40625, 42.931640625, 45.45703125, 47.982421875, 50.5078125, 53.033203125, 55.55859375, 58.083984375, 60.609375, 63.134765625, 65.66015625, 68.185546875, 70.7109375, 73.236328125, 75.76171875, 78.287109375, 80.8125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 517.0, 481.0, 9.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.01999282836914, -24.805633544921875, -16.59127426147461, -8.376914978027344, -0.16255569458007812, 8.051803588867188, 16.266162872314453, 24.48052215576172, 32.694881439208984, 40.90924072265625, 49.123600006103516, 57.33795928955078, 65.55232238769531, 73.76667785644531, 81.98103332519531, 90.19539642333984, 98.40975952148438, 106.62411499023438, 114.8384780883789, 123.05284118652344, 131.26719665527344, 139.48155212402344, 147.6959228515625, 155.9102783203125, 164.1246337890625, 172.3389892578125, 180.5533447265625, 188.76771545410156, 196.98207092285156, 205.19642639160156, 213.41079711914062, 221.62515258789062, 229.83950805664062, 238.05386352539062, 246.26821899414062, 254.4825897216797, 262.69696044921875, 270.91131591796875, 279.12567138671875, 287.34002685546875, 295.55438232421875, 303.76873779296875, 311.98309326171875, 320.19744873046875, 328.41180419921875, 336.6261901855469, 344.8405456542969, 353.0549011230469, 361.2692565917969, 369.4836120605469, 377.6979675292969, 385.9123229980469, 394.126708984375, 402.341064453125, 410.555419921875, 418.769775390625, 426.984130859375, 435.198486328125, 443.412841796875, 451.627197265625, 459.841552734375, 468.0559387207031, 476.2702941894531, 484.4846496582031, 492.6990051269531]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 13.0, 9.0, 29.0, 17.0, 24.0, 30.0, 42.0, 38.0, 33.0, 46.0, 60.0, 43.0, 34.0, 57.0, 44.0, 57.0, 68.0, 37.0, 49.0, 35.0, 40.0, 33.0, 27.0, 32.0, 20.0, 15.0, 9.0, 11.0, 10.0, 11.0, 7.0, 5.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.7867431640625, -36.5736083984375, -35.3604736328125, -34.147342681884766, -32.934207916259766, -31.721073150634766, -30.5079402923584, -29.29480743408203, -28.08167266845703, -26.86853790283203, -25.655405044555664, -24.442272186279297, -23.229137420654297, -22.016002655029297, -20.80286979675293, -19.589736938476562, -18.376602172851562, -17.163467407226562, -15.950334548950195, -14.737200736999512, -13.524066925048828, -12.310933113098145, -11.097799301147461, -9.884665489196777, -8.671531677246094, -7.45839786529541, -6.245264053344727, -5.032130241394043, -3.8189964294433594, -2.605862617492676, -1.3927288055419922, -0.1795949935913086, 1.033538818359375, 2.2466726303100586, 3.459806442260742, 4.672940254211426, 5.886074066162109, 7.099207878112793, 8.312341690063477, 9.52547550201416, 10.738609313964844, 11.951743125915527, 13.164876937866211, 14.378010749816895, 15.591144561767578, 16.804279327392578, 18.017412185668945, 19.230545043945312, 20.443679809570312, 21.656814575195312, 22.86994743347168, 24.083080291748047, 25.296215057373047, 26.509349822998047, 27.722482681274414, 28.93561553955078, 30.14875030517578, 31.36188507080078, 32.57501983642578, 33.788150787353516, 35.001285552978516, 36.214420318603516, 37.42755126953125, 38.64068603515625, 39.85382080078125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 3.0, 3.0, 9.0, 9.0, 8.0, 8.0, 13.0, 11.0, 11.0, 21.0, 27.0, 24.0, 22.0, 36.0, 31.0, 33.0, 21.0, 36.0, 30.0, 33.0, 36.0, 41.0, 38.0, 35.0, 38.0, 26.0, 39.0, 42.0, 27.0, 39.0, 34.0, 23.0, 36.0, 33.0, 21.0, 15.0, 12.0, 13.0, 16.0, 6.0, 11.0, 4.0, 7.0, 3.0, 1.0, 7.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7119140625, -1.6591644287109375, -1.606414794921875, -1.5536651611328125, -1.50091552734375, -1.4481658935546875, -1.395416259765625, -1.3426666259765625, -1.2899169921875, -1.2371673583984375, -1.184417724609375, -1.1316680908203125, -1.07891845703125, -1.0261688232421875, -0.973419189453125, -0.9206695556640625, -0.867919921875, -0.8151702880859375, -0.762420654296875, -0.7096710205078125, -0.65692138671875, -0.6041717529296875, -0.551422119140625, -0.4986724853515625, -0.4459228515625, -0.3931732177734375, -0.340423583984375, -0.2876739501953125, -0.23492431640625, -0.1821746826171875, -0.129425048828125, -0.0766754150390625, -0.02392578125, 0.0288238525390625, 0.081573486328125, 0.1343231201171875, 0.18707275390625, 0.2398223876953125, 0.292572021484375, 0.3453216552734375, 0.3980712890625, 0.4508209228515625, 0.503570556640625, 0.5563201904296875, 0.60906982421875, 0.6618194580078125, 0.714569091796875, 0.7673187255859375, 0.820068359375, 0.8728179931640625, 0.925567626953125, 0.9783172607421875, 1.03106689453125, 1.0838165283203125, 1.136566162109375, 1.1893157958984375, 1.2420654296875, 1.2948150634765625, 1.347564697265625, 1.4003143310546875, 1.45306396484375, 1.5058135986328125, 1.558563232421875, 1.6113128662109375, 1.6640625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 7.0, 6.0, 6.0, 14.0, 15.0, 17.0, 18.0, 39.0, 43.0, 82.0, 96.0, 132.0, 178.0, 289.0, 414.0, 624.0, 895.0, 1355.0, 1949.0, 3118.0, 4879.0, 7756.0, 12476.0, 20125.0, 32929.0, 54153.0, 88061.0, 133396.0, 179180.0, 171905.0, 124449.0, 80253.0, 49670.0, 30297.0, 18277.0, 11331.0, 7024.0, 4444.0, 2866.0, 1875.0, 1313.0, 841.0, 567.0, 386.0, 230.0, 187.0, 118.0, 87.0, 60.0, 47.0, 25.0, 22.0, 16.0, 6.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1917724609375, -0.18535995483398438, -0.17894744873046875, -0.17253494262695312, -0.1661224365234375, -0.15970993041992188, -0.15329742431640625, -0.14688491821289062, -0.140472412109375, -0.13405990600585938, -0.12764739990234375, -0.12123489379882812, -0.1148223876953125, -0.10840988159179688, -0.10199737548828125, -0.09558486938476562, -0.08917236328125, -0.08275985717773438, -0.07634735107421875, -0.06993484497070312, -0.0635223388671875, -0.057109832763671875, -0.05069732666015625, -0.044284820556640625, -0.037872314453125, -0.031459808349609375, -0.02504730224609375, -0.018634796142578125, -0.0122222900390625, -0.005809783935546875, 0.00060272216796875, 0.007015228271484375, 0.013427734375, 0.019840240478515625, 0.02625274658203125, 0.032665252685546875, 0.0390777587890625, 0.045490264892578125, 0.05190277099609375, 0.058315277099609375, 0.064727783203125, 0.07114028930664062, 0.07755279541015625, 0.08396530151367188, 0.0903778076171875, 0.09679031372070312, 0.10320281982421875, 0.10961532592773438, 0.11602783203125, 0.12244033813476562, 0.12885284423828125, 0.13526535034179688, 0.1416778564453125, 0.14809036254882812, 0.15450286865234375, 0.16091537475585938, 0.167327880859375, 0.17374038696289062, 0.18015289306640625, 0.18656539916992188, 0.1929779052734375, 0.19939041137695312, 0.20580291748046875, 0.21221542358398438, 0.2186279296875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 0.0, 4.0, 5.0, 0.0, 7.0, 5.0, 10.0, 9.0, 7.0, 12.0, 14.0, 11.0, 17.0, 17.0, 26.0, 21.0, 25.0, 23.0, 38.0, 27.0, 24.0, 39.0, 38.0, 39.0, 30.0, 1063.0, 43.0, 42.0, 52.0, 52.0, 31.0, 32.0, 39.0, 26.0, 34.0, 28.0, 26.0, 21.0, 17.0, 15.0, 15.0, 10.0, 10.0, 4.0, 12.0, 5.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0673828125, -1.0301361083984375, -0.992889404296875, -0.9556427001953125, -0.91839599609375, -0.8811492919921875, -0.843902587890625, -0.8066558837890625, -0.7694091796875, -0.7321624755859375, -0.694915771484375, -0.6576690673828125, -0.62042236328125, -0.5831756591796875, -0.545928955078125, -0.5086822509765625, -0.471435546875, -0.4341888427734375, -0.396942138671875, -0.3596954345703125, -0.32244873046875, -0.2852020263671875, -0.247955322265625, -0.2107086181640625, -0.1734619140625, -0.1362152099609375, -0.098968505859375, -0.0617218017578125, -0.02447509765625, 0.0127716064453125, 0.050018310546875, 0.0872650146484375, 0.12451171875, 0.1617584228515625, 0.199005126953125, 0.2362518310546875, 0.27349853515625, 0.3107452392578125, 0.347991943359375, 0.3852386474609375, 0.4224853515625, 0.4597320556640625, 0.496978759765625, 0.5342254638671875, 0.57147216796875, 0.6087188720703125, 0.645965576171875, 0.6832122802734375, 0.720458984375, 0.7577056884765625, 0.794952392578125, 0.8321990966796875, 0.86944580078125, 0.9066925048828125, 0.943939208984375, 0.9811859130859375, 1.0184326171875, 1.0556793212890625, 1.092926025390625, 1.1301727294921875, 1.16741943359375, 1.2046661376953125, 1.241912841796875, 1.2791595458984375, 1.31640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 8.0, 14.0, 10.0, 21.0, 41.0, 49.0, 69.0, 101.0, 162.0, 239.0, 413.0, 665.0, 943.0, 1488.0, 2373.0, 3818.0, 5807.0, 9319.0, 14640.0, 22717.0, 35626.0, 53727.0, 80071.0, 112617.0, 211470.0, 1116423.0, 136070.0, 97470.0, 66432.0, 44427.0, 28890.0, 18489.0, 11784.0, 7540.0, 4748.0, 2993.0, 1909.0, 1277.0, 800.0, 479.0, 348.0, 213.0, 143.0, 94.0, 69.0, 45.0, 27.0, 19.0, 18.0, 8.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.117919921875, -0.11437511444091797, -0.11083030700683594, -0.1072854995727539, -0.10374069213867188, -0.10019588470458984, -0.09665107727050781, -0.09310626983642578, -0.08956146240234375, -0.08601665496826172, -0.08247184753417969, -0.07892704010009766, -0.07538223266601562, -0.0718374252319336, -0.06829261779785156, -0.06474781036376953, -0.0612030029296875, -0.05765819549560547, -0.05411338806152344, -0.050568580627441406, -0.047023773193359375, -0.043478965759277344, -0.03993415832519531, -0.03638935089111328, -0.03284454345703125, -0.02929973602294922, -0.025754928588867188, -0.022210121154785156, -0.018665313720703125, -0.015120506286621094, -0.011575698852539062, -0.008030891418457031, -0.004486083984375, -0.0009412765502929688, 0.0026035308837890625, 0.006148338317871094, 0.009693145751953125, 0.013237953186035156, 0.016782760620117188, 0.02032756805419922, 0.02387237548828125, 0.02741718292236328, 0.030961990356445312, 0.034506797790527344, 0.038051605224609375, 0.041596412658691406, 0.04514122009277344, 0.04868602752685547, 0.0522308349609375, 0.05577564239501953, 0.05932044982910156, 0.0628652572631836, 0.06641006469726562, 0.06995487213134766, 0.07349967956542969, 0.07704448699951172, 0.08058929443359375, 0.08413410186767578, 0.08767890930175781, 0.09122371673583984, 0.09476852416992188, 0.0983133316040039, 0.10185813903808594, 0.10540294647216797, 0.10894775390625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 6.0, 6.0, 5.0, 5.0, 2.0, 11.0, 16.0, 12.0, 11.0, 18.0, 16.0, 16.0, 31.0, 22.0, 30.0, 39.0, 28.0, 44.0, 51.0, 81.0, 95.0, 74.0, 50.0, 58.0, 47.0, 30.0, 27.0, 20.0, 21.0, 18.0, 25.0, 18.0, 10.0, 12.0, 11.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005962371826171875, -0.005777239799499512, -0.0055921077728271484, -0.005406975746154785, -0.005221843719482422, -0.005036711692810059, -0.004851579666137695, -0.004666447639465332, -0.004481315612792969, -0.0042961835861206055, -0.004111051559448242, -0.003925919532775879, -0.0037407875061035156, -0.0035556554794311523, -0.003370523452758789, -0.0031853914260864258, -0.0030002593994140625, -0.0028151273727416992, -0.002629995346069336, -0.0024448633193969727, -0.0022597312927246094, -0.002074599266052246, -0.0018894672393798828, -0.0017043352127075195, -0.0015192031860351562, -0.001334071159362793, -0.0011489391326904297, -0.0009638071060180664, -0.0007786750793457031, -0.0005935430526733398, -0.00040841102600097656, -0.00022327899932861328, -3.814697265625e-05, 0.00014698505401611328, 0.00033211708068847656, 0.0005172491073608398, 0.0007023811340332031, 0.0008875131607055664, 0.0010726451873779297, 0.001257777214050293, 0.0014429092407226562, 0.0016280412673950195, 0.0018131732940673828, 0.001998305320739746, 0.0021834373474121094, 0.0023685693740844727, 0.002553701400756836, 0.0027388334274291992, 0.0029239654541015625, 0.0031090974807739258, 0.003294229507446289, 0.0034793615341186523, 0.0036644935607910156, 0.003849625587463379, 0.004034757614135742, 0.0042198896408081055, 0.004405021667480469, 0.004590153694152832, 0.004775285720825195, 0.004960417747497559, 0.005145549774169922, 0.005330681800842285, 0.0055158138275146484, 0.005700945854187012, 0.005886077880859375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 2.0, 3.0, 5.0, 5.0, 7.0, 9.0, 5.0, 15.0, 23.0, 33.0, 23.0, 32.0, 55.0, 87.0, 113.0, 177.0, 245.0, 401.0, 860.0, 59303.0, 983680.0, 1947.0, 530.0, 305.0, 189.0, 140.0, 78.0, 66.0, 42.0, 38.0, 16.0, 14.0, 16.0, 23.0, 12.0, 16.0, 5.0, 6.0, 7.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1776123046875, -0.17083168029785156, -0.16405105590820312, -0.1572704315185547, -0.15048980712890625, -0.1437091827392578, -0.13692855834960938, -0.13014793395996094, -0.1233673095703125, -0.11658668518066406, -0.10980606079101562, -0.10302543640136719, -0.09624481201171875, -0.08946418762207031, -0.08268356323242188, -0.07590293884277344, -0.069122314453125, -0.06234169006347656, -0.055561065673828125, -0.04878044128417969, -0.04199981689453125, -0.03521919250488281, -0.028438568115234375, -0.021657943725585938, -0.0148773193359375, -0.008096694946289062, -0.001316070556640625, 0.0054645538330078125, 0.01224517822265625, 0.019025802612304688, 0.025806427001953125, 0.03258705139160156, 0.03936767578125, 0.04614830017089844, 0.052928924560546875, 0.05970954895019531, 0.06649017333984375, 0.07327079772949219, 0.08005142211914062, 0.08683204650878906, 0.0936126708984375, 0.10039329528808594, 0.10717391967773438, 0.11395454406738281, 0.12073516845703125, 0.1275157928466797, 0.13429641723632812, 0.14107704162597656, 0.147857666015625, 0.15463829040527344, 0.16141891479492188, 0.1681995391845703, 0.17498016357421875, 0.1817607879638672, 0.18854141235351562, 0.19532203674316406, 0.2021026611328125, 0.20888328552246094, 0.21566390991210938, 0.2224445343017578, 0.22922515869140625, 0.2360057830810547, 0.24278640747070312, 0.24956703186035156, 0.25634765625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 7.0, 159.0, 838.0, 8.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3295329213142395, -0.32378077507019043, -0.31802862882614136, -0.3122764825820923, -0.3065243661403656, -0.30077221989631653, -0.29502007365226746, -0.2892679274082184, -0.2835157811641693, -0.27776363492012024, -0.27201148867607117, -0.2662593424320221, -0.2605072259902954, -0.25475507974624634, -0.24900293350219727, -0.2432507872581482, -0.23749864101409912, -0.23174649477005005, -0.22599436342716217, -0.2202422171831131, -0.21449007093906403, -0.20873792469501495, -0.20298579335212708, -0.197233647108078, -0.19148151576519012, -0.18572936952114105, -0.17997723817825317, -0.1742250919342041, -0.16847294569015503, -0.16272079944610596, -0.15696866810321808, -0.151216521859169, -0.14546436071395874, -0.13971221446990967, -0.1339600831270218, -0.12820793688297272, -0.12245579063892365, -0.11670365184545517, -0.1109515130519867, -0.10519936680793762, -0.09944723546504974, -0.09369509667158127, -0.0879429504275322, -0.08219081163406372, -0.07643866539001465, -0.07068652659654617, -0.0649343878030777, -0.059182241559028625, -0.05343009531497955, -0.04767795279622078, -0.041925810277462006, -0.03617367148399353, -0.030421527102589607, -0.024669384583830833, -0.01891724392771721, -0.013165101408958435, -0.007412958890199661, -0.0016608168371021748, 0.004091325215995312, 0.009843466803431511, 0.015595609322190285, 0.02134775184094906, 0.027099892497062683, 0.03285203501582146, 0.03860417753458023]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 13.0, 5.0, 12.0, 13.0, 18.0, 20.0, 20.0, 28.0, 34.0, 34.0, 50.0, 48.0, 58.0, 52.0, 44.0, 56.0, 44.0, 46.0, 62.0, 43.0, 37.0, 62.0, 34.0, 30.0, 33.0, 28.0, 21.0, 11.0, 8.0, 10.0, 5.0, 8.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0075286030769348145, -0.0073126088827848434, -0.0070966146886348724, -0.006880620494484901, -0.00666462630033493, -0.006448632106184959, -0.006232637912034988, -0.006016643717885017, -0.005800649523735046, -0.005584655329585075, -0.005368661135435104, -0.005152666941285133, -0.004936672747135162, -0.004720678552985191, -0.00450468435883522, -0.004288690164685249, -0.004072695970535278, -0.0038567017763853073, -0.0036407075822353363, -0.0034247133880853653, -0.0032087191939353943, -0.0029927249997854233, -0.0027767308056354523, -0.0025607366114854813, -0.0023447424173355103, -0.0021287482231855392, -0.0019127540290355682, -0.0016967598348855972, -0.0014807656407356262, -0.0012647714465856552, -0.0010487772524356842, -0.0008327830582857132, -0.0006167888641357422, -0.0004007946699857712, -0.00018480047583580017, 3.119371831417084e-05, 0.00024718791246414185, 0.00046318210661411285, 0.0006791763007640839, 0.0008951704949140549, 0.0011111646890640259, 0.0013271588832139969, 0.001543153077363968, 0.001759147271513939, 0.00197514146566391, 0.002191135659813881, 0.002407129853963852, 0.002623124048113823, 0.002839118242263794, 0.003055112436413765, 0.003271106630563736, 0.003487100824713707, 0.003703095018863678, 0.003919089213013649, 0.00413508340716362, 0.004351077601313591, 0.004567071795463562, 0.004783065989613533, 0.004999060183763504, 0.005215054377913475, 0.005431048572063446, 0.005647042766213417, 0.005863036960363388, 0.006079031154513359, 0.00629502534866333]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 3.0, 3.0, 9.0, 9.0, 8.0, 8.0, 13.0, 11.0, 11.0, 21.0, 27.0, 24.0, 22.0, 35.0, 32.0, 33.0, 21.0, 36.0, 30.0, 33.0, 36.0, 41.0, 38.0, 35.0, 38.0, 26.0, 39.0, 42.0, 27.0, 39.0, 34.0, 23.0, 36.0, 33.0, 21.0, 15.0, 11.0, 14.0, 16.0, 6.0, 11.0, 4.0, 7.0, 3.0, 1.0, 7.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7119140625, -1.6591644287109375, -1.606414794921875, -1.5536651611328125, -1.50091552734375, -1.4481658935546875, -1.395416259765625, -1.3426666259765625, -1.2899169921875, -1.2371673583984375, -1.184417724609375, -1.1316680908203125, -1.07891845703125, -1.0261688232421875, -0.973419189453125, -0.9206695556640625, -0.867919921875, -0.8151702880859375, -0.762420654296875, -0.7096710205078125, -0.65692138671875, -0.6041717529296875, -0.551422119140625, -0.4986724853515625, -0.4459228515625, -0.3931732177734375, -0.340423583984375, -0.2876739501953125, -0.23492431640625, -0.1821746826171875, -0.129425048828125, -0.0766754150390625, -0.02392578125, 0.0288238525390625, 0.081573486328125, 0.1343231201171875, 0.18707275390625, 0.2398223876953125, 0.292572021484375, 0.3453216552734375, 0.3980712890625, 0.4508209228515625, 0.503570556640625, 0.5563201904296875, 0.60906982421875, 0.6618194580078125, 0.714569091796875, 0.7673187255859375, 0.820068359375, 0.8728179931640625, 0.925567626953125, 0.9783172607421875, 1.03106689453125, 1.0838165283203125, 1.136566162109375, 1.1893157958984375, 1.2420654296875, 1.2948150634765625, 1.347564697265625, 1.4003143310546875, 1.45306396484375, 1.5058135986328125, 1.558563232421875, 1.6113128662109375, 1.6640625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 14.0, 15.0, 22.0, 21.0, 36.0, 45.0, 55.0, 79.0, 111.0, 158.0, 208.0, 339.0, 423.0, 633.0, 787.0, 1168.0, 1621.0, 2233.0, 3423.0, 5167.0, 8224.0, 14527.0, 34417.0, 131603.0, 506480.0, 236784.0, 51958.0, 19152.0, 9659.0, 6007.0, 4064.0, 2620.0, 1847.0, 1374.0, 923.0, 665.0, 457.0, 340.0, 239.0, 174.0, 139.0, 91.0, 67.0, 39.0, 43.0, 28.0, 24.0, 14.0, 5.0, 12.0, 8.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-6.5625, -6.3553466796875, -6.148193359375, -5.9410400390625, -5.73388671875, -5.5267333984375, -5.319580078125, -5.1124267578125, -4.9052734375, -4.6981201171875, -4.490966796875, -4.2838134765625, -4.07666015625, -3.8695068359375, -3.662353515625, -3.4552001953125, -3.248046875, -3.0408935546875, -2.833740234375, -2.6265869140625, -2.41943359375, -2.2122802734375, -2.005126953125, -1.7979736328125, -1.5908203125, -1.3836669921875, -1.176513671875, -0.9693603515625, -0.76220703125, -0.5550537109375, -0.347900390625, -0.1407470703125, 0.06640625, 0.2735595703125, 0.480712890625, 0.6878662109375, 0.89501953125, 1.1021728515625, 1.309326171875, 1.5164794921875, 1.7236328125, 1.9307861328125, 2.137939453125, 2.3450927734375, 2.55224609375, 2.7593994140625, 2.966552734375, 3.1737060546875, 3.380859375, 3.5880126953125, 3.795166015625, 4.0023193359375, 4.20947265625, 4.4166259765625, 4.623779296875, 4.8309326171875, 5.0380859375, 5.2452392578125, 5.452392578125, 5.6595458984375, 5.86669921875, 6.0738525390625, 6.281005859375, 6.4881591796875, 6.6953125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 9.0, 10.0, 12.0, 20.0, 24.0, 23.0, 20.0, 26.0, 30.0, 49.0, 36.0, 44.0, 66.0, 83.0, 121.0, 247.0, 1460.0, 233.0, 132.0, 74.0, 57.0, 34.0, 43.0, 23.0, 25.0, 33.0, 20.0, 21.0, 21.0, 17.0, 12.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.078125, -6.865966796875, -6.65380859375, -6.441650390625, -6.2294921875, -6.017333984375, -5.80517578125, -5.593017578125, -5.380859375, -5.168701171875, -4.95654296875, -4.744384765625, -4.5322265625, -4.320068359375, -4.10791015625, -3.895751953125, -3.68359375, -3.471435546875, -3.25927734375, -3.047119140625, -2.8349609375, -2.622802734375, -2.41064453125, -2.198486328125, -1.986328125, -1.774169921875, -1.56201171875, -1.349853515625, -1.1376953125, -0.925537109375, -0.71337890625, -0.501220703125, -0.2890625, -0.076904296875, 0.13525390625, 0.347412109375, 0.5595703125, 0.771728515625, 0.98388671875, 1.196044921875, 1.408203125, 1.620361328125, 1.83251953125, 2.044677734375, 2.2568359375, 2.468994140625, 2.68115234375, 2.893310546875, 3.10546875, 3.317626953125, 3.52978515625, 3.741943359375, 3.9541015625, 4.166259765625, 4.37841796875, 4.590576171875, 4.802734375, 5.014892578125, 5.22705078125, 5.439208984375, 5.6513671875, 5.863525390625, 6.07568359375, 6.287841796875, 6.5]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 8.0, 16.0, 11.0, 7.0, 21.0, 22.0, 19.0, 24.0, 24.0, 39.0, 40.0, 63.0, 130.0, 378.0, 1913.0, 710634.0, 2428859.0, 2544.0, 437.0, 158.0, 78.0, 53.0, 36.0, 41.0, 27.0, 22.0, 16.0, 20.0, 19.0, 8.0, 15.0, 7.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.53125, -27.58203125, -26.6328125, -25.68359375, -24.734375, -23.78515625, -22.8359375, -21.88671875, -20.9375, -19.98828125, -19.0390625, -18.08984375, -17.140625, -16.19140625, -15.2421875, -14.29296875, -13.34375, -12.39453125, -11.4453125, -10.49609375, -9.546875, -8.59765625, -7.6484375, -6.69921875, -5.75, -4.80078125, -3.8515625, -2.90234375, -1.953125, -1.00390625, -0.0546875, 0.89453125, 1.84375, 2.79296875, 3.7421875, 4.69140625, 5.640625, 6.58984375, 7.5390625, 8.48828125, 9.4375, 10.38671875, 11.3359375, 12.28515625, 13.234375, 14.18359375, 15.1328125, 16.08203125, 17.03125, 17.98046875, 18.9296875, 19.87890625, 20.828125, 21.77734375, 22.7265625, 23.67578125, 24.625, 25.57421875, 26.5234375, 27.47265625, 28.421875, 29.37109375, 30.3203125, 31.26953125, 32.21875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 400.0, 617.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-253.70907592773438, -249.2605743408203, -244.81207275390625, -240.36358642578125, -235.9150848388672, -231.46658325195312, -227.01808166503906, -222.569580078125, -218.12107849121094, -213.67257690429688, -209.2240753173828, -204.77557373046875, -200.32708740234375, -195.8785858154297, -191.43008422851562, -186.98158264160156, -182.5330810546875, -178.08457946777344, -173.63607788085938, -169.18759155273438, -164.7390899658203, -160.29058837890625, -155.8420867919922, -151.39358520507812, -146.94509887695312, -142.49659729003906, -138.048095703125, -133.599609375, -129.15110778808594, -124.70260620117188, -120.25410461425781, -115.80560302734375, -111.35710906982422, -106.90860748291016, -102.46011352539062, -98.01161193847656, -93.5631103515625, -89.11460876464844, -84.6661148071289, -80.21761322021484, -75.76911926269531, -71.32061767578125, -66.87212371826172, -62.423622131347656, -57.975120544433594, -53.5266227722168, -49.078125, -44.62962341308594, -40.181121826171875, -35.73262405395508, -31.284122467041016, -26.83562469482422, -22.38712501525879, -17.93862533569336, -13.490127563476562, -9.041627883911133, -4.593128204345703, -0.14462900161743164, 4.30387020111084, 8.752368927001953, 13.200868606567383, 17.649368286132812, 22.09786605834961, 26.54636573791504, 30.99486541748047]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 8.0, 5.0, 6.0, 9.0, 15.0, 9.0, 15.0, 23.0, 14.0, 25.0, 18.0, 19.0, 30.0, 35.0, 32.0, 42.0, 53.0, 43.0, 55.0, 46.0, 47.0, 43.0, 27.0, 37.0, 32.0, 25.0, 42.0, 23.0, 28.0, 29.0, 31.0, 27.0, 17.0, 18.0, 10.0, 16.0, 17.0, 4.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.899330139160156, -17.330888748168945, -16.762449264526367, -16.194007873535156, -15.625568389892578, -15.057126998901367, -14.488686561584473, -13.920246124267578, -13.351805686950684, -12.783365249633789, -12.214924812316895, -11.646484375, -11.078042984008789, -10.509603500366211, -9.941162109375, -9.372721672058105, -8.804281234741211, -8.235840797424316, -7.667400360107422, -7.098959445953369, -6.530519008636475, -5.96207857131958, -5.393637657165527, -4.825197219848633, -4.256756782531738, -3.6883163452148438, -3.11987566947937, -2.5514349937438965, -1.982994556427002, -1.4145541191101074, -0.8461134433746338, -0.27767276763916016, 0.2907676696777344, 0.8592082262039185, 1.4276487827301025, 1.9960893392562866, 2.5645298957824707, 3.1329703330993652, 3.701411008834839, 4.2698516845703125, 4.838292121887207, 5.406732559204102, 5.975172996520996, 6.543613910675049, 7.112054347991943, 7.680494785308838, 8.24893569946289, 8.817376136779785, 9.38581657409668, 9.954257011413574, 10.522697448730469, 11.091137886047363, 11.659578323364258, 12.228019714355469, 12.796460151672363, 13.364900588989258, 13.933341026306152, 14.501781463623047, 15.070221900939941, 15.638662338256836, 16.207103729248047, 16.775543212890625, 17.343984603881836, 17.912425994873047, 18.480865478515625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 4.0, 2.0, 6.0, 5.0, 11.0, 13.0, 13.0, 11.0, 16.0, 22.0, 16.0, 22.0, 23.0, 34.0, 42.0, 23.0, 28.0, 26.0, 37.0, 32.0, 40.0, 33.0, 45.0, 33.0, 29.0, 25.0, 39.0, 41.0, 32.0, 30.0, 31.0, 30.0, 26.0, 31.0, 31.0, 14.0, 22.0, 9.0, 7.0, 10.0, 9.0, 9.0, 3.0, 10.0, 6.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.76953125, -1.7151031494140625, -1.660675048828125, -1.6062469482421875, -1.55181884765625, -1.4973907470703125, -1.442962646484375, -1.3885345458984375, -1.3341064453125, -1.2796783447265625, -1.225250244140625, -1.1708221435546875, -1.11639404296875, -1.0619659423828125, -1.007537841796875, -0.9531097412109375, -0.898681640625, -0.8442535400390625, -0.789825439453125, -0.7353973388671875, -0.68096923828125, -0.6265411376953125, -0.572113037109375, -0.5176849365234375, -0.4632568359375, -0.4088287353515625, -0.354400634765625, -0.2999725341796875, -0.24554443359375, -0.1911163330078125, -0.136688232421875, -0.0822601318359375, -0.02783203125, 0.0265960693359375, 0.081024169921875, 0.1354522705078125, 0.18988037109375, 0.2443084716796875, 0.298736572265625, 0.3531646728515625, 0.4075927734375, 0.4620208740234375, 0.516448974609375, 0.5708770751953125, 0.62530517578125, 0.6797332763671875, 0.734161376953125, 0.7885894775390625, 0.843017578125, 0.8974456787109375, 0.951873779296875, 1.0063018798828125, 1.06072998046875, 1.1151580810546875, 1.169586181640625, 1.2240142822265625, 1.2784423828125, 1.3328704833984375, 1.387298583984375, 1.4417266845703125, 1.49615478515625, 1.5505828857421875, 1.605010986328125, 1.6594390869140625, 1.7138671875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 4.0, 3.0, 4.0, 9.0, 13.0, 13.0, 16.0, 25.0, 39.0, 44.0, 60.0, 73.0, 109.0, 155.0, 218.0, 306.0, 513.0, 843.0, 1930.0, 4881.0, 16376.0, 74737.0, 568988.0, 2975987.0, 462145.0, 63793.0, 14436.0, 4426.0, 1772.0, 839.0, 470.0, 295.0, 215.0, 151.0, 131.0, 61.0, 51.0, 48.0, 23.0, 27.0, 23.0, 6.0, 5.0, 6.0, 5.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4375, -9.146728515625, -8.85595703125, -8.565185546875, -8.2744140625, -7.983642578125, -7.69287109375, -7.402099609375, -7.111328125, -6.820556640625, -6.52978515625, -6.239013671875, -5.9482421875, -5.657470703125, -5.36669921875, -5.075927734375, -4.78515625, -4.494384765625, -4.20361328125, -3.912841796875, -3.6220703125, -3.331298828125, -3.04052734375, -2.749755859375, -2.458984375, -2.168212890625, -1.87744140625, -1.586669921875, -1.2958984375, -1.005126953125, -0.71435546875, -0.423583984375, -0.1328125, 0.157958984375, 0.44873046875, 0.739501953125, 1.0302734375, 1.321044921875, 1.61181640625, 1.902587890625, 2.193359375, 2.484130859375, 2.77490234375, 3.065673828125, 3.3564453125, 3.647216796875, 3.93798828125, 4.228759765625, 4.51953125, 4.810302734375, 5.10107421875, 5.391845703125, 5.6826171875, 5.973388671875, 6.26416015625, 6.554931640625, 6.845703125, 7.136474609375, 7.42724609375, 7.718017578125, 8.0087890625, 8.299560546875, 8.59033203125, 8.881103515625, 9.171875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 12.0, 5.0, 18.0, 31.0, 47.0, 58.0, 115.0, 144.0, 235.0, 279.0, 412.0, 569.0, 604.0, 482.0, 337.0, 248.0, 151.0, 111.0, 84.0, 44.0, 27.0, 18.0, 16.0, 7.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.6953125, -9.384765625, -9.07421875, -8.763671875, -8.453125, -8.142578125, -7.83203125, -7.521484375, -7.2109375, -6.900390625, -6.58984375, -6.279296875, -5.96875, -5.658203125, -5.34765625, -5.037109375, -4.7265625, -4.416015625, -4.10546875, -3.794921875, -3.484375, -3.173828125, -2.86328125, -2.552734375, -2.2421875, -1.931640625, -1.62109375, -1.310546875, -1.0, -0.689453125, -0.37890625, -0.068359375, 0.2421875, 0.552734375, 0.86328125, 1.173828125, 1.484375, 1.794921875, 2.10546875, 2.416015625, 2.7265625, 3.037109375, 3.34765625, 3.658203125, 3.96875, 4.279296875, 4.58984375, 4.900390625, 5.2109375, 5.521484375, 5.83203125, 6.142578125, 6.453125, 6.763671875, 7.07421875, 7.384765625, 7.6953125, 8.005859375, 8.31640625, 8.626953125, 8.9375, 9.248046875, 9.55859375, 9.869140625, 10.1796875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 9.0, 14.0, 25.0, 30.0, 66.0, 131.0, 245.0, 559.0, 2054.0, 46336.0, 3951724.0, 188214.0, 3312.0, 856.0, 316.0, 177.0, 72.0, 54.0, 21.0, 23.0, 15.0, 9.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.6875, -39.4775390625, -38.267578125, -37.0576171875, -35.84765625, -34.6376953125, -33.427734375, -32.2177734375, -31.0078125, -29.7978515625, -28.587890625, -27.3779296875, -26.16796875, -24.9580078125, -23.748046875, -22.5380859375, -21.328125, -20.1181640625, -18.908203125, -17.6982421875, -16.48828125, -15.2783203125, -14.068359375, -12.8583984375, -11.6484375, -10.4384765625, -9.228515625, -8.0185546875, -6.80859375, -5.5986328125, -4.388671875, -3.1787109375, -1.96875, -0.7587890625, 0.451171875, 1.6611328125, 2.87109375, 4.0810546875, 5.291015625, 6.5009765625, 7.7109375, 8.9208984375, 10.130859375, 11.3408203125, 12.55078125, 13.7607421875, 14.970703125, 16.1806640625, 17.390625, 18.6005859375, 19.810546875, 21.0205078125, 22.23046875, 23.4404296875, 24.650390625, 25.8603515625, 27.0703125, 28.2802734375, 29.490234375, 30.7001953125, 31.91015625, 33.1201171875, 34.330078125, 35.5400390625, 36.75]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 21.0, 102.0, 196.0, 279.0, 235.0, 116.0, 46.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.661731719970703, -28.421232223510742, -26.18073081970215, -23.940231323242188, -21.699729919433594, -19.459230422973633, -17.218730926513672, -14.978230476379395, -12.737730026245117, -10.49722957611084, -8.256729125976562, -6.016229629516602, -3.775729179382324, -1.5352287292480469, 0.7052707672119141, 2.9457712173461914, 5.186271667480469, 7.426772117614746, 9.667272567749023, 11.907772064208984, 14.148272514343262, 16.38877296447754, 18.6292724609375, 20.869773864746094, 23.110273361206055, 25.350772857666016, 27.59127426147461, 29.83177375793457, 32.07227325439453, 34.312774658203125, 36.55327606201172, 38.79377365112305, 41.034271240234375, 43.27477264404297, 45.5152702331543, 47.75577163696289, 49.996273040771484, 52.23677062988281, 54.477272033691406, 56.7177734375, 58.958274841308594, 61.19877624511719, 63.439273834228516, 65.67977905273438, 67.92027282714844, 70.16077423095703, 72.40127563476562, 74.64177703857422, 76.88227844238281, 79.1227798461914, 81.36328125, 83.60377502441406, 85.84427642822266, 88.08477783203125, 90.32527923583984, 92.56578063964844, 94.8062744140625, 97.0467758178711, 99.28727722167969, 101.52777099609375, 103.76827239990234, 106.00877380371094, 108.24927520751953, 110.48977661132812, 112.73027801513672]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 6.0, 6.0, 8.0, 6.0, 14.0, 16.0, 20.0, 12.0, 17.0, 22.0, 26.0, 35.0, 35.0, 19.0, 35.0, 36.0, 37.0, 34.0, 42.0, 37.0, 37.0, 40.0, 43.0, 40.0, 30.0, 38.0, 35.0, 34.0, 38.0, 26.0, 20.0, 22.0, 27.0, 18.0, 18.0, 16.0, 10.0, 9.0, 6.0, 9.0, 6.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.72325897216797, -25.89497947692871, -25.066699981689453, -24.238420486450195, -23.410140991210938, -22.581859588623047, -21.75358009338379, -20.92530059814453, -20.097021102905273, -19.268741607666016, -18.440462112426758, -17.6121826171875, -16.78390121459961, -15.955622673034668, -15.127342224121094, -14.299062728881836, -13.470783233642578, -12.64250373840332, -11.814224243164062, -10.985943794250488, -10.15766429901123, -9.329384803771973, -8.501104354858398, -7.672824859619141, -6.844545364379883, -6.016265869140625, -5.187985897064209, -4.359705924987793, -3.531426429748535, -2.7031469345092773, -1.8748669624328613, -1.0465869903564453, -0.2183074951171875, 0.6099722385406494, 1.4382519721984863, 2.2665317058563232, 3.09481143951416, 3.923090934753418, 4.751370906829834, 5.57965087890625, 6.407930374145508, 7.236209869384766, 8.064489364624023, 8.892769813537598, 9.721049308776855, 10.549328804016113, 11.377609252929688, 12.205888748168945, 13.034168243408203, 13.862447738647461, 14.690727233886719, 15.519007682800293, 16.347286224365234, 17.175567626953125, 18.003847122192383, 18.83212661743164, 19.6604061126709, 20.488685607910156, 21.316965103149414, 22.145244598388672, 22.973526000976562, 23.801803588867188, 24.630084991455078, 25.458364486694336, 26.286643981933594]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 10.0, 11.0, 12.0, 11.0, 8.0, 14.0, 15.0, 30.0, 25.0, 17.0, 22.0, 27.0, 35.0, 30.0, 41.0, 50.0, 41.0, 30.0, 41.0, 47.0, 45.0, 38.0, 30.0, 38.0, 31.0, 47.0, 35.0, 31.0, 25.0, 32.0, 25.0, 17.0, 23.0, 15.0, 9.0, 10.0, 8.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.06640625, -2.002410888671875, -1.93841552734375, -1.874420166015625, -1.8104248046875, -1.746429443359375, -1.68243408203125, -1.618438720703125, -1.554443359375, -1.490447998046875, -1.42645263671875, -1.362457275390625, -1.2984619140625, -1.234466552734375, -1.17047119140625, -1.106475830078125, -1.04248046875, -0.978485107421875, -0.91448974609375, -0.850494384765625, -0.7864990234375, -0.722503662109375, -0.65850830078125, -0.594512939453125, -0.530517578125, -0.466522216796875, -0.40252685546875, -0.338531494140625, -0.2745361328125, -0.210540771484375, -0.14654541015625, -0.082550048828125, -0.0185546875, 0.045440673828125, 0.10943603515625, 0.173431396484375, 0.2374267578125, 0.301422119140625, 0.36541748046875, 0.429412841796875, 0.493408203125, 0.557403564453125, 0.62139892578125, 0.685394287109375, 0.7493896484375, 0.813385009765625, 0.87738037109375, 0.941375732421875, 1.00537109375, 1.069366455078125, 1.13336181640625, 1.197357177734375, 1.2613525390625, 1.325347900390625, 1.38934326171875, 1.453338623046875, 1.517333984375, 1.581329345703125, 1.64532470703125, 1.709320068359375, 1.7733154296875, 1.837310791015625, 1.90130615234375, 1.965301513671875, 2.029296875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 13.0, 14.0, 27.0, 35.0, 57.0, 65.0, 101.0, 142.0, 202.0, 290.0, 439.0, 644.0, 976.0, 1447.0, 2256.0, 3403.0, 5552.0, 8513.0, 13515.0, 21449.0, 34230.0, 53312.0, 82613.0, 121307.0, 158333.0, 163230.0, 128775.0, 89217.0, 57611.0, 36601.0, 23169.0, 14848.0, 9284.0, 5772.0, 3828.0, 2446.0, 1539.0, 1076.0, 678.0, 470.0, 321.0, 216.0, 174.0, 115.0, 92.0, 59.0, 24.0, 23.0, 16.0, 12.0, 13.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.1871337890625, -0.18111419677734375, -0.1750946044921875, -0.16907501220703125, -0.163055419921875, -0.15703582763671875, -0.1510162353515625, -0.14499664306640625, -0.13897705078125, -0.13295745849609375, -0.1269378662109375, -0.12091827392578125, -0.114898681640625, -0.10887908935546875, -0.1028594970703125, -0.09683990478515625, -0.0908203125, -0.08480072021484375, -0.0787811279296875, -0.07276153564453125, -0.066741943359375, -0.06072235107421875, -0.0547027587890625, -0.04868316650390625, -0.04266357421875, -0.03664398193359375, -0.0306243896484375, -0.02460479736328125, -0.018585205078125, -0.01256561279296875, -0.0065460205078125, -0.00052642822265625, 0.0054931640625, 0.01151275634765625, 0.0175323486328125, 0.02355194091796875, 0.029571533203125, 0.03559112548828125, 0.0416107177734375, 0.04763031005859375, 0.05364990234375, 0.05966949462890625, 0.0656890869140625, 0.07170867919921875, 0.077728271484375, 0.08374786376953125, 0.0897674560546875, 0.09578704833984375, 0.101806640625, 0.10782623291015625, 0.1138458251953125, 0.11986541748046875, 0.125885009765625, 0.13190460205078125, 0.1379241943359375, 0.14394378662109375, 0.14996337890625, 0.15598297119140625, 0.1620025634765625, 0.16802215576171875, 0.174041748046875, 0.18006134033203125, 0.1860809326171875, 0.19210052490234375, 0.1981201171875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 9.0, 8.0, 8.0, 6.0, 5.0, 19.0, 17.0, 25.0, 16.0, 19.0, 34.0, 33.0, 43.0, 42.0, 37.0, 48.0, 53.0, 57.0, 1073.0, 41.0, 46.0, 43.0, 45.0, 48.0, 35.0, 28.0, 24.0, 28.0, 32.0, 20.0, 23.0, 13.0, 8.0, 8.0, 11.0, 7.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.39453125, -1.3473663330078125, -1.300201416015625, -1.2530364990234375, -1.20587158203125, -1.1587066650390625, -1.111541748046875, -1.0643768310546875, -1.0172119140625, -0.9700469970703125, -0.922882080078125, -0.8757171630859375, -0.82855224609375, -0.7813873291015625, -0.734222412109375, -0.6870574951171875, -0.639892578125, -0.5927276611328125, -0.545562744140625, -0.4983978271484375, -0.45123291015625, -0.4040679931640625, -0.356903076171875, -0.3097381591796875, -0.2625732421875, -0.2154083251953125, -0.168243408203125, -0.1210784912109375, -0.07391357421875, -0.0267486572265625, 0.020416259765625, 0.0675811767578125, 0.11474609375, 0.1619110107421875, 0.209075927734375, 0.2562408447265625, 0.30340576171875, 0.3505706787109375, 0.397735595703125, 0.4449005126953125, 0.4920654296875, 0.5392303466796875, 0.586395263671875, 0.6335601806640625, 0.68072509765625, 0.7278900146484375, 0.775054931640625, 0.8222198486328125, 0.869384765625, 0.9165496826171875, 0.963714599609375, 1.0108795166015625, 1.05804443359375, 1.1052093505859375, 1.152374267578125, 1.1995391845703125, 1.2467041015625, 1.2938690185546875, 1.341033935546875, 1.3881988525390625, 1.43536376953125, 1.4825286865234375, 1.529693603515625, 1.5768585205078125, 1.6240234375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 13.0, 17.0, 28.0, 33.0, 69.0, 107.0, 146.0, 225.0, 371.0, 498.0, 869.0, 1341.0, 2033.0, 3163.0, 4902.0, 7767.0, 11944.0, 18922.0, 28700.0, 43129.0, 64940.0, 92264.0, 122989.0, 1048813.0, 274049.0, 114356.0, 84647.0, 59048.0, 39327.0, 25696.0, 16510.0, 10781.0, 6882.0, 4603.0, 2913.0, 1732.0, 1211.0, 742.0, 448.0, 321.0, 209.0, 133.0, 92.0, 59.0, 29.0, 22.0, 13.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.1220703125, -0.11835670471191406, -0.11464309692382812, -0.11092948913574219, -0.10721588134765625, -0.10350227355957031, -0.09978866577148438, -0.09607505798339844, -0.0923614501953125, -0.08864784240722656, -0.08493423461914062, -0.08122062683105469, -0.07750701904296875, -0.07379341125488281, -0.07007980346679688, -0.06636619567871094, -0.062652587890625, -0.05893898010253906, -0.055225372314453125, -0.05151176452636719, -0.04779815673828125, -0.04408454895019531, -0.040370941162109375, -0.03665733337402344, -0.0329437255859375, -0.029230117797851562, -0.025516510009765625, -0.021802902221679688, -0.01808929443359375, -0.014375686645507812, -0.010662078857421875, -0.0069484710693359375, -0.00323486328125, 0.0004787445068359375, 0.004192352294921875, 0.007905960083007812, 0.01161956787109375, 0.015333175659179688, 0.019046783447265625, 0.022760391235351562, 0.0264739990234375, 0.030187606811523438, 0.033901214599609375, 0.03761482238769531, 0.04132843017578125, 0.04504203796386719, 0.048755645751953125, 0.05246925354003906, 0.056182861328125, 0.05989646911621094, 0.06361007690429688, 0.06732368469238281, 0.07103729248046875, 0.07475090026855469, 0.07846450805664062, 0.08217811584472656, 0.0858917236328125, 0.08960533142089844, 0.09331893920898438, 0.09703254699707031, 0.10074615478515625, 0.10445976257324219, 0.10817337036132812, 0.11188697814941406, 0.1156005859375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 8.0, 8.0, 8.0, 4.0, 13.0, 12.0, 14.0, 19.0, 20.0, 36.0, 38.0, 59.0, 74.0, 141.0, 181.0, 89.0, 64.0, 23.0, 34.0, 30.0, 23.0, 20.0, 13.0, 9.0, 9.0, 8.0, 5.0, 9.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007171630859375, -0.006925463676452637, -0.0066792964935302734, -0.00643312931060791, -0.006186962127685547, -0.005940794944763184, -0.00569462776184082, -0.005448460578918457, -0.005202293395996094, -0.0049561262130737305, -0.004709959030151367, -0.004463791847229004, -0.004217624664306641, -0.003971457481384277, -0.003725290298461914, -0.0034791231155395508, -0.0032329559326171875, -0.0029867887496948242, -0.002740621566772461, -0.0024944543838500977, -0.0022482872009277344, -0.002002120018005371, -0.0017559528350830078, -0.0015097856521606445, -0.0012636184692382812, -0.001017451286315918, -0.0007712841033935547, -0.0005251169204711914, -0.0002789497375488281, -3.2782554626464844e-05, 0.00021338462829589844, 0.0004595518112182617, 0.000705718994140625, 0.0009518861770629883, 0.0011980533599853516, 0.0014442205429077148, 0.0016903877258300781, 0.0019365549087524414, 0.0021827220916748047, 0.002428889274597168, 0.0026750564575195312, 0.0029212236404418945, 0.003167390823364258, 0.003413558006286621, 0.0036597251892089844, 0.0039058923721313477, 0.004152059555053711, 0.004398226737976074, 0.0046443939208984375, 0.004890561103820801, 0.005136728286743164, 0.005382895469665527, 0.005629062652587891, 0.005875229835510254, 0.006121397018432617, 0.0063675642013549805, 0.006613731384277344, 0.006859898567199707, 0.00710606575012207, 0.007352232933044434, 0.007598400115966797, 0.00784456729888916, 0.008090734481811523, 0.008336901664733887, 0.00858306884765625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 9.0, 8.0, 13.0, 10.0, 16.0, 16.0, 19.0, 33.0, 52.0, 88.0, 131.0, 213.0, 528.0, 6422.0, 1038784.0, 1287.0, 373.0, 185.0, 112.0, 68.0, 49.0, 30.0, 16.0, 20.0, 15.0, 3.0, 18.0, 6.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.289306640625, -0.28061676025390625, -0.2719268798828125, -0.26323699951171875, -0.254547119140625, -0.24585723876953125, -0.2371673583984375, -0.22847747802734375, -0.21978759765625, -0.21109771728515625, -0.2024078369140625, -0.19371795654296875, -0.185028076171875, -0.17633819580078125, -0.1676483154296875, -0.15895843505859375, -0.1502685546875, -0.14157867431640625, -0.1328887939453125, -0.12419891357421875, -0.115509033203125, -0.10681915283203125, -0.0981292724609375, -0.08943939208984375, -0.08074951171875, -0.07205963134765625, -0.0633697509765625, -0.05467987060546875, -0.045989990234375, -0.03730010986328125, -0.0286102294921875, -0.01992034912109375, -0.01123046875, -0.00254058837890625, 0.0061492919921875, 0.01483917236328125, 0.023529052734375, 0.03221893310546875, 0.0409088134765625, 0.04959869384765625, 0.05828857421875, 0.06697845458984375, 0.0756683349609375, 0.08435821533203125, 0.093048095703125, 0.10173797607421875, 0.1104278564453125, 0.11911773681640625, 0.1278076171875, 0.13649749755859375, 0.1451873779296875, 0.15387725830078125, 0.162567138671875, 0.17125701904296875, 0.1799468994140625, 0.18863677978515625, 0.19732666015625, 0.20601654052734375, 0.2147064208984375, 0.22339630126953125, 0.232086181640625, 0.24077606201171875, 0.2494659423828125, 0.25815582275390625, 0.266845703125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 16.0, 761.0, 237.0], "bins": [-0.28093189001083374, -0.27646803855895996, -0.2720041871070862, -0.26754030585289, -0.26307645440101624, -0.25861260294914246, -0.2541487514972687, -0.2496848851442337, -0.24522101879119873, -0.24075716733932495, -0.23629330098628998, -0.2318294495344162, -0.22736558318138123, -0.22290173172950745, -0.21843786537647247, -0.2139740139245987, -0.20951014757156372, -0.20504629611968994, -0.20058242976665497, -0.1961185783147812, -0.19165471196174622, -0.18719086050987244, -0.18272699415683746, -0.17826314270496368, -0.1737992912530899, -0.16933543980121613, -0.16487157344818115, -0.16040772199630737, -0.1559438556432724, -0.15148000419139862, -0.14701613783836365, -0.14255228638648987, -0.1380884349346161, -0.1336245834827423, -0.12916071712970734, -0.12469685822725296, -0.12023299932479858, -0.11576914042234421, -0.11130528151988983, -0.10684143006801605, -0.10237756371498108, -0.0979137048125267, -0.09344984591007233, -0.08898598700761795, -0.08452212810516357, -0.0800582692027092, -0.07559441030025482, -0.07113055884838104, -0.06666669994592667, -0.06220284104347229, -0.057738982141017914, -0.05327512323856354, -0.04881126433610916, -0.044347405433654785, -0.03988355025649071, -0.03541969135403633, -0.030955830588936806, -0.02649197168648243, -0.022028114646673203, -0.017564255744218826, -0.01310039684176445, -0.008636537939310074, -0.004172680899500847, 0.00029117800295352936, 0.004755036905407906]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 4.0, 1.0, 1.0, 3.0, 6.0, 13.0, 15.0, 12.0, 11.0, 24.0, 19.0, 36.0, 42.0, 42.0, 32.0, 59.0, 46.0, 41.0, 42.0, 57.0, 52.0, 49.0, 41.0, 47.0, 48.0, 40.0, 47.0, 32.0, 28.0, 23.0, 22.0, 19.0, 16.0, 11.0, 7.0, 5.0, 4.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006202518939971924, -0.00593939796090126, -0.005676276981830597, -0.0054131560027599335, -0.00515003502368927, -0.004886914044618607, -0.004623793065547943, -0.00436067208647728, -0.004097551107406616, -0.0038344301283359528, -0.0035713091492652893, -0.003308188170194626, -0.0030450671911239624, -0.002781946212053299, -0.0025188252329826355, -0.002255704253911972, -0.0019925832748413086, -0.0017294622957706451, -0.0014663413166999817, -0.0012032203376293182, -0.0009400993585586548, -0.0006769783794879913, -0.0004138574004173279, -0.00015073642134666443, 0.00011238455772399902, 0.0003755055367946625, 0.0006386265158653259, 0.0009017474949359894, 0.0011648684740066528, 0.0014279894530773163, 0.0016911104321479797, 0.001954231411218643, 0.0022173523902893066, 0.00248047336935997, 0.0027435943484306335, 0.003006715327501297, 0.0032698363065719604, 0.003532957285642624, 0.0037960782647132874, 0.004059199243783951, 0.004322320222854614, 0.004585441201925278, 0.004848562180995941, 0.005111683160066605, 0.005374804139137268, 0.0056379251182079315, 0.005901046097278595, 0.006164167076349258, 0.006427288055419922, 0.006690409034490585, 0.006953530013561249, 0.007216650992631912, 0.007479771971702576, 0.007742892950773239, 0.008006013929843903, 0.008269134908914566, 0.00853225588798523, 0.008795376867055893, 0.009058497846126556, 0.00932161882519722, 0.009584739804267883, 0.009847860783338547, 0.01011098176240921, 0.010374102741479874, 0.010637223720550537]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 10.0, 11.0, 12.0, 11.0, 8.0, 14.0, 15.0, 30.0, 25.0, 17.0, 22.0, 27.0, 35.0, 30.0, 41.0, 50.0, 41.0, 30.0, 41.0, 47.0, 45.0, 37.0, 31.0, 38.0, 31.0, 47.0, 35.0, 31.0, 25.0, 32.0, 26.0, 16.0, 23.0, 15.0, 9.0, 10.0, 8.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.06640625, -2.002410888671875, -1.93841552734375, -1.874420166015625, -1.8104248046875, -1.746429443359375, -1.68243408203125, -1.618438720703125, -1.554443359375, -1.490447998046875, -1.42645263671875, -1.362457275390625, -1.2984619140625, -1.234466552734375, -1.17047119140625, -1.106475830078125, -1.04248046875, -0.978485107421875, -0.91448974609375, -0.850494384765625, -0.7864990234375, -0.722503662109375, -0.65850830078125, -0.594512939453125, -0.530517578125, -0.466522216796875, -0.40252685546875, -0.338531494140625, -0.2745361328125, -0.210540771484375, -0.14654541015625, -0.082550048828125, -0.0185546875, 0.045440673828125, 0.10943603515625, 0.173431396484375, 0.2374267578125, 0.301422119140625, 0.36541748046875, 0.429412841796875, 0.493408203125, 0.557403564453125, 0.62139892578125, 0.685394287109375, 0.7493896484375, 0.813385009765625, 0.87738037109375, 0.941375732421875, 1.00537109375, 1.069366455078125, 1.13336181640625, 1.197357177734375, 1.2613525390625, 1.325347900390625, 1.38934326171875, 1.453338623046875, 1.517333984375, 1.581329345703125, 1.64532470703125, 1.709320068359375, 1.7733154296875, 1.837310791015625, 1.90130615234375, 1.965301513671875, 2.029296875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 0.0, 6.0, 19.0, 22.0, 26.0, 26.0, 37.0, 52.0, 71.0, 79.0, 131.0, 177.0, 291.0, 385.0, 748.0, 1242.0, 2454.0, 5404.0, 12601.0, 31297.0, 84443.0, 226633.0, 368865.0, 194277.0, 71695.0, 26747.0, 10797.0, 4652.0, 2232.0, 1165.0, 682.0, 372.0, 296.0, 161.0, 128.0, 98.0, 83.0, 40.0, 38.0, 12.0, 19.0, 19.0, 17.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.947265625, -1.885284423828125, -1.82330322265625, -1.761322021484375, -1.6993408203125, -1.637359619140625, -1.57537841796875, -1.513397216796875, -1.451416015625, -1.389434814453125, -1.32745361328125, -1.265472412109375, -1.2034912109375, -1.141510009765625, -1.07952880859375, -1.017547607421875, -0.95556640625, -0.893585205078125, -0.83160400390625, -0.769622802734375, -0.7076416015625, -0.645660400390625, -0.58367919921875, -0.521697998046875, -0.459716796875, -0.397735595703125, -0.33575439453125, -0.273773193359375, -0.2117919921875, -0.149810791015625, -0.08782958984375, -0.025848388671875, 0.0361328125, 0.098114013671875, 0.16009521484375, 0.222076416015625, 0.2840576171875, 0.346038818359375, 0.40802001953125, 0.470001220703125, 0.531982421875, 0.593963623046875, 0.65594482421875, 0.717926025390625, 0.7799072265625, 0.841888427734375, 0.90386962890625, 0.965850830078125, 1.02783203125, 1.089813232421875, 1.15179443359375, 1.213775634765625, 1.2757568359375, 1.337738037109375, 1.39971923828125, 1.461700439453125, 1.523681640625, 1.585662841796875, 1.64764404296875, 1.709625244140625, 1.7716064453125, 1.833587646484375, 1.89556884765625, 1.957550048828125, 2.01953125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 3.0, 19.0, 14.0, 20.0, 19.0, 19.0, 21.0, 31.0, 19.0, 43.0, 27.0, 36.0, 40.0, 46.0, 66.0, 108.0, 409.0, 1496.0, 152.0, 65.0, 62.0, 38.0, 29.0, 39.0, 31.0, 34.0, 21.0, 33.0, 14.0, 18.0, 13.0, 16.0, 5.0, 6.0, 5.0, 6.0, 3.0, 1.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-7.8046875, -7.5758056640625, -7.346923828125, -7.1180419921875, -6.88916015625, -6.6602783203125, -6.431396484375, -6.2025146484375, -5.9736328125, -5.7447509765625, -5.515869140625, -5.2869873046875, -5.05810546875, -4.8292236328125, -4.600341796875, -4.3714599609375, -4.142578125, -3.9136962890625, -3.684814453125, -3.4559326171875, -3.22705078125, -2.9981689453125, -2.769287109375, -2.5404052734375, -2.3115234375, -2.0826416015625, -1.853759765625, -1.6248779296875, -1.39599609375, -1.1671142578125, -0.938232421875, -0.7093505859375, -0.48046875, -0.2515869140625, -0.022705078125, 0.2061767578125, 0.43505859375, 0.6639404296875, 0.892822265625, 1.1217041015625, 1.3505859375, 1.5794677734375, 1.808349609375, 2.0372314453125, 2.26611328125, 2.4949951171875, 2.723876953125, 2.9527587890625, 3.181640625, 3.4105224609375, 3.639404296875, 3.8682861328125, 4.09716796875, 4.3260498046875, 4.554931640625, 4.7838134765625, 5.0126953125, 5.2415771484375, 5.470458984375, 5.6993408203125, 5.92822265625, 6.1571044921875, 6.385986328125, 6.6148681640625, 6.84375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 4.0, 2.0, 5.0, 5.0, 6.0, 14.0, 18.0, 17.0, 11.0, 23.0, 29.0, 41.0, 41.0, 39.0, 80.0, 73.0, 183.0, 374.0, 1166.0, 13615.0, 3066045.0, 60979.0, 1709.0, 493.0, 228.0, 130.0, 71.0, 54.0, 44.0, 33.0, 27.0, 25.0, 24.0, 14.0, 22.0, 20.0, 8.0, 8.0, 5.0, 4.0, 6.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.296875, -14.8133544921875, -14.329833984375, -13.8463134765625, -13.36279296875, -12.8792724609375, -12.395751953125, -11.9122314453125, -11.4287109375, -10.9451904296875, -10.461669921875, -9.9781494140625, -9.49462890625, -9.0111083984375, -8.527587890625, -8.0440673828125, -7.560546875, -7.0770263671875, -6.593505859375, -6.1099853515625, -5.62646484375, -5.1429443359375, -4.659423828125, -4.1759033203125, -3.6923828125, -3.2088623046875, -2.725341796875, -2.2418212890625, -1.75830078125, -1.2747802734375, -0.791259765625, -0.3077392578125, 0.17578125, 0.6593017578125, 1.142822265625, 1.6263427734375, 2.10986328125, 2.5933837890625, 3.076904296875, 3.5604248046875, 4.0439453125, 4.5274658203125, 5.010986328125, 5.4945068359375, 5.97802734375, 6.4615478515625, 6.945068359375, 7.4285888671875, 7.912109375, 8.3956298828125, 8.879150390625, 9.3626708984375, 9.84619140625, 10.3297119140625, 10.813232421875, 11.2967529296875, 11.7802734375, 12.2637939453125, 12.747314453125, 13.2308349609375, 13.71435546875, 14.1978759765625, 14.681396484375, 15.1649169921875, 15.6484375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 108.0, 562.0, 317.0, 22.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.971656799316406, -5.762825965881348, -4.553994655609131, -3.345163583755493, -2.1363325119018555, -0.9275016784667969, 0.2813296318054199, 1.4901609420776367, 2.6989917755126953, 3.907822847366333, 5.116653919219971, 6.3254852294921875, 7.534316062927246, 8.743146896362305, 9.95197868347168, 11.160809516906738, 12.369640350341797, 13.578471183776855, 14.787302017211914, 15.996133804321289, 17.20496368408203, 18.413795471191406, 19.62262725830078, 20.831459045410156, 22.0402889251709, 23.249120712280273, 24.457950592041016, 25.66678237915039, 26.875614166259766, 28.084444046020508, 29.293275833129883, 30.502105712890625, 31.7109375, 32.919769287109375, 34.12860107421875, 35.33742904663086, 36.546260833740234, 37.75509262084961, 38.963924407958984, 40.17275619506836, 41.38158416748047, 42.590415954589844, 43.79924774169922, 45.00807571411133, 46.2169075012207, 47.42573928833008, 48.63457107543945, 49.84340286254883, 51.0522346496582, 52.26106643676758, 53.46989822387695, 54.67872619628906, 55.88755798339844, 57.09638977050781, 58.30522155761719, 59.51405334472656, 60.72288513183594, 61.93171691894531, 63.14054870605469, 64.34938049316406, 65.55821228027344, 66.76704406738281, 67.97586822509766, 69.18470001220703, 70.3935317993164]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 5.0, 3.0, 10.0, 6.0, 13.0, 10.0, 9.0, 16.0, 10.0, 29.0, 18.0, 29.0, 22.0, 32.0, 35.0, 34.0, 36.0, 50.0, 42.0, 45.0, 41.0, 48.0, 40.0, 43.0, 36.0, 30.0, 42.0, 39.0, 33.0, 32.0, 19.0, 23.0, 19.0, 26.0, 12.0, 9.0, 10.0, 9.0, 4.0, 13.0, 3.0, 9.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-23.55523681640625, -22.84619903564453, -22.137161254882812, -21.428123474121094, -20.719085693359375, -20.010046005249023, -19.301008224487305, -18.591970443725586, -17.882932662963867, -17.17389488220215, -16.46485710144043, -15.755818367004395, -15.046780586242676, -14.337742805480957, -13.628704071044922, -12.919666290283203, -12.210628509521484, -11.501590728759766, -10.792552947998047, -10.083514213562012, -9.374476432800293, -8.665438652038574, -7.956400394439697, -7.24736213684082, -6.538324356079102, -5.829286575317383, -5.120248317718506, -4.411210060119629, -3.70217227935791, -2.9931342601776123, -2.2840962409973145, -1.5750579833984375, -0.8660202026367188, -0.1569821834564209, 0.552055835723877, 1.2610938549041748, 1.9701318740844727, 2.6791698932647705, 3.3882079124450684, 4.097246170043945, 4.806283950805664, 5.515321731567383, 6.22435998916626, 6.933398246765137, 7.6424360275268555, 8.351473808288574, 9.06051254272461, 9.769550323486328, 10.478588104248047, 11.187625885009766, 11.896663665771484, 12.60570240020752, 13.314740180969238, 14.023777961730957, 14.732816696166992, 15.441854476928711, 16.15089225769043, 16.85993003845215, 17.568967819213867, 18.278005599975586, 18.987045288085938, 19.696083068847656, 20.405120849609375, 21.114158630371094, 21.823196411132812]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 10.0, 9.0, 9.0, 10.0, 14.0, 13.0, 16.0, 17.0, 27.0, 19.0, 23.0, 21.0, 35.0, 36.0, 27.0, 45.0, 48.0, 32.0, 36.0, 45.0, 42.0, 49.0, 35.0, 26.0, 37.0, 44.0, 38.0, 32.0, 24.0, 28.0, 29.0, 24.0, 22.0, 18.0, 12.0, 11.0, 8.0, 7.0, 8.0, 8.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.06787109375, -2.0029296875, -1.93798828125, -1.873046875, -1.80810546875, -1.7431640625, -1.67822265625, -1.61328125, -1.54833984375, -1.4833984375, -1.41845703125, -1.353515625, -1.28857421875, -1.2236328125, -1.15869140625, -1.09375, -1.02880859375, -0.9638671875, -0.89892578125, -0.833984375, -0.76904296875, -0.7041015625, -0.63916015625, -0.57421875, -0.50927734375, -0.4443359375, -0.37939453125, -0.314453125, -0.24951171875, -0.1845703125, -0.11962890625, -0.0546875, 0.01025390625, 0.0751953125, 0.14013671875, 0.205078125, 0.27001953125, 0.3349609375, 0.39990234375, 0.46484375, 0.52978515625, 0.5947265625, 0.65966796875, 0.724609375, 0.78955078125, 0.8544921875, 0.91943359375, 0.984375, 1.04931640625, 1.1142578125, 1.17919921875, 1.244140625, 1.30908203125, 1.3740234375, 1.43896484375, 1.50390625, 1.56884765625, 1.6337890625, 1.69873046875, 1.763671875, 1.82861328125, 1.8935546875, 1.95849609375, 2.0234375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 7.0, 2.0, 7.0, 12.0, 11.0, 12.0, 22.0, 30.0, 21.0, 29.0, 40.0, 51.0, 50.0, 64.0, 68.0, 113.0, 229.0, 588.0, 1873.0, 7451.0, 36612.0, 258101.0, 2544837.0, 1204600.0, 113815.0, 18920.0, 4259.0, 1274.0, 460.0, 211.0, 123.0, 91.0, 71.0, 44.0, 30.0, 30.0, 25.0, 20.0, 16.0, 18.0, 12.0, 14.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.3515625, -8.0889892578125, -7.826416015625, -7.5638427734375, -7.30126953125, -7.0386962890625, -6.776123046875, -6.5135498046875, -6.2509765625, -5.9884033203125, -5.725830078125, -5.4632568359375, -5.20068359375, -4.9381103515625, -4.675537109375, -4.4129638671875, -4.150390625, -3.8878173828125, -3.625244140625, -3.3626708984375, -3.10009765625, -2.8375244140625, -2.574951171875, -2.3123779296875, -2.0498046875, -1.7872314453125, -1.524658203125, -1.2620849609375, -0.99951171875, -0.7369384765625, -0.474365234375, -0.2117919921875, 0.05078125, 0.3133544921875, 0.575927734375, 0.8385009765625, 1.10107421875, 1.3636474609375, 1.626220703125, 1.8887939453125, 2.1513671875, 2.4139404296875, 2.676513671875, 2.9390869140625, 3.20166015625, 3.4642333984375, 3.726806640625, 3.9893798828125, 4.251953125, 4.5145263671875, 4.777099609375, 5.0396728515625, 5.30224609375, 5.5648193359375, 5.827392578125, 6.0899658203125, 6.3525390625, 6.6151123046875, 6.877685546875, 7.1402587890625, 7.40283203125, 7.6654052734375, 7.927978515625, 8.1905517578125, 8.453125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 11.0, 10.0, 17.0, 16.0, 27.0, 37.0, 67.0, 89.0, 126.0, 168.0, 234.0, 305.0, 428.0, 477.0, 474.0, 429.0, 338.0, 242.0, 176.0, 127.0, 83.0, 54.0, 44.0, 26.0, 18.0, 11.0, 15.0, 5.0, 4.0, 3.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.01953125, -6.75994873046875, -6.5003662109375, -6.24078369140625, -5.981201171875, -5.72161865234375, -5.4620361328125, -5.20245361328125, -4.94287109375, -4.68328857421875, -4.4237060546875, -4.16412353515625, -3.904541015625, -3.64495849609375, -3.3853759765625, -3.12579345703125, -2.8662109375, -2.60662841796875, -2.3470458984375, -2.08746337890625, -1.827880859375, -1.56829833984375, -1.3087158203125, -1.04913330078125, -0.78955078125, -0.52996826171875, -0.2703857421875, -0.01080322265625, 0.248779296875, 0.50836181640625, 0.7679443359375, 1.02752685546875, 1.287109375, 1.54669189453125, 1.8062744140625, 2.06585693359375, 2.325439453125, 2.58502197265625, 2.8446044921875, 3.10418701171875, 3.36376953125, 3.62335205078125, 3.8829345703125, 4.14251708984375, 4.402099609375, 4.66168212890625, 4.9212646484375, 5.18084716796875, 5.4404296875, 5.70001220703125, 5.9595947265625, 6.21917724609375, 6.478759765625, 6.73834228515625, 6.9979248046875, 7.25750732421875, 7.51708984375, 7.77667236328125, 8.0362548828125, 8.29583740234375, 8.555419921875, 8.81500244140625, 9.0745849609375, 9.33416748046875, 9.59375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 10.0, 16.0, 21.0, 43.0, 57.0, 92.0, 164.0, 343.0, 746.0, 1983.0, 9619.0, 109748.0, 2353032.0, 1630309.0, 77478.0, 7629.0, 1678.0, 599.0, 299.0, 153.0, 98.0, 62.0, 27.0, 17.0, 15.0, 6.0, 12.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.96875, -21.357421875, -20.74609375, -20.134765625, -19.5234375, -18.912109375, -18.30078125, -17.689453125, -17.078125, -16.466796875, -15.85546875, -15.244140625, -14.6328125, -14.021484375, -13.41015625, -12.798828125, -12.1875, -11.576171875, -10.96484375, -10.353515625, -9.7421875, -9.130859375, -8.51953125, -7.908203125, -7.296875, -6.685546875, -6.07421875, -5.462890625, -4.8515625, -4.240234375, -3.62890625, -3.017578125, -2.40625, -1.794921875, -1.18359375, -0.572265625, 0.0390625, 0.650390625, 1.26171875, 1.873046875, 2.484375, 3.095703125, 3.70703125, 4.318359375, 4.9296875, 5.541015625, 6.15234375, 6.763671875, 7.375, 7.986328125, 8.59765625, 9.208984375, 9.8203125, 10.431640625, 11.04296875, 11.654296875, 12.265625, 12.876953125, 13.48828125, 14.099609375, 14.7109375, 15.322265625, 15.93359375, 16.544921875, 17.15625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 19.0, 71.0, 134.0, 248.0, 256.0, 165.0, 79.0, 28.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.081417083740234, -36.6553840637207, -34.229347229003906, -31.803314208984375, -29.37727928161621, -26.951244354248047, -24.525211334228516, -22.09917640686035, -19.673141479492188, -17.247106552124023, -14.821072578430176, -12.395038604736328, -9.969003677368164, -7.54296875, -5.116934776306152, -2.6909008026123047, -0.2648658752441406, 2.1611685752868652, 4.587203025817871, 7.013237476348877, 9.439271926879883, 11.865306854248047, 14.291340827941895, 16.717374801635742, 19.143409729003906, 21.56944465637207, 23.995479583740234, 26.421512603759766, 28.84754753112793, 31.273582458496094, 33.699615478515625, 36.125648498535156, 38.55168914794922, 40.97772216796875, 43.40375900268555, 45.82979202270508, 48.255828857421875, 50.681861877441406, 53.10789489746094, 55.53392791748047, 57.959964752197266, 60.3859977722168, 62.812034606933594, 65.23806762695312, 67.66410064697266, 70.09013366699219, 72.51617431640625, 74.94220733642578, 77.36824035644531, 79.79427337646484, 82.22030639648438, 84.64634704589844, 87.07238006591797, 89.4984130859375, 91.92444610595703, 94.35047912597656, 96.77651977539062, 99.20255279541016, 101.62858581542969, 104.05462646484375, 106.48065948486328, 108.90669250488281, 111.33272552490234, 113.75875854492188, 116.1847915649414]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 0.0, 6.0, 8.0, 5.0, 3.0, 3.0, 6.0, 9.0, 16.0, 8.0, 17.0, 13.0, 18.0, 18.0, 18.0, 43.0, 27.0, 33.0, 43.0, 30.0, 54.0, 45.0, 29.0, 47.0, 39.0, 37.0, 24.0, 45.0, 32.0, 32.0, 37.0, 39.0, 30.0, 27.0, 21.0, 18.0, 21.0, 26.0, 19.0, 15.0, 11.0, 9.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.880813598632812, -20.142555236816406, -19.404296875, -18.666038513183594, -17.927780151367188, -17.18952178955078, -16.451263427734375, -15.713005065917969, -14.974746704101562, -14.236488342285156, -13.49822998046875, -12.759971618652344, -12.021713256835938, -11.283454895019531, -10.545196533203125, -9.806938171386719, -9.068679809570312, -8.330421447753906, -7.5921630859375, -6.853904724121094, -6.1156463623046875, -5.377388000488281, -4.639129638671875, -3.9008712768554688, -3.1626129150390625, -2.4243545532226562, -1.68609619140625, -0.9478378295898438, -0.2095794677734375, 0.5286788940429688, 1.266937255859375, 2.0051956176757812, 2.7434539794921875, 3.4817123413085938, 4.219970703125, 4.958229064941406, 5.6964874267578125, 6.434745788574219, 7.173004150390625, 7.911262512207031, 8.649520874023438, 9.387779235839844, 10.12603759765625, 10.864295959472656, 11.602554321289062, 12.340812683105469, 13.079071044921875, 13.817329406738281, 14.555587768554688, 15.293846130371094, 16.0321044921875, 16.770362854003906, 17.508621215820312, 18.24687957763672, 18.985137939453125, 19.72339630126953, 20.461654663085938, 21.199913024902344, 21.93817138671875, 22.676429748535156, 23.414688110351562, 24.15294647216797, 24.891204833984375, 25.62946319580078, 26.367721557617188]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 10.0, 9.0, 9.0, 16.0, 17.0, 19.0, 17.0, 22.0, 18.0, 30.0, 33.0, 26.0, 25.0, 42.0, 41.0, 30.0, 43.0, 54.0, 51.0, 47.0, 33.0, 45.0, 33.0, 46.0, 35.0, 30.0, 23.0, 27.0, 21.0, 30.0, 16.0, 17.0, 26.0, 6.0, 14.0, 8.0, 4.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.298828125, -2.23004150390625, -2.1612548828125, -2.09246826171875, -2.023681640625, -1.95489501953125, -1.8861083984375, -1.81732177734375, -1.74853515625, -1.67974853515625, -1.6109619140625, -1.54217529296875, -1.473388671875, -1.40460205078125, -1.3358154296875, -1.26702880859375, -1.1982421875, -1.12945556640625, -1.0606689453125, -0.99188232421875, -0.923095703125, -0.85430908203125, -0.7855224609375, -0.71673583984375, -0.64794921875, -0.57916259765625, -0.5103759765625, -0.44158935546875, -0.372802734375, -0.30401611328125, -0.2352294921875, -0.16644287109375, -0.09765625, -0.02886962890625, 0.0399169921875, 0.10870361328125, 0.177490234375, 0.24627685546875, 0.3150634765625, 0.38385009765625, 0.45263671875, 0.52142333984375, 0.5902099609375, 0.65899658203125, 0.727783203125, 0.79656982421875, 0.8653564453125, 0.93414306640625, 1.0029296875, 1.07171630859375, 1.1405029296875, 1.20928955078125, 1.278076171875, 1.34686279296875, 1.4156494140625, 1.48443603515625, 1.55322265625, 1.62200927734375, 1.6907958984375, 1.75958251953125, 1.828369140625, 1.89715576171875, 1.9659423828125, 2.03472900390625, 2.103515625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 8.0, 7.0, 6.0, 5.0, 10.0, 23.0, 36.0, 50.0, 53.0, 90.0, 155.0, 195.0, 311.0, 538.0, 926.0, 1432.0, 2454.0, 4059.0, 6995.0, 12201.0, 21406.0, 37095.0, 65279.0, 109068.0, 167167.0, 201985.0, 163470.0, 105555.0, 62820.0, 36194.0, 20663.0, 11662.0, 6696.0, 3861.0, 2250.0, 1371.0, 829.0, 519.0, 390.0, 216.0, 140.0, 98.0, 80.0, 60.0, 27.0, 22.0, 23.0, 16.0, 14.0, 13.0, 10.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.249755859375, -0.2420635223388672, -0.23437118530273438, -0.22667884826660156, -0.21898651123046875, -0.21129417419433594, -0.20360183715820312, -0.1959095001220703, -0.1882171630859375, -0.1805248260498047, -0.17283248901367188, -0.16514015197753906, -0.15744781494140625, -0.14975547790527344, -0.14206314086914062, -0.1343708038330078, -0.126678466796875, -0.11898612976074219, -0.11129379272460938, -0.10360145568847656, -0.09590911865234375, -0.08821678161621094, -0.08052444458007812, -0.07283210754394531, -0.0651397705078125, -0.05744743347167969, -0.049755096435546875, -0.04206275939941406, -0.03437042236328125, -0.026678085327148438, -0.018985748291015625, -0.011293411254882812, -0.00360107421875, 0.0040912628173828125, 0.011783599853515625, 0.019475936889648438, 0.02716827392578125, 0.03486061096191406, 0.042552947998046875, 0.05024528503417969, 0.0579376220703125, 0.06562995910644531, 0.07332229614257812, 0.08101463317871094, 0.08870697021484375, 0.09639930725097656, 0.10409164428710938, 0.11178398132324219, 0.119476318359375, 0.1271686553955078, 0.13486099243164062, 0.14255332946777344, 0.15024566650390625, 0.15793800354003906, 0.16563034057617188, 0.1733226776123047, 0.1810150146484375, 0.1887073516845703, 0.19639968872070312, 0.20409202575683594, 0.21178436279296875, 0.21947669982910156, 0.22716903686523438, 0.2348613739013672, 0.2425537109375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 12.0, 8.0, 6.0, 14.0, 19.0, 6.0, 16.0, 6.0, 28.0, 18.0, 18.0, 24.0, 32.0, 33.0, 38.0, 37.0, 38.0, 43.0, 37.0, 39.0, 1054.0, 45.0, 36.0, 40.0, 41.0, 38.0, 24.0, 31.0, 23.0, 34.0, 23.0, 30.0, 17.0, 22.0, 17.0, 15.0, 12.0, 6.0, 10.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.326171875, -1.2820587158203125, -1.237945556640625, -1.1938323974609375, -1.14971923828125, -1.1056060791015625, -1.061492919921875, -1.0173797607421875, -0.9732666015625, -0.9291534423828125, -0.885040283203125, -0.8409271240234375, -0.79681396484375, -0.7527008056640625, -0.708587646484375, -0.6644744873046875, -0.620361328125, -0.5762481689453125, -0.532135009765625, -0.4880218505859375, -0.44390869140625, -0.3997955322265625, -0.355682373046875, -0.3115692138671875, -0.2674560546875, -0.2233428955078125, -0.179229736328125, -0.1351165771484375, -0.09100341796875, -0.0468902587890625, -0.002777099609375, 0.0413360595703125, 0.08544921875, 0.1295623779296875, 0.173675537109375, 0.2177886962890625, 0.26190185546875, 0.3060150146484375, 0.350128173828125, 0.3942413330078125, 0.4383544921875, 0.4824676513671875, 0.526580810546875, 0.5706939697265625, 0.61480712890625, 0.6589202880859375, 0.703033447265625, 0.7471466064453125, 0.791259765625, 0.8353729248046875, 0.879486083984375, 0.9235992431640625, 0.96771240234375, 1.0118255615234375, 1.055938720703125, 1.1000518798828125, 1.1441650390625, 1.1882781982421875, 1.232391357421875, 1.2765045166015625, 1.32061767578125, 1.3647308349609375, 1.408843994140625, 1.4529571533203125, 1.4970703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 6.0, 5.0, 9.0, 22.0, 22.0, 32.0, 54.0, 89.0, 110.0, 192.0, 256.0, 416.0, 620.0, 914.0, 1514.0, 2233.0, 3428.0, 5151.0, 8128.0, 12722.0, 19324.0, 28964.0, 43851.0, 63639.0, 88532.0, 117569.0, 787983.0, 521285.0, 115115.0, 87754.0, 62387.0, 42753.0, 28508.0, 18707.0, 12207.0, 7958.0, 5107.0, 3372.0, 2088.0, 1381.0, 946.0, 645.0, 367.0, 263.0, 187.0, 98.0, 69.0, 59.0, 30.0, 29.0, 12.0, 15.0, 2.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.11224365234375, -0.10849857330322266, -0.10475349426269531, -0.10100841522216797, -0.09726333618164062, -0.09351825714111328, -0.08977317810058594, -0.0860280990600586, -0.08228302001953125, -0.0785379409790039, -0.07479286193847656, -0.07104778289794922, -0.06730270385742188, -0.06355762481689453, -0.05981254577636719, -0.056067466735839844, -0.0523223876953125, -0.048577308654785156, -0.04483222961425781, -0.04108715057373047, -0.037342071533203125, -0.03359699249267578, -0.029851913452148438, -0.026106834411621094, -0.02236175537109375, -0.018616676330566406, -0.014871597290039062, -0.011126518249511719, -0.007381439208984375, -0.0036363601684570312, 0.0001087188720703125, 0.0038537979125976562, 0.007598876953125, 0.011343955993652344, 0.015089035034179688, 0.01883411407470703, 0.022579193115234375, 0.02632427215576172, 0.030069351196289062, 0.033814430236816406, 0.03755950927734375, 0.041304588317871094, 0.04504966735839844, 0.04879474639892578, 0.052539825439453125, 0.05628490447998047, 0.06002998352050781, 0.06377506256103516, 0.0675201416015625, 0.07126522064208984, 0.07501029968261719, 0.07875537872314453, 0.08250045776367188, 0.08624553680419922, 0.08999061584472656, 0.0937356948852539, 0.09748077392578125, 0.1012258529663086, 0.10497093200683594, 0.10871601104736328, 0.11246109008789062, 0.11620616912841797, 0.11995124816894531, 0.12369632720947266, 0.12744140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 9.0, 7.0, 9.0, 23.0, 21.0, 27.0, 30.0, 48.0, 72.0, 136.0, 252.0, 120.0, 75.0, 30.0, 34.0, 29.0, 25.0, 10.0, 14.0, 9.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01226043701171875, -0.011882305145263672, -0.011504173278808594, -0.011126041412353516, -0.010747909545898438, -0.01036977767944336, -0.009991645812988281, -0.009613513946533203, -0.009235382080078125, -0.008857250213623047, -0.008479118347167969, -0.00810098648071289, -0.0077228546142578125, -0.007344722747802734, -0.006966590881347656, -0.006588459014892578, -0.0062103271484375, -0.005832195281982422, -0.005454063415527344, -0.005075931549072266, -0.0046977996826171875, -0.004319667816162109, -0.003941535949707031, -0.003563404083251953, -0.003185272216796875, -0.002807140350341797, -0.0024290084838867188, -0.0020508766174316406, -0.0016727447509765625, -0.0012946128845214844, -0.0009164810180664062, -0.0005383491516113281, -0.00016021728515625, 0.00021791458129882812, 0.0005960464477539062, 0.0009741783142089844, 0.0013523101806640625, 0.0017304420471191406, 0.0021085739135742188, 0.002486705780029297, 0.002864837646484375, 0.003242969512939453, 0.0036211013793945312, 0.003999233245849609, 0.0043773651123046875, 0.004755496978759766, 0.005133628845214844, 0.005511760711669922, 0.005889892578125, 0.006268024444580078, 0.006646156311035156, 0.007024288177490234, 0.0074024200439453125, 0.007780551910400391, 0.008158683776855469, 0.008536815643310547, 0.008914947509765625, 0.009293079376220703, 0.009671211242675781, 0.01004934310913086, 0.010427474975585938, 0.010805606842041016, 0.011183738708496094, 0.011561870574951172, 0.01194000244140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 8.0, 6.0, 9.0, 11.0, 19.0, 15.0, 23.0, 17.0, 31.0, 41.0, 50.0, 92.0, 139.0, 195.0, 318.0, 710.0, 4018.0, 651953.0, 385617.0, 3622.0, 690.0, 310.0, 186.0, 122.0, 85.0, 50.0, 43.0, 27.0, 26.0, 17.0, 12.0, 13.0, 12.0, 10.0, 7.0, 8.0, 8.0, 4.0, 4.0, 2.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.22021484375, -0.21373367309570312, -0.20725250244140625, -0.20077133178710938, -0.1942901611328125, -0.18780899047851562, -0.18132781982421875, -0.17484664916992188, -0.168365478515625, -0.16188430786132812, -0.15540313720703125, -0.14892196655273438, -0.1424407958984375, -0.13595962524414062, -0.12947845458984375, -0.12299728393554688, -0.11651611328125, -0.11003494262695312, -0.10355377197265625, -0.09707260131835938, -0.0905914306640625, -0.08411026000976562, -0.07762908935546875, -0.07114791870117188, -0.064666748046875, -0.058185577392578125, -0.05170440673828125, -0.045223236083984375, -0.0387420654296875, -0.032260894775390625, -0.02577972412109375, -0.019298553466796875, -0.0128173828125, -0.006336212158203125, 0.00014495849609375, 0.006626129150390625, 0.0131072998046875, 0.019588470458984375, 0.02606964111328125, 0.032550811767578125, 0.039031982421875, 0.045513153076171875, 0.05199432373046875, 0.058475494384765625, 0.0649566650390625, 0.07143783569335938, 0.07791900634765625, 0.08440017700195312, 0.09088134765625, 0.09736251831054688, 0.10384368896484375, 0.11032485961914062, 0.1168060302734375, 0.12328720092773438, 0.12976837158203125, 0.13624954223632812, 0.142730712890625, 0.14921188354492188, 0.15569305419921875, 0.16217422485351562, 0.1686553955078125, 0.17513656616210938, 0.18161773681640625, 0.18809890747070312, 0.194580078125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 24.0, 66.0, 412.0, 444.0, 55.0, 9.0], "bins": [-0.21687912940979004, -0.21332520246505737, -0.2097712755203247, -0.20621734857559204, -0.20266342163085938, -0.1991094946861267, -0.19555556774139404, -0.19200164079666138, -0.1884477138519287, -0.18489378690719604, -0.18133985996246338, -0.1777859330177307, -0.17423200607299805, -0.17067807912826538, -0.16712415218353271, -0.16357022523880005, -0.16001631319522858, -0.1564623862504959, -0.15290845930576324, -0.14935453236103058, -0.1458006054162979, -0.14224667847156525, -0.13869275152683258, -0.1351388394832611, -0.13158491253852844, -0.12803098559379578, -0.12447705864906311, -0.12092313170433044, -0.11736920475959778, -0.11381527781486511, -0.11026135832071304, -0.10670743137598038, -0.10315349698066711, -0.09959957003593445, -0.09604564309120178, -0.09249171614646912, -0.08893778920173645, -0.08538386225700378, -0.08182994276285172, -0.07827601581811905, -0.07472209632396698, -0.07116816937923431, -0.06761424243450165, -0.06406031548976898, -0.060506392270326614, -0.05695246532559395, -0.05339854210615158, -0.049844615161418915, -0.04629068449139595, -0.042736757546663284, -0.03918283432722092, -0.03562890738248825, -0.032074980437755585, -0.02852105349302292, -0.024967128410935402, -0.021413203328847885, -0.01785927638411522, -0.014305350370705128, -0.010751424357295036, -0.007197498343884945, -0.0036435723304748535, -8.96453857421875e-05, 0.0034642796963453293, 0.007018204778432846, 0.010572131723165512]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 7.0, 6.0, 10.0, 7.0, 17.0, 11.0, 16.0, 19.0, 22.0, 23.0, 17.0, 34.0, 37.0, 38.0, 34.0, 40.0, 37.0, 47.0, 44.0, 38.0, 52.0, 42.0, 42.0, 46.0, 30.0, 21.0, 37.0, 23.0, 31.0, 24.0, 22.0, 24.0, 14.0, 14.0, 12.0, 12.0, 10.0, 8.0, 6.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042945146560668945, -0.004139101132750511, -0.003983687609434128, -0.0038282740861177444, -0.003672860562801361, -0.0035174470394849777, -0.0033620335161685944, -0.003206619992852211, -0.0030512064695358276, -0.0028957929462194443, -0.002740379422903061, -0.0025849658995866776, -0.002429552376270294, -0.002274138852953911, -0.0021187253296375275, -0.001963311806321144, -0.0018078982830047607, -0.0016524847596883774, -0.001497071236371994, -0.0013416577130556107, -0.0011862441897392273, -0.001030830666422844, -0.0008754171431064606, -0.0007200036197900772, -0.0005645900964736938, -0.0004091765731573105, -0.0002537630498409271, -9.834952652454376e-05, 5.70639967918396e-05, 0.00021247752010822296, 0.0003678910434246063, 0.0005233045667409897, 0.000678718090057373, 0.0008341316133737564, 0.0009895451366901398, 0.0011449586600065231, 0.0013003721833229065, 0.0014557857066392899, 0.0016111992299556732, 0.0017666127532720566, 0.00192202627658844, 0.0020774397999048233, 0.0022328533232212067, 0.00238826684653759, 0.0025436803698539734, 0.0026990938931703568, 0.00285450741648674, 0.0030099209398031235, 0.003165334463119507, 0.00332074798643589, 0.0034761615097522736, 0.003631575033068657, 0.0037869885563850403, 0.003942402079701424, 0.004097815603017807, 0.00425322912633419, 0.004408642649650574, 0.004564056172966957, 0.0047194696962833405, 0.004874883219599724, 0.005030296742916107, 0.0051857102662324905, 0.005341123789548874, 0.005496537312865257, 0.005651950836181641]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 10.0, 9.0, 9.0, 16.0, 17.0, 19.0, 17.0, 22.0, 18.0, 30.0, 33.0, 26.0, 25.0, 42.0, 41.0, 30.0, 43.0, 52.0, 53.0, 47.0, 32.0, 45.0, 32.0, 45.0, 38.0, 30.0, 23.0, 27.0, 21.0, 28.0, 18.0, 17.0, 25.0, 7.0, 14.0, 8.0, 4.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.298828125, -2.230072021484375, -2.16131591796875, -2.092559814453125, -2.0238037109375, -1.955047607421875, -1.88629150390625, -1.817535400390625, -1.748779296875, -1.680023193359375, -1.61126708984375, -1.542510986328125, -1.4737548828125, -1.404998779296875, -1.33624267578125, -1.267486572265625, -1.19873046875, -1.129974365234375, -1.06121826171875, -0.992462158203125, -0.9237060546875, -0.854949951171875, -0.78619384765625, -0.717437744140625, -0.648681640625, -0.579925537109375, -0.51116943359375, -0.442413330078125, -0.3736572265625, -0.304901123046875, -0.23614501953125, -0.167388916015625, -0.0986328125, -0.029876708984375, 0.03887939453125, 0.107635498046875, 0.1763916015625, 0.245147705078125, 0.31390380859375, 0.382659912109375, 0.451416015625, 0.520172119140625, 0.58892822265625, 0.657684326171875, 0.7264404296875, 0.795196533203125, 0.86395263671875, 0.932708740234375, 1.00146484375, 1.070220947265625, 1.13897705078125, 1.207733154296875, 1.2764892578125, 1.345245361328125, 1.41400146484375, 1.482757568359375, 1.551513671875, 1.620269775390625, 1.68902587890625, 1.757781982421875, 1.8265380859375, 1.895294189453125, 1.96405029296875, 2.032806396484375, 2.1015625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 4.0, 18.0, 15.0, 41.0, 46.0, 73.0, 132.0, 187.0, 276.0, 420.0, 665.0, 994.0, 1591.0, 2431.0, 3792.0, 6061.0, 10133.0, 18502.0, 37262.0, 88424.0, 238020.0, 356693.0, 158297.0, 61065.0, 27069.0, 14335.0, 8204.0, 4800.0, 3143.0, 2028.0, 1320.0, 888.0, 589.0, 373.0, 252.0, 140.0, 100.0, 63.0, 45.0, 28.0, 13.0, 12.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.9951171875, -1.941619873046875, -1.88812255859375, -1.834625244140625, -1.7811279296875, -1.727630615234375, -1.67413330078125, -1.620635986328125, -1.567138671875, -1.513641357421875, -1.46014404296875, -1.406646728515625, -1.3531494140625, -1.299652099609375, -1.24615478515625, -1.192657470703125, -1.13916015625, -1.085662841796875, -1.03216552734375, -0.978668212890625, -0.9251708984375, -0.871673583984375, -0.81817626953125, -0.764678955078125, -0.711181640625, -0.657684326171875, -0.60418701171875, -0.550689697265625, -0.4971923828125, -0.443695068359375, -0.39019775390625, -0.336700439453125, -0.283203125, -0.229705810546875, -0.17620849609375, -0.122711181640625, -0.0692138671875, -0.015716552734375, 0.03778076171875, 0.091278076171875, 0.144775390625, 0.198272705078125, 0.25177001953125, 0.305267333984375, 0.3587646484375, 0.412261962890625, 0.46575927734375, 0.519256591796875, 0.57275390625, 0.626251220703125, 0.67974853515625, 0.733245849609375, 0.7867431640625, 0.840240478515625, 0.89373779296875, 0.947235107421875, 1.000732421875, 1.054229736328125, 1.10772705078125, 1.161224365234375, 1.2147216796875, 1.268218994140625, 1.32171630859375, 1.375213623046875, 1.4287109375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 2.0, 7.0, 3.0, 5.0, 9.0, 10.0, 17.0, 17.0, 12.0, 24.0, 19.0, 22.0, 22.0, 25.0, 42.0, 33.0, 46.0, 37.0, 52.0, 61.0, 171.0, 1524.0, 350.0, 110.0, 63.0, 43.0, 37.0, 34.0, 31.0, 27.0, 27.0, 29.0, 18.0, 21.0, 16.0, 13.0, 12.0, 6.0, 12.0, 11.0, 10.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.99609375, -7.7528076171875, -7.509521484375, -7.2662353515625, -7.02294921875, -6.7796630859375, -6.536376953125, -6.2930908203125, -6.0498046875, -5.8065185546875, -5.563232421875, -5.3199462890625, -5.07666015625, -4.8333740234375, -4.590087890625, -4.3468017578125, -4.103515625, -3.8602294921875, -3.616943359375, -3.3736572265625, -3.13037109375, -2.8870849609375, -2.643798828125, -2.4005126953125, -2.1572265625, -1.9139404296875, -1.670654296875, -1.4273681640625, -1.18408203125, -0.9407958984375, -0.697509765625, -0.4542236328125, -0.2109375, 0.0323486328125, 0.275634765625, 0.5189208984375, 0.76220703125, 1.0054931640625, 1.248779296875, 1.4920654296875, 1.7353515625, 1.9786376953125, 2.221923828125, 2.4652099609375, 2.70849609375, 2.9517822265625, 3.195068359375, 3.4383544921875, 3.681640625, 3.9249267578125, 4.168212890625, 4.4114990234375, 4.65478515625, 4.8980712890625, 5.141357421875, 5.3846435546875, 5.6279296875, 5.8712158203125, 6.114501953125, 6.3577880859375, 6.60107421875, 6.8443603515625, 7.087646484375, 7.3309326171875, 7.57421875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 5.0, 0.0, 4.0, 3.0, 6.0, 4.0, 7.0, 7.0, 11.0, 9.0, 13.0, 11.0, 24.0, 21.0, 25.0, 36.0, 43.0, 68.0, 88.0, 132.0, 235.0, 455.0, 1271.0, 8314.0, 203147.0, 2877153.0, 48882.0, 3906.0, 841.0, 365.0, 169.0, 114.0, 80.0, 44.0, 37.0, 29.0, 24.0, 25.0, 30.0, 17.0, 10.0, 11.0, 10.0, 4.0, 3.0, 9.0, 8.0, 1.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.578125, -11.1832275390625, -10.788330078125, -10.3934326171875, -9.99853515625, -9.6036376953125, -9.208740234375, -8.8138427734375, -8.4189453125, -8.0240478515625, -7.629150390625, -7.2342529296875, -6.83935546875, -6.4444580078125, -6.049560546875, -5.6546630859375, -5.259765625, -4.8648681640625, -4.469970703125, -4.0750732421875, -3.68017578125, -3.2852783203125, -2.890380859375, -2.4954833984375, -2.1005859375, -1.7056884765625, -1.310791015625, -0.9158935546875, -0.52099609375, -0.1260986328125, 0.268798828125, 0.6636962890625, 1.05859375, 1.4534912109375, 1.848388671875, 2.2432861328125, 2.63818359375, 3.0330810546875, 3.427978515625, 3.8228759765625, 4.2177734375, 4.6126708984375, 5.007568359375, 5.4024658203125, 5.79736328125, 6.1922607421875, 6.587158203125, 6.9820556640625, 7.376953125, 7.7718505859375, 8.166748046875, 8.5616455078125, 8.95654296875, 9.3514404296875, 9.746337890625, 10.1412353515625, 10.5361328125, 10.9310302734375, 11.325927734375, 11.7208251953125, 12.11572265625, 12.5106201171875, 12.905517578125, 13.3004150390625, 13.6953125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 385.0, 631.0, 2.0, 0.0, 0.0, 1.0], "bins": [-253.60528564453125, -249.31167602539062, -245.01806640625, -240.7244415283203, -236.4308319091797, -232.13722229003906, -227.84361267089844, -223.5500030517578, -219.25637817382812, -214.9627685546875, -210.66915893554688, -206.3755340576172, -202.08192443847656, -197.78831481933594, -193.4947052001953, -189.2010955810547, -184.90748596191406, -180.61387634277344, -176.3202667236328, -172.02664184570312, -167.7330322265625, -163.43942260742188, -159.14581298828125, -154.85220336914062, -150.55859375, -146.26498413085938, -141.97137451171875, -137.67774963378906, -133.38414001464844, -129.0905303955078, -124.79692077636719, -120.50331115722656, -116.20967864990234, -111.91606903076172, -107.62245178222656, -103.32884216308594, -99.03523254394531, -94.74161529541016, -90.44800567626953, -86.15438842773438, -81.86077880859375, -77.56716918945312, -73.27355194091797, -68.97994232177734, -64.68632507324219, -60.39271545410156, -56.09910583496094, -51.80549240112305, -47.511878967285156, -43.218265533447266, -38.924652099609375, -34.63104248046875, -30.33742904663086, -26.04381561279297, -21.75020408630371, -17.456592559814453, -13.162979125976562, -8.869366645812988, -4.575754165649414, -0.28214168548583984, 4.011470794677734, 8.305084228515625, 12.598695755004883, 16.89230728149414, 21.18592071533203]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 8.0, 8.0, 11.0, 9.0, 15.0, 9.0, 12.0, 19.0, 23.0, 25.0, 37.0, 27.0, 26.0, 31.0, 47.0, 34.0, 38.0, 45.0, 32.0, 50.0, 48.0, 26.0, 36.0, 40.0, 41.0, 42.0, 26.0, 37.0, 24.0, 33.0, 20.0, 20.0, 16.0, 14.0, 11.0, 6.0, 5.0, 9.0, 10.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.641633987426758, -23.86092758178711, -23.08022117614746, -22.299514770507812, -21.518808364868164, -20.738101959228516, -19.957395553588867, -19.17668914794922, -18.39598274230957, -17.615276336669922, -16.834569931030273, -16.053863525390625, -15.273157119750977, -14.492450714111328, -13.71174430847168, -12.931037902832031, -12.150331497192383, -11.369625091552734, -10.588918685913086, -9.808212280273438, -9.027505874633789, -8.24679946899414, -7.466093063354492, -6.685386657714844, -5.904680252075195, -5.123973846435547, -4.343267440795898, -3.56256103515625, -2.7818546295166016, -2.001148223876953, -1.2204418182373047, -0.43973541259765625, 0.340972900390625, 1.1216793060302734, 1.9023857116699219, 2.6830921173095703, 3.4637985229492188, 4.244504928588867, 5.025211334228516, 5.805917739868164, 6.5866241455078125, 7.367330551147461, 8.14803695678711, 8.928743362426758, 9.709449768066406, 10.490156173706055, 11.270862579345703, 12.051568984985352, 12.832275390625, 13.612981796264648, 14.393688201904297, 15.174394607543945, 15.955101013183594, 16.735807418823242, 17.51651382446289, 18.29722023010254, 19.077926635742188, 19.858633041381836, 20.639339447021484, 21.420045852661133, 22.20075225830078, 22.98145866394043, 23.762165069580078, 24.542871475219727, 25.323577880859375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 7.0, 1.0, 5.0, 5.0, 13.0, 10.0, 12.0, 11.0, 16.0, 11.0, 25.0, 24.0, 24.0, 22.0, 25.0, 32.0, 32.0, 36.0, 31.0, 49.0, 42.0, 49.0, 46.0, 47.0, 36.0, 32.0, 32.0, 54.0, 45.0, 23.0, 22.0, 21.0, 26.0, 29.0, 18.0, 17.0, 15.0, 20.0, 10.0, 9.0, 7.0, 4.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.36328125, -2.29254150390625, -2.2218017578125, -2.15106201171875, -2.080322265625, -2.00958251953125, -1.9388427734375, -1.86810302734375, -1.79736328125, -1.72662353515625, -1.6558837890625, -1.58514404296875, -1.514404296875, -1.44366455078125, -1.3729248046875, -1.30218505859375, -1.2314453125, -1.16070556640625, -1.0899658203125, -1.01922607421875, -0.948486328125, -0.87774658203125, -0.8070068359375, -0.73626708984375, -0.66552734375, -0.59478759765625, -0.5240478515625, -0.45330810546875, -0.382568359375, -0.31182861328125, -0.2410888671875, -0.17034912109375, -0.099609375, -0.02886962890625, 0.0418701171875, 0.11260986328125, 0.183349609375, 0.25408935546875, 0.3248291015625, 0.39556884765625, 0.46630859375, 0.53704833984375, 0.6077880859375, 0.67852783203125, 0.749267578125, 0.82000732421875, 0.8907470703125, 0.96148681640625, 1.0322265625, 1.10296630859375, 1.1737060546875, 1.24444580078125, 1.315185546875, 1.38592529296875, 1.4566650390625, 1.52740478515625, 1.59814453125, 1.66888427734375, 1.7396240234375, 1.81036376953125, 1.881103515625, 1.95184326171875, 2.0225830078125, 2.09332275390625, 2.1640625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 12.0, 7.0, 11.0, 8.0, 14.0, 15.0, 22.0, 31.0, 23.0, 36.0, 37.0, 83.0, 98.0, 131.0, 231.0, 640.0, 2543.0, 12839.0, 85243.0, 1174053.0, 2685708.0, 201230.0, 24785.0, 4504.0, 1027.0, 316.0, 176.0, 100.0, 72.0, 60.0, 47.0, 29.0, 20.0, 24.0, 19.0, 18.0, 10.0, 14.0, 5.0, 8.0, 4.0, 5.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-10.5, -10.19287109375, -9.8857421875, -9.57861328125, -9.271484375, -8.96435546875, -8.6572265625, -8.35009765625, -8.04296875, -7.73583984375, -7.4287109375, -7.12158203125, -6.814453125, -6.50732421875, -6.2001953125, -5.89306640625, -5.5859375, -5.27880859375, -4.9716796875, -4.66455078125, -4.357421875, -4.05029296875, -3.7431640625, -3.43603515625, -3.12890625, -2.82177734375, -2.5146484375, -2.20751953125, -1.900390625, -1.59326171875, -1.2861328125, -0.97900390625, -0.671875, -0.36474609375, -0.0576171875, 0.24951171875, 0.556640625, 0.86376953125, 1.1708984375, 1.47802734375, 1.78515625, 2.09228515625, 2.3994140625, 2.70654296875, 3.013671875, 3.32080078125, 3.6279296875, 3.93505859375, 4.2421875, 4.54931640625, 4.8564453125, 5.16357421875, 5.470703125, 5.77783203125, 6.0849609375, 6.39208984375, 6.69921875, 7.00634765625, 7.3134765625, 7.62060546875, 7.927734375, 8.23486328125, 8.5419921875, 8.84912109375, 9.15625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 13.0, 15.0, 18.0, 18.0, 36.0, 49.0, 64.0, 96.0, 146.0, 180.0, 235.0, 359.0, 458.0, 462.0, 498.0, 433.0, 297.0, 199.0, 147.0, 108.0, 62.0, 60.0, 37.0, 21.0, 22.0, 9.0, 10.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-10.765625, -10.50750732421875, -10.2493896484375, -9.99127197265625, -9.733154296875, -9.47503662109375, -9.2169189453125, -8.95880126953125, -8.70068359375, -8.44256591796875, -8.1844482421875, -7.92633056640625, -7.668212890625, -7.41009521484375, -7.1519775390625, -6.89385986328125, -6.6357421875, -6.37762451171875, -6.1195068359375, -5.86138916015625, -5.603271484375, -5.34515380859375, -5.0870361328125, -4.82891845703125, -4.57080078125, -4.31268310546875, -4.0545654296875, -3.79644775390625, -3.538330078125, -3.28021240234375, -3.0220947265625, -2.76397705078125, -2.505859375, -2.24774169921875, -1.9896240234375, -1.73150634765625, -1.473388671875, -1.21527099609375, -0.9571533203125, -0.69903564453125, -0.44091796875, -0.18280029296875, 0.0753173828125, 0.33343505859375, 0.591552734375, 0.84967041015625, 1.1077880859375, 1.36590576171875, 1.6240234375, 1.88214111328125, 2.1402587890625, 2.39837646484375, 2.656494140625, 2.91461181640625, 3.1727294921875, 3.43084716796875, 3.68896484375, 3.94708251953125, 4.2052001953125, 4.46331787109375, 4.721435546875, 4.97955322265625, 5.2376708984375, 5.49578857421875, 5.75390625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 10.0, 7.0, 13.0, 12.0, 34.0, 53.0, 64.0, 123.0, 212.0, 381.0, 859.0, 3260.0, 37469.0, 1438805.0, 2640805.0, 65504.0, 4613.0, 964.0, 464.0, 246.0, 151.0, 68.0, 64.0, 41.0, 31.0, 11.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-25.1875, -24.42626953125, -23.6650390625, -22.90380859375, -22.142578125, -21.38134765625, -20.6201171875, -19.85888671875, -19.09765625, -18.33642578125, -17.5751953125, -16.81396484375, -16.052734375, -15.29150390625, -14.5302734375, -13.76904296875, -13.0078125, -12.24658203125, -11.4853515625, -10.72412109375, -9.962890625, -9.20166015625, -8.4404296875, -7.67919921875, -6.91796875, -6.15673828125, -5.3955078125, -4.63427734375, -3.873046875, -3.11181640625, -2.3505859375, -1.58935546875, -0.828125, -0.06689453125, 0.6943359375, 1.45556640625, 2.216796875, 2.97802734375, 3.7392578125, 4.50048828125, 5.26171875, 6.02294921875, 6.7841796875, 7.54541015625, 8.306640625, 9.06787109375, 9.8291015625, 10.59033203125, 11.3515625, 12.11279296875, 12.8740234375, 13.63525390625, 14.396484375, 15.15771484375, 15.9189453125, 16.68017578125, 17.44140625, 18.20263671875, 18.9638671875, 19.72509765625, 20.486328125, 21.24755859375, 22.0087890625, 22.77001953125, 23.53125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 9.0, 33.0, 92.0, 164.0, 225.0, 217.0, 150.0, 76.0, 31.0, 11.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.0709114074707, -55.74771499633789, -53.424522399902344, -51.10132598876953, -48.77812957763672, -46.454933166503906, -44.131736755371094, -41.80854415893555, -39.485347747802734, -37.16215133666992, -34.838958740234375, -32.51576232910156, -30.19256591796875, -27.869369506835938, -25.546175003051758, -23.222980499267578, -20.899784088134766, -18.576587677001953, -16.253393173217773, -13.930197715759277, -11.607002258300781, -9.283806800842285, -6.960611343383789, -4.637416839599609, -2.314220428466797, 0.008975028991699219, 2.3321704864501953, 4.655365943908691, 6.9785614013671875, 9.301756858825684, 11.62495231628418, 13.94814682006836, 16.271347045898438, 18.59454345703125, 20.91773796081543, 23.24093246459961, 25.564128875732422, 27.887325286865234, 30.210519790649414, 32.533714294433594, 34.856910705566406, 37.18010711669922, 39.50330352783203, 41.82649612426758, 44.14969253540039, 46.4728889465332, 48.79608154296875, 51.11927795410156, 53.442474365234375, 55.76567077636719, 58.0888671875, 60.41205978393555, 62.73525619506836, 65.0584487915039, 67.38164520263672, 69.70484161376953, 72.02803802490234, 74.35123443603516, 76.67443084716797, 78.99762725830078, 81.32081604003906, 83.64401245117188, 85.96720886230469, 88.2904052734375, 90.61360168457031]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 4.0, 4.0, 4.0, 10.0, 12.0, 17.0, 13.0, 16.0, 22.0, 11.0, 26.0, 24.0, 33.0, 32.0, 35.0, 33.0, 43.0, 30.0, 49.0, 36.0, 40.0, 53.0, 30.0, 38.0, 40.0, 42.0, 36.0, 31.0, 16.0, 29.0, 17.0, 31.0, 12.0, 17.0, 18.0, 16.0, 16.0, 11.0, 7.0, 8.0, 8.0, 10.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-24.102630615234375, -23.330764770507812, -22.558897018432617, -21.787031173706055, -21.01516342163086, -20.243297576904297, -19.4714298248291, -18.69956398010254, -17.927696228027344, -17.15583038330078, -16.383962631225586, -15.612095832824707, -14.840229034423828, -14.06836223602295, -13.29649543762207, -12.524629592895508, -11.752762794494629, -10.98089599609375, -10.209029197692871, -9.437162399291992, -8.665295600891113, -7.893428802490234, -7.121562480926514, -6.349695682525635, -5.577828884124756, -4.805962085723877, -4.034095287322998, -3.2622287273406982, -2.4903619289398193, -1.7184951305389404, -0.9466285705566406, -0.17476177215576172, 0.5971050262451172, 1.368971824645996, 2.140838623046875, 2.912705183029175, 3.6845719814300537, 4.456439018249512, 5.228305339813232, 6.000172138214111, 6.77203893661499, 7.543905735015869, 8.31577205657959, 9.087638854980469, 9.859505653381348, 10.631372451782227, 11.403239250183105, 12.175106048583984, 12.946972846984863, 13.718839645385742, 14.490706443786621, 15.2625732421875, 16.034439086914062, 16.806306838989258, 17.57817268371582, 18.350040435791016, 19.121906280517578, 19.89377212524414, 20.665639877319336, 21.4375057220459, 22.209373474121094, 22.981239318847656, 23.75310707092285, 24.524972915649414, 25.29684066772461]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 8.0, 5.0, 8.0, 13.0, 5.0, 19.0, 16.0, 18.0, 27.0, 23.0, 16.0, 29.0, 35.0, 34.0, 29.0, 42.0, 44.0, 54.0, 33.0, 42.0, 49.0, 34.0, 43.0, 42.0, 33.0, 37.0, 29.0, 32.0, 33.0, 29.0, 25.0, 16.0, 20.0, 18.0, 7.0, 15.0, 7.0, 5.0, 7.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.322265625, -2.24658203125, -2.1708984375, -2.09521484375, -2.01953125, -1.94384765625, -1.8681640625, -1.79248046875, -1.716796875, -1.64111328125, -1.5654296875, -1.48974609375, -1.4140625, -1.33837890625, -1.2626953125, -1.18701171875, -1.111328125, -1.03564453125, -0.9599609375, -0.88427734375, -0.80859375, -0.73291015625, -0.6572265625, -0.58154296875, -0.505859375, -0.43017578125, -0.3544921875, -0.27880859375, -0.203125, -0.12744140625, -0.0517578125, 0.02392578125, 0.099609375, 0.17529296875, 0.2509765625, 0.32666015625, 0.40234375, 0.47802734375, 0.5537109375, 0.62939453125, 0.705078125, 0.78076171875, 0.8564453125, 0.93212890625, 1.0078125, 1.08349609375, 1.1591796875, 1.23486328125, 1.310546875, 1.38623046875, 1.4619140625, 1.53759765625, 1.61328125, 1.68896484375, 1.7646484375, 1.84033203125, 1.916015625, 1.99169921875, 2.0673828125, 2.14306640625, 2.21875, 2.29443359375, 2.3701171875, 2.44580078125, 2.521484375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 0.0, 12.0, 14.0, 14.0, 25.0, 28.0, 35.0, 58.0, 71.0, 130.0, 224.0, 296.0, 449.0, 774.0, 1236.0, 2012.0, 3597.0, 6358.0, 11591.0, 21553.0, 40549.0, 75667.0, 135172.0, 208545.0, 216668.0, 144833.0, 81993.0, 44159.0, 23510.0, 12538.0, 6830.0, 3781.0, 2228.0, 1262.0, 817.0, 494.0, 318.0, 238.0, 133.0, 116.0, 70.0, 46.0, 46.0, 14.0, 22.0, 15.0, 6.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.296142578125, -0.28629302978515625, -0.2764434814453125, -0.26659393310546875, -0.256744384765625, -0.24689483642578125, -0.2370452880859375, -0.22719573974609375, -0.21734619140625, -0.20749664306640625, -0.1976470947265625, -0.18779754638671875, -0.177947998046875, -0.16809844970703125, -0.1582489013671875, -0.14839935302734375, -0.1385498046875, -0.12870025634765625, -0.1188507080078125, -0.10900115966796875, -0.099151611328125, -0.08930206298828125, -0.0794525146484375, -0.06960296630859375, -0.05975341796875, -0.04990386962890625, -0.0400543212890625, -0.03020477294921875, -0.020355224609375, -0.01050567626953125, -0.0006561279296875, 0.00919342041015625, 0.01904296875, 0.02889251708984375, 0.0387420654296875, 0.04859161376953125, 0.058441162109375, 0.06829071044921875, 0.0781402587890625, 0.08798980712890625, 0.09783935546875, 0.10768890380859375, 0.1175384521484375, 0.12738800048828125, 0.137237548828125, 0.14708709716796875, 0.1569366455078125, 0.16678619384765625, 0.1766357421875, 0.18648529052734375, 0.1963348388671875, 0.20618438720703125, 0.216033935546875, 0.22588348388671875, 0.2357330322265625, 0.24558258056640625, 0.25543212890625, 0.26528167724609375, 0.2751312255859375, 0.28498077392578125, 0.294830322265625, 0.30467987060546875, 0.3145294189453125, 0.32437896728515625, 0.334228515625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 9.0, 6.0, 10.0, 11.0, 15.0, 18.0, 26.0, 23.0, 30.0, 33.0, 19.0, 30.0, 32.0, 36.0, 29.0, 35.0, 31.0, 44.0, 1063.0, 41.0, 32.0, 43.0, 29.0, 40.0, 36.0, 50.0, 29.0, 33.0, 21.0, 22.0, 28.0, 17.0, 15.0, 12.0, 14.0, 10.0, 11.0, 11.0, 2.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5537109375, -1.5048370361328125, -1.455963134765625, -1.4070892333984375, -1.35821533203125, -1.3093414306640625, -1.260467529296875, -1.2115936279296875, -1.1627197265625, -1.1138458251953125, -1.064971923828125, -1.0160980224609375, -0.96722412109375, -0.9183502197265625, -0.869476318359375, -0.8206024169921875, -0.771728515625, -0.7228546142578125, -0.673980712890625, -0.6251068115234375, -0.57623291015625, -0.5273590087890625, -0.478485107421875, -0.4296112060546875, -0.3807373046875, -0.3318634033203125, -0.282989501953125, -0.2341156005859375, -0.18524169921875, -0.1363677978515625, -0.087493896484375, -0.0386199951171875, 0.01025390625, 0.0591278076171875, 0.108001708984375, 0.1568756103515625, 0.20574951171875, 0.2546234130859375, 0.303497314453125, 0.3523712158203125, 0.4012451171875, 0.4501190185546875, 0.498992919921875, 0.5478668212890625, 0.59674072265625, 0.6456146240234375, 0.694488525390625, 0.7433624267578125, 0.792236328125, 0.8411102294921875, 0.889984130859375, 0.9388580322265625, 0.98773193359375, 1.0366058349609375, 1.085479736328125, 1.1343536376953125, 1.1832275390625, 1.2321014404296875, 1.280975341796875, 1.3298492431640625, 1.37872314453125, 1.4275970458984375, 1.476470947265625, 1.5253448486328125, 1.57421875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [8.0, 2.0, 5.0, 5.0, 12.0, 8.0, 16.0, 26.0, 29.0, 53.0, 67.0, 105.0, 148.0, 205.0, 326.0, 423.0, 634.0, 941.0, 1378.0, 1960.0, 2970.0, 4360.0, 6729.0, 9863.0, 15002.0, 21922.0, 32562.0, 47649.0, 68087.0, 91808.0, 123754.0, 1031802.0, 255653.0, 109352.0, 82323.0, 59437.0, 41300.0, 28192.0, 19019.0, 12817.0, 8563.0, 5684.0, 3822.0, 2590.0, 1740.0, 1183.0, 814.0, 550.0, 375.0, 275.0, 172.0, 136.0, 106.0, 64.0, 29.0, 34.0, 16.0, 10.0, 12.0, 4.0, 6.0, 10.0, 4.0, 1.0], "bins": [-0.1214599609375, -0.11764144897460938, -0.11382293701171875, -0.11000442504882812, -0.1061859130859375, -0.10236740112304688, -0.09854888916015625, -0.09473037719726562, -0.090911865234375, -0.08709335327148438, -0.08327484130859375, -0.07945632934570312, -0.0756378173828125, -0.07181930541992188, -0.06800079345703125, -0.06418228149414062, -0.06036376953125, -0.056545257568359375, -0.05272674560546875, -0.048908233642578125, -0.0450897216796875, -0.041271209716796875, -0.03745269775390625, -0.033634185791015625, -0.029815673828125, -0.025997161865234375, -0.02217864990234375, -0.018360137939453125, -0.0145416259765625, -0.010723114013671875, -0.00690460205078125, -0.003086090087890625, 0.000732421875, 0.004550933837890625, 0.00836944580078125, 0.012187957763671875, 0.0160064697265625, 0.019824981689453125, 0.02364349365234375, 0.027462005615234375, 0.031280517578125, 0.035099029541015625, 0.03891754150390625, 0.042736053466796875, 0.0465545654296875, 0.050373077392578125, 0.05419158935546875, 0.058010101318359375, 0.06182861328125, 0.06564712524414062, 0.06946563720703125, 0.07328414916992188, 0.0771026611328125, 0.08092117309570312, 0.08473968505859375, 0.08855819702148438, 0.092376708984375, 0.09619522094726562, 0.10001373291015625, 0.10383224487304688, 0.1076507568359375, 0.11146926879882812, 0.11528778076171875, 0.11910629272460938, 0.1229248046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 7.0, 7.0, 17.0, 18.0, 19.0, 30.0, 39.0, 36.0, 85.0, 192.0, 207.0, 117.0, 60.0, 42.0, 24.0, 20.0, 15.0, 10.0, 8.0, 14.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02410888671875, -0.02331066131591797, -0.022512435913085938, -0.021714210510253906, -0.020915985107421875, -0.020117759704589844, -0.019319534301757812, -0.01852130889892578, -0.01772308349609375, -0.01692485809326172, -0.016126632690429688, -0.015328407287597656, -0.014530181884765625, -0.013731956481933594, -0.012933731079101562, -0.012135505676269531, -0.0113372802734375, -0.010539054870605469, -0.009740829467773438, -0.008942604064941406, -0.008144378662109375, -0.007346153259277344, -0.0065479278564453125, -0.005749702453613281, -0.00495147705078125, -0.004153251647949219, -0.0033550262451171875, -0.0025568008422851562, -0.001758575439453125, -0.0009603500366210938, -0.0001621246337890625, 0.0006361007690429688, 0.001434326171875, 0.0022325515747070312, 0.0030307769775390625, 0.0038290023803710938, 0.004627227783203125, 0.005425453186035156, 0.0062236785888671875, 0.007021903991699219, 0.00782012939453125, 0.008618354797363281, 0.009416580200195312, 0.010214805603027344, 0.011013031005859375, 0.011811256408691406, 0.012609481811523438, 0.013407707214355469, 0.0142059326171875, 0.015004158020019531, 0.015802383422851562, 0.016600608825683594, 0.017398834228515625, 0.018197059631347656, 0.018995285034179688, 0.01979351043701172, 0.02059173583984375, 0.02138996124267578, 0.022188186645507812, 0.022986412048339844, 0.023784637451171875, 0.024582862854003906, 0.025381088256835938, 0.02617931365966797, 0.0269775390625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 9.0, 9.0, 18.0, 23.0, 32.0, 49.0, 83.0, 102.0, 142.0, 253.0, 630.0, 3947.0, 133412.0, 900243.0, 7671.0, 1072.0, 313.0, 139.0, 128.0, 67.0, 45.0, 38.0, 23.0, 15.0, 12.0, 16.0, 11.0, 6.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364013671875, -0.35193634033203125, -0.3398590087890625, -0.32778167724609375, -0.315704345703125, -0.30362701416015625, -0.2915496826171875, -0.27947235107421875, -0.26739501953125, -0.25531768798828125, -0.2432403564453125, -0.23116302490234375, -0.219085693359375, -0.20700836181640625, -0.1949310302734375, -0.18285369873046875, -0.1707763671875, -0.15869903564453125, -0.1466217041015625, -0.13454437255859375, -0.122467041015625, -0.11038970947265625, -0.0983123779296875, -0.08623504638671875, -0.07415771484375, -0.06208038330078125, -0.0500030517578125, -0.03792572021484375, -0.025848388671875, -0.01377105712890625, -0.0016937255859375, 0.01038360595703125, 0.0224609375, 0.03453826904296875, 0.0466156005859375, 0.05869293212890625, 0.070770263671875, 0.08284759521484375, 0.0949249267578125, 0.10700225830078125, 0.11907958984375, 0.13115692138671875, 0.1432342529296875, 0.15531158447265625, 0.167388916015625, 0.17946624755859375, 0.1915435791015625, 0.20362091064453125, 0.2156982421875, 0.22777557373046875, 0.2398529052734375, 0.25193023681640625, 0.264007568359375, 0.27608489990234375, 0.2881622314453125, 0.30023956298828125, 0.31231689453125, 0.32439422607421875, 0.3364715576171875, 0.34854888916015625, 0.360626220703125, 0.37270355224609375, 0.3847808837890625, 0.39685821533203125, 0.408935546875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 21.0, 36.0, 86.0, 278.0, 419.0, 117.0, 35.0, 11.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23239365220069885, -0.2279408872127533, -0.22348812222480774, -0.21903537213802338, -0.21458260715007782, -0.21012984216213226, -0.2056770920753479, -0.20122432708740234, -0.1967715620994568, -0.19231879711151123, -0.18786603212356567, -0.1834132820367813, -0.17896051704883575, -0.1745077520608902, -0.17005500197410583, -0.16560223698616028, -0.16114947199821472, -0.15669670701026917, -0.1522439420223236, -0.14779119193553925, -0.1433384269475937, -0.13888566195964813, -0.13443291187286377, -0.1299801468849182, -0.12552738189697266, -0.1210746169090271, -0.11662185937166214, -0.11216910183429718, -0.10771633684635162, -0.10326357185840607, -0.09881081432104111, -0.09435805678367615, -0.08990529179573059, -0.08545252680778503, -0.08099976927042007, -0.07654701173305511, -0.07209424674510956, -0.067641481757164, -0.06318872421979904, -0.058735962957143784, -0.054283205419778824, -0.049830444157123566, -0.04537768289446831, -0.04092492163181305, -0.03647216036915779, -0.03201939910650253, -0.027566637843847275, -0.023113876581192017, -0.01866111531853676, -0.0142083540558815, -0.009755592793226242, -0.005302831530570984, -0.0008500702679157257, 0.0036026909947395325, 0.00805545225739479, 0.012508213520050049, 0.016960974782705307, 0.021413736045360565, 0.025866497308015823, 0.03031925857067108, 0.03477201983332634, 0.0392247810959816, 0.043677542358636856, 0.048130303621292114, 0.05258306488394737]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 8.0, 8.0, 12.0, 5.0, 12.0, 15.0, 19.0, 17.0, 17.0, 19.0, 35.0, 35.0, 31.0, 41.0, 34.0, 46.0, 46.0, 38.0, 39.0, 39.0, 42.0, 41.0, 41.0, 57.0, 37.0, 34.0, 37.0, 27.0, 23.0, 29.0, 20.0, 16.0, 12.0, 18.0, 10.0, 6.0, 7.0, 10.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.026595473289489746, -0.025811992585659027, -0.02502851001918316, -0.02424502745270729, -0.02346154674887657, -0.022678066045045853, -0.021894583478569984, -0.021111100912094116, -0.020327620208263397, -0.019544139504432678, -0.01876065693795681, -0.017977174371480942, -0.017193693667650223, -0.016410212963819504, -0.015626730397343636, -0.014843248762190342, -0.014059767127037048, -0.013276285491883755, -0.012492803856730461, -0.011709322221577168, -0.010925840586423874, -0.01014235895127058, -0.009358877316117287, -0.008575395680963993, -0.0077919140458106995, -0.007008432410657406, -0.006224950775504112, -0.005441469140350819, -0.004657987505197525, -0.0038745058700442314, -0.003091024234890938, -0.002307542599737644, -0.0015240609645843506, -0.000740579329431057, 4.290230572223663e-05, 0.0008263839408755302, 0.0016098655760288239, 0.0023933472111821175, 0.003176828846335411, 0.003960310481488705, 0.004743792116641998, 0.005527273751795292, 0.0063107553869485855, 0.007094237022101879, 0.007877718657255173, 0.008661200292408466, 0.00944468192756176, 0.010228163562715054, 0.011011645197868347, 0.01179512683302164, 0.012578608468174934, 0.013362090103328228, 0.014145571738481522, 0.014929053373634815, 0.01571253500878811, 0.016496017575263977, 0.017279498279094696, 0.018062978982925415, 0.018846461549401283, 0.01962994411587715, 0.02041342481970787, 0.02119690552353859, 0.021980388090014458, 0.022763870656490326, 0.023547351360321045]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 8.0, 5.0, 9.0, 12.0, 5.0, 20.0, 15.0, 19.0, 26.0, 24.0, 15.0, 29.0, 35.0, 36.0, 27.0, 44.0, 43.0, 53.0, 33.0, 42.0, 50.0, 35.0, 41.0, 42.0, 33.0, 37.0, 29.0, 33.0, 32.0, 29.0, 25.0, 17.0, 20.0, 17.0, 7.0, 15.0, 7.0, 5.0, 7.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3203125, -2.244659423828125, -2.16900634765625, -2.093353271484375, -2.0177001953125, -1.942047119140625, -1.86639404296875, -1.790740966796875, -1.715087890625, -1.639434814453125, -1.56378173828125, -1.488128662109375, -1.4124755859375, -1.336822509765625, -1.26116943359375, -1.185516357421875, -1.10986328125, -1.034210205078125, -0.95855712890625, -0.882904052734375, -0.8072509765625, -0.731597900390625, -0.65594482421875, -0.580291748046875, -0.504638671875, -0.428985595703125, -0.35333251953125, -0.277679443359375, -0.2020263671875, -0.126373291015625, -0.05072021484375, 0.024932861328125, 0.1005859375, 0.176239013671875, 0.25189208984375, 0.327545166015625, 0.4031982421875, 0.478851318359375, 0.55450439453125, 0.630157470703125, 0.705810546875, 0.781463623046875, 0.85711669921875, 0.932769775390625, 1.0084228515625, 1.084075927734375, 1.15972900390625, 1.235382080078125, 1.31103515625, 1.386688232421875, 1.46234130859375, 1.537994384765625, 1.6136474609375, 1.689300537109375, 1.76495361328125, 1.840606689453125, 1.916259765625, 1.991912841796875, 2.06756591796875, 2.143218994140625, 2.2188720703125, 2.294525146484375, 2.37017822265625, 2.445831298828125, 2.521484375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 7.0, 19.0, 28.0, 40.0, 57.0, 74.0, 152.0, 226.0, 435.0, 768.0, 1346.0, 2499.0, 4769.0, 9164.0, 19646.0, 47151.0, 146020.0, 437697.0, 252319.0, 72424.0, 27687.0, 12506.0, 6174.0, 3249.0, 1752.0, 970.0, 547.0, 323.0, 179.0, 115.0, 72.0, 50.0, 21.0, 16.0, 10.0, 9.0, 4.0, 8.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.177734375, -2.113128662109375, -2.04852294921875, -1.983917236328125, -1.9193115234375, -1.854705810546875, -1.79010009765625, -1.725494384765625, -1.660888671875, -1.596282958984375, -1.53167724609375, -1.467071533203125, -1.4024658203125, -1.337860107421875, -1.27325439453125, -1.208648681640625, -1.14404296875, -1.079437255859375, -1.01483154296875, -0.950225830078125, -0.8856201171875, -0.821014404296875, -0.75640869140625, -0.691802978515625, -0.627197265625, -0.562591552734375, -0.49798583984375, -0.433380126953125, -0.3687744140625, -0.304168701171875, -0.23956298828125, -0.174957275390625, -0.1103515625, -0.045745849609375, 0.01885986328125, 0.083465576171875, 0.1480712890625, 0.212677001953125, 0.27728271484375, 0.341888427734375, 0.406494140625, 0.471099853515625, 0.53570556640625, 0.600311279296875, 0.6649169921875, 0.729522705078125, 0.79412841796875, 0.858734130859375, 0.92333984375, 0.987945556640625, 1.05255126953125, 1.117156982421875, 1.1817626953125, 1.246368408203125, 1.31097412109375, 1.375579833984375, 1.440185546875, 1.504791259765625, 1.56939697265625, 1.634002685546875, 1.6986083984375, 1.763214111328125, 1.82781982421875, 1.892425537109375, 1.95703125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 14.0, 10.0, 14.0, 17.0, 15.0, 14.0, 12.0, 24.0, 38.0, 36.0, 38.0, 39.0, 37.0, 52.0, 58.0, 107.0, 310.0, 1637.0, 122.0, 71.0, 41.0, 48.0, 50.0, 41.0, 33.0, 26.0, 25.0, 22.0, 24.0, 9.0, 16.0, 11.0, 9.0, 4.0, 4.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.421875, -8.142822265625, -7.86376953125, -7.584716796875, -7.3056640625, -7.026611328125, -6.74755859375, -6.468505859375, -6.189453125, -5.910400390625, -5.63134765625, -5.352294921875, -5.0732421875, -4.794189453125, -4.51513671875, -4.236083984375, -3.95703125, -3.677978515625, -3.39892578125, -3.119873046875, -2.8408203125, -2.561767578125, -2.28271484375, -2.003662109375, -1.724609375, -1.445556640625, -1.16650390625, -0.887451171875, -0.6083984375, -0.329345703125, -0.05029296875, 0.228759765625, 0.5078125, 0.786865234375, 1.06591796875, 1.344970703125, 1.6240234375, 1.903076171875, 2.18212890625, 2.461181640625, 2.740234375, 3.019287109375, 3.29833984375, 3.577392578125, 3.8564453125, 4.135498046875, 4.41455078125, 4.693603515625, 4.97265625, 5.251708984375, 5.53076171875, 5.809814453125, 6.0888671875, 6.367919921875, 6.64697265625, 6.926025390625, 7.205078125, 7.484130859375, 7.76318359375, 8.042236328125, 8.3212890625, 8.600341796875, 8.87939453125, 9.158447265625, 9.4375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 8.0, 12.0, 16.0, 13.0, 28.0, 33.0, 26.0, 46.0, 61.0, 117.0, 167.0, 340.0, 737.0, 2079.0, 10937.0, 269908.0, 2828395.0, 26871.0, 3634.0, 1155.0, 440.0, 214.0, 123.0, 86.0, 56.0, 45.0, 29.0, 13.0, 21.0, 16.0, 18.0, 8.0, 16.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6484375, -14.2071533203125, -13.765869140625, -13.3245849609375, -12.88330078125, -12.4420166015625, -12.000732421875, -11.5594482421875, -11.1181640625, -10.6768798828125, -10.235595703125, -9.7943115234375, -9.35302734375, -8.9117431640625, -8.470458984375, -8.0291748046875, -7.587890625, -7.1466064453125, -6.705322265625, -6.2640380859375, -5.82275390625, -5.3814697265625, -4.940185546875, -4.4989013671875, -4.0576171875, -3.6163330078125, -3.175048828125, -2.7337646484375, -2.29248046875, -1.8511962890625, -1.409912109375, -0.9686279296875, -0.52734375, -0.0860595703125, 0.355224609375, 0.7965087890625, 1.23779296875, 1.6790771484375, 2.120361328125, 2.5616455078125, 3.0029296875, 3.4442138671875, 3.885498046875, 4.3267822265625, 4.76806640625, 5.2093505859375, 5.650634765625, 6.0919189453125, 6.533203125, 6.9744873046875, 7.415771484375, 7.8570556640625, 8.29833984375, 8.7396240234375, 9.180908203125, 9.6221923828125, 10.0634765625, 10.5047607421875, 10.946044921875, 11.3873291015625, 11.82861328125, 12.2698974609375, 12.711181640625, 13.1524658203125, 13.59375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [58.0, 813.0, 148.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.236794471740723, -2.011749029159546, 1.2132964134216309, 4.438342094421387, 7.663387298583984, 10.888432502746582, 14.113478660583496, 17.338523864746094, 20.563568115234375, 23.78861427307129, 27.01365852355957, 30.238704681396484, 33.463748931884766, 36.68879699707031, 39.913841247558594, 43.138885498046875, 46.36393356323242, 49.5889778137207, 52.81402587890625, 56.03907012939453, 59.26411437988281, 62.489158630371094, 65.71420288085938, 68.93925476074219, 72.16429901123047, 75.38934326171875, 78.61438751220703, 81.83943176269531, 85.06448364257812, 88.2895278930664, 91.51457214355469, 94.73961639404297, 97.96465301513672, 101.189697265625, 104.41474151611328, 107.63978576660156, 110.86483764648438, 114.08988189697266, 117.31492614746094, 120.53997039794922, 123.7650146484375, 126.99005889892578, 130.21510314941406, 133.44015502929688, 136.66519165039062, 139.89024353027344, 143.11529541015625, 146.34033203125, 149.5653839111328, 152.79043579101562, 156.01547241210938, 159.2405242919922, 162.46556091308594, 165.69061279296875, 168.9156494140625, 172.1407012939453, 175.36573791503906, 178.59078979492188, 181.81582641601562, 185.04087829589844, 188.2659149169922, 191.490966796875, 194.71600341796875, 197.94105529785156, 201.16610717773438]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 6.0, 10.0, 10.0, 7.0, 5.0, 12.0, 20.0, 20.0, 12.0, 24.0, 31.0, 24.0, 26.0, 21.0, 28.0, 40.0, 39.0, 37.0, 44.0, 32.0, 59.0, 49.0, 53.0, 42.0, 36.0, 41.0, 30.0, 21.0, 24.0, 27.0, 24.0, 19.0, 26.0, 21.0, 10.0, 17.0, 8.0, 6.0, 10.0, 6.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-24.72364616394043, -23.941390991210938, -23.159137725830078, -22.376882553100586, -21.594629287719727, -20.812374114990234, -20.030120849609375, -19.247865676879883, -18.46561050415039, -17.6833553314209, -16.90110206604004, -16.118846893310547, -15.336593627929688, -14.554338455200195, -13.77208423614502, -12.989830017089844, -12.207576751708984, -11.425322532653809, -10.643068313598633, -9.86081314086914, -9.078559875488281, -8.296304702758789, -7.514050483703613, -6.7317962646484375, -5.949542045593262, -5.167287826538086, -4.38503360748291, -3.602778911590576, -2.8205246925354004, -2.0382704734802246, -1.2560157775878906, -0.47376155853271484, 0.3084907531738281, 1.0907450914382935, 1.8729994297027588, 2.6552538871765137, 3.4375081062316895, 4.219762325286865, 5.002017021179199, 5.784271240234375, 6.566525459289551, 7.348779678344727, 8.131033897399902, 8.913288116455078, 9.69554328918457, 10.47779655456543, 11.260051727294922, 12.042305946350098, 12.824560165405273, 13.60681438446045, 14.389068603515625, 15.171323776245117, 15.953577041625977, 16.73583221435547, 17.518085479736328, 18.30034065246582, 19.082595825195312, 19.864850997924805, 20.647104263305664, 21.429359436035156, 22.211612701416016, 22.993867874145508, 23.776123046875, 24.55837631225586, 25.34062957763672]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 8.0, 5.0, 8.0, 11.0, 7.0, 12.0, 15.0, 23.0, 21.0, 23.0, 16.0, 20.0, 31.0, 42.0, 35.0, 36.0, 39.0, 52.0, 35.0, 50.0, 47.0, 36.0, 54.0, 48.0, 23.0, 39.0, 30.0, 37.0, 27.0, 29.0, 25.0, 22.0, 19.0, 17.0, 8.0, 14.0, 12.0, 6.0, 7.0, 1.0, 11.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.474609375, -2.395263671875, -2.31591796875, -2.236572265625, -2.1572265625, -2.077880859375, -1.99853515625, -1.919189453125, -1.83984375, -1.760498046875, -1.68115234375, -1.601806640625, -1.5224609375, -1.443115234375, -1.36376953125, -1.284423828125, -1.205078125, -1.125732421875, -1.04638671875, -0.967041015625, -0.8876953125, -0.808349609375, -0.72900390625, -0.649658203125, -0.5703125, -0.490966796875, -0.41162109375, -0.332275390625, -0.2529296875, -0.173583984375, -0.09423828125, -0.014892578125, 0.064453125, 0.143798828125, 0.22314453125, 0.302490234375, 0.3818359375, 0.461181640625, 0.54052734375, 0.619873046875, 0.69921875, 0.778564453125, 0.85791015625, 0.937255859375, 1.0166015625, 1.095947265625, 1.17529296875, 1.254638671875, 1.333984375, 1.413330078125, 1.49267578125, 1.572021484375, 1.6513671875, 1.730712890625, 1.81005859375, 1.889404296875, 1.96875, 2.048095703125, 2.12744140625, 2.206787109375, 2.2861328125, 2.365478515625, 2.44482421875, 2.524169921875, 2.603515625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 9.0, 8.0, 10.0, 10.0, 22.0, 30.0, 38.0, 70.0, 89.0, 157.0, 311.0, 632.0, 1368.0, 3724.0, 9869.0, 29048.0, 95279.0, 402491.0, 1883522.0, 1392218.0, 270645.0, 69992.0, 22017.0, 7617.0, 2786.0, 1132.0, 547.0, 232.0, 147.0, 76.0, 46.0, 35.0, 27.0, 24.0, 11.0, 9.0, 7.0, 9.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.66015625, -5.48797607421875, -5.3157958984375, -5.14361572265625, -4.971435546875, -4.79925537109375, -4.6270751953125, -4.45489501953125, -4.28271484375, -4.11053466796875, -3.9383544921875, -3.76617431640625, -3.593994140625, -3.42181396484375, -3.2496337890625, -3.07745361328125, -2.9052734375, -2.73309326171875, -2.5609130859375, -2.38873291015625, -2.216552734375, -2.04437255859375, -1.8721923828125, -1.70001220703125, -1.52783203125, -1.35565185546875, -1.1834716796875, -1.01129150390625, -0.839111328125, -0.66693115234375, -0.4947509765625, -0.32257080078125, -0.150390625, 0.02178955078125, 0.1939697265625, 0.36614990234375, 0.538330078125, 0.71051025390625, 0.8826904296875, 1.05487060546875, 1.22705078125, 1.39923095703125, 1.5714111328125, 1.74359130859375, 1.915771484375, 2.08795166015625, 2.2601318359375, 2.43231201171875, 2.6044921875, 2.77667236328125, 2.9488525390625, 3.12103271484375, 3.293212890625, 3.46539306640625, 3.6375732421875, 3.80975341796875, 3.98193359375, 4.15411376953125, 4.3262939453125, 4.49847412109375, 4.670654296875, 4.84283447265625, 5.0150146484375, 5.18719482421875, 5.359375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 13.0, 13.0, 21.0, 33.0, 55.0, 83.0, 146.0, 208.0, 337.0, 479.0, 677.0, 656.0, 450.0, 347.0, 204.0, 131.0, 83.0, 54.0, 21.0, 28.0, 10.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6171875, -11.263916015625, -10.91064453125, -10.557373046875, -10.2041015625, -9.850830078125, -9.49755859375, -9.144287109375, -8.791015625, -8.437744140625, -8.08447265625, -7.731201171875, -7.3779296875, -7.024658203125, -6.67138671875, -6.318115234375, -5.96484375, -5.611572265625, -5.25830078125, -4.905029296875, -4.5517578125, -4.198486328125, -3.84521484375, -3.491943359375, -3.138671875, -2.785400390625, -2.43212890625, -2.078857421875, -1.7255859375, -1.372314453125, -1.01904296875, -0.665771484375, -0.3125, 0.040771484375, 0.39404296875, 0.747314453125, 1.1005859375, 1.453857421875, 1.80712890625, 2.160400390625, 2.513671875, 2.866943359375, 3.22021484375, 3.573486328125, 3.9267578125, 4.280029296875, 4.63330078125, 4.986572265625, 5.33984375, 5.693115234375, 6.04638671875, 6.399658203125, 6.7529296875, 7.106201171875, 7.45947265625, 7.812744140625, 8.166015625, 8.519287109375, 8.87255859375, 9.225830078125, 9.5791015625, 9.932373046875, 10.28564453125, 10.638916015625, 10.9921875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 12.0, 14.0, 13.0, 21.0, 31.0, 43.0, 48.0, 72.0, 119.0, 184.0, 369.0, 594.0, 1315.0, 4420.0, 34572.0, 567870.0, 3276895.0, 282310.0, 19805.0, 3134.0, 1072.0, 554.0, 305.0, 161.0, 108.0, 72.0, 45.0, 32.0, 21.0, 19.0, 19.0, 10.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.140625, -18.53076171875, -17.9208984375, -17.31103515625, -16.701171875, -16.09130859375, -15.4814453125, -14.87158203125, -14.26171875, -13.65185546875, -13.0419921875, -12.43212890625, -11.822265625, -11.21240234375, -10.6025390625, -9.99267578125, -9.3828125, -8.77294921875, -8.1630859375, -7.55322265625, -6.943359375, -6.33349609375, -5.7236328125, -5.11376953125, -4.50390625, -3.89404296875, -3.2841796875, -2.67431640625, -2.064453125, -1.45458984375, -0.8447265625, -0.23486328125, 0.375, 0.98486328125, 1.5947265625, 2.20458984375, 2.814453125, 3.42431640625, 4.0341796875, 4.64404296875, 5.25390625, 5.86376953125, 6.4736328125, 7.08349609375, 7.693359375, 8.30322265625, 8.9130859375, 9.52294921875, 10.1328125, 10.74267578125, 11.3525390625, 11.96240234375, 12.572265625, 13.18212890625, 13.7919921875, 14.40185546875, 15.01171875, 15.62158203125, 16.2314453125, 16.84130859375, 17.451171875, 18.06103515625, 18.6708984375, 19.28076171875, 19.890625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 21.0, 49.0, 103.0, 185.0, 210.0, 228.0, 120.0, 59.0, 20.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.66728210449219, -113.12980651855469, -110.59233093261719, -108.05485534667969, -105.51737976074219, -102.97990417480469, -100.44242858886719, -97.90495300292969, -95.36747741699219, -92.83000183105469, -90.29252624511719, -87.75505065917969, -85.21757507324219, -82.68009948730469, -80.14262390136719, -77.60514831542969, -75.06767272949219, -72.53019714355469, -69.99272155761719, -67.45524597167969, -64.91777038574219, -62.38029479980469, -59.84281921386719, -57.30534362792969, -54.76787567138672, -52.23040008544922, -49.69292449951172, -47.15544891357422, -44.61797332763672, -42.08049774169922, -39.54302215576172, -37.00554656982422, -34.46806716918945, -31.930591583251953, -29.393115997314453, -26.855640411376953, -24.318164825439453, -21.780689239501953, -19.243215560913086, -16.705739974975586, -14.168264389038086, -11.630788803100586, -9.093313217163086, -6.555838584899902, -4.018362998962402, -1.4808874130249023, 1.0565872192382812, 3.5940628051757812, 6.131538391113281, 8.669013977050781, 11.206489562988281, 13.743964195251465, 16.28144073486328, 18.81891632080078, 21.35638999938965, 23.89386558532715, 26.43134117126465, 28.96881675720215, 31.50629234313965, 34.043766021728516, 36.581241607666016, 39.118717193603516, 41.656192779541016, 44.193668365478516, 46.731143951416016]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 8.0, 5.0, 8.0, 8.0, 8.0, 10.0, 17.0, 19.0, 19.0, 17.0, 29.0, 26.0, 35.0, 29.0, 30.0, 39.0, 32.0, 46.0, 40.0, 40.0, 33.0, 41.0, 34.0, 46.0, 31.0, 32.0, 36.0, 25.0, 27.0, 27.0, 39.0, 22.0, 21.0, 16.0, 19.0, 17.0, 15.0, 14.0, 7.0, 9.0, 7.0, 4.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-26.786483764648438, -25.994264602661133, -25.202043533325195, -24.40982437133789, -23.617603302001953, -22.82538414001465, -22.033164978027344, -21.240943908691406, -20.4487247467041, -19.656505584716797, -18.86428451538086, -18.072065353393555, -17.27984619140625, -16.487625122070312, -15.695405960083008, -14.903185844421387, -14.110965728759766, -13.318745613098145, -12.526525497436523, -11.734306335449219, -10.942086219787598, -10.149866104125977, -9.357646942138672, -8.56542682647705, -7.77320671081543, -6.980986595153809, -6.188766956329346, -5.396547317504883, -4.604327201843262, -3.8121073246002197, -3.0198874473571777, -2.227667808532715, -1.4354476928710938, -0.6432278156280518, 0.14899206161499023, 0.9412119388580322, 1.7334318161010742, 2.525651693344116, 3.317871570587158, 4.110091209411621, 4.902311325073242, 5.694531440734863, 6.486751079559326, 7.278970718383789, 8.07119083404541, 8.863410949707031, 9.655630111694336, 10.447850227355957, 11.240070343017578, 12.0322904586792, 12.82451057434082, 13.616729736328125, 14.408949851989746, 15.201169967651367, 15.993389129638672, 16.78561019897461, 17.577829360961914, 18.37004852294922, 19.162269592285156, 19.95448875427246, 20.746707916259766, 21.538928985595703, 22.331148147583008, 23.123367309570312, 23.91558837890625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 8.0, 7.0, 7.0, 2.0, 9.0, 8.0, 17.0, 15.0, 17.0, 24.0, 23.0, 28.0, 33.0, 27.0, 42.0, 32.0, 41.0, 52.0, 44.0, 43.0, 56.0, 39.0, 53.0, 43.0, 45.0, 37.0, 41.0, 24.0, 21.0, 27.0, 22.0, 19.0, 18.0, 18.0, 16.0, 16.0, 8.0, 10.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4765625, -2.388671875, -2.30078125, -2.212890625, -2.125, -2.037109375, -1.94921875, -1.861328125, -1.7734375, -1.685546875, -1.59765625, -1.509765625, -1.421875, -1.333984375, -1.24609375, -1.158203125, -1.0703125, -0.982421875, -0.89453125, -0.806640625, -0.71875, -0.630859375, -0.54296875, -0.455078125, -0.3671875, -0.279296875, -0.19140625, -0.103515625, -0.015625, 0.072265625, 0.16015625, 0.248046875, 0.3359375, 0.423828125, 0.51171875, 0.599609375, 0.6875, 0.775390625, 0.86328125, 0.951171875, 1.0390625, 1.126953125, 1.21484375, 1.302734375, 1.390625, 1.478515625, 1.56640625, 1.654296875, 1.7421875, 1.830078125, 1.91796875, 2.005859375, 2.09375, 2.181640625, 2.26953125, 2.357421875, 2.4453125, 2.533203125, 2.62109375, 2.708984375, 2.796875, 2.884765625, 2.97265625, 3.060546875, 3.1484375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 6.0, 17.0, 18.0, 21.0, 34.0, 39.0, 75.0, 109.0, 147.0, 190.0, 342.0, 494.0, 747.0, 1302.0, 2126.0, 3620.0, 6382.0, 10831.0, 19312.0, 33285.0, 58031.0, 96771.0, 152077.0, 199700.0, 174925.0, 117629.0, 71784.0, 41786.0, 23835.0, 13599.0, 7955.0, 4561.0, 2555.0, 1573.0, 1017.0, 573.0, 359.0, 218.0, 143.0, 123.0, 64.0, 43.0, 48.0, 25.0, 21.0, 9.0, 13.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.283203125, -0.27426910400390625, -0.2653350830078125, -0.25640106201171875, -0.247467041015625, -0.23853302001953125, -0.2295989990234375, -0.22066497802734375, -0.21173095703125, -0.20279693603515625, -0.1938629150390625, -0.18492889404296875, -0.175994873046875, -0.16706085205078125, -0.1581268310546875, -0.14919281005859375, -0.1402587890625, -0.13132476806640625, -0.1223907470703125, -0.11345672607421875, -0.104522705078125, -0.09558868408203125, -0.0866546630859375, -0.07772064208984375, -0.06878662109375, -0.05985260009765625, -0.0509185791015625, -0.04198455810546875, -0.033050537109375, -0.02411651611328125, -0.0151824951171875, -0.00624847412109375, 0.002685546875, 0.01161956787109375, 0.0205535888671875, 0.02948760986328125, 0.038421630859375, 0.04735565185546875, 0.0562896728515625, 0.06522369384765625, 0.07415771484375, 0.08309173583984375, 0.0920257568359375, 0.10095977783203125, 0.109893798828125, 0.11882781982421875, 0.1277618408203125, 0.13669586181640625, 0.1456298828125, 0.15456390380859375, 0.1634979248046875, 0.17243194580078125, 0.181365966796875, 0.19029998779296875, 0.1992340087890625, 0.20816802978515625, 0.21710205078125, 0.22603607177734375, 0.2349700927734375, 0.24390411376953125, 0.252838134765625, 0.26177215576171875, 0.2707061767578125, 0.27964019775390625, 0.28857421875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 4.0, 3.0, 10.0, 5.0, 4.0, 5.0, 11.0, 16.0, 8.0, 14.0, 23.0, 21.0, 24.0, 21.0, 25.0, 26.0, 28.0, 35.0, 30.0, 30.0, 38.0, 50.0, 28.0, 1062.0, 40.0, 37.0, 35.0, 36.0, 31.0, 41.0, 36.0, 27.0, 33.0, 25.0, 34.0, 21.0, 17.0, 11.0, 14.0, 14.0, 11.0, 11.0, 7.0, 5.0, 7.0, 3.0, 3.0, 0.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.6611328125, -1.61004638671875, -1.5589599609375, -1.50787353515625, -1.456787109375, -1.40570068359375, -1.3546142578125, -1.30352783203125, -1.25244140625, -1.20135498046875, -1.1502685546875, -1.09918212890625, -1.048095703125, -0.99700927734375, -0.9459228515625, -0.89483642578125, -0.84375, -0.79266357421875, -0.7415771484375, -0.69049072265625, -0.639404296875, -0.58831787109375, -0.5372314453125, -0.48614501953125, -0.43505859375, -0.38397216796875, -0.3328857421875, -0.28179931640625, -0.230712890625, -0.17962646484375, -0.1285400390625, -0.07745361328125, -0.0263671875, 0.02471923828125, 0.0758056640625, 0.12689208984375, 0.177978515625, 0.22906494140625, 0.2801513671875, 0.33123779296875, 0.38232421875, 0.43341064453125, 0.4844970703125, 0.53558349609375, 0.586669921875, 0.63775634765625, 0.6888427734375, 0.73992919921875, 0.791015625, 0.84210205078125, 0.8931884765625, 0.94427490234375, 0.995361328125, 1.04644775390625, 1.0975341796875, 1.14862060546875, 1.19970703125, 1.25079345703125, 1.3018798828125, 1.35296630859375, 1.404052734375, 1.45513916015625, 1.5062255859375, 1.55731201171875, 1.6083984375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 6.0, 8.0, 20.0, 29.0, 48.0, 79.0, 75.0, 128.0, 252.0, 367.0, 481.0, 763.0, 1144.0, 1785.0, 2723.0, 4141.0, 6336.0, 9802.0, 14873.0, 22953.0, 34989.0, 51665.0, 73258.0, 100185.0, 144784.0, 1122751.0, 163111.0, 103827.0, 76582.0, 53571.0, 36428.0, 24159.0, 15790.0, 10570.0, 6786.0, 4439.0, 2878.0, 1853.0, 1196.0, 777.0, 524.0, 346.0, 215.0, 163.0, 86.0, 73.0, 44.0, 23.0, 15.0, 13.0, 9.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.141357421875, -0.13701629638671875, -0.1326751708984375, -0.12833404541015625, -0.123992919921875, -0.11965179443359375, -0.1153106689453125, -0.11096954345703125, -0.10662841796875, -0.10228729248046875, -0.0979461669921875, -0.09360504150390625, -0.089263916015625, -0.08492279052734375, -0.0805816650390625, -0.07624053955078125, -0.0718994140625, -0.06755828857421875, -0.0632171630859375, -0.05887603759765625, -0.054534912109375, -0.05019378662109375, -0.0458526611328125, -0.04151153564453125, -0.03717041015625, -0.03282928466796875, -0.0284881591796875, -0.02414703369140625, -0.019805908203125, -0.01546478271484375, -0.0111236572265625, -0.00678253173828125, -0.00244140625, 0.00189971923828125, 0.0062408447265625, 0.01058197021484375, 0.014923095703125, 0.01926422119140625, 0.0236053466796875, 0.02794647216796875, 0.03228759765625, 0.03662872314453125, 0.0409698486328125, 0.04531097412109375, 0.049652099609375, 0.05399322509765625, 0.0583343505859375, 0.06267547607421875, 0.0670166015625, 0.07135772705078125, 0.0756988525390625, 0.08003997802734375, 0.084381103515625, 0.08872222900390625, 0.0930633544921875, 0.09740447998046875, 0.10174560546875, 0.10608673095703125, 0.1104278564453125, 0.11476898193359375, 0.119110107421875, 0.12345123291015625, 0.1277923583984375, 0.13213348388671875, 0.136474609375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 8.0, 8.0, 9.0, 8.0, 17.0, 30.0, 35.0, 69.0, 92.0, 96.0, 177.0, 115.0, 94.0, 68.0, 47.0, 26.0, 27.0, 10.0, 7.0, 10.0, 6.0, 3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0258941650390625, -0.0252077579498291, -0.024521350860595703, -0.023834943771362305, -0.023148536682128906, -0.022462129592895508, -0.02177572250366211, -0.02108931541442871, -0.020402908325195312, -0.019716501235961914, -0.019030094146728516, -0.018343687057495117, -0.01765727996826172, -0.01697087287902832, -0.016284465789794922, -0.015598058700561523, -0.014911651611328125, -0.014225244522094727, -0.013538837432861328, -0.01285243034362793, -0.012166023254394531, -0.011479616165161133, -0.010793209075927734, -0.010106801986694336, -0.009420394897460938, -0.008733987808227539, -0.00804758071899414, -0.007361173629760742, -0.006674766540527344, -0.005988359451293945, -0.005301952362060547, -0.0046155452728271484, -0.00392913818359375, -0.0032427310943603516, -0.002556324005126953, -0.0018699169158935547, -0.0011835098266601562, -0.0004971027374267578, 0.00018930435180664062, 0.0008757114410400391, 0.0015621185302734375, 0.002248525619506836, 0.0029349327087402344, 0.003621339797973633, 0.004307746887207031, 0.00499415397644043, 0.005680561065673828, 0.0063669681549072266, 0.007053375244140625, 0.0077397823333740234, 0.008426189422607422, 0.00911259651184082, 0.009799003601074219, 0.010485410690307617, 0.011171817779541016, 0.011858224868774414, 0.012544631958007812, 0.013231039047241211, 0.01391744613647461, 0.014603853225708008, 0.015290260314941406, 0.015976667404174805, 0.016663074493408203, 0.0173494815826416, 0.018035888671875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 3.0, 2.0, 2.0, 8.0, 9.0, 5.0, 15.0, 19.0, 18.0, 41.0, 49.0, 59.0, 92.0, 150.0, 315.0, 836.0, 8829.0, 985107.0, 50180.0, 1758.0, 464.0, 220.0, 116.0, 71.0, 45.0, 39.0, 27.0, 14.0, 11.0, 10.0, 5.0, 3.0, 8.0, 3.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31103515625, -0.2993888854980469, -0.28774261474609375, -0.2760963439941406, -0.2644500732421875, -0.2528038024902344, -0.24115753173828125, -0.22951126098632812, -0.217864990234375, -0.20621871948242188, -0.19457244873046875, -0.18292617797851562, -0.1712799072265625, -0.15963363647460938, -0.14798736572265625, -0.13634109497070312, -0.12469482421875, -0.11304855346679688, -0.10140228271484375, -0.08975601196289062, -0.0781097412109375, -0.06646347045898438, -0.05481719970703125, -0.043170928955078125, -0.031524658203125, -0.019878387451171875, -0.00823211669921875, 0.003414154052734375, 0.0150604248046875, 0.026706695556640625, 0.03835296630859375, 0.049999237060546875, 0.0616455078125, 0.07329177856445312, 0.08493804931640625, 0.09658432006835938, 0.1082305908203125, 0.11987686157226562, 0.13152313232421875, 0.14316940307617188, 0.154815673828125, 0.16646194458007812, 0.17810821533203125, 0.18975448608398438, 0.2014007568359375, 0.21304702758789062, 0.22469329833984375, 0.23633956909179688, 0.24798583984375, 0.2596321105957031, 0.27127838134765625, 0.2829246520996094, 0.2945709228515625, 0.3062171936035156, 0.31786346435546875, 0.3295097351074219, 0.341156005859375, 0.3528022766113281, 0.36444854736328125, 0.3760948181152344, 0.3877410888671875, 0.3993873596191406, 0.41103363037109375, 0.4226799011230469, 0.434326171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 20.0, 34.0, 97.0, 260.0, 468.0, 97.0, 28.0, 5.0], "bins": [-0.26065051555633545, -0.2563200891017914, -0.2519896328449249, -0.24765920639038086, -0.2433287799358368, -0.23899833858013153, -0.23466789722442627, -0.2303374707698822, -0.22600702941417694, -0.22167658805847168, -0.2173461616039276, -0.21301572024822235, -0.2086852788925171, -0.20435485243797302, -0.20002441108226776, -0.1956939846277237, -0.19136354327201843, -0.18703310191631317, -0.1827026754617691, -0.17837223410606384, -0.17404180765151978, -0.16971136629581451, -0.16538092494010925, -0.16105049848556519, -0.15672005712985992, -0.15238961577415466, -0.1480591893196106, -0.14372874796390533, -0.13939830660820007, -0.135067880153656, -0.13073743879795074, -0.12640701234340668, -0.12207657098770142, -0.11774613708257675, -0.11341570317745209, -0.10908526182174683, -0.10475482791662216, -0.1004243940114975, -0.09609395265579224, -0.09176351875066757, -0.08743308484554291, -0.08310265094041824, -0.07877221703529358, -0.07444177567958832, -0.07011134177446365, -0.06578090786933899, -0.061450470238924026, -0.057120032608509064, -0.0527895987033844, -0.048459164798259735, -0.04412872716784477, -0.03979828953742981, -0.035467855632305145, -0.03113741986453533, -0.026806984096765518, -0.022476548328995705, -0.01814611442387104, -0.013815678656101227, -0.009485242888331413, -0.0051548071205616, -0.0008243713527917862, 0.0035060644149780273, 0.007836500182747841, 0.012166935950517654, 0.016497371718287468]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 7.0, 14.0, 14.0, 14.0, 20.0, 17.0, 14.0, 22.0, 26.0, 26.0, 20.0, 29.0, 31.0, 32.0, 45.0, 36.0, 35.0, 46.0, 46.0, 49.0, 40.0, 43.0, 34.0, 44.0, 44.0, 29.0, 42.0, 25.0, 18.0, 14.0, 18.0, 26.0, 15.0, 11.0, 13.0, 9.0, 7.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02419579029083252, -0.023412737995386124, -0.02262968383729458, -0.021846629679203033, -0.021063577383756638, -0.02028052508831024, -0.019497470930218697, -0.01871441677212715, -0.017931364476680756, -0.01714831218123436, -0.016365258023142815, -0.015582204796373844, -0.014799151569604874, -0.014016098342835903, -0.013233045116066933, -0.012449991889297962, -0.011666938662528992, -0.010883885435760021, -0.01010083220899105, -0.00931777898222208, -0.00853472575545311, -0.007751672528684139, -0.006968619301915169, -0.006185566075146198, -0.005402512848377228, -0.004619459621608257, -0.003836406394839287, -0.0030533531680703163, -0.002270299941301346, -0.0014872467145323753, -0.0007041934877634048, 7.885973900556564e-05, 0.0008619129657745361, 0.0016449661925435066, 0.002428019419312477, 0.0032110726460814476, 0.003994125872850418, 0.004777179099619389, 0.005560232326388359, 0.0063432855531573296, 0.0071263387799263, 0.00790939200669527, 0.008692445233464241, 0.009475498460233212, 0.010258551687002182, 0.011041604913771152, 0.011824658140540123, 0.012607711367309093, 0.013390764594078064, 0.014173817820847034, 0.014956871047616005, 0.01573992520570755, 0.016522977501153946, 0.017306029796600342, 0.018089083954691887, 0.018872138112783432, 0.019655190408229828, 0.020438242703676224, 0.02122129686176777, 0.022004351019859314, 0.02278740331530571, 0.023570455610752106, 0.02435350976884365, 0.025136563926935196, 0.025919616222381592]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 8.0, 7.0, 7.0, 2.0, 9.0, 8.0, 17.0, 15.0, 18.0, 23.0, 23.0, 28.0, 32.0, 28.0, 42.0, 33.0, 40.0, 52.0, 44.0, 43.0, 56.0, 39.0, 52.0, 44.0, 45.0, 37.0, 41.0, 24.0, 21.0, 27.0, 22.0, 18.0, 19.0, 18.0, 16.0, 16.0, 7.0, 11.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4765625, -2.388671875, -2.30078125, -2.212890625, -2.125, -2.037109375, -1.94921875, -1.861328125, -1.7734375, -1.685546875, -1.59765625, -1.509765625, -1.421875, -1.333984375, -1.24609375, -1.158203125, -1.0703125, -0.982421875, -0.89453125, -0.806640625, -0.71875, -0.630859375, -0.54296875, -0.455078125, -0.3671875, -0.279296875, -0.19140625, -0.103515625, -0.015625, 0.072265625, 0.16015625, 0.248046875, 0.3359375, 0.423828125, 0.51171875, 0.599609375, 0.6875, 0.775390625, 0.86328125, 0.951171875, 1.0390625, 1.126953125, 1.21484375, 1.302734375, 1.390625, 1.478515625, 1.56640625, 1.654296875, 1.7421875, 1.830078125, 1.91796875, 2.005859375, 2.09375, 2.181640625, 2.26953125, 2.357421875, 2.4453125, 2.533203125, 2.62109375, 2.708984375, 2.796875, 2.884765625, 2.97265625, 3.060546875, 3.1484375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 9.0, 8.0, 12.0, 23.0, 23.0, 42.0, 66.0, 105.0, 135.0, 207.0, 275.0, 548.0, 803.0, 1228.0, 1844.0, 2932.0, 5048.0, 8959.0, 16992.0, 36470.0, 88498.0, 235082.0, 364363.0, 163567.0, 62728.0, 27079.0, 13128.0, 7037.0, 4152.0, 2574.0, 1682.0, 1037.0, 635.0, 461.0, 298.0, 161.0, 126.0, 84.0, 56.0, 24.0, 21.0, 14.0, 8.0, 10.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1640625, -2.1009979248046875, -2.037933349609375, -1.9748687744140625, -1.91180419921875, -1.8487396240234375, -1.785675048828125, -1.7226104736328125, -1.6595458984375, -1.5964813232421875, -1.533416748046875, -1.4703521728515625, -1.40728759765625, -1.3442230224609375, -1.281158447265625, -1.2180938720703125, -1.155029296875, -1.0919647216796875, -1.028900146484375, -0.9658355712890625, -0.90277099609375, -0.8397064208984375, -0.776641845703125, -0.7135772705078125, -0.6505126953125, -0.5874481201171875, -0.524383544921875, -0.4613189697265625, -0.39825439453125, -0.3351898193359375, -0.272125244140625, -0.2090606689453125, -0.14599609375, -0.0829315185546875, -0.019866943359375, 0.0431976318359375, 0.10626220703125, 0.1693267822265625, 0.232391357421875, 0.2954559326171875, 0.3585205078125, 0.4215850830078125, 0.484649658203125, 0.5477142333984375, 0.61077880859375, 0.6738433837890625, 0.736907958984375, 0.7999725341796875, 0.863037109375, 0.9261016845703125, 0.989166259765625, 1.0522308349609375, 1.11529541015625, 1.1783599853515625, 1.241424560546875, 1.3044891357421875, 1.3675537109375, 1.4306182861328125, 1.493682861328125, 1.5567474365234375, 1.61981201171875, 1.6828765869140625, 1.745941162109375, 1.8090057373046875, 1.8720703125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 8.0, 8.0, 10.0, 10.0, 14.0, 9.0, 17.0, 25.0, 21.0, 34.0, 25.0, 40.0, 33.0, 48.0, 56.0, 47.0, 69.0, 215.0, 1669.0, 223.0, 80.0, 56.0, 43.0, 38.0, 36.0, 34.0, 30.0, 33.0, 27.0, 22.0, 10.0, 11.0, 10.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.890625, -9.5660400390625, -9.241455078125, -8.9168701171875, -8.59228515625, -8.2677001953125, -7.943115234375, -7.6185302734375, -7.2939453125, -6.9693603515625, -6.644775390625, -6.3201904296875, -5.99560546875, -5.6710205078125, -5.346435546875, -5.0218505859375, -4.697265625, -4.3726806640625, -4.048095703125, -3.7235107421875, -3.39892578125, -3.0743408203125, -2.749755859375, -2.4251708984375, -2.1005859375, -1.7760009765625, -1.451416015625, -1.1268310546875, -0.80224609375, -0.4776611328125, -0.153076171875, 0.1715087890625, 0.49609375, 0.8206787109375, 1.145263671875, 1.4698486328125, 1.79443359375, 2.1190185546875, 2.443603515625, 2.7681884765625, 3.0927734375, 3.4173583984375, 3.741943359375, 4.0665283203125, 4.39111328125, 4.7156982421875, 5.040283203125, 5.3648681640625, 5.689453125, 6.0140380859375, 6.338623046875, 6.6632080078125, 6.98779296875, 7.3123779296875, 7.636962890625, 7.9615478515625, 8.2861328125, 8.6107177734375, 8.935302734375, 9.2598876953125, 9.58447265625, 9.9090576171875, 10.233642578125, 10.5582275390625, 10.8828125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 12.0, 8.0, 17.0, 19.0, 24.0, 46.0, 39.0, 57.0, 87.0, 112.0, 176.0, 289.0, 780.0, 4458.0, 193378.0, 2922123.0, 21231.0, 1541.0, 454.0, 244.0, 169.0, 100.0, 73.0, 49.0, 48.0, 20.0, 36.0, 21.0, 14.0, 10.0, 13.0, 7.0, 8.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.734375, -16.231201171875, -15.72802734375, -15.224853515625, -14.7216796875, -14.218505859375, -13.71533203125, -13.212158203125, -12.708984375, -12.205810546875, -11.70263671875, -11.199462890625, -10.6962890625, -10.193115234375, -9.68994140625, -9.186767578125, -8.68359375, -8.180419921875, -7.67724609375, -7.174072265625, -6.6708984375, -6.167724609375, -5.66455078125, -5.161376953125, -4.658203125, -4.155029296875, -3.65185546875, -3.148681640625, -2.6455078125, -2.142333984375, -1.63916015625, -1.135986328125, -0.6328125, -0.129638671875, 0.37353515625, 0.876708984375, 1.3798828125, 1.883056640625, 2.38623046875, 2.889404296875, 3.392578125, 3.895751953125, 4.39892578125, 4.902099609375, 5.4052734375, 5.908447265625, 6.41162109375, 6.914794921875, 7.41796875, 7.921142578125, 8.42431640625, 8.927490234375, 9.4306640625, 9.933837890625, 10.43701171875, 10.940185546875, 11.443359375, 11.946533203125, 12.44970703125, 12.952880859375, 13.4560546875, 13.959228515625, 14.46240234375, 14.965576171875, 15.46875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 104.0, 854.0, 59.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-205.0399627685547, -201.46641540527344, -197.8928680419922, -194.31932067871094, -190.7457733154297, -187.17222595214844, -183.5986785888672, -180.02511596679688, -176.45156860351562, -172.87802124023438, -169.30447387695312, -165.73092651367188, -162.15737915039062, -158.58383178710938, -155.01028442382812, -151.43673706054688, -147.86318969726562, -144.28964233398438, -140.71609497070312, -137.14254760742188, -133.56900024414062, -129.99545288085938, -126.4218978881836, -122.84835052490234, -119.2748031616211, -115.70125579833984, -112.1277084350586, -108.55416107177734, -104.98060607910156, -101.40705871582031, -97.83351135253906, -94.25996398925781, -90.68641662597656, -87.11286926269531, -83.53932189941406, -79.96577453613281, -76.39222717285156, -72.81867980957031, -69.24512481689453, -65.67157745361328, -62.09803009033203, -58.52448272705078, -54.95093536376953, -51.377384185791016, -47.803836822509766, -44.230289459228516, -40.65673828125, -37.08319091796875, -33.5096435546875, -29.93609619140625, -26.362546920776367, -22.788997650146484, -19.215450286865234, -15.641902923583984, -12.068353652954102, -8.494804382324219, -4.921257019042969, -1.3477087020874023, 2.225839614868164, 5.7993879318237305, 9.372936248779297, 12.946483612060547, 16.52003288269043, 20.093582153320312, 23.667129516601562]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 8.0, 8.0, 5.0, 7.0, 7.0, 7.0, 11.0, 9.0, 14.0, 17.0, 22.0, 26.0, 16.0, 22.0, 32.0, 24.0, 34.0, 26.0, 27.0, 40.0, 39.0, 32.0, 38.0, 33.0, 36.0, 35.0, 39.0, 28.0, 23.0, 20.0, 33.0, 22.0, 33.0, 22.0, 25.0, 18.0, 29.0, 22.0, 18.0, 19.0, 7.0, 14.0, 12.0, 10.0, 8.0, 6.0, 8.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.193906784057617, -24.39202308654785, -23.59014129638672, -22.788257598876953, -21.986373901367188, -21.184492111206055, -20.38260841369629, -19.580726623535156, -18.77884292602539, -17.976959228515625, -17.175077438354492, -16.373193740844727, -15.571310997009277, -14.769428253173828, -13.967544555664062, -13.165661811828613, -12.363779067993164, -11.561896324157715, -10.760013580322266, -9.9581298828125, -9.15624713897705, -8.354364395141602, -7.552481174468994, -6.750597953796387, -5.9487152099609375, -5.146832466125488, -4.344949245452881, -3.5430662631988525, -2.741183280944824, -1.939300537109375, -1.1374173164367676, -0.33553409576416016, 0.46634864807128906, 1.2682316303253174, 2.0701146125793457, 2.871997594833374, 3.6738805770874023, 4.475763320922852, 5.277646541595459, 6.079529762268066, 6.881412506103516, 7.683295249938965, 8.485177993774414, 9.28706169128418, 10.088944435119629, 10.890827178955078, 11.692710876464844, 12.494593620300293, 13.296476364135742, 14.098359107971191, 14.90024185180664, 15.702125549316406, 16.504009246826172, 17.305891036987305, 18.10777473449707, 18.909656524658203, 19.71154022216797, 20.513423919677734, 21.315305709838867, 22.117189407348633, 22.919071197509766, 23.72095489501953, 24.522838592529297, 25.324722290039062, 26.126604080200195]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 5.0, 9.0, 7.0, 4.0, 9.0, 10.0, 7.0, 13.0, 20.0, 18.0, 26.0, 22.0, 35.0, 29.0, 37.0, 32.0, 26.0, 42.0, 49.0, 46.0, 46.0, 43.0, 45.0, 52.0, 47.0, 40.0, 41.0, 29.0, 33.0, 31.0, 15.0, 16.0, 18.0, 22.0, 16.0, 16.0, 16.0, 9.0, 7.0, 5.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.447265625, -2.35968017578125, -2.2720947265625, -2.18450927734375, -2.096923828125, -2.00933837890625, -1.9217529296875, -1.83416748046875, -1.74658203125, -1.65899658203125, -1.5714111328125, -1.48382568359375, -1.396240234375, -1.30865478515625, -1.2210693359375, -1.13348388671875, -1.0458984375, -0.95831298828125, -0.8707275390625, -0.78314208984375, -0.695556640625, -0.60797119140625, -0.5203857421875, -0.43280029296875, -0.34521484375, -0.25762939453125, -0.1700439453125, -0.08245849609375, 0.005126953125, 0.09271240234375, 0.1802978515625, 0.26788330078125, 0.35546875, 0.44305419921875, 0.5306396484375, 0.61822509765625, 0.705810546875, 0.79339599609375, 0.8809814453125, 0.96856689453125, 1.05615234375, 1.14373779296875, 1.2313232421875, 1.31890869140625, 1.406494140625, 1.49407958984375, 1.5816650390625, 1.66925048828125, 1.7568359375, 1.84442138671875, 1.9320068359375, 2.01959228515625, 2.107177734375, 2.19476318359375, 2.2823486328125, 2.36993408203125, 2.45751953125, 2.54510498046875, 2.6326904296875, 2.72027587890625, 2.807861328125, 2.89544677734375, 2.9830322265625, 3.07061767578125, 3.158203125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 7.0, 9.0, 13.0, 15.0, 15.0, 24.0, 17.0, 44.0, 55.0, 100.0, 158.0, 314.0, 822.0, 2445.0, 9079.0, 38092.0, 192477.0, 1506660.0, 2088717.0, 286637.0, 51744.0, 11806.0, 3147.0, 983.0, 408.0, 181.0, 93.0, 46.0, 45.0, 17.0, 27.0, 12.0, 15.0, 12.0, 12.0, 6.0, 7.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2578125, -7.0167236328125, -6.775634765625, -6.5345458984375, -6.29345703125, -6.0523681640625, -5.811279296875, -5.5701904296875, -5.3291015625, -5.0880126953125, -4.846923828125, -4.6058349609375, -4.36474609375, -4.1236572265625, -3.882568359375, -3.6414794921875, -3.400390625, -3.1593017578125, -2.918212890625, -2.6771240234375, -2.43603515625, -2.1949462890625, -1.953857421875, -1.7127685546875, -1.4716796875, -1.2305908203125, -0.989501953125, -0.7484130859375, -0.50732421875, -0.2662353515625, -0.025146484375, 0.2159423828125, 0.45703125, 0.6981201171875, 0.939208984375, 1.1802978515625, 1.42138671875, 1.6624755859375, 1.903564453125, 2.1446533203125, 2.3857421875, 2.6268310546875, 2.867919921875, 3.1090087890625, 3.35009765625, 3.5911865234375, 3.832275390625, 4.0733642578125, 4.314453125, 4.5555419921875, 4.796630859375, 5.0377197265625, 5.27880859375, 5.5198974609375, 5.760986328125, 6.0020751953125, 6.2431640625, 6.4842529296875, 6.725341796875, 6.9664306640625, 7.20751953125, 7.4486083984375, 7.689697265625, 7.9307861328125, 8.171875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 10.0, 17.0, 29.0, 28.0, 50.0, 90.0, 109.0, 170.0, 195.0, 305.0, 360.0, 498.0, 495.0, 463.0, 354.0, 287.0, 184.0, 122.0, 94.0, 63.0, 47.0, 28.0, 19.0, 12.0, 6.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.234375, -9.9361572265625, -9.637939453125, -9.3397216796875, -9.04150390625, -8.7432861328125, -8.445068359375, -8.1468505859375, -7.8486328125, -7.5504150390625, -7.252197265625, -6.9539794921875, -6.65576171875, -6.3575439453125, -6.059326171875, -5.7611083984375, -5.462890625, -5.1646728515625, -4.866455078125, -4.5682373046875, -4.27001953125, -3.9718017578125, -3.673583984375, -3.3753662109375, -3.0771484375, -2.7789306640625, -2.480712890625, -2.1824951171875, -1.88427734375, -1.5860595703125, -1.287841796875, -0.9896240234375, -0.69140625, -0.3931884765625, -0.094970703125, 0.2032470703125, 0.50146484375, 0.7996826171875, 1.097900390625, 1.3961181640625, 1.6943359375, 1.9925537109375, 2.290771484375, 2.5889892578125, 2.88720703125, 3.1854248046875, 3.483642578125, 3.7818603515625, 4.080078125, 4.3782958984375, 4.676513671875, 4.9747314453125, 5.27294921875, 5.5711669921875, 5.869384765625, 6.1676025390625, 6.4658203125, 6.7640380859375, 7.062255859375, 7.3604736328125, 7.65869140625, 7.9569091796875, 8.255126953125, 8.5533447265625, 8.8515625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 4.0, 6.0, 8.0, 12.0, 14.0, 20.0, 45.0, 47.0, 81.0, 123.0, 181.0, 348.0, 775.0, 2150.0, 9191.0, 69064.0, 956510.0, 2888561.0, 237493.0, 23085.0, 4142.0, 1231.0, 503.0, 254.0, 134.0, 81.0, 75.0, 35.0, 28.0, 17.0, 11.0, 12.0, 16.0, 6.0, 7.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.71875, -18.15576171875, -17.5927734375, -17.02978515625, -16.466796875, -15.90380859375, -15.3408203125, -14.77783203125, -14.21484375, -13.65185546875, -13.0888671875, -12.52587890625, -11.962890625, -11.39990234375, -10.8369140625, -10.27392578125, -9.7109375, -9.14794921875, -8.5849609375, -8.02197265625, -7.458984375, -6.89599609375, -6.3330078125, -5.77001953125, -5.20703125, -4.64404296875, -4.0810546875, -3.51806640625, -2.955078125, -2.39208984375, -1.8291015625, -1.26611328125, -0.703125, -0.14013671875, 0.4228515625, 0.98583984375, 1.548828125, 2.11181640625, 2.6748046875, 3.23779296875, 3.80078125, 4.36376953125, 4.9267578125, 5.48974609375, 6.052734375, 6.61572265625, 7.1787109375, 7.74169921875, 8.3046875, 8.86767578125, 9.4306640625, 9.99365234375, 10.556640625, 11.11962890625, 11.6826171875, 12.24560546875, 12.80859375, 13.37158203125, 13.9345703125, 14.49755859375, 15.060546875, 15.62353515625, 16.1865234375, 16.74951171875, 17.3125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 9.0, 15.0, 11.0, 22.0, 23.0, 32.0, 33.0, 41.0, 56.0, 69.0, 79.0, 88.0, 84.0, 94.0, 70.0, 49.0, 65.0, 40.0, 28.0, 34.0, 17.0, 12.0, 8.0, 13.0, 8.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.96895217895508, -39.97862243652344, -38.98829650878906, -37.99796676635742, -37.00763702392578, -36.017311096191406, -35.026981353759766, -34.036651611328125, -33.04632568359375, -32.05599594116211, -31.0656681060791, -30.075340270996094, -29.085012435913086, -28.094682693481445, -27.104354858398438, -26.114025115966797, -25.123695373535156, -24.13336753845215, -23.143037796020508, -22.1527099609375, -21.162382125854492, -20.17205238342285, -19.181724548339844, -18.191394805908203, -17.201068878173828, -16.21074104309082, -15.220412254333496, -14.230083465576172, -13.239754676818848, -12.249425888061523, -11.259098052978516, -10.268769264221191, -9.278440475463867, -8.288111686706543, -7.297783374786377, -6.307455062866211, -5.317126274108887, -4.326797962188721, -3.3364696502685547, -2.3461408615112305, -1.3558125495910645, -0.3654840588569641, 0.6248444318771362, 1.6151728630065918, 2.605501413345337, 3.595829963684082, 4.586158275604248, 5.576487064361572, 6.566815376281738, 7.557143688201904, 8.54747200012207, 9.537800788879395, 10.528129577636719, 11.518457412719727, 12.50878620147705, 13.499114990234375, 14.489442825317383, 15.479771614074707, 16.47010040283203, 17.46042823791504, 18.450756072998047, 19.441085815429688, 20.431413650512695, 21.421741485595703, 22.412071228027344]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 8.0, 5.0, 13.0, 10.0, 16.0, 19.0, 13.0, 18.0, 21.0, 21.0, 33.0, 31.0, 34.0, 32.0, 45.0, 35.0, 45.0, 38.0, 45.0, 47.0, 44.0, 38.0, 46.0, 42.0, 40.0, 33.0, 25.0, 29.0, 33.0, 13.0, 11.0, 20.0, 18.0, 19.0, 10.0, 9.0, 8.0, 7.0, 9.0, 6.0, 6.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-27.64544677734375, -26.790151596069336, -25.934856414794922, -25.079561233520508, -24.224266052246094, -23.368968963623047, -22.513673782348633, -21.65837860107422, -20.803083419799805, -19.94778823852539, -19.092493057250977, -18.237197875976562, -17.381900787353516, -16.526607513427734, -15.671310424804688, -14.816015243530273, -13.96072006225586, -13.105424880981445, -12.250129699707031, -11.3948335647583, -10.539538383483887, -9.684243202209473, -8.828947067260742, -7.973651885986328, -7.118356704711914, -6.2630615234375, -5.407765865325928, -4.5524702072143555, -3.6971750259399414, -2.8418798446655273, -1.986584186553955, -1.1312885284423828, -0.27599334716796875, 0.5793020725250244, 1.4345974922180176, 2.2898929119110107, 3.145188331604004, 4.000483512878418, 4.85577917098999, 5.7110748291015625, 6.566370010375977, 7.421665191650391, 8.276960372924805, 9.132256507873535, 9.98755168914795, 10.842846870422363, 11.698143005371094, 12.553438186645508, 13.408733367919922, 14.264028549194336, 15.11932373046875, 15.97461986541748, 16.829914093017578, 17.685211181640625, 18.54050636291504, 19.395801544189453, 20.251096725463867, 21.10639190673828, 21.961687088012695, 22.81698226928711, 23.672279357910156, 24.527572631835938, 25.382869720458984, 26.2381649017334, 27.093460083007812]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 9.0, 11.0, 9.0, 5.0, 13.0, 19.0, 14.0, 15.0, 26.0, 24.0, 20.0, 32.0, 31.0, 40.0, 43.0, 28.0, 42.0, 35.0, 37.0, 44.0, 36.0, 47.0, 45.0, 50.0, 36.0, 30.0, 28.0, 29.0, 32.0, 27.0, 24.0, 23.0, 11.0, 19.0, 14.0, 6.0, 8.0, 8.0, 4.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.499298095703125, -2.41461181640625, -2.329925537109375, -2.2452392578125, -2.160552978515625, -2.07586669921875, -1.991180419921875, -1.906494140625, -1.821807861328125, -1.73712158203125, -1.652435302734375, -1.5677490234375, -1.483062744140625, -1.39837646484375, -1.313690185546875, -1.22900390625, -1.144317626953125, -1.05963134765625, -0.974945068359375, -0.8902587890625, -0.805572509765625, -0.72088623046875, -0.636199951171875, -0.551513671875, -0.466827392578125, -0.38214111328125, -0.297454833984375, -0.2127685546875, -0.128082275390625, -0.04339599609375, 0.041290283203125, 0.1259765625, 0.210662841796875, 0.29534912109375, 0.380035400390625, 0.4647216796875, 0.549407958984375, 0.63409423828125, 0.718780517578125, 0.803466796875, 0.888153076171875, 0.97283935546875, 1.057525634765625, 1.1422119140625, 1.226898193359375, 1.31158447265625, 1.396270751953125, 1.48095703125, 1.565643310546875, 1.65032958984375, 1.735015869140625, 1.8197021484375, 1.904388427734375, 1.98907470703125, 2.073760986328125, 2.158447265625, 2.243133544921875, 2.32781982421875, 2.412506103515625, 2.4971923828125, 2.581878662109375, 2.66656494140625, 2.751251220703125, 2.8359375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 9.0, 2.0, 11.0, 17.0, 16.0, 24.0, 38.0, 58.0, 73.0, 128.0, 183.0, 242.0, 362.0, 528.0, 814.0, 1292.0, 2181.0, 3794.0, 6861.0, 12989.0, 25007.0, 51117.0, 105546.0, 206548.0, 272404.0, 179259.0, 88920.0, 42786.0, 21735.0, 11037.0, 5903.0, 3248.0, 1942.0, 1222.0, 715.0, 486.0, 322.0, 248.0, 158.0, 104.0, 71.0, 54.0, 38.0, 26.0, 16.0, 13.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.5020675659179688, -0.4860687255859375, -0.47006988525390625, -0.454071044921875, -0.43807220458984375, -0.4220733642578125, -0.40607452392578125, -0.39007568359375, -0.37407684326171875, -0.3580780029296875, -0.34207916259765625, -0.326080322265625, -0.31008148193359375, -0.2940826416015625, -0.27808380126953125, -0.2620849609375, -0.24608612060546875, -0.2300872802734375, -0.21408843994140625, -0.198089599609375, -0.18209075927734375, -0.1660919189453125, -0.15009307861328125, -0.13409423828125, -0.11809539794921875, -0.1020965576171875, -0.08609771728515625, -0.070098876953125, -0.05410003662109375, -0.0381011962890625, -0.02210235595703125, -0.006103515625, 0.00989532470703125, 0.0258941650390625, 0.04189300537109375, 0.057891845703125, 0.07389068603515625, 0.0898895263671875, 0.10588836669921875, 0.12188720703125, 0.13788604736328125, 0.1538848876953125, 0.16988372802734375, 0.185882568359375, 0.20188140869140625, 0.2178802490234375, 0.23387908935546875, 0.2498779296875, 0.26587677001953125, 0.2818756103515625, 0.29787445068359375, 0.313873291015625, 0.32987213134765625, 0.3458709716796875, 0.36186981201171875, 0.37786865234375, 0.39386749267578125, 0.4098663330078125, 0.42586517333984375, 0.441864013671875, 0.45786285400390625, 0.4738616943359375, 0.48986053466796875, 0.505859375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 5.0, 11.0, 7.0, 15.0, 6.0, 13.0, 11.0, 13.0, 22.0, 19.0, 17.0, 29.0, 28.0, 21.0, 25.0, 32.0, 21.0, 34.0, 47.0, 38.0, 1061.0, 33.0, 45.0, 43.0, 52.0, 39.0, 36.0, 30.0, 37.0, 33.0, 23.0, 23.0, 28.0, 15.0, 15.0, 15.0, 14.0, 21.0, 9.0, 8.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-1.7939453125, -1.741058349609375, -1.68817138671875, -1.635284423828125, -1.5823974609375, -1.529510498046875, -1.47662353515625, -1.423736572265625, -1.370849609375, -1.317962646484375, -1.26507568359375, -1.212188720703125, -1.1593017578125, -1.106414794921875, -1.05352783203125, -1.000640869140625, -0.94775390625, -0.894866943359375, -0.84197998046875, -0.789093017578125, -0.7362060546875, -0.683319091796875, -0.63043212890625, -0.577545166015625, -0.524658203125, -0.471771240234375, -0.41888427734375, -0.365997314453125, -0.3131103515625, -0.260223388671875, -0.20733642578125, -0.154449462890625, -0.1015625, -0.048675537109375, 0.00421142578125, 0.057098388671875, 0.1099853515625, 0.162872314453125, 0.21575927734375, 0.268646240234375, 0.321533203125, 0.374420166015625, 0.42730712890625, 0.480194091796875, 0.5330810546875, 0.585968017578125, 0.63885498046875, 0.691741943359375, 0.74462890625, 0.797515869140625, 0.85040283203125, 0.903289794921875, 0.9561767578125, 1.009063720703125, 1.06195068359375, 1.114837646484375, 1.167724609375, 1.220611572265625, 1.27349853515625, 1.326385498046875, 1.3792724609375, 1.432159423828125, 1.48504638671875, 1.537933349609375, 1.5908203125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 2.0, 8.0, 13.0, 18.0, 28.0, 37.0, 55.0, 101.0, 128.0, 189.0, 329.0, 479.0, 878.0, 1317.0, 2340.0, 3840.0, 6812.0, 11779.0, 20758.0, 37286.0, 65183.0, 112199.0, 185956.0, 1206465.0, 181926.0, 110089.0, 64737.0, 36238.0, 20251.0, 11585.0, 6511.0, 3854.0, 2228.0, 1297.0, 837.0, 473.0, 313.0, 218.0, 112.0, 82.0, 60.0, 34.0, 28.0, 19.0, 17.0, 9.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.220703125, -0.21346282958984375, -0.2062225341796875, -0.19898223876953125, -0.191741943359375, -0.18450164794921875, -0.1772613525390625, -0.17002105712890625, -0.16278076171875, -0.15554046630859375, -0.1483001708984375, -0.14105987548828125, -0.133819580078125, -0.12657928466796875, -0.1193389892578125, -0.11209869384765625, -0.1048583984375, -0.09761810302734375, -0.0903778076171875, -0.08313751220703125, -0.075897216796875, -0.06865692138671875, -0.0614166259765625, -0.05417633056640625, -0.04693603515625, -0.03969573974609375, -0.0324554443359375, -0.02521514892578125, -0.017974853515625, -0.01073455810546875, -0.0034942626953125, 0.00374603271484375, 0.010986328125, 0.01822662353515625, 0.0254669189453125, 0.03270721435546875, 0.039947509765625, 0.04718780517578125, 0.0544281005859375, 0.06166839599609375, 0.06890869140625, 0.07614898681640625, 0.0833892822265625, 0.09062957763671875, 0.097869873046875, 0.10511016845703125, 0.1123504638671875, 0.11959075927734375, 0.1268310546875, 0.13407135009765625, 0.1413116455078125, 0.14855194091796875, 0.155792236328125, 0.16303253173828125, 0.1702728271484375, 0.17751312255859375, 0.18475341796875, 0.19199371337890625, 0.1992340087890625, 0.20647430419921875, 0.213714599609375, 0.22095489501953125, 0.2281951904296875, 0.23543548583984375, 0.24267578125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 6.0, 1.0, 8.0, 8.0, 4.0, 13.0, 17.0, 40.0, 45.0, 61.0, 82.0, 110.0, 198.0, 117.0, 81.0, 55.0, 52.0, 25.0, 13.0, 9.0, 9.0, 1.0, 2.0, 8.0, 6.0, 5.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0538330078125, -0.05235576629638672, -0.05087852478027344, -0.049401283264160156, -0.047924041748046875, -0.046446800231933594, -0.04496955871582031, -0.04349231719970703, -0.04201507568359375, -0.04053783416748047, -0.03906059265136719, -0.037583351135253906, -0.036106109619140625, -0.034628868103027344, -0.03315162658691406, -0.03167438507080078, -0.0301971435546875, -0.02871990203857422, -0.027242660522460938, -0.025765419006347656, -0.024288177490234375, -0.022810935974121094, -0.021333694458007812, -0.01985645294189453, -0.01837921142578125, -0.01690196990966797, -0.015424728393554688, -0.013947486877441406, -0.012470245361328125, -0.010993003845214844, -0.009515762329101562, -0.008038520812988281, -0.006561279296875, -0.005084037780761719, -0.0036067962646484375, -0.0021295547485351562, -0.000652313232421875, 0.0008249282836914062, 0.0023021697998046875, 0.0037794113159179688, 0.00525665283203125, 0.006733894348144531, 0.008211135864257812, 0.009688377380371094, 0.011165618896484375, 0.012642860412597656, 0.014120101928710938, 0.015597343444824219, 0.0170745849609375, 0.01855182647705078, 0.020029067993164062, 0.021506309509277344, 0.022983551025390625, 0.024460792541503906, 0.025938034057617188, 0.02741527557373047, 0.02889251708984375, 0.03036975860595703, 0.03184700012207031, 0.033324241638183594, 0.034801483154296875, 0.036278724670410156, 0.03775596618652344, 0.03923320770263672, 0.04071044921875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 11.0, 11.0, 16.0, 25.0, 31.0, 46.0, 57.0, 85.0, 143.0, 405.0, 1983.0, 21898.0, 973787.0, 45915.0, 3070.0, 525.0, 193.0, 112.0, 65.0, 50.0, 26.0, 20.0, 17.0, 11.0, 7.0, 7.0, 3.0, 3.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64794921875, -0.624481201171875, -0.60101318359375, -0.577545166015625, -0.5540771484375, -0.530609130859375, -0.50714111328125, -0.483673095703125, -0.460205078125, -0.436737060546875, -0.41326904296875, -0.389801025390625, -0.3663330078125, -0.342864990234375, -0.31939697265625, -0.295928955078125, -0.2724609375, -0.248992919921875, -0.22552490234375, -0.202056884765625, -0.1785888671875, -0.155120849609375, -0.13165283203125, -0.108184814453125, -0.084716796875, -0.061248779296875, -0.03778076171875, -0.014312744140625, 0.0091552734375, 0.032623291015625, 0.05609130859375, 0.079559326171875, 0.10302734375, 0.126495361328125, 0.14996337890625, 0.173431396484375, 0.1968994140625, 0.220367431640625, 0.24383544921875, 0.267303466796875, 0.290771484375, 0.314239501953125, 0.33770751953125, 0.361175537109375, 0.3846435546875, 0.408111572265625, 0.43157958984375, 0.455047607421875, 0.478515625, 0.501983642578125, 0.52545166015625, 0.548919677734375, 0.5723876953125, 0.595855712890625, 0.61932373046875, 0.642791748046875, 0.666259765625, 0.689727783203125, 0.71319580078125, 0.736663818359375, 0.7601318359375, 0.783599853515625, 0.80706787109375, 0.830535888671875, 0.85400390625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 17.0, 54.0, 139.0, 481.0, 226.0, 65.0, 11.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37442389130592346, -0.3613996207714081, -0.3483753204345703, -0.33535104990005493, -0.32232677936553955, -0.30930250883102417, -0.2962782382965088, -0.283253937959671, -0.27022966742515564, -0.25720539689064026, -0.24418111145496368, -0.2311568260192871, -0.21813255548477173, -0.20510828495025635, -0.19208399951457977, -0.1790597140789032, -0.16603544354438782, -0.15301117300987244, -0.13998688757419586, -0.1269626021385193, -0.1139383316040039, -0.10091405361890793, -0.08788977563381195, -0.07486549764871597, -0.061841219663619995, -0.04881694167852402, -0.03579266369342804, -0.022768385708332062, -0.009744107723236084, 0.003280170261859894, 0.01630444824695587, 0.02932872623205185, 0.042353034019470215, 0.05537731200456619, 0.06840158998966217, 0.08142586797475815, 0.09445014595985413, 0.1074744239449501, 0.12049870193004608, 0.13352298736572266, 0.14654725790023804, 0.15957152843475342, 0.17259581387043, 0.18562009930610657, 0.19864436984062195, 0.21166864037513733, 0.2246929258108139, 0.23771721124649048, 0.25074148178100586, 0.26376575231552124, 0.2767900228500366, 0.2898143231868744, 0.30283859372138977, 0.31586286425590515, 0.3288871645927429, 0.3419114351272583, 0.3549357056617737, 0.36795997619628906, 0.38098424673080444, 0.3940085470676422, 0.4070328176021576, 0.420057088136673, 0.43308138847351074, 0.4461056590080261, 0.4591299295425415]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 13.0, 12.0, 12.0, 8.0, 8.0, 12.0, 22.0, 20.0, 18.0, 20.0, 26.0, 21.0, 42.0, 23.0, 39.0, 35.0, 41.0, 37.0, 28.0, 44.0, 45.0, 37.0, 29.0, 47.0, 36.0, 34.0, 39.0, 40.0, 30.0, 21.0, 26.0, 29.0, 14.0, 11.0, 22.0, 8.0, 9.0, 10.0, 6.0, 8.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07403814792633057, -0.0719212219119072, -0.06980429589748383, -0.06768736988306046, -0.06557044386863708, -0.06345351785421371, -0.061336591839790344, -0.059219665825366974, -0.057102739810943604, -0.05498581379652023, -0.05286888778209686, -0.05075196176767349, -0.04863503575325012, -0.04651810973882675, -0.04440118372440338, -0.04228425770998001, -0.04016733169555664, -0.03805040568113327, -0.0359334796667099, -0.03381655365228653, -0.03169962763786316, -0.02958270162343979, -0.02746577560901642, -0.025348849594593048, -0.023231923580169678, -0.021114997565746307, -0.018998071551322937, -0.016881145536899567, -0.014764219522476196, -0.012647293508052826, -0.010530367493629456, -0.008413441479206085, -0.006296515464782715, -0.0041795894503593445, -0.002062663435935974, 5.426257848739624e-05, 0.0021711885929107666, 0.004288114607334137, 0.006405040621757507, 0.008521966636180878, 0.010638892650604248, 0.012755818665027618, 0.014872744679450989, 0.01698967069387436, 0.01910659670829773, 0.0212235227227211, 0.02334044873714447, 0.02545737475156784, 0.02757430076599121, 0.02969122678041458, 0.03180815279483795, 0.03392507880926132, 0.03604200482368469, 0.03815893083810806, 0.04027585685253143, 0.0423927828669548, 0.044509708881378174, 0.046626634895801544, 0.048743560910224915, 0.050860486924648285, 0.052977412939071655, 0.055094338953495026, 0.057211264967918396, 0.059328190982341766, 0.06144511699676514]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 9.0, 11.0, 8.0, 6.0, 12.0, 20.0, 14.0, 15.0, 26.0, 24.0, 20.0, 32.0, 34.0, 34.0, 43.0, 31.0, 41.0, 36.0, 36.0, 44.0, 36.0, 47.0, 46.0, 51.0, 34.0, 30.0, 29.0, 28.0, 33.0, 26.0, 25.0, 23.0, 11.0, 19.0, 14.0, 6.0, 8.0, 8.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.49932861328125, -2.4146728515625, -2.33001708984375, -2.245361328125, -2.16070556640625, -2.0760498046875, -1.99139404296875, -1.90673828125, -1.82208251953125, -1.7374267578125, -1.65277099609375, -1.568115234375, -1.48345947265625, -1.3988037109375, -1.31414794921875, -1.2294921875, -1.14483642578125, -1.0601806640625, -0.97552490234375, -0.890869140625, -0.80621337890625, -0.7215576171875, -0.63690185546875, -0.55224609375, -0.46759033203125, -0.3829345703125, -0.29827880859375, -0.213623046875, -0.12896728515625, -0.0443115234375, 0.04034423828125, 0.125, 0.20965576171875, 0.2943115234375, 0.37896728515625, 0.463623046875, 0.54827880859375, 0.6329345703125, 0.71759033203125, 0.80224609375, 0.88690185546875, 0.9715576171875, 1.05621337890625, 1.140869140625, 1.22552490234375, 1.3101806640625, 1.39483642578125, 1.4794921875, 1.56414794921875, 1.6488037109375, 1.73345947265625, 1.818115234375, 1.90277099609375, 1.9874267578125, 2.07208251953125, 2.15673828125, 2.24139404296875, 2.3260498046875, 2.41070556640625, 2.495361328125, 2.58001708984375, 2.6646728515625, 2.74932861328125, 2.833984375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 7.0, 4.0, 7.0, 6.0, 11.0, 12.0, 21.0, 29.0, 48.0, 79.0, 99.0, 126.0, 235.0, 304.0, 519.0, 747.0, 1127.0, 1861.0, 2672.0, 4259.0, 7388.0, 13999.0, 30669.0, 76629.0, 268961.0, 447266.0, 109498.0, 41046.0, 17724.0, 8941.0, 5097.0, 3162.0, 2037.0, 1330.0, 859.0, 604.0, 367.0, 260.0, 178.0, 127.0, 82.0, 52.0, 36.0, 23.0, 18.0, 10.0, 11.0, 9.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.947265625, -2.846221923828125, -2.74517822265625, -2.644134521484375, -2.5430908203125, -2.442047119140625, -2.34100341796875, -2.239959716796875, -2.138916015625, -2.037872314453125, -1.93682861328125, -1.835784912109375, -1.7347412109375, -1.633697509765625, -1.53265380859375, -1.431610107421875, -1.33056640625, -1.229522705078125, -1.12847900390625, -1.027435302734375, -0.9263916015625, -0.825347900390625, -0.72430419921875, -0.623260498046875, -0.522216796875, -0.421173095703125, -0.32012939453125, -0.219085693359375, -0.1180419921875, -0.016998291015625, 0.08404541015625, 0.185089111328125, 0.2861328125, 0.387176513671875, 0.48822021484375, 0.589263916015625, 0.6903076171875, 0.791351318359375, 0.89239501953125, 0.993438720703125, 1.094482421875, 1.195526123046875, 1.29656982421875, 1.397613525390625, 1.4986572265625, 1.599700927734375, 1.70074462890625, 1.801788330078125, 1.90283203125, 2.003875732421875, 2.10491943359375, 2.205963134765625, 2.3070068359375, 2.408050537109375, 2.50909423828125, 2.610137939453125, 2.711181640625, 2.812225341796875, 2.91326904296875, 3.014312744140625, 3.1153564453125, 3.216400146484375, 3.31744384765625, 3.418487548828125, 3.51953125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 2.0, 10.0, 3.0, 3.0, 12.0, 6.0, 6.0, 10.0, 12.0, 18.0, 18.0, 25.0, 27.0, 18.0, 25.0, 38.0, 32.0, 24.0, 36.0, 43.0, 60.0, 108.0, 232.0, 1555.0, 216.0, 79.0, 61.0, 46.0, 36.0, 44.0, 40.0, 25.0, 33.0, 27.0, 19.0, 16.0, 13.0, 13.0, 10.0, 8.0, 8.0, 6.0, 8.0, 8.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.9375, -8.6619873046875, -8.386474609375, -8.1109619140625, -7.83544921875, -7.5599365234375, -7.284423828125, -7.0089111328125, -6.7333984375, -6.4578857421875, -6.182373046875, -5.9068603515625, -5.63134765625, -5.3558349609375, -5.080322265625, -4.8048095703125, -4.529296875, -4.2537841796875, -3.978271484375, -3.7027587890625, -3.42724609375, -3.1517333984375, -2.876220703125, -2.6007080078125, -2.3251953125, -2.0496826171875, -1.774169921875, -1.4986572265625, -1.22314453125, -0.9476318359375, -0.672119140625, -0.3966064453125, -0.12109375, 0.1544189453125, 0.429931640625, 0.7054443359375, 0.98095703125, 1.2564697265625, 1.531982421875, 1.8074951171875, 2.0830078125, 2.3585205078125, 2.634033203125, 2.9095458984375, 3.18505859375, 3.4605712890625, 3.736083984375, 4.0115966796875, 4.287109375, 4.5626220703125, 4.838134765625, 5.1136474609375, 5.38916015625, 5.6646728515625, 5.940185546875, 6.2156982421875, 6.4912109375, 6.7667236328125, 7.042236328125, 7.3177490234375, 7.59326171875, 7.8687744140625, 8.144287109375, 8.4197998046875, 8.6953125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 7.0, 5.0, 7.0, 9.0, 21.0, 12.0, 17.0, 20.0, 36.0, 59.0, 79.0, 97.0, 152.0, 225.0, 558.0, 2278.0, 16994.0, 2027140.0, 1079829.0, 14795.0, 2011.0, 523.0, 231.0, 152.0, 110.0, 83.0, 66.0, 45.0, 32.0, 22.0, 20.0, 9.0, 12.0, 13.0, 8.0, 5.0, 5.0, 5.0, 11.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.453125, -17.83740234375, -17.2216796875, -16.60595703125, -15.990234375, -15.37451171875, -14.7587890625, -14.14306640625, -13.52734375, -12.91162109375, -12.2958984375, -11.68017578125, -11.064453125, -10.44873046875, -9.8330078125, -9.21728515625, -8.6015625, -7.98583984375, -7.3701171875, -6.75439453125, -6.138671875, -5.52294921875, -4.9072265625, -4.29150390625, -3.67578125, -3.06005859375, -2.4443359375, -1.82861328125, -1.212890625, -0.59716796875, 0.0185546875, 0.63427734375, 1.25, 1.86572265625, 2.4814453125, 3.09716796875, 3.712890625, 4.32861328125, 4.9443359375, 5.56005859375, 6.17578125, 6.79150390625, 7.4072265625, 8.02294921875, 8.638671875, 9.25439453125, 9.8701171875, 10.48583984375, 11.1015625, 11.71728515625, 12.3330078125, 12.94873046875, 13.564453125, 14.18017578125, 14.7958984375, 15.41162109375, 16.02734375, 16.64306640625, 17.2587890625, 17.87451171875, 18.490234375, 19.10595703125, 19.7216796875, 20.33740234375, 20.953125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 21.0, 169.0, 428.0, 298.0, 87.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.80569458007812, -64.01609802246094, -62.226505279541016, -60.436912536621094, -58.647315979003906, -56.85771942138672, -55.0681266784668, -53.278533935546875, -51.48893737792969, -49.6993408203125, -47.90974807739258, -46.120155334472656, -44.33055877685547, -42.54096221923828, -40.75136947631836, -38.96177673339844, -37.17218017578125, -35.38258361816406, -33.59299087524414, -31.803396224975586, -30.01380157470703, -28.224206924438477, -26.434612274169922, -24.645017623901367, -22.855422973632812, -21.065828323364258, -19.276233673095703, -17.48663902282715, -15.697044372558594, -13.907449722290039, -12.117855072021484, -10.32826042175293, -8.53866195678711, -6.749067306518555, -4.95947265625, -3.1698780059814453, -1.3802833557128906, 0.40931129455566406, 2.1989059448242188, 3.9885005950927734, 5.778095245361328, 7.567689895629883, 9.357284545898438, 11.146879196166992, 12.936473846435547, 14.726068496704102, 16.515663146972656, 18.30525779724121, 20.094852447509766, 21.88444709777832, 23.674041748046875, 25.46363639831543, 27.253231048583984, 29.04282569885254, 30.832420349121094, 32.62201690673828, 34.4116096496582, 36.201202392578125, 37.99079895019531, 39.7803955078125, 41.56998825073242, 43.359580993652344, 45.14917755126953, 46.93877410888672, 48.72836685180664]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 5.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 10.0, 12.0, 13.0, 14.0, 15.0, 24.0, 18.0, 23.0, 17.0, 38.0, 29.0, 31.0, 30.0, 35.0, 38.0, 33.0, 41.0, 37.0, 40.0, 37.0, 38.0, 38.0, 27.0, 35.0, 23.0, 27.0, 27.0, 23.0, 26.0, 27.0, 25.0, 13.0, 13.0, 13.0, 15.0, 9.0, 13.0, 12.0, 6.0, 11.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-23.7745361328125, -22.986364364624023, -22.198190689086914, -21.410018920898438, -20.621845245361328, -19.83367347717285, -19.045501708984375, -18.257328033447266, -17.469154357910156, -16.68098258972168, -15.89280891418457, -15.104637145996094, -14.316463470458984, -13.528291702270508, -12.740118980407715, -11.951946258544922, -11.163774490356445, -10.375601768493652, -9.58742904663086, -8.799257278442383, -8.011083602905273, -7.222911357879639, -6.434739112854004, -5.646566390991211, -4.858393669128418, -4.070220947265625, -3.282048463821411, -2.4938759803771973, -1.7057032585144043, -0.9175305366516113, -0.12935829162597656, 0.6588144302368164, 1.4469871520996094, 2.2351598739624023, 3.023332357406616, 3.81150484085083, 4.599677562713623, 5.387850284576416, 6.176022529602051, 6.964195251464844, 7.752367973327637, 8.54054069519043, 9.328713417053223, 10.116886138916016, 10.905057907104492, 11.693231582641602, 12.481403350830078, 13.269576072692871, 14.057748794555664, 14.845921516418457, 15.63409423828125, 16.422266006469727, 17.210439682006836, 17.998611450195312, 18.786785125732422, 19.5749568939209, 20.363128662109375, 21.15130043029785, 21.93947410583496, 22.727645874023438, 23.515819549560547, 24.303991317749023, 25.0921630859375, 25.88033676147461, 26.66851043701172]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 4.0, 7.0, 13.0, 6.0, 13.0, 8.0, 14.0, 18.0, 22.0, 18.0, 21.0, 28.0, 30.0, 29.0, 37.0, 43.0, 35.0, 29.0, 37.0, 46.0, 51.0, 38.0, 44.0, 44.0, 43.0, 34.0, 31.0, 28.0, 32.0, 31.0, 35.0, 19.0, 18.0, 14.0, 14.0, 12.0, 10.0, 7.0, 6.0, 3.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.76171875, -2.673492431640625, -2.58526611328125, -2.497039794921875, -2.4088134765625, -2.320587158203125, -2.23236083984375, -2.144134521484375, -2.055908203125, -1.967681884765625, -1.87945556640625, -1.791229248046875, -1.7030029296875, -1.614776611328125, -1.52655029296875, -1.438323974609375, -1.35009765625, -1.261871337890625, -1.17364501953125, -1.085418701171875, -0.9971923828125, -0.908966064453125, -0.82073974609375, -0.732513427734375, -0.644287109375, -0.556060791015625, -0.46783447265625, -0.379608154296875, -0.2913818359375, -0.203155517578125, -0.11492919921875, -0.026702880859375, 0.0615234375, 0.149749755859375, 0.23797607421875, 0.326202392578125, 0.4144287109375, 0.502655029296875, 0.59088134765625, 0.679107666015625, 0.767333984375, 0.855560302734375, 0.94378662109375, 1.032012939453125, 1.1202392578125, 1.208465576171875, 1.29669189453125, 1.384918212890625, 1.47314453125, 1.561370849609375, 1.64959716796875, 1.737823486328125, 1.8260498046875, 1.914276123046875, 2.00250244140625, 2.090728759765625, 2.178955078125, 2.267181396484375, 2.35540771484375, 2.443634033203125, 2.5318603515625, 2.620086669921875, 2.70831298828125, 2.796539306640625, 2.884765625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 16.0, 20.0, 23.0, 27.0, 71.0, 72.0, 82.0, 137.0, 203.0, 307.0, 480.0, 829.0, 1449.0, 2613.0, 4626.0, 8957.0, 17850.0, 35473.0, 77356.0, 184494.0, 496548.0, 1182247.0, 1251447.0, 557067.0, 207864.0, 85490.0, 38688.0, 18746.0, 9659.0, 4893.0, 2701.0, 1552.0, 861.0, 536.0, 294.0, 206.0, 120.0, 80.0, 62.0, 41.0, 18.0, 29.0, 15.0, 14.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3984375, -3.285369873046875, -3.17230224609375, -3.059234619140625, -2.9461669921875, -2.833099365234375, -2.72003173828125, -2.606964111328125, -2.493896484375, -2.380828857421875, -2.26776123046875, -2.154693603515625, -2.0416259765625, -1.928558349609375, -1.81549072265625, -1.702423095703125, -1.58935546875, -1.476287841796875, -1.36322021484375, -1.250152587890625, -1.1370849609375, -1.024017333984375, -0.91094970703125, -0.797882080078125, -0.684814453125, -0.571746826171875, -0.45867919921875, -0.345611572265625, -0.2325439453125, -0.119476318359375, -0.00640869140625, 0.106658935546875, 0.2197265625, 0.332794189453125, 0.44586181640625, 0.558929443359375, 0.6719970703125, 0.785064697265625, 0.89813232421875, 1.011199951171875, 1.124267578125, 1.237335205078125, 1.35040283203125, 1.463470458984375, 1.5765380859375, 1.689605712890625, 1.80267333984375, 1.915740966796875, 2.02880859375, 2.141876220703125, 2.25494384765625, 2.368011474609375, 2.4810791015625, 2.594146728515625, 2.70721435546875, 2.820281982421875, 2.933349609375, 3.046417236328125, 3.15948486328125, 3.272552490234375, 3.3856201171875, 3.498687744140625, 3.61175537109375, 3.724822998046875, 3.837890625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 8.0, 7.0, 6.0, 9.0, 11.0, 14.0, 30.0, 31.0, 38.0, 62.0, 97.0, 133.0, 168.0, 223.0, 287.0, 361.0, 454.0, 451.0, 398.0, 305.0, 253.0, 194.0, 141.0, 99.0, 77.0, 57.0, 48.0, 31.0, 18.0, 20.0, 12.0, 7.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.671875, -9.41192626953125, -9.1519775390625, -8.89202880859375, -8.632080078125, -8.37213134765625, -8.1121826171875, -7.85223388671875, -7.59228515625, -7.33233642578125, -7.0723876953125, -6.81243896484375, -6.552490234375, -6.29254150390625, -6.0325927734375, -5.77264404296875, -5.5126953125, -5.25274658203125, -4.9927978515625, -4.73284912109375, -4.472900390625, -4.21295166015625, -3.9530029296875, -3.69305419921875, -3.43310546875, -3.17315673828125, -2.9132080078125, -2.65325927734375, -2.393310546875, -2.13336181640625, -1.8734130859375, -1.61346435546875, -1.353515625, -1.09356689453125, -0.8336181640625, -0.57366943359375, -0.313720703125, -0.05377197265625, 0.2061767578125, 0.46612548828125, 0.72607421875, 0.98602294921875, 1.2459716796875, 1.50592041015625, 1.765869140625, 2.02581787109375, 2.2857666015625, 2.54571533203125, 2.8056640625, 3.06561279296875, 3.3255615234375, 3.58551025390625, 3.845458984375, 4.10540771484375, 4.3653564453125, 4.62530517578125, 4.88525390625, 5.14520263671875, 5.4051513671875, 5.66510009765625, 5.925048828125, 6.18499755859375, 6.4449462890625, 6.70489501953125, 6.96484375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 5.0, 11.0, 10.0, 16.0, 22.0, 30.0, 46.0, 72.0, 74.0, 133.0, 228.0, 587.0, 1670.0, 6909.0, 54013.0, 774209.0, 3048161.0, 278297.0, 23881.0, 3925.0, 1063.0, 343.0, 205.0, 104.0, 70.0, 51.0, 47.0, 29.0, 16.0, 14.0, 11.0, 8.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.578125, -22.00390625, -21.4296875, -20.85546875, -20.28125, -19.70703125, -19.1328125, -18.55859375, -17.984375, -17.41015625, -16.8359375, -16.26171875, -15.6875, -15.11328125, -14.5390625, -13.96484375, -13.390625, -12.81640625, -12.2421875, -11.66796875, -11.09375, -10.51953125, -9.9453125, -9.37109375, -8.796875, -8.22265625, -7.6484375, -7.07421875, -6.5, -5.92578125, -5.3515625, -4.77734375, -4.203125, -3.62890625, -3.0546875, -2.48046875, -1.90625, -1.33203125, -0.7578125, -0.18359375, 0.390625, 0.96484375, 1.5390625, 2.11328125, 2.6875, 3.26171875, 3.8359375, 4.41015625, 4.984375, 5.55859375, 6.1328125, 6.70703125, 7.28125, 7.85546875, 8.4296875, 9.00390625, 9.578125, 10.15234375, 10.7265625, 11.30078125, 11.875, 12.44921875, 13.0234375, 13.59765625, 14.171875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 20.0, 69.0, 121.0, 189.0, 226.0, 184.0, 124.0, 54.0, 10.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-143.73486328125, -140.88414001464844, -138.03343200683594, -135.18270874023438, -132.3319854736328, -129.4812774658203, -126.63055419921875, -123.77983093261719, -120.92911529541016, -118.07839965820312, -115.22767639160156, -112.37696075439453, -109.5262451171875, -106.67552185058594, -103.8248062133789, -100.97409057617188, -98.12336730957031, -95.27265167236328, -92.42192840576172, -89.57121276855469, -86.72048950195312, -83.8697738647461, -81.01905822753906, -78.1683349609375, -75.31761932373047, -72.46690368652344, -69.61618041992188, -66.76546478271484, -63.91474533081055, -61.06402587890625, -58.21331024169922, -55.36259078979492, -52.511863708496094, -49.6611442565918, -46.8104248046875, -43.95970916748047, -41.10898971557617, -38.258270263671875, -35.407554626464844, -32.55683517456055, -29.70611572265625, -26.855396270751953, -24.00467872619629, -21.153961181640625, -18.303241729736328, -15.452523231506348, -12.601804733276367, -9.751087188720703, -6.900367736816406, -4.049649238586426, -1.1989307403564453, 1.6517877578735352, 4.502506256103516, 7.353224754333496, 10.203943252563477, 13.05466079711914, 15.905380249023438, 18.756099700927734, 21.6068172454834, 24.457534790039062, 27.30825424194336, 30.158973693847656, 33.00968933105469, 35.860408782958984, 38.71112823486328]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 3.0, 6.0, 7.0, 12.0, 6.0, 11.0, 20.0, 17.0, 20.0, 19.0, 16.0, 38.0, 22.0, 32.0, 36.0, 34.0, 44.0, 48.0, 53.0, 45.0, 46.0, 48.0, 46.0, 37.0, 32.0, 49.0, 30.0, 36.0, 27.0, 30.0, 24.0, 17.0, 17.0, 14.0, 16.0, 12.0, 10.0, 7.0, 9.0, 2.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.827207565307617, -28.90460777282715, -27.982009887695312, -27.059410095214844, -26.136810302734375, -25.21421241760254, -24.29161262512207, -23.369014739990234, -22.446414947509766, -21.523815155029297, -20.60121726989746, -19.678617477416992, -18.756019592285156, -17.833419799804688, -16.91082000732422, -15.988221168518066, -15.065622329711914, -14.143023490905762, -13.22042465209961, -12.29782485961914, -11.375226020812988, -10.452627182006836, -9.530027389526367, -8.607428550720215, -7.6848297119140625, -6.76223087310791, -5.8396315574646, -4.917032241821289, -3.9944334030151367, -3.0718345642089844, -2.149235248565674, -1.2266359329223633, -0.30403900146484375, 0.6185600757598877, 1.5411591529846191, 2.4637582302093506, 3.386357307434082, 4.308956146240234, 5.231555461883545, 6.1541547775268555, 7.076753616333008, 7.99935245513916, 8.921951293945312, 9.844551086425781, 10.767149925231934, 11.689748764038086, 12.612348556518555, 13.534947395324707, 14.45754623413086, 15.380145072937012, 16.302743911743164, 17.225343704223633, 18.14794158935547, 19.070541381835938, 19.993141174316406, 20.915740966796875, 21.83833885192871, 22.76093864440918, 23.683536529541016, 24.606136322021484, 25.528736114501953, 26.45133399963379, 27.373933792114258, 28.296531677246094, 29.219131469726562]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 5.0, 6.0, 8.0, 6.0, 6.0, 6.0, 14.0, 11.0, 15.0, 17.0, 17.0, 26.0, 31.0, 30.0, 22.0, 24.0, 28.0, 37.0, 46.0, 35.0, 37.0, 34.0, 40.0, 39.0, 40.0, 30.0, 44.0, 45.0, 43.0, 37.0, 28.0, 23.0, 33.0, 18.0, 24.0, 17.0, 13.0, 14.0, 8.0, 7.0, 7.0, 9.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0], "bins": [-3.08203125, -2.992523193359375, -2.90301513671875, -2.813507080078125, -2.7239990234375, -2.634490966796875, -2.54498291015625, -2.455474853515625, -2.365966796875, -2.276458740234375, -2.18695068359375, -2.097442626953125, -2.0079345703125, -1.918426513671875, -1.82891845703125, -1.739410400390625, -1.64990234375, -1.560394287109375, -1.47088623046875, -1.381378173828125, -1.2918701171875, -1.202362060546875, -1.11285400390625, -1.023345947265625, -0.933837890625, -0.844329833984375, -0.75482177734375, -0.665313720703125, -0.5758056640625, -0.486297607421875, -0.39678955078125, -0.307281494140625, -0.2177734375, -0.128265380859375, -0.03875732421875, 0.050750732421875, 0.1402587890625, 0.229766845703125, 0.31927490234375, 0.408782958984375, 0.498291015625, 0.587799072265625, 0.67730712890625, 0.766815185546875, 0.8563232421875, 0.945831298828125, 1.03533935546875, 1.124847412109375, 1.21435546875, 1.303863525390625, 1.39337158203125, 1.482879638671875, 1.5723876953125, 1.661895751953125, 1.75140380859375, 1.840911865234375, 1.930419921875, 2.019927978515625, 2.10943603515625, 2.198944091796875, 2.2884521484375, 2.377960205078125, 2.46746826171875, 2.556976318359375, 2.646484375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 7.0, 6.0, 16.0, 25.0, 35.0, 50.0, 67.0, 115.0, 157.0, 269.0, 462.0, 752.0, 1348.0, 2663.0, 4834.0, 9997.0, 20850.0, 44922.0, 94461.0, 191720.0, 283800.0, 200282.0, 100493.0, 47251.0, 22005.0, 10651.0, 5167.0, 2670.0, 1414.0, 769.0, 487.0, 288.0, 177.0, 123.0, 71.0, 44.0, 32.0, 22.0, 15.0, 13.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5966796875, -0.578887939453125, -0.56109619140625, -0.543304443359375, -0.5255126953125, -0.507720947265625, -0.48992919921875, -0.472137451171875, -0.454345703125, -0.436553955078125, -0.41876220703125, -0.400970458984375, -0.3831787109375, -0.365386962890625, -0.34759521484375, -0.329803466796875, -0.31201171875, -0.294219970703125, -0.27642822265625, -0.258636474609375, -0.2408447265625, -0.223052978515625, -0.20526123046875, -0.187469482421875, -0.169677734375, -0.151885986328125, -0.13409423828125, -0.116302490234375, -0.0985107421875, -0.080718994140625, -0.06292724609375, -0.045135498046875, -0.02734375, -0.009552001953125, 0.00823974609375, 0.026031494140625, 0.0438232421875, 0.061614990234375, 0.07940673828125, 0.097198486328125, 0.114990234375, 0.132781982421875, 0.15057373046875, 0.168365478515625, 0.1861572265625, 0.203948974609375, 0.22174072265625, 0.239532470703125, 0.25732421875, 0.275115966796875, 0.29290771484375, 0.310699462890625, 0.3284912109375, 0.346282958984375, 0.36407470703125, 0.381866455078125, 0.399658203125, 0.417449951171875, 0.43524169921875, 0.453033447265625, 0.4708251953125, 0.488616943359375, 0.50640869140625, 0.524200439453125, 0.5419921875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 11.0, 7.0, 8.0, 8.0, 14.0, 13.0, 14.0, 11.0, 14.0, 22.0, 20.0, 26.0, 35.0, 32.0, 31.0, 31.0, 40.0, 40.0, 41.0, 41.0, 1058.0, 37.0, 42.0, 33.0, 43.0, 26.0, 38.0, 43.0, 28.0, 29.0, 36.0, 26.0, 22.0, 22.0, 11.0, 13.0, 13.0, 7.0, 14.0, 3.0, 4.0, 3.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-2.072265625, -2.013580322265625, -1.95489501953125, -1.896209716796875, -1.8375244140625, -1.778839111328125, -1.72015380859375, -1.661468505859375, -1.602783203125, -1.544097900390625, -1.48541259765625, -1.426727294921875, -1.3680419921875, -1.309356689453125, -1.25067138671875, -1.191986083984375, -1.13330078125, -1.074615478515625, -1.01593017578125, -0.957244873046875, -0.8985595703125, -0.839874267578125, -0.78118896484375, -0.722503662109375, -0.663818359375, -0.605133056640625, -0.54644775390625, -0.487762451171875, -0.4290771484375, -0.370391845703125, -0.31170654296875, -0.253021240234375, -0.1943359375, -0.135650634765625, -0.07696533203125, -0.018280029296875, 0.0404052734375, 0.099090576171875, 0.15777587890625, 0.216461181640625, 0.275146484375, 0.333831787109375, 0.39251708984375, 0.451202392578125, 0.5098876953125, 0.568572998046875, 0.62725830078125, 0.685943603515625, 0.74462890625, 0.803314208984375, 0.86199951171875, 0.920684814453125, 0.9793701171875, 1.038055419921875, 1.09674072265625, 1.155426025390625, 1.214111328125, 1.272796630859375, 1.33148193359375, 1.390167236328125, 1.4488525390625, 1.507537841796875, 1.56622314453125, 1.624908447265625, 1.68359375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 16.0, 17.0, 27.0, 33.0, 71.0, 102.0, 157.0, 213.0, 298.0, 535.0, 750.0, 1181.0, 1746.0, 2607.0, 4157.0, 6378.0, 10081.0, 15378.0, 24318.0, 37077.0, 56205.0, 82852.0, 120236.0, 315583.0, 994387.0, 140391.0, 94765.0, 64685.0, 42767.0, 28185.0, 18453.0, 11744.0, 7633.0, 4930.0, 3133.0, 2038.0, 1331.0, 900.0, 555.0, 402.0, 285.0, 160.0, 125.0, 81.0, 51.0, 34.0, 29.0, 20.0, 15.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1768798828125, -0.1712055206298828, -0.16553115844726562, -0.15985679626464844, -0.15418243408203125, -0.14850807189941406, -0.14283370971679688, -0.1371593475341797, -0.1314849853515625, -0.1258106231689453, -0.12013626098632812, -0.11446189880371094, -0.10878753662109375, -0.10311317443847656, -0.09743881225585938, -0.09176445007324219, -0.086090087890625, -0.08041572570800781, -0.07474136352539062, -0.06906700134277344, -0.06339263916015625, -0.05771827697753906, -0.052043914794921875, -0.04636955261230469, -0.0406951904296875, -0.03502082824707031, -0.029346466064453125, -0.023672103881835938, -0.01799774169921875, -0.012323379516601562, -0.006649017333984375, -0.0009746551513671875, 0.00469970703125, 0.010374069213867188, 0.016048431396484375, 0.021722793579101562, 0.02739715576171875, 0.03307151794433594, 0.038745880126953125, 0.04442024230957031, 0.0500946044921875, 0.05576896667480469, 0.061443328857421875, 0.06711769104003906, 0.07279205322265625, 0.07846641540527344, 0.08414077758789062, 0.08981513977050781, 0.095489501953125, 0.10116386413574219, 0.10683822631835938, 0.11251258850097656, 0.11818695068359375, 0.12386131286621094, 0.12953567504882812, 0.1352100372314453, 0.1408843994140625, 0.1465587615966797, 0.15223312377929688, 0.15790748596191406, 0.16358184814453125, 0.16925621032714844, 0.17493057250976562, 0.1806049346923828, 0.186279296875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 5.0, 9.0, 10.0, 14.0, 18.0, 28.0, 39.0, 34.0, 74.0, 93.0, 141.0, 124.0, 103.0, 91.0, 45.0, 37.0, 24.0, 26.0, 13.0, 10.0, 16.0, 9.0, 9.0, 9.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062408447265625, -0.06041383743286133, -0.058419227600097656, -0.056424617767333984, -0.05443000793457031, -0.05243539810180664, -0.05044078826904297, -0.0484461784362793, -0.046451568603515625, -0.04445695877075195, -0.04246234893798828, -0.04046773910522461, -0.03847312927246094, -0.036478519439697266, -0.034483909606933594, -0.03248929977416992, -0.03049468994140625, -0.028500080108642578, -0.026505470275878906, -0.024510860443115234, -0.022516250610351562, -0.02052164077758789, -0.01852703094482422, -0.016532421112060547, -0.014537811279296875, -0.012543201446533203, -0.010548591613769531, -0.00855398178100586, -0.0065593719482421875, -0.004564762115478516, -0.0025701522827148438, -0.0005755424499511719, 0.0014190673828125, 0.003413677215576172, 0.005408287048339844, 0.007402896881103516, 0.009397506713867188, 0.01139211654663086, 0.013386726379394531, 0.015381336212158203, 0.017375946044921875, 0.019370555877685547, 0.02136516571044922, 0.02335977554321289, 0.025354385375976562, 0.027348995208740234, 0.029343605041503906, 0.03133821487426758, 0.03333282470703125, 0.03532743453979492, 0.037322044372558594, 0.039316654205322266, 0.04131126403808594, 0.04330587387084961, 0.04530048370361328, 0.04729509353637695, 0.049289703369140625, 0.0512843132019043, 0.05327892303466797, 0.05527353286743164, 0.05726814270019531, 0.059262752532958984, 0.061257362365722656, 0.06325197219848633, 0.06524658203125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 9.0, 6.0, 6.0, 17.0, 14.0, 18.0, 26.0, 27.0, 48.0, 75.0, 87.0, 167.0, 455.0, 1630.0, 16537.0, 1000254.0, 26140.0, 1991.0, 489.0, 196.0, 92.0, 108.0, 49.0, 29.0, 24.0, 13.0, 9.0, 13.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9736328125, -0.9437332153320312, -0.9138336181640625, -0.8839340209960938, -0.854034423828125, -0.8241348266601562, -0.7942352294921875, -0.7643356323242188, -0.73443603515625, -0.7045364379882812, -0.6746368408203125, -0.6447372436523438, -0.614837646484375, -0.5849380493164062, -0.5550384521484375, -0.5251388549804688, -0.4952392578125, -0.46533966064453125, -0.4354400634765625, -0.40554046630859375, -0.375640869140625, -0.34574127197265625, -0.3158416748046875, -0.28594207763671875, -0.25604248046875, -0.22614288330078125, -0.1962432861328125, -0.16634368896484375, -0.136444091796875, -0.10654449462890625, -0.0766448974609375, -0.04674530029296875, -0.016845703125, 0.01305389404296875, 0.0429534912109375, 0.07285308837890625, 0.102752685546875, 0.13265228271484375, 0.1625518798828125, 0.19245147705078125, 0.22235107421875, 0.25225067138671875, 0.2821502685546875, 0.31204986572265625, 0.341949462890625, 0.37184906005859375, 0.4017486572265625, 0.43164825439453125, 0.4615478515625, 0.49144744873046875, 0.5213470458984375, 0.5512466430664062, 0.581146240234375, 0.6110458374023438, 0.6409454345703125, 0.6708450317382812, 0.70074462890625, 0.7306442260742188, 0.7605438232421875, 0.7904434204101562, 0.820343017578125, 0.8502426147460938, 0.8801422119140625, 0.9100418090820312, 0.93994140625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 10.0, 18.0, 50.0, 201.0, 554.0, 132.0, 28.0, 10.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6166738271713257, -0.6017930507659912, -0.5869122743606567, -0.5720314383506775, -0.557150661945343, -0.5422698855400085, -0.5273891091346741, -0.5125083327293396, -0.49762752652168274, -0.48274675011634827, -0.4678659439086914, -0.45298516750335693, -0.4381043612957001, -0.4232235848903656, -0.40834277868270874, -0.39346200227737427, -0.3785812258720398, -0.3637004494667053, -0.34881964325904846, -0.333938866853714, -0.31905806064605713, -0.30417728424072266, -0.2892965078353882, -0.2744157016277313, -0.25953489542007446, -0.2446541041135788, -0.22977331280708313, -0.21489253640174866, -0.200011745095253, -0.18513095378875732, -0.17025016248226166, -0.155369371175766, -0.14048859477043152, -0.12560780346393585, -0.11072701960802078, -0.09584622830152512, -0.08096544444561005, -0.06608465313911438, -0.05120386183261871, -0.036323077976703644, -0.021442286670207977, -0.006561498157680035, 0.008319290354847908, 0.023200079798698425, 0.03808086737990379, 0.05296165496110916, 0.06784244626760483, 0.0827232301235199, 0.09760402143001556, 0.11248481273651123, 0.1273656040430069, 0.14224639534950256, 0.15712717175483704, 0.1720079630613327, 0.18688875436782837, 0.20176953077316284, 0.2166503369808197, 0.23153112828731537, 0.24641191959381104, 0.2612926959991455, 0.27617350220680237, 0.29105427861213684, 0.3059350848197937, 0.3208158612251282, 0.33569663763046265]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 4.0, 5.0, 12.0, 13.0, 12.0, 8.0, 12.0, 20.0, 15.0, 20.0, 18.0, 32.0, 30.0, 27.0, 26.0, 28.0, 30.0, 34.0, 34.0, 34.0, 46.0, 36.0, 44.0, 31.0, 34.0, 39.0, 29.0, 35.0, 31.0, 27.0, 30.0, 26.0, 15.0, 21.0, 16.0, 22.0, 13.0, 11.0, 14.0, 12.0, 7.0, 8.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.08392399549484253, -0.08129259943962097, -0.07866121083498001, -0.07602982223033905, -0.07339842617511749, -0.07076703011989594, -0.06813564151525497, -0.06550425291061401, -0.06287285685539246, -0.0602414645254612, -0.05761007219552994, -0.05497867986559868, -0.05234728753566742, -0.04971589520573616, -0.0470845028758049, -0.04445311054587364, -0.04182171821594238, -0.039190325886011124, -0.036558933556079865, -0.033927541226148605, -0.031296148896217346, -0.028664756566286087, -0.026033364236354828, -0.02340197190642357, -0.02077057957649231, -0.01813918724656105, -0.015507794916629791, -0.012876402586698532, -0.010245010256767273, -0.007613617926836014, -0.004982225596904755, -0.0023508332669734955, 0.00028055906295776367, 0.002911951392889023, 0.005543343722820282, 0.008174736052751541, 0.0108061283826828, 0.01343752071261406, 0.01606891304254532, 0.018700305372476578, 0.021331697702407837, 0.023963090032339096, 0.026594482362270355, 0.029225874692201614, 0.031857267022132874, 0.03448865935206413, 0.03712005168199539, 0.03975144401192665, 0.04238283634185791, 0.04501422867178917, 0.04764562100172043, 0.05027701333165169, 0.05290840566158295, 0.055539797991514206, 0.058171190321445465, 0.060802582651376724, 0.06343397498130798, 0.06606537103652954, 0.0686967596411705, 0.07132814824581146, 0.07395954430103302, 0.07659094035625458, 0.07922232896089554, 0.0818537175655365, 0.08448511362075806]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 5.0, 6.0, 8.0, 6.0, 6.0, 7.0, 13.0, 12.0, 14.0, 17.0, 18.0, 25.0, 30.0, 33.0, 20.0, 24.0, 27.0, 39.0, 46.0, 36.0, 34.0, 35.0, 39.0, 44.0, 36.0, 29.0, 44.0, 51.0, 39.0, 36.0, 28.0, 26.0, 30.0, 18.0, 24.0, 17.0, 12.0, 16.0, 7.0, 6.0, 8.0, 9.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0], "bins": [-3.08203125, -2.99249267578125, -2.9029541015625, -2.81341552734375, -2.723876953125, -2.63433837890625, -2.5447998046875, -2.45526123046875, -2.36572265625, -2.27618408203125, -2.1866455078125, -2.09710693359375, -2.007568359375, -1.91802978515625, -1.8284912109375, -1.73895263671875, -1.6494140625, -1.55987548828125, -1.4703369140625, -1.38079833984375, -1.291259765625, -1.20172119140625, -1.1121826171875, -1.02264404296875, -0.93310546875, -0.84356689453125, -0.7540283203125, -0.66448974609375, -0.574951171875, -0.48541259765625, -0.3958740234375, -0.30633544921875, -0.216796875, -0.12725830078125, -0.0377197265625, 0.05181884765625, 0.141357421875, 0.23089599609375, 0.3204345703125, 0.40997314453125, 0.49951171875, 0.58905029296875, 0.6785888671875, 0.76812744140625, 0.857666015625, 0.94720458984375, 1.0367431640625, 1.12628173828125, 1.2158203125, 1.30535888671875, 1.3948974609375, 1.48443603515625, 1.573974609375, 1.66351318359375, 1.7530517578125, 1.84259033203125, 1.93212890625, 2.02166748046875, 2.1112060546875, 2.20074462890625, 2.290283203125, 2.37982177734375, 2.4693603515625, 2.55889892578125, 2.6484375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 8.0, 25.0, 23.0, 32.0, 38.0, 79.0, 94.0, 136.0, 208.0, 263.0, 401.0, 583.0, 847.0, 1246.0, 1906.0, 2927.0, 4847.0, 8974.0, 17122.0, 37591.0, 93770.0, 266215.0, 365524.0, 141602.0, 53153.0, 23090.0, 11276.0, 6156.0, 3620.0, 2297.0, 1422.0, 965.0, 626.0, 424.0, 295.0, 232.0, 155.0, 115.0, 76.0, 55.0, 38.0, 19.0, 28.0, 13.0, 10.0, 10.0, 6.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.501953125, -2.416259765625, -2.33056640625, -2.244873046875, -2.1591796875, -2.073486328125, -1.98779296875, -1.902099609375, -1.81640625, -1.730712890625, -1.64501953125, -1.559326171875, -1.4736328125, -1.387939453125, -1.30224609375, -1.216552734375, -1.130859375, -1.045166015625, -0.95947265625, -0.873779296875, -0.7880859375, -0.702392578125, -0.61669921875, -0.531005859375, -0.4453125, -0.359619140625, -0.27392578125, -0.188232421875, -0.1025390625, -0.016845703125, 0.06884765625, 0.154541015625, 0.240234375, 0.325927734375, 0.41162109375, 0.497314453125, 0.5830078125, 0.668701171875, 0.75439453125, 0.840087890625, 0.92578125, 1.011474609375, 1.09716796875, 1.182861328125, 1.2685546875, 1.354248046875, 1.43994140625, 1.525634765625, 1.611328125, 1.697021484375, 1.78271484375, 1.868408203125, 1.9541015625, 2.039794921875, 2.12548828125, 2.211181640625, 2.296875, 2.382568359375, 2.46826171875, 2.553955078125, 2.6396484375, 2.725341796875, 2.81103515625, 2.896728515625, 2.982421875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 10.0, 8.0, 9.0, 8.0, 17.0, 19.0, 29.0, 33.0, 38.0, 37.0, 40.0, 40.0, 40.0, 66.0, 118.0, 406.0, 1567.0, 144.0, 77.0, 55.0, 46.0, 43.0, 46.0, 34.0, 22.0, 23.0, 20.0, 8.0, 13.0, 9.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.796875, -14.3494873046875, -13.902099609375, -13.4547119140625, -13.00732421875, -12.5599365234375, -12.112548828125, -11.6651611328125, -11.2177734375, -10.7703857421875, -10.322998046875, -9.8756103515625, -9.42822265625, -8.9808349609375, -8.533447265625, -8.0860595703125, -7.638671875, -7.1912841796875, -6.743896484375, -6.2965087890625, -5.84912109375, -5.4017333984375, -4.954345703125, -4.5069580078125, -4.0595703125, -3.6121826171875, -3.164794921875, -2.7174072265625, -2.27001953125, -1.8226318359375, -1.375244140625, -0.9278564453125, -0.48046875, -0.0330810546875, 0.414306640625, 0.8616943359375, 1.30908203125, 1.7564697265625, 2.203857421875, 2.6512451171875, 3.0986328125, 3.5460205078125, 3.993408203125, 4.4407958984375, 4.88818359375, 5.3355712890625, 5.782958984375, 6.2303466796875, 6.677734375, 7.1251220703125, 7.572509765625, 8.0198974609375, 8.46728515625, 8.9146728515625, 9.362060546875, 9.8094482421875, 10.2568359375, 10.7042236328125, 11.151611328125, 11.5989990234375, 12.04638671875, 12.4937744140625, 12.941162109375, 13.3885498046875, 13.8359375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 8.0, 3.0, 5.0, 11.0, 11.0, 13.0, 14.0, 21.0, 33.0, 41.0, 68.0, 92.0, 128.0, 197.0, 361.0, 918.0, 11552.0, 3021584.0, 106889.0, 2430.0, 496.0, 265.0, 157.0, 105.0, 75.0, 61.0, 46.0, 30.0, 22.0, 20.0, 14.0, 10.0, 8.0, 8.0, 4.0, 2.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.59375, -26.696044921875, -25.79833984375, -24.900634765625, -24.0029296875, -23.105224609375, -22.20751953125, -21.309814453125, -20.412109375, -19.514404296875, -18.61669921875, -17.718994140625, -16.8212890625, -15.923583984375, -15.02587890625, -14.128173828125, -13.23046875, -12.332763671875, -11.43505859375, -10.537353515625, -9.6396484375, -8.741943359375, -7.84423828125, -6.946533203125, -6.048828125, -5.151123046875, -4.25341796875, -3.355712890625, -2.4580078125, -1.560302734375, -0.66259765625, 0.235107421875, 1.1328125, 2.030517578125, 2.92822265625, 3.825927734375, 4.7236328125, 5.621337890625, 6.51904296875, 7.416748046875, 8.314453125, 9.212158203125, 10.10986328125, 11.007568359375, 11.9052734375, 12.802978515625, 13.70068359375, 14.598388671875, 15.49609375, 16.393798828125, 17.29150390625, 18.189208984375, 19.0869140625, 19.984619140625, 20.88232421875, 21.780029296875, 22.677734375, 23.575439453125, 24.47314453125, 25.370849609375, 26.2685546875, 27.166259765625, 28.06396484375, 28.961669921875, 29.859375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 112.0, 873.0, 31.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-274.7069396972656, -269.7449035644531, -264.78289794921875, -259.82086181640625, -254.8588409423828, -249.89682006835938, -244.93478393554688, -239.97276306152344, -235.0107421875, -230.04872131347656, -225.08670043945312, -220.12466430664062, -215.1626434326172, -210.20062255859375, -205.23858642578125, -200.2765655517578, -195.31454467773438, -190.35252380371094, -185.3905029296875, -180.428466796875, -175.46644592285156, -170.50442504882812, -165.54238891601562, -160.5803680419922, -155.61834716796875, -150.6563262939453, -145.69430541992188, -140.73226928710938, -135.77024841308594, -130.8082275390625, -125.84619903564453, -120.88417053222656, -115.9221420288086, -110.96011352539062, -105.99809265136719, -101.03607177734375, -96.07404327392578, -91.11201477050781, -86.14999389648438, -81.18797302246094, -76.22594451904297, -71.263916015625, -66.30189514160156, -61.33987045288086, -56.377845764160156, -51.41582107543945, -46.45379638671875, -41.49177169799805, -36.529747009277344, -31.56772232055664, -26.605697631835938, -21.643672943115234, -16.68164825439453, -11.719623565673828, -6.757598876953125, -1.7955741882324219, 3.1664505004882812, 8.128475189208984, 13.090499877929688, 18.05252456665039, 23.014549255371094, 27.976573944091797, 32.9385986328125, 37.9006233215332, 42.862648010253906]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 13.0, 9.0, 12.0, 20.0, 16.0, 10.0, 16.0, 20.0, 27.0, 28.0, 31.0, 32.0, 29.0, 35.0, 31.0, 55.0, 40.0, 29.0, 30.0, 39.0, 30.0, 38.0, 45.0, 31.0, 39.0, 22.0, 35.0, 24.0, 25.0, 19.0, 17.0, 25.0, 20.0, 11.0, 15.0, 9.0, 12.0, 12.0, 12.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0], "bins": [-26.7233943939209, -25.895402908325195, -25.06740951538086, -24.239418029785156, -23.411426544189453, -22.583433151245117, -21.755441665649414, -20.927448272705078, -20.099456787109375, -19.271465301513672, -18.443471908569336, -17.615480422973633, -16.787487030029297, -15.959495544433594, -15.13150405883789, -14.303511619567871, -13.475519180297852, -12.647526741027832, -11.819534301757812, -10.99154281616211, -10.16355037689209, -9.33555793762207, -8.507566452026367, -7.679574012756348, -6.851581573486328, -6.023589134216309, -5.195597171783447, -4.367605209350586, -3.5396127700805664, -2.711620330810547, -1.8836283683776855, -1.0556364059448242, -0.22764205932617188, 0.6003501415252686, 1.428342342376709, 2.2563345432281494, 3.08432674407959, 3.9123191833496094, 4.740311145782471, 5.568303108215332, 6.396295547485352, 7.224287986755371, 8.05228042602539, 8.880271911621094, 9.708264350891113, 10.536256790161133, 11.364248275756836, 12.192240715026855, 13.020233154296875, 13.848225593566895, 14.676218032836914, 15.504209518432617, 16.332202911376953, 17.160194396972656, 17.98818588256836, 18.816177368164062, 19.6441707611084, 20.4721622467041, 21.300155639648438, 22.12814712524414, 22.956138610839844, 23.78413200378418, 24.612123489379883, 25.44011688232422, 26.268108367919922]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 6.0, 8.0, 7.0, 4.0, 4.0, 10.0, 5.0, 15.0, 14.0, 17.0, 20.0, 20.0, 28.0, 25.0, 32.0, 25.0, 27.0, 24.0, 40.0, 36.0, 49.0, 35.0, 39.0, 37.0, 42.0, 41.0, 32.0, 36.0, 36.0, 44.0, 43.0, 18.0, 30.0, 25.0, 23.0, 12.0, 21.0, 16.0, 7.0, 8.0, 9.0, 9.0, 3.0, 7.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0], "bins": [-3.12890625, -3.0364990234375, -2.944091796875, -2.8516845703125, -2.75927734375, -2.6668701171875, -2.574462890625, -2.4820556640625, -2.3896484375, -2.2972412109375, -2.204833984375, -2.1124267578125, -2.02001953125, -1.9276123046875, -1.835205078125, -1.7427978515625, -1.650390625, -1.5579833984375, -1.465576171875, -1.3731689453125, -1.28076171875, -1.1883544921875, -1.095947265625, -1.0035400390625, -0.9111328125, -0.8187255859375, -0.726318359375, -0.6339111328125, -0.54150390625, -0.4490966796875, -0.356689453125, -0.2642822265625, -0.171875, -0.0794677734375, 0.012939453125, 0.1053466796875, 0.19775390625, 0.2901611328125, 0.382568359375, 0.4749755859375, 0.5673828125, 0.6597900390625, 0.752197265625, 0.8446044921875, 0.93701171875, 1.0294189453125, 1.121826171875, 1.2142333984375, 1.306640625, 1.3990478515625, 1.491455078125, 1.5838623046875, 1.67626953125, 1.7686767578125, 1.861083984375, 1.9534912109375, 2.0458984375, 2.1383056640625, 2.230712890625, 2.3231201171875, 2.41552734375, 2.5079345703125, 2.600341796875, 2.6927490234375, 2.78515625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 8.0, 2.0, 4.0, 3.0, 5.0, 11.0, 12.0, 10.0, 15.0, 11.0, 19.0, 30.0, 42.0, 38.0, 53.0, 72.0, 91.0, 144.0, 249.0, 758.0, 2719.0, 13801.0, 106990.0, 1601750.0, 2281803.0, 160994.0, 19296.0, 3473.0, 933.0, 343.0, 159.0, 111.0, 69.0, 48.0, 48.0, 33.0, 27.0, 20.0, 22.0, 11.0, 10.0, 10.0, 12.0, 9.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.6328125, -11.270263671875, -10.90771484375, -10.545166015625, -10.1826171875, -9.820068359375, -9.45751953125, -9.094970703125, -8.732421875, -8.369873046875, -8.00732421875, -7.644775390625, -7.2822265625, -6.919677734375, -6.55712890625, -6.194580078125, -5.83203125, -5.469482421875, -5.10693359375, -4.744384765625, -4.3818359375, -4.019287109375, -3.65673828125, -3.294189453125, -2.931640625, -2.569091796875, -2.20654296875, -1.843994140625, -1.4814453125, -1.118896484375, -0.75634765625, -0.393798828125, -0.03125, 0.331298828125, 0.69384765625, 1.056396484375, 1.4189453125, 1.781494140625, 2.14404296875, 2.506591796875, 2.869140625, 3.231689453125, 3.59423828125, 3.956787109375, 4.3193359375, 4.681884765625, 5.04443359375, 5.406982421875, 5.76953125, 6.132080078125, 6.49462890625, 6.857177734375, 7.2197265625, 7.582275390625, 7.94482421875, 8.307373046875, 8.669921875, 9.032470703125, 9.39501953125, 9.757568359375, 10.1201171875, 10.482666015625, 10.84521484375, 11.207763671875, 11.5703125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 9.0, 14.0, 14.0, 12.0, 24.0, 34.0, 51.0, 68.0, 99.0, 128.0, 170.0, 264.0, 336.0, 394.0, 507.0, 450.0, 400.0, 290.0, 199.0, 182.0, 125.0, 69.0, 70.0, 59.0, 31.0, 26.0, 18.0, 7.0, 4.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9296875, -9.6448974609375, -9.360107421875, -9.0753173828125, -8.79052734375, -8.5057373046875, -8.220947265625, -7.9361572265625, -7.6513671875, -7.3665771484375, -7.081787109375, -6.7969970703125, -6.51220703125, -6.2274169921875, -5.942626953125, -5.6578369140625, -5.373046875, -5.0882568359375, -4.803466796875, -4.5186767578125, -4.23388671875, -3.9490966796875, -3.664306640625, -3.3795166015625, -3.0947265625, -2.8099365234375, -2.525146484375, -2.2403564453125, -1.95556640625, -1.6707763671875, -1.385986328125, -1.1011962890625, -0.81640625, -0.5316162109375, -0.246826171875, 0.0379638671875, 0.32275390625, 0.6075439453125, 0.892333984375, 1.1771240234375, 1.4619140625, 1.7467041015625, 2.031494140625, 2.3162841796875, 2.60107421875, 2.8858642578125, 3.170654296875, 3.4554443359375, 3.740234375, 4.0250244140625, 4.309814453125, 4.5946044921875, 4.87939453125, 5.1641845703125, 5.448974609375, 5.7337646484375, 6.0185546875, 6.3033447265625, 6.588134765625, 6.8729248046875, 7.15771484375, 7.4425048828125, 7.727294921875, 8.0120849609375, 8.296875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 10.0, 8.0, 10.0, 15.0, 14.0, 22.0, 41.0, 51.0, 73.0, 91.0, 132.0, 201.0, 335.0, 670.0, 2216.0, 17090.0, 361152.0, 3484113.0, 309267.0, 15004.0, 2109.0, 689.0, 327.0, 190.0, 133.0, 100.0, 63.0, 44.0, 38.0, 13.0, 18.0, 15.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.84375, -20.11181640625, -19.3798828125, -18.64794921875, -17.916015625, -17.18408203125, -16.4521484375, -15.72021484375, -14.98828125, -14.25634765625, -13.5244140625, -12.79248046875, -12.060546875, -11.32861328125, -10.5966796875, -9.86474609375, -9.1328125, -8.40087890625, -7.6689453125, -6.93701171875, -6.205078125, -5.47314453125, -4.7412109375, -4.00927734375, -3.27734375, -2.54541015625, -1.8134765625, -1.08154296875, -0.349609375, 0.38232421875, 1.1142578125, 1.84619140625, 2.578125, 3.31005859375, 4.0419921875, 4.77392578125, 5.505859375, 6.23779296875, 6.9697265625, 7.70166015625, 8.43359375, 9.16552734375, 9.8974609375, 10.62939453125, 11.361328125, 12.09326171875, 12.8251953125, 13.55712890625, 14.2890625, 15.02099609375, 15.7529296875, 16.48486328125, 17.216796875, 17.94873046875, 18.6806640625, 19.41259765625, 20.14453125, 20.87646484375, 21.6083984375, 22.34033203125, 23.072265625, 23.80419921875, 24.5361328125, 25.26806640625, 26.0]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 19.0, 57.0, 125.0, 235.0, 257.0, 181.0, 90.0, 37.0, 10.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.6572036743164, -88.17896270751953, -84.70072174072266, -81.22248077392578, -77.74423217773438, -74.2659912109375, -70.78775024414062, -67.30950927734375, -63.831268310546875, -60.35302734375, -56.874786376953125, -53.396541595458984, -49.91830062866211, -46.440059661865234, -42.961814880371094, -39.48357391357422, -36.005332946777344, -32.52709197998047, -29.04884910583496, -25.570606231689453, -22.092365264892578, -18.614124298095703, -15.135881423950195, -11.657638549804688, -8.179397583007812, -4.701155662536621, -1.2229137420654297, 2.2553281784057617, 5.733570098876953, 9.211811065673828, 12.690053939819336, 16.168296813964844, 19.64654541015625, 23.124786376953125, 26.603029251098633, 30.08127212524414, 33.559513092041016, 37.03775405883789, 40.51599884033203, 43.994239807128906, 47.47248077392578, 50.950721740722656, 54.42896270751953, 57.90720748901367, 61.38544845581055, 64.86369323730469, 68.34193420410156, 71.82017517089844, 75.29841613769531, 78.77665710449219, 82.25489807128906, 85.73313903808594, 89.21138000488281, 92.68962097167969, 96.1678695678711, 99.64611053466797, 103.12435150146484, 106.60259246826172, 110.0808334350586, 113.55907440185547, 117.03732299804688, 120.51556396484375, 123.99380493164062, 127.4720458984375, 130.95028686523438]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 6.0, 7.0, 12.0, 17.0, 3.0, 14.0, 17.0, 16.0, 20.0, 23.0, 24.0, 40.0, 27.0, 31.0, 38.0, 34.0, 35.0, 47.0, 34.0, 38.0, 52.0, 37.0, 38.0, 39.0, 34.0, 27.0, 44.0, 32.0, 31.0, 24.0, 20.0, 23.0, 30.0, 15.0, 10.0, 13.0, 11.0, 14.0, 6.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.69482421875, -27.821910858154297, -26.948997497558594, -26.07608413696289, -25.203170776367188, -24.330257415771484, -23.45734405517578, -22.584430694580078, -21.711517333984375, -20.838603973388672, -19.96569061279297, -19.092777252197266, -18.219863891601562, -17.34695053100586, -16.474037170410156, -15.601123809814453, -14.72821044921875, -13.855297088623047, -12.982383728027344, -12.10947036743164, -11.236557006835938, -10.363643646240234, -9.490730285644531, -8.617816925048828, -7.744903564453125, -6.871990203857422, -5.999076843261719, -5.126163482666016, -4.2532501220703125, -3.3803367614746094, -2.5074234008789062, -1.6345100402832031, -0.7615966796875, 0.11131668090820312, 0.9842300415039062, 1.8571434020996094, 2.7300567626953125, 3.6029701232910156, 4.475883483886719, 5.348796844482422, 6.221710205078125, 7.094623565673828, 7.967536926269531, 8.840450286865234, 9.713363647460938, 10.58627700805664, 11.459190368652344, 12.332103729248047, 13.20501708984375, 14.077930450439453, 14.950843811035156, 15.82375717163086, 16.696670532226562, 17.569583892822266, 18.44249725341797, 19.315410614013672, 20.188323974609375, 21.061237335205078, 21.93415069580078, 22.807064056396484, 23.679977416992188, 24.55289077758789, 25.425804138183594, 26.298717498779297, 27.171630859375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 5.0, 9.0, 7.0, 10.0, 6.0, 13.0, 12.0, 24.0, 26.0, 14.0, 24.0, 27.0, 31.0, 22.0, 32.0, 29.0, 31.0, 36.0, 42.0, 35.0, 34.0, 49.0, 31.0, 41.0, 44.0, 40.0, 43.0, 31.0, 27.0, 20.0, 33.0, 28.0, 17.0, 28.0, 18.0, 16.0, 8.0, 5.0, 8.0, 5.0, 9.0, 4.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.994140625, -2.900634765625, -2.80712890625, -2.713623046875, -2.6201171875, -2.526611328125, -2.43310546875, -2.339599609375, -2.24609375, -2.152587890625, -2.05908203125, -1.965576171875, -1.8720703125, -1.778564453125, -1.68505859375, -1.591552734375, -1.498046875, -1.404541015625, -1.31103515625, -1.217529296875, -1.1240234375, -1.030517578125, -0.93701171875, -0.843505859375, -0.75, -0.656494140625, -0.56298828125, -0.469482421875, -0.3759765625, -0.282470703125, -0.18896484375, -0.095458984375, -0.001953125, 0.091552734375, 0.18505859375, 0.278564453125, 0.3720703125, 0.465576171875, 0.55908203125, 0.652587890625, 0.74609375, 0.839599609375, 0.93310546875, 1.026611328125, 1.1201171875, 1.213623046875, 1.30712890625, 1.400634765625, 1.494140625, 1.587646484375, 1.68115234375, 1.774658203125, 1.8681640625, 1.961669921875, 2.05517578125, 2.148681640625, 2.2421875, 2.335693359375, 2.42919921875, 2.522705078125, 2.6162109375, 2.709716796875, 2.80322265625, 2.896728515625, 2.990234375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 12.0, 20.0, 23.0, 46.0, 62.0, 67.0, 132.0, 192.0, 273.0, 490.0, 724.0, 1038.0, 1684.0, 2431.0, 3821.0, 5890.0, 8892.0, 13544.0, 20294.0, 30690.0, 45944.0, 67977.0, 96976.0, 129616.0, 150398.0, 136996.0, 104977.0, 74427.0, 50746.0, 33797.0, 22628.0, 14952.0, 9888.0, 6414.0, 4332.0, 2826.0, 1837.0, 1248.0, 789.0, 468.0, 339.0, 208.0, 149.0, 92.0, 59.0, 61.0, 21.0, 26.0, 12.0, 10.0, 5.0, 6.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.3056640625, -0.296295166015625, -0.28692626953125, -0.277557373046875, -0.2681884765625, -0.258819580078125, -0.24945068359375, -0.240081787109375, -0.230712890625, -0.221343994140625, -0.21197509765625, -0.202606201171875, -0.1932373046875, -0.183868408203125, -0.17449951171875, -0.165130615234375, -0.15576171875, -0.146392822265625, -0.13702392578125, -0.127655029296875, -0.1182861328125, -0.108917236328125, -0.09954833984375, -0.090179443359375, -0.080810546875, -0.071441650390625, -0.06207275390625, -0.052703857421875, -0.0433349609375, -0.033966064453125, -0.02459716796875, -0.015228271484375, -0.005859375, 0.003509521484375, 0.01287841796875, 0.022247314453125, 0.0316162109375, 0.040985107421875, 0.05035400390625, 0.059722900390625, 0.069091796875, 0.078460693359375, 0.08782958984375, 0.097198486328125, 0.1065673828125, 0.115936279296875, 0.12530517578125, 0.134674072265625, 0.14404296875, 0.153411865234375, 0.16278076171875, 0.172149658203125, 0.1815185546875, 0.190887451171875, 0.20025634765625, 0.209625244140625, 0.218994140625, 0.228363037109375, 0.23773193359375, 0.247100830078125, 0.2564697265625, 0.265838623046875, 0.27520751953125, 0.284576416015625, 0.2939453125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 11.0, 8.0, 11.0, 14.0, 17.0, 21.0, 18.0, 21.0, 28.0, 38.0, 24.0, 24.0, 30.0, 46.0, 36.0, 37.0, 46.0, 1059.0, 49.0, 45.0, 50.0, 36.0, 38.0, 39.0, 44.0, 30.0, 31.0, 25.0, 32.0, 24.0, 16.0, 14.0, 11.0, 12.0, 13.0, 10.0, 7.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.259765625, -2.1890869140625, -2.118408203125, -2.0477294921875, -1.97705078125, -1.9063720703125, -1.835693359375, -1.7650146484375, -1.6943359375, -1.6236572265625, -1.552978515625, -1.4822998046875, -1.41162109375, -1.3409423828125, -1.270263671875, -1.1995849609375, -1.12890625, -1.0582275390625, -0.987548828125, -0.9168701171875, -0.84619140625, -0.7755126953125, -0.704833984375, -0.6341552734375, -0.5634765625, -0.4927978515625, -0.422119140625, -0.3514404296875, -0.28076171875, -0.2100830078125, -0.139404296875, -0.0687255859375, 0.001953125, 0.0726318359375, 0.143310546875, 0.2139892578125, 0.28466796875, 0.3553466796875, 0.426025390625, 0.4967041015625, 0.5673828125, 0.6380615234375, 0.708740234375, 0.7794189453125, 0.85009765625, 0.9207763671875, 0.991455078125, 1.0621337890625, 1.1328125, 1.2034912109375, 1.274169921875, 1.3448486328125, 1.41552734375, 1.4862060546875, 1.556884765625, 1.6275634765625, 1.6982421875, 1.7689208984375, 1.839599609375, 1.9102783203125, 1.98095703125, 2.0516357421875, 2.122314453125, 2.1929931640625, 2.263671875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 9.0, 15.0, 23.0, 30.0, 49.0, 72.0, 112.0, 156.0, 271.0, 390.0, 508.0, 805.0, 1242.0, 1829.0, 2831.0, 4028.0, 6219.0, 9593.0, 14400.0, 21357.0, 32800.0, 48040.0, 69927.0, 98017.0, 144973.0, 1047124.0, 228669.0, 112078.0, 80563.0, 56572.0, 38609.0, 25465.0, 17156.0, 11234.0, 7413.0, 4910.0, 3303.0, 2157.0, 1381.0, 917.0, 594.0, 424.0, 301.0, 201.0, 112.0, 85.0, 65.0, 36.0, 21.0, 27.0, 8.0, 7.0, 7.0, 1.0, 2.0], "bins": [-0.1837158203125, -0.1784229278564453, -0.17313003540039062, -0.16783714294433594, -0.16254425048828125, -0.15725135803222656, -0.15195846557617188, -0.1466655731201172, -0.1413726806640625, -0.1360797882080078, -0.13078689575195312, -0.12549400329589844, -0.12020111083984375, -0.11490821838378906, -0.10961532592773438, -0.10432243347167969, -0.099029541015625, -0.09373664855957031, -0.08844375610351562, -0.08315086364746094, -0.07785797119140625, -0.07256507873535156, -0.06727218627929688, -0.06197929382324219, -0.0566864013671875, -0.05139350891113281, -0.046100616455078125, -0.04080772399902344, -0.03551483154296875, -0.030221939086914062, -0.024929046630859375, -0.019636154174804688, -0.01434326171875, -0.009050369262695312, -0.003757476806640625, 0.0015354156494140625, 0.00682830810546875, 0.012121200561523438, 0.017414093017578125, 0.022706985473632812, 0.0279998779296875, 0.03329277038574219, 0.038585662841796875, 0.04387855529785156, 0.04917144775390625, 0.05446434020996094, 0.059757232666015625, 0.06505012512207031, 0.070343017578125, 0.07563591003417969, 0.08092880249023438, 0.08622169494628906, 0.09151458740234375, 0.09680747985839844, 0.10210037231445312, 0.10739326477050781, 0.1126861572265625, 0.11797904968261719, 0.12327194213867188, 0.12856483459472656, 0.13385772705078125, 0.13915061950683594, 0.14444351196289062, 0.1497364044189453, 0.155029296875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 3.0, 4.0, 4.0, 4.0, 10.0, 7.0, 18.0, 18.0, 16.0, 19.0, 39.0, 46.0, 46.0, 71.0, 105.0, 184.0, 101.0, 63.0, 51.0, 42.0, 26.0, 26.0, 15.0, 14.0, 19.0, 8.0, 1.0, 7.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.058624267578125, -0.057106971740722656, -0.05558967590332031, -0.05407238006591797, -0.052555084228515625, -0.05103778839111328, -0.04952049255371094, -0.048003196716308594, -0.04648590087890625, -0.044968605041503906, -0.04345130920410156, -0.04193401336669922, -0.040416717529296875, -0.03889942169189453, -0.03738212585449219, -0.035864830017089844, -0.0343475341796875, -0.032830238342285156, -0.03131294250488281, -0.02979564666748047, -0.028278350830078125, -0.02676105499267578, -0.025243759155273438, -0.023726463317871094, -0.02220916748046875, -0.020691871643066406, -0.019174575805664062, -0.01765727996826172, -0.016139984130859375, -0.014622688293457031, -0.013105392456054688, -0.011588096618652344, -0.01007080078125, -0.008553504943847656, -0.0070362091064453125, -0.005518913269042969, -0.004001617431640625, -0.0024843215942382812, -0.0009670257568359375, 0.0005502700805664062, 0.00206756591796875, 0.0035848617553710938, 0.0051021575927734375, 0.006619453430175781, 0.008136749267578125, 0.009654045104980469, 0.011171340942382812, 0.012688636779785156, 0.0142059326171875, 0.015723228454589844, 0.017240524291992188, 0.01875782012939453, 0.020275115966796875, 0.02179241180419922, 0.023309707641601562, 0.024827003479003906, 0.02634429931640625, 0.027861595153808594, 0.029378890991210938, 0.03089618682861328, 0.032413482666015625, 0.03393077850341797, 0.03544807434082031, 0.036965370178222656, 0.038482666015625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 4.0, 5.0, 16.0, 27.0, 24.0, 51.0, 66.0, 120.0, 246.0, 922.0, 17385.0, 1017380.0, 11001.0, 731.0, 212.0, 111.0, 62.0, 46.0, 32.0, 26.0, 14.0, 12.0, 12.0, 3.0, 6.0, 6.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79345703125, -0.7622756958007812, -0.7310943603515625, -0.6999130249023438, -0.668731689453125, -0.6375503540039062, -0.6063690185546875, -0.5751876831054688, -0.54400634765625, -0.5128250122070312, -0.4816436767578125, -0.45046234130859375, -0.419281005859375, -0.38809967041015625, -0.3569183349609375, -0.32573699951171875, -0.2945556640625, -0.26337432861328125, -0.2321929931640625, -0.20101165771484375, -0.169830322265625, -0.13864898681640625, -0.1074676513671875, -0.07628631591796875, -0.04510498046875, -0.01392364501953125, 0.0172576904296875, 0.04843902587890625, 0.079620361328125, 0.11080169677734375, 0.1419830322265625, 0.17316436767578125, 0.204345703125, 0.23552703857421875, 0.2667083740234375, 0.29788970947265625, 0.329071044921875, 0.36025238037109375, 0.3914337158203125, 0.42261505126953125, 0.45379638671875, 0.48497772216796875, 0.5161590576171875, 0.5473403930664062, 0.578521728515625, 0.6097030639648438, 0.6408843994140625, 0.6720657348632812, 0.7032470703125, 0.7344284057617188, 0.7656097412109375, 0.7967910766601562, 0.827972412109375, 0.8591537475585938, 0.8903350830078125, 0.9215164184570312, 0.95269775390625, 0.9838790893554688, 1.0150604248046875, 1.0462417602539062, 1.077423095703125, 1.1086044311523438, 1.1397857666015625, 1.1709671020507812, 1.2021484375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 18.0, 25.0, 91.0, 276.0, 455.0, 104.0, 20.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5164682865142822, -0.5065786838531494, -0.4966890811920166, -0.4867994785308838, -0.476909875869751, -0.46702027320861816, -0.45713067054748535, -0.44724106788635254, -0.4373514652252197, -0.4274618625640869, -0.4175722599029541, -0.4076826572418213, -0.3977930545806885, -0.38790345191955566, -0.37801384925842285, -0.36812424659729004, -0.3582346439361572, -0.3483450412750244, -0.3384554386138916, -0.3285658359527588, -0.318676233291626, -0.30878663063049316, -0.29889702796936035, -0.28900742530822754, -0.2791178226470947, -0.2692282199859619, -0.2593386173248291, -0.2494490146636963, -0.23955941200256348, -0.22966980934143066, -0.21978020668029785, -0.20989060401916504, -0.20000098645687103, -0.19011138379573822, -0.1802217811346054, -0.1703321784734726, -0.16044257581233978, -0.15055297315120697, -0.14066337049007416, -0.13077376782894135, -0.12088416516780853, -0.11099456250667572, -0.10110495984554291, -0.0912153571844101, -0.08132575452327728, -0.07143615186214447, -0.06154654920101166, -0.051656946539878845, -0.04176734387874603, -0.03187774121761322, -0.021988138556480408, -0.012098535895347595, -0.0022089332342147827, 0.00768066942691803, 0.017570272088050842, 0.027459874749183655, 0.03734947741031647, 0.04723908007144928, 0.05712868273258209, 0.0670182853937149, 0.07690788805484772, 0.08679749071598053, 0.09668709337711334, 0.10657669603824615, 0.11646629869937897]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 4.0, 7.0, 4.0, 6.0, 6.0, 7.0, 7.0, 12.0, 10.0, 20.0, 26.0, 20.0, 23.0, 27.0, 30.0, 31.0, 17.0, 22.0, 34.0, 36.0, 41.0, 43.0, 28.0, 47.0, 33.0, 21.0, 40.0, 44.0, 24.0, 31.0, 31.0, 31.0, 28.0, 27.0, 21.0, 24.0, 18.0, 19.0, 28.0, 13.0, 15.0, 11.0, 4.0, 10.0, 5.0, 6.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06097853183746338, -0.058819644153118134, -0.05666075646877289, -0.054501865059137344, -0.0523429773747921, -0.050184089690446854, -0.04802519828081131, -0.045866310596466064, -0.04370742291212082, -0.041548535227775574, -0.03938964754343033, -0.037230756133794785, -0.03507186844944954, -0.032912980765104294, -0.0307540912181139, -0.028595201671123505, -0.02643631398677826, -0.024277426302433014, -0.02211853675544262, -0.019959647208452225, -0.01780075952410698, -0.015641871839761734, -0.01348298229277134, -0.01132409367710352, -0.0091652050614357, -0.0070063164457678795, -0.0048474278301000595, -0.0026885392144322395, -0.0005296505987644196, 0.0016292380169034004, 0.0037881266325712204, 0.00594701524823904, 0.00810590386390686, 0.01026479247957468, 0.0124236810952425, 0.01458256971091032, 0.01674145832657814, 0.018900346010923386, 0.02105923555791378, 0.023218125104904175, 0.02537701278924942, 0.027535900473594666, 0.02969479002058506, 0.031853679567575455, 0.0340125672519207, 0.036171454936265945, 0.03833034634590149, 0.040489234030246735, 0.04264812171459198, 0.044807009398937225, 0.04696589708328247, 0.049124788492918015, 0.05128367617726326, 0.053442563861608505, 0.05560145527124405, 0.057760342955589294, 0.05991923063993454, 0.062078118324279785, 0.06423700600862503, 0.06639589369297028, 0.06855478882789612, 0.07071367651224136, 0.07287256419658661, 0.07503145188093185, 0.0771903395652771]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 9.0, 7.0, 10.0, 6.0, 13.0, 10.0, 24.0, 28.0, 14.0, 23.0, 28.0, 30.0, 22.0, 30.0, 32.0, 31.0, 33.0, 44.0, 33.0, 35.0, 50.0, 31.0, 42.0, 42.0, 38.0, 46.0, 31.0, 27.0, 21.0, 33.0, 28.0, 15.0, 29.0, 19.0, 16.0, 8.0, 4.0, 9.0, 5.0, 9.0, 4.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.998046875, -2.904510498046875, -2.81097412109375, -2.717437744140625, -2.6239013671875, -2.530364990234375, -2.43682861328125, -2.343292236328125, -2.249755859375, -2.156219482421875, -2.06268310546875, -1.969146728515625, -1.8756103515625, -1.782073974609375, -1.68853759765625, -1.595001220703125, -1.50146484375, -1.407928466796875, -1.31439208984375, -1.220855712890625, -1.1273193359375, -1.033782958984375, -0.94024658203125, -0.846710205078125, -0.753173828125, -0.659637451171875, -0.56610107421875, -0.472564697265625, -0.3790283203125, -0.285491943359375, -0.19195556640625, -0.098419189453125, -0.0048828125, 0.088653564453125, 0.18218994140625, 0.275726318359375, 0.3692626953125, 0.462799072265625, 0.55633544921875, 0.649871826171875, 0.743408203125, 0.836944580078125, 0.93048095703125, 1.024017333984375, 1.1175537109375, 1.211090087890625, 1.30462646484375, 1.398162841796875, 1.49169921875, 1.585235595703125, 1.67877197265625, 1.772308349609375, 1.8658447265625, 1.959381103515625, 2.05291748046875, 2.146453857421875, 2.239990234375, 2.333526611328125, 2.42706298828125, 2.520599365234375, 2.6141357421875, 2.707672119140625, 2.80120849609375, 2.894744873046875, 2.98828125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 13.0, 20.0, 15.0, 36.0, 50.0, 62.0, 77.0, 130.0, 184.0, 268.0, 405.0, 613.0, 1002.0, 1519.0, 2400.0, 3807.0, 6093.0, 9702.0, 15754.0, 26589.0, 47522.0, 89679.0, 185123.0, 311018.0, 161502.0, 79088.0, 42665.0, 24316.0, 14463.0, 8927.0, 5644.0, 3537.0, 2223.0, 1397.0, 918.0, 572.0, 379.0, 271.0, 177.0, 129.0, 95.0, 63.0, 32.0, 24.0, 13.0, 16.0, 7.0, 10.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.171875, -2.10687255859375, -2.0418701171875, -1.97686767578125, -1.911865234375, -1.84686279296875, -1.7818603515625, -1.71685791015625, -1.65185546875, -1.58685302734375, -1.5218505859375, -1.45684814453125, -1.391845703125, -1.32684326171875, -1.2618408203125, -1.19683837890625, -1.1318359375, -1.06683349609375, -1.0018310546875, -0.93682861328125, -0.871826171875, -0.80682373046875, -0.7418212890625, -0.67681884765625, -0.61181640625, -0.54681396484375, -0.4818115234375, -0.41680908203125, -0.351806640625, -0.28680419921875, -0.2218017578125, -0.15679931640625, -0.091796875, -0.02679443359375, 0.0382080078125, 0.10321044921875, 0.168212890625, 0.23321533203125, 0.2982177734375, 0.36322021484375, 0.42822265625, 0.49322509765625, 0.5582275390625, 0.62322998046875, 0.688232421875, 0.75323486328125, 0.8182373046875, 0.88323974609375, 0.9482421875, 1.01324462890625, 1.0782470703125, 1.14324951171875, 1.208251953125, 1.27325439453125, 1.3382568359375, 1.40325927734375, 1.46826171875, 1.53326416015625, 1.5982666015625, 1.66326904296875, 1.728271484375, 1.79327392578125, 1.8582763671875, 1.92327880859375, 1.98828125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 0.0, 2.0, 2.0, 8.0, 7.0, 8.0, 10.0, 6.0, 15.0, 15.0, 16.0, 21.0, 22.0, 32.0, 26.0, 41.0, 30.0, 30.0, 56.0, 56.0, 68.0, 149.0, 1447.0, 351.0, 132.0, 81.0, 61.0, 56.0, 32.0, 36.0, 25.0, 35.0, 27.0, 19.0, 28.0, 15.0, 16.0, 12.0, 17.0, 12.0, 4.0, 9.0, 4.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.1015625, -11.7342529296875, -11.366943359375, -10.9996337890625, -10.63232421875, -10.2650146484375, -9.897705078125, -9.5303955078125, -9.1630859375, -8.7957763671875, -8.428466796875, -8.0611572265625, -7.69384765625, -7.3265380859375, -6.959228515625, -6.5919189453125, -6.224609375, -5.8572998046875, -5.489990234375, -5.1226806640625, -4.75537109375, -4.3880615234375, -4.020751953125, -3.6534423828125, -3.2861328125, -2.9188232421875, -2.551513671875, -2.1842041015625, -1.81689453125, -1.4495849609375, -1.082275390625, -0.7149658203125, -0.34765625, 0.0196533203125, 0.386962890625, 0.7542724609375, 1.12158203125, 1.4888916015625, 1.856201171875, 2.2235107421875, 2.5908203125, 2.9581298828125, 3.325439453125, 3.6927490234375, 4.06005859375, 4.4273681640625, 4.794677734375, 5.1619873046875, 5.529296875, 5.8966064453125, 6.263916015625, 6.6312255859375, 6.99853515625, 7.3658447265625, 7.733154296875, 8.1004638671875, 8.4677734375, 8.8350830078125, 9.202392578125, 9.5697021484375, 9.93701171875, 10.3043212890625, 10.671630859375, 11.0389404296875, 11.40625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 15.0, 18.0, 24.0, 40.0, 67.0, 82.0, 155.0, 240.0, 490.0, 1435.0, 39446.0, 3091013.0, 10754.0, 983.0, 399.0, 169.0, 131.0, 77.0, 48.0, 32.0, 31.0, 11.0, 13.0, 11.0, 3.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.84375, -48.577880859375, -47.31201171875, -46.046142578125, -44.7802734375, -43.514404296875, -42.24853515625, -40.982666015625, -39.716796875, -38.450927734375, -37.18505859375, -35.919189453125, -34.6533203125, -33.387451171875, -32.12158203125, -30.855712890625, -29.58984375, -28.323974609375, -27.05810546875, -25.792236328125, -24.5263671875, -23.260498046875, -21.99462890625, -20.728759765625, -19.462890625, -18.197021484375, -16.93115234375, -15.665283203125, -14.3994140625, -13.133544921875, -11.86767578125, -10.601806640625, -9.3359375, -8.070068359375, -6.80419921875, -5.538330078125, -4.2724609375, -3.006591796875, -1.74072265625, -0.474853515625, 0.791015625, 2.056884765625, 3.32275390625, 4.588623046875, 5.8544921875, 7.120361328125, 8.38623046875, 9.652099609375, 10.91796875, 12.183837890625, 13.44970703125, 14.715576171875, 15.9814453125, 17.247314453125, 18.51318359375, 19.779052734375, 21.044921875, 22.310791015625, 23.57666015625, 24.842529296875, 26.1083984375, 27.374267578125, 28.64013671875, 29.906005859375, 31.171875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [21.0, 233.0, 549.0, 192.0, 20.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.597906112670898, -4.626360893249512, -1.6548161506652832, 1.3167285919189453, 4.288273811340332, 7.259819030761719, 10.231363296508789, 13.202909469604492, 16.174453735351562, 19.145998001098633, 22.117544174194336, 25.089088439941406, 28.06063461303711, 31.03217887878418, 34.00372314453125, 36.97526931762695, 39.946815490722656, 42.91836166381836, 45.8899040222168, 48.8614501953125, 51.8329963684082, 54.804542541503906, 57.776084899902344, 60.74763107299805, 63.719173431396484, 66.69071960449219, 69.66226196289062, 72.63380432128906, 75.60535430908203, 78.57689666748047, 81.54844665527344, 84.51998901367188, 87.49153900146484, 90.46308135986328, 93.43463134765625, 96.40617370605469, 99.37771606445312, 102.3492660522461, 105.32080841064453, 108.2923583984375, 111.26390075683594, 114.23544311523438, 117.20699310302734, 120.17853546142578, 123.15007781982422, 126.12162780761719, 129.09317016601562, 132.06471252441406, 135.0362548828125, 138.00779724121094, 140.97933959960938, 143.95089721679688, 146.9224395751953, 149.89398193359375, 152.8655242919922, 155.83706665039062, 158.80862426757812, 161.78016662597656, 164.751708984375, 167.7232666015625, 170.69480895996094, 173.66635131835938, 176.6378936767578, 179.60943603515625, 182.5809783935547]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 1.0, 1.0, 4.0, 7.0, 12.0, 13.0, 20.0, 17.0, 19.0, 31.0, 23.0, 36.0, 41.0, 30.0, 51.0, 49.0, 46.0, 45.0, 36.0, 42.0, 39.0, 28.0, 35.0, 44.0, 46.0, 40.0, 30.0, 39.0, 28.0, 27.0, 23.0, 11.0, 18.0, 12.0, 19.0, 9.0, 9.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.29036331176758, -33.1875114440918, -32.08466339111328, -30.9818115234375, -29.87895965576172, -28.77610969543457, -27.673259735107422, -26.57040786743164, -25.467557907104492, -24.364707946777344, -23.261856079101562, -22.159006118774414, -21.056156158447266, -19.953304290771484, -18.850454330444336, -17.747604370117188, -16.644752502441406, -15.541901588439941, -14.439050674438477, -13.336200714111328, -12.233349800109863, -11.130498886108398, -10.02764892578125, -8.924798011779785, -7.82194709777832, -6.7190961837768555, -5.616245746612549, -4.513395309448242, -3.4105443954467773, -2.3076934814453125, -1.2048430442810059, -0.10199260711669922, 1.0008621215820312, 2.103712797164917, 3.2065634727478027, 4.309413909912109, 5.412264823913574, 6.515115737915039, 7.617966175079346, 8.720816612243652, 9.823667526245117, 10.926518440246582, 12.029369354248047, 13.132219314575195, 14.23507022857666, 15.337921142578125, 16.440771102905273, 17.543621063232422, 18.646472930908203, 19.74932289123535, 20.852174758911133, 21.95502471923828, 23.057876586914062, 24.16072654724121, 25.26357650756836, 26.36642837524414, 27.46927833557129, 28.572128295898438, 29.67498016357422, 30.777830123901367, 31.880680084228516, 32.9835319519043, 34.08638381958008, 35.189231872558594, 36.292083740234375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 9.0, 10.0, 6.0, 5.0, 9.0, 13.0, 13.0, 15.0, 25.0, 16.0, 21.0, 23.0, 38.0, 29.0, 20.0, 34.0, 27.0, 31.0, 36.0, 42.0, 39.0, 43.0, 46.0, 31.0, 34.0, 43.0, 32.0, 45.0, 30.0, 26.0, 25.0, 30.0, 29.0, 21.0, 19.0, 15.0, 14.0, 10.0, 7.0, 12.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.1484375, -3.04852294921875, -2.9486083984375, -2.84869384765625, -2.748779296875, -2.64886474609375, -2.5489501953125, -2.44903564453125, -2.34912109375, -2.24920654296875, -2.1492919921875, -2.04937744140625, -1.949462890625, -1.84954833984375, -1.7496337890625, -1.64971923828125, -1.5498046875, -1.44989013671875, -1.3499755859375, -1.25006103515625, -1.150146484375, -1.05023193359375, -0.9503173828125, -0.85040283203125, -0.75048828125, -0.65057373046875, -0.5506591796875, -0.45074462890625, -0.350830078125, -0.25091552734375, -0.1510009765625, -0.05108642578125, 0.048828125, 0.14874267578125, 0.2486572265625, 0.34857177734375, 0.448486328125, 0.54840087890625, 0.6483154296875, 0.74822998046875, 0.84814453125, 0.94805908203125, 1.0479736328125, 1.14788818359375, 1.247802734375, 1.34771728515625, 1.4476318359375, 1.54754638671875, 1.6474609375, 1.74737548828125, 1.8472900390625, 1.94720458984375, 2.047119140625, 2.14703369140625, 2.2469482421875, 2.34686279296875, 2.44677734375, 2.54669189453125, 2.6466064453125, 2.74652099609375, 2.846435546875, 2.94635009765625, 3.0462646484375, 3.14617919921875, 3.24609375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 10.0, 14.0, 16.0, 31.0, 29.0, 45.0, 58.0, 57.0, 120.0, 148.0, 233.0, 419.0, 744.0, 1485.0, 3325.0, 7742.0, 19499.0, 52308.0, 160501.0, 576022.0, 1539903.0, 1256852.0, 396082.0, 113834.0, 38895.0, 14603.0, 6027.0, 2473.0, 1196.0, 591.0, 356.0, 227.0, 115.0, 73.0, 62.0, 53.0, 34.0, 27.0, 14.0, 12.0, 8.0, 11.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-5.09375, -4.933837890625, -4.77392578125, -4.614013671875, -4.4541015625, -4.294189453125, -4.13427734375, -3.974365234375, -3.814453125, -3.654541015625, -3.49462890625, -3.334716796875, -3.1748046875, -3.014892578125, -2.85498046875, -2.695068359375, -2.53515625, -2.375244140625, -2.21533203125, -2.055419921875, -1.8955078125, -1.735595703125, -1.57568359375, -1.415771484375, -1.255859375, -1.095947265625, -0.93603515625, -0.776123046875, -0.6162109375, -0.456298828125, -0.29638671875, -0.136474609375, 0.0234375, 0.183349609375, 0.34326171875, 0.503173828125, 0.6630859375, 0.822998046875, 0.98291015625, 1.142822265625, 1.302734375, 1.462646484375, 1.62255859375, 1.782470703125, 1.9423828125, 2.102294921875, 2.26220703125, 2.422119140625, 2.58203125, 2.741943359375, 2.90185546875, 3.061767578125, 3.2216796875, 3.381591796875, 3.54150390625, 3.701416015625, 3.861328125, 4.021240234375, 4.18115234375, 4.341064453125, 4.5009765625, 4.660888671875, 4.82080078125, 4.980712890625, 5.140625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 9.0, 17.0, 18.0, 22.0, 30.0, 41.0, 51.0, 57.0, 85.0, 114.0, 138.0, 166.0, 250.0, 364.0, 364.0, 383.0, 364.0, 320.0, 291.0, 251.0, 170.0, 127.0, 98.0, 87.0, 72.0, 41.0, 34.0, 23.0, 16.0, 16.0, 10.0, 7.0, 6.0, 8.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.4140625, -7.173583984375, -6.93310546875, -6.692626953125, -6.4521484375, -6.211669921875, -5.97119140625, -5.730712890625, -5.490234375, -5.249755859375, -5.00927734375, -4.768798828125, -4.5283203125, -4.287841796875, -4.04736328125, -3.806884765625, -3.56640625, -3.325927734375, -3.08544921875, -2.844970703125, -2.6044921875, -2.364013671875, -2.12353515625, -1.883056640625, -1.642578125, -1.402099609375, -1.16162109375, -0.921142578125, -0.6806640625, -0.440185546875, -0.19970703125, 0.040771484375, 0.28125, 0.521728515625, 0.76220703125, 1.002685546875, 1.2431640625, 1.483642578125, 1.72412109375, 1.964599609375, 2.205078125, 2.445556640625, 2.68603515625, 2.926513671875, 3.1669921875, 3.407470703125, 3.64794921875, 3.888427734375, 4.12890625, 4.369384765625, 4.60986328125, 4.850341796875, 5.0908203125, 5.331298828125, 5.57177734375, 5.812255859375, 6.052734375, 6.293212890625, 6.53369140625, 6.774169921875, 7.0146484375, 7.255126953125, 7.49560546875, 7.736083984375, 7.9765625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 0.0, 0.0, 6.0, 2.0, 5.0, 10.0, 11.0, 16.0, 18.0, 16.0, 27.0, 38.0, 59.0, 32.0, 65.0, 99.0, 142.0, 218.0, 338.0, 722.0, 2426.0, 13896.0, 138137.0, 2009092.0, 1882960.0, 128962.0, 12811.0, 2309.0, 737.0, 345.0, 209.0, 139.0, 110.0, 81.0, 63.0, 38.0, 42.0, 26.0, 20.0, 16.0, 12.0, 7.0, 4.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.328125, -16.786376953125, -16.24462890625, -15.702880859375, -15.1611328125, -14.619384765625, -14.07763671875, -13.535888671875, -12.994140625, -12.452392578125, -11.91064453125, -11.368896484375, -10.8271484375, -10.285400390625, -9.74365234375, -9.201904296875, -8.66015625, -8.118408203125, -7.57666015625, -7.034912109375, -6.4931640625, -5.951416015625, -5.40966796875, -4.867919921875, -4.326171875, -3.784423828125, -3.24267578125, -2.700927734375, -2.1591796875, -1.617431640625, -1.07568359375, -0.533935546875, 0.0078125, 0.549560546875, 1.09130859375, 1.633056640625, 2.1748046875, 2.716552734375, 3.25830078125, 3.800048828125, 4.341796875, 4.883544921875, 5.42529296875, 5.967041015625, 6.5087890625, 7.050537109375, 7.59228515625, 8.134033203125, 8.67578125, 9.217529296875, 9.75927734375, 10.301025390625, 10.8427734375, 11.384521484375, 11.92626953125, 12.468017578125, 13.009765625, 13.551513671875, 14.09326171875, 14.635009765625, 15.1767578125, 15.718505859375, 16.26025390625, 16.802001953125, 17.34375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 15.0, 39.0, 82.0, 128.0, 188.0, 198.0, 154.0, 119.0, 48.0, 26.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.10188293457031, -103.64897155761719, -101.1960678100586, -98.74315643310547, -96.29024505615234, -93.83733367919922, -91.38442993164062, -88.9315185546875, -86.47860717773438, -84.02569580078125, -81.57279205322266, -79.11988067626953, -76.6669692993164, -74.21405792236328, -71.76115417480469, -69.30824279785156, -66.85533142089844, -64.40242004394531, -61.94951248168945, -59.496604919433594, -57.04369354248047, -54.59078598022461, -52.13787841796875, -49.684967041015625, -47.23206329345703, -44.77915573120117, -42.32624435424805, -39.87333679199219, -37.42042541503906, -34.9675178527832, -32.514610290527344, -30.06169891357422, -27.608787536621094, -25.1558780670166, -22.70296859741211, -20.25006103515625, -17.797149658203125, -15.34424114227295, -12.891332626342773, -10.438423156738281, -7.985513687133789, -5.532604217529297, -3.079695224761963, -0.6267862319946289, 1.8261232376098633, 4.2790327072143555, 6.731941223144531, 9.184850692749023, 11.637760162353516, 14.090669631958008, 16.5435791015625, 18.99648666381836, 21.449398040771484, 23.902305603027344, 26.355215072631836, 28.808124542236328, 31.26103401184082, 33.71394348144531, 36.16685104370117, 38.6197624206543, 41.072669982910156, 43.52558135986328, 45.97848892211914, 48.431396484375, 50.884307861328125]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 7.0, 3.0, 2.0, 2.0, 9.0, 15.0, 10.0, 9.0, 13.0, 13.0, 14.0, 19.0, 24.0, 29.0, 29.0, 26.0, 31.0, 35.0, 31.0, 34.0, 35.0, 34.0, 42.0, 48.0, 40.0, 46.0, 41.0, 34.0, 40.0, 26.0, 27.0, 31.0, 25.0, 26.0, 19.0, 24.0, 24.0, 19.0, 11.0, 8.0, 9.0, 11.0, 4.0, 8.0, 6.0, 7.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-24.620132446289062, -23.839879989624023, -23.059629440307617, -22.279376983642578, -21.499126434326172, -20.718873977661133, -19.938621520996094, -19.158370971679688, -18.37811851501465, -17.59786605834961, -16.817615509033203, -16.037363052368164, -15.257111549377441, -14.476860046386719, -13.69660758972168, -12.916356086730957, -12.136104583740234, -11.355853080749512, -10.575601577758789, -9.79534912109375, -9.015097618103027, -8.234846115112305, -7.454594135284424, -6.674342155456543, -5.89409065246582, -5.113839149475098, -4.333587169647217, -3.553335428237915, -2.7730836868286133, -1.9928319454193115, -1.2125802040100098, -0.4323282241821289, 0.34792327880859375, 1.1281750202178955, 1.9084267616271973, 2.688678503036499, 3.468930244445801, 4.249181747436523, 5.029433727264404, 5.809685707092285, 6.589937210083008, 7.3701887130737305, 8.150440216064453, 8.930692672729492, 9.710944175720215, 10.491195678710938, 11.271448135375977, 12.0516996383667, 12.831951141357422, 13.612202644348145, 14.392454147338867, 15.172706604003906, 15.952958106994629, 16.73320960998535, 17.51346206665039, 18.293712615966797, 19.073965072631836, 19.854217529296875, 20.63446807861328, 21.41472053527832, 22.19497299194336, 22.975223541259766, 23.755475997924805, 24.535728454589844, 25.31597900390625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 6.0, 6.0, 11.0, 9.0, 9.0, 20.0, 17.0, 23.0, 26.0, 24.0, 23.0, 30.0, 28.0, 27.0, 34.0, 36.0, 34.0, 38.0, 30.0, 43.0, 38.0, 47.0, 52.0, 43.0, 36.0, 28.0, 29.0, 25.0, 26.0, 20.0, 31.0, 17.0, 27.0, 15.0, 16.0, 8.0, 10.0, 11.0, 11.0, 6.0, 4.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.158203125, -3.0555419921875, -2.952880859375, -2.8502197265625, -2.74755859375, -2.6448974609375, -2.542236328125, -2.4395751953125, -2.3369140625, -2.2342529296875, -2.131591796875, -2.0289306640625, -1.92626953125, -1.8236083984375, -1.720947265625, -1.6182861328125, -1.515625, -1.4129638671875, -1.310302734375, -1.2076416015625, -1.10498046875, -1.0023193359375, -0.899658203125, -0.7969970703125, -0.6943359375, -0.5916748046875, -0.489013671875, -0.3863525390625, -0.28369140625, -0.1810302734375, -0.078369140625, 0.0242919921875, 0.126953125, 0.2296142578125, 0.332275390625, 0.4349365234375, 0.53759765625, 0.6402587890625, 0.742919921875, 0.8455810546875, 0.9482421875, 1.0509033203125, 1.153564453125, 1.2562255859375, 1.35888671875, 1.4615478515625, 1.564208984375, 1.6668701171875, 1.76953125, 1.8721923828125, 1.974853515625, 2.0775146484375, 2.18017578125, 2.2828369140625, 2.385498046875, 2.4881591796875, 2.5908203125, 2.6934814453125, 2.796142578125, 2.8988037109375, 3.00146484375, 3.1041259765625, 3.206787109375, 3.3094482421875, 3.412109375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 13.0, 16.0, 19.0, 39.0, 40.0, 78.0, 135.0, 229.0, 426.0, 700.0, 1237.0, 2271.0, 4773.0, 9334.0, 19906.0, 40820.0, 84250.0, 164669.0, 254446.0, 221316.0, 123874.0, 61522.0, 29835.0, 14226.0, 6863.0, 3541.0, 1687.0, 969.0, 514.0, 282.0, 191.0, 113.0, 75.0, 46.0, 31.0, 24.0, 19.0, 10.0, 6.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5009765625, -0.482269287109375, -0.46356201171875, -0.444854736328125, -0.4261474609375, -0.407440185546875, -0.38873291015625, -0.370025634765625, -0.351318359375, -0.332611083984375, -0.31390380859375, -0.295196533203125, -0.2764892578125, -0.257781982421875, -0.23907470703125, -0.220367431640625, -0.20166015625, -0.182952880859375, -0.16424560546875, -0.145538330078125, -0.1268310546875, -0.108123779296875, -0.08941650390625, -0.070709228515625, -0.052001953125, -0.033294677734375, -0.01458740234375, 0.004119873046875, 0.0228271484375, 0.041534423828125, 0.06024169921875, 0.078948974609375, 0.09765625, 0.116363525390625, 0.13507080078125, 0.153778076171875, 0.1724853515625, 0.191192626953125, 0.20989990234375, 0.228607177734375, 0.247314453125, 0.266021728515625, 0.28472900390625, 0.303436279296875, 0.3221435546875, 0.340850830078125, 0.35955810546875, 0.378265380859375, 0.39697265625, 0.415679931640625, 0.43438720703125, 0.453094482421875, 0.4718017578125, 0.490509033203125, 0.50921630859375, 0.527923583984375, 0.546630859375, 0.565338134765625, 0.58404541015625, 0.602752685546875, 0.6214599609375, 0.640167236328125, 0.65887451171875, 0.677581787109375, 0.6962890625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 7.0, 11.0, 16.0, 15.0, 19.0, 18.0, 17.0, 27.0, 22.0, 27.0, 25.0, 34.0, 50.0, 30.0, 30.0, 53.0, 43.0, 1074.0, 37.0, 48.0, 40.0, 40.0, 36.0, 46.0, 23.0, 33.0, 28.0, 28.0, 29.0, 12.0, 12.0, 15.0, 20.0, 9.0, 8.0, 8.0, 4.0, 4.0, 7.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.45703125, -2.38250732421875, -2.3079833984375, -2.23345947265625, -2.158935546875, -2.08441162109375, -2.0098876953125, -1.93536376953125, -1.86083984375, -1.78631591796875, -1.7117919921875, -1.63726806640625, -1.562744140625, -1.48822021484375, -1.4136962890625, -1.33917236328125, -1.2646484375, -1.19012451171875, -1.1156005859375, -1.04107666015625, -0.966552734375, -0.89202880859375, -0.8175048828125, -0.74298095703125, -0.66845703125, -0.59393310546875, -0.5194091796875, -0.44488525390625, -0.370361328125, -0.29583740234375, -0.2213134765625, -0.14678955078125, -0.072265625, 0.00225830078125, 0.0767822265625, 0.15130615234375, 0.225830078125, 0.30035400390625, 0.3748779296875, 0.44940185546875, 0.52392578125, 0.59844970703125, 0.6729736328125, 0.74749755859375, 0.822021484375, 0.89654541015625, 0.9710693359375, 1.04559326171875, 1.1201171875, 1.19464111328125, 1.2691650390625, 1.34368896484375, 1.418212890625, 1.49273681640625, 1.5672607421875, 1.64178466796875, 1.71630859375, 1.79083251953125, 1.8653564453125, 1.93988037109375, 2.014404296875, 2.08892822265625, 2.1634521484375, 2.23797607421875, 2.3125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 7.0, 6.0, 9.0, 14.0, 14.0, 24.0, 33.0, 69.0, 67.0, 111.0, 166.0, 242.0, 339.0, 508.0, 765.0, 1121.0, 1662.0, 2587.0, 3800.0, 6040.0, 9266.0, 14590.0, 22394.0, 34517.0, 52204.0, 77268.0, 108359.0, 188398.0, 1108713.0, 153778.0, 100699.0, 71538.0, 48216.0, 31375.0, 20406.0, 13217.0, 8737.0, 5534.0, 3414.0, 2269.0, 1525.0, 1024.0, 658.0, 479.0, 319.0, 227.0, 133.0, 94.0, 66.0, 44.0, 33.0, 22.0, 7.0, 12.0, 9.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0], "bins": [-0.194091796875, -0.1879100799560547, -0.18172836303710938, -0.17554664611816406, -0.16936492919921875, -0.16318321228027344, -0.15700149536132812, -0.1508197784423828, -0.1446380615234375, -0.1384563446044922, -0.13227462768554688, -0.12609291076660156, -0.11991119384765625, -0.11372947692871094, -0.10754776000976562, -0.10136604309082031, -0.095184326171875, -0.08900260925292969, -0.08282089233398438, -0.07663917541503906, -0.07045745849609375, -0.06427574157714844, -0.058094024658203125, -0.05191230773925781, -0.0457305908203125, -0.03954887390136719, -0.033367156982421875, -0.027185440063476562, -0.02100372314453125, -0.014822006225585938, -0.008640289306640625, -0.0024585723876953125, 0.00372314453125, 0.009904861450195312, 0.016086578369140625, 0.022268295288085938, 0.02845001220703125, 0.03463172912597656, 0.040813446044921875, 0.04699516296386719, 0.0531768798828125, 0.05935859680175781, 0.06554031372070312, 0.07172203063964844, 0.07790374755859375, 0.08408546447753906, 0.09026718139648438, 0.09644889831542969, 0.102630615234375, 0.10881233215332031, 0.11499404907226562, 0.12117576599121094, 0.12735748291015625, 0.13353919982910156, 0.13972091674804688, 0.1459026336669922, 0.1520843505859375, 0.1582660675048828, 0.16444778442382812, 0.17062950134277344, 0.17681121826171875, 0.18299293518066406, 0.18917465209960938, 0.1953563690185547, 0.2015380859375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 7.0, 11.0, 7.0, 16.0, 19.0, 33.0, 28.0, 40.0, 42.0, 56.0, 51.0, 45.0, 83.0, 95.0, 90.0, 50.0, 43.0, 49.0, 40.0, 37.0, 24.0, 30.0, 19.0, 14.0, 11.0, 9.0, 8.0, 2.0, 6.0, 4.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.045745849609375, -0.04437875747680664, -0.04301166534423828, -0.04164457321166992, -0.04027748107910156, -0.0389103889465332, -0.037543296813964844, -0.036176204681396484, -0.034809112548828125, -0.033442020416259766, -0.032074928283691406, -0.030707836151123047, -0.029340744018554688, -0.027973651885986328, -0.02660655975341797, -0.02523946762084961, -0.02387237548828125, -0.02250528335571289, -0.02113819122314453, -0.019771099090576172, -0.018404006958007812, -0.017036914825439453, -0.015669822692871094, -0.014302730560302734, -0.012935638427734375, -0.011568546295166016, -0.010201454162597656, -0.008834362030029297, -0.0074672698974609375, -0.006100177764892578, -0.004733085632324219, -0.0033659934997558594, -0.0019989013671875, -0.0006318092346191406, 0.0007352828979492188, 0.002102375030517578, 0.0034694671630859375, 0.004836559295654297, 0.006203651428222656, 0.007570743560791016, 0.008937835693359375, 0.010304927825927734, 0.011672019958496094, 0.013039112091064453, 0.014406204223632812, 0.015773296356201172, 0.01714038848876953, 0.01850748062133789, 0.01987457275390625, 0.02124166488647461, 0.02260875701904297, 0.023975849151611328, 0.025342941284179688, 0.026710033416748047, 0.028077125549316406, 0.029444217681884766, 0.030811309814453125, 0.032178401947021484, 0.033545494079589844, 0.0349125862121582, 0.03627967834472656, 0.03764677047729492, 0.03901386260986328, 0.04038095474243164, 0.041748046875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 6.0, 3.0, 3.0, 9.0, 5.0, 12.0, 18.0, 19.0, 31.0, 39.0, 51.0, 72.0, 104.0, 218.0, 730.0, 13905.0, 1020531.0, 11473.0, 690.0, 241.0, 105.0, 62.0, 56.0, 42.0, 34.0, 22.0, 16.0, 9.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.89599609375, -0.8666000366210938, -0.8372039794921875, -0.8078079223632812, -0.778411865234375, -0.7490158081054688, -0.7196197509765625, -0.6902236938476562, -0.66082763671875, -0.6314315795898438, -0.6020355224609375, -0.5726394653320312, -0.543243408203125, -0.5138473510742188, -0.4844512939453125, -0.45505523681640625, -0.4256591796875, -0.39626312255859375, -0.3668670654296875, -0.33747100830078125, -0.308074951171875, -0.27867889404296875, -0.2492828369140625, -0.21988677978515625, -0.19049072265625, -0.16109466552734375, -0.1316986083984375, -0.10230255126953125, -0.072906494140625, -0.04351043701171875, -0.0141143798828125, 0.01528167724609375, 0.044677734375, 0.07407379150390625, 0.1034698486328125, 0.13286590576171875, 0.162261962890625, 0.19165802001953125, 0.2210540771484375, 0.25045013427734375, 0.27984619140625, 0.30924224853515625, 0.3386383056640625, 0.36803436279296875, 0.397430419921875, 0.42682647705078125, 0.4562225341796875, 0.48561859130859375, 0.5150146484375, 0.5444107055664062, 0.5738067626953125, 0.6032028198242188, 0.632598876953125, 0.6619949340820312, 0.6913909912109375, 0.7207870483398438, 0.75018310546875, 0.7795791625976562, 0.8089752197265625, 0.8383712768554688, 0.867767333984375, 0.8971633911132812, 0.9265594482421875, 0.9559555053710938, 0.9853515625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 9.0, 12.0, 44.0, 110.0, 408.0, 345.0, 56.0, 17.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47800084948539734, -0.4684353768825531, -0.45886990427970886, -0.4493044316768646, -0.4397389888763428, -0.43017351627349854, -0.4206080436706543, -0.41104257106781006, -0.4014770984649658, -0.3919116258621216, -0.38234615325927734, -0.3727806806564331, -0.36321520805358887, -0.353649765253067, -0.3440842926502228, -0.33451882004737854, -0.3249533474445343, -0.31538787484169006, -0.3058224022388458, -0.2962569296360016, -0.28669148683547974, -0.2771260142326355, -0.26756054162979126, -0.257995069026947, -0.24842959642410278, -0.23886412382125854, -0.2292986512184143, -0.21973319351673126, -0.21016772091388702, -0.20060224831104279, -0.19103679060935974, -0.1814713180065155, -0.17190583050251007, -0.16234035789966583, -0.1527749001979828, -0.14320942759513855, -0.1336439549922943, -0.12407848238945007, -0.11451301723718643, -0.10494755208492279, -0.09538207948207855, -0.08581660687923431, -0.07625114172697067, -0.06668567657470703, -0.05712020397186279, -0.04755473509430885, -0.03798926621675491, -0.028423801064491272, -0.018858328461647034, -0.009292859584093094, 0.00027260929346084595, 0.009838078171014786, 0.019403547048568726, 0.028969015926122665, 0.038534484803676605, 0.04809994995594025, 0.057665422558784485, 0.06723089516162872, 0.07679636031389236, 0.086361825466156, 0.09592729806900024, 0.10549277067184448, 0.11505823582410812, 0.12462370097637177, 0.134189173579216]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 6.0, 5.0, 4.0, 5.0, 12.0, 7.0, 11.0, 18.0, 16.0, 18.0, 27.0, 32.0, 26.0, 36.0, 39.0, 22.0, 34.0, 31.0, 33.0, 40.0, 62.0, 48.0, 38.0, 38.0, 42.0, 27.0, 26.0, 41.0, 24.0, 29.0, 29.0, 23.0, 29.0, 25.0, 20.0, 12.0, 18.0, 7.0, 13.0, 8.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.08212399482727051, -0.07944123446941376, -0.07675846666097641, -0.07407570630311966, -0.07139293849468231, -0.06871017813682556, -0.06602741777896881, -0.06334465742111206, -0.06066188961267471, -0.057979125529527664, -0.055296361446380615, -0.052613601088523865, -0.049930837005376816, -0.04724807292222977, -0.044565312564373016, -0.04188254848122597, -0.03919978439807892, -0.03651702031493187, -0.03383425623178482, -0.03115149587392807, -0.02846873179078102, -0.025785967707633972, -0.023103205487132072, -0.020420443266630173, -0.017737679183483124, -0.01505491603165865, -0.012372152879834175, -0.0096893897280097, -0.0070066265761852264, -0.004323863424360752, -0.0016411002725362778, 0.001041661947965622, 0.003724426031112671, 0.006407189182937145, 0.00908995233476162, 0.011772715486586094, 0.014455478638410568, 0.017138242721557617, 0.019821004942059517, 0.022503767162561417, 0.025186531245708466, 0.027869295328855515, 0.030552057549357414, 0.033234819769859314, 0.03591758385300636, 0.03860034793615341, 0.04128310829401016, 0.04396587237715721, 0.04664863646030426, 0.04933140054345131, 0.05201416462659836, 0.05469692498445511, 0.05737968906760216, 0.06006245315074921, 0.06274521350860596, 0.06542797386646271, 0.06811074167490005, 0.0707935020327568, 0.07347626984119415, 0.0761590301990509, 0.07884179055690765, 0.081524558365345, 0.08420731872320175, 0.0868900865316391, 0.08957284688949585]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 7.0, 5.0, 6.0, 11.0, 8.0, 10.0, 19.0, 18.0, 23.0, 25.0, 23.0, 24.0, 30.0, 28.0, 27.0, 35.0, 33.0, 36.0, 38.0, 29.0, 45.0, 36.0, 49.0, 51.0, 40.0, 41.0, 26.0, 30.0, 25.0, 26.0, 20.0, 30.0, 16.0, 27.0, 17.0, 15.0, 9.0, 10.0, 11.0, 10.0, 7.0, 4.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.16015625, -3.057525634765625, -2.95489501953125, -2.852264404296875, -2.7496337890625, -2.647003173828125, -2.54437255859375, -2.441741943359375, -2.339111328125, -2.236480712890625, -2.13385009765625, -2.031219482421875, -1.9285888671875, -1.825958251953125, -1.72332763671875, -1.620697021484375, -1.51806640625, -1.415435791015625, -1.31280517578125, -1.210174560546875, -1.1075439453125, -1.004913330078125, -0.90228271484375, -0.799652099609375, -0.697021484375, -0.594390869140625, -0.49176025390625, -0.389129638671875, -0.2864990234375, -0.183868408203125, -0.08123779296875, 0.021392822265625, 0.1240234375, 0.226654052734375, 0.32928466796875, 0.431915283203125, 0.5345458984375, 0.637176513671875, 0.73980712890625, 0.842437744140625, 0.945068359375, 1.047698974609375, 1.15032958984375, 1.252960205078125, 1.3555908203125, 1.458221435546875, 1.56085205078125, 1.663482666015625, 1.76611328125, 1.868743896484375, 1.97137451171875, 2.074005126953125, 2.1766357421875, 2.279266357421875, 2.38189697265625, 2.484527587890625, 2.587158203125, 2.689788818359375, 2.79241943359375, 2.895050048828125, 2.9976806640625, 3.100311279296875, 3.20294189453125, 3.305572509765625, 3.408203125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 10.0, 11.0, 21.0, 20.0, 35.0, 43.0, 67.0, 96.0, 126.0, 280.0, 444.0, 736.0, 1415.0, 2559.0, 5121.0, 10948.0, 23627.0, 52903.0, 129158.0, 346402.0, 288329.0, 103623.0, 43963.0, 19869.0, 9227.0, 4354.0, 2284.0, 1149.0, 682.0, 407.0, 236.0, 154.0, 85.0, 62.0, 33.0, 24.0, 14.0, 15.0, 4.0, 6.0, 8.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.328125, -4.20751953125, -4.0869140625, -3.96630859375, -3.845703125, -3.72509765625, -3.6044921875, -3.48388671875, -3.36328125, -3.24267578125, -3.1220703125, -3.00146484375, -2.880859375, -2.76025390625, -2.6396484375, -2.51904296875, -2.3984375, -2.27783203125, -2.1572265625, -2.03662109375, -1.916015625, -1.79541015625, -1.6748046875, -1.55419921875, -1.43359375, -1.31298828125, -1.1923828125, -1.07177734375, -0.951171875, -0.83056640625, -0.7099609375, -0.58935546875, -0.46875, -0.34814453125, -0.2275390625, -0.10693359375, 0.013671875, 0.13427734375, 0.2548828125, 0.37548828125, 0.49609375, 0.61669921875, 0.7373046875, 0.85791015625, 0.978515625, 1.09912109375, 1.2197265625, 1.34033203125, 1.4609375, 1.58154296875, 1.7021484375, 1.82275390625, 1.943359375, 2.06396484375, 2.1845703125, 2.30517578125, 2.42578125, 2.54638671875, 2.6669921875, 2.78759765625, 2.908203125, 3.02880859375, 3.1494140625, 3.27001953125, 3.390625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 4.0, 9.0, 15.0, 10.0, 13.0, 13.0, 18.0, 19.0, 30.0, 29.0, 33.0, 35.0, 38.0, 43.0, 69.0, 75.0, 133.0, 316.0, 1502.0, 140.0, 97.0, 67.0, 43.0, 43.0, 43.0, 29.0, 21.0, 27.0, 33.0, 18.0, 17.0, 16.0, 10.0, 10.0, 5.0, 2.0, 7.0, 7.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.8671875, -13.4085693359375, -12.949951171875, -12.4913330078125, -12.03271484375, -11.5740966796875, -11.115478515625, -10.6568603515625, -10.1982421875, -9.7396240234375, -9.281005859375, -8.8223876953125, -8.36376953125, -7.9051513671875, -7.446533203125, -6.9879150390625, -6.529296875, -6.0706787109375, -5.612060546875, -5.1534423828125, -4.69482421875, -4.2362060546875, -3.777587890625, -3.3189697265625, -2.8603515625, -2.4017333984375, -1.943115234375, -1.4844970703125, -1.02587890625, -0.5672607421875, -0.108642578125, 0.3499755859375, 0.80859375, 1.2672119140625, 1.725830078125, 2.1844482421875, 2.64306640625, 3.1016845703125, 3.560302734375, 4.0189208984375, 4.4775390625, 4.9361572265625, 5.394775390625, 5.8533935546875, 6.31201171875, 6.7706298828125, 7.229248046875, 7.6878662109375, 8.146484375, 8.6051025390625, 9.063720703125, 9.5223388671875, 9.98095703125, 10.4395751953125, 10.898193359375, 11.3568115234375, 11.8154296875, 12.2740478515625, 12.732666015625, 13.1912841796875, 13.64990234375, 14.1085205078125, 14.567138671875, 15.0257568359375, 15.484375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 1.0, 4.0, 13.0, 9.0, 21.0, 16.0, 35.0, 42.0, 65.0, 86.0, 118.0, 221.0, 304.0, 616.0, 2973.0, 435861.0, 2698593.0, 4833.0, 797.0, 370.0, 216.0, 177.0, 93.0, 62.0, 41.0, 40.0, 24.0, 24.0, 20.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-52.71875, -51.404052734375, -50.08935546875, -48.774658203125, -47.4599609375, -46.145263671875, -44.83056640625, -43.515869140625, -42.201171875, -40.886474609375, -39.57177734375, -38.257080078125, -36.9423828125, -35.627685546875, -34.31298828125, -32.998291015625, -31.68359375, -30.368896484375, -29.05419921875, -27.739501953125, -26.4248046875, -25.110107421875, -23.79541015625, -22.480712890625, -21.166015625, -19.851318359375, -18.53662109375, -17.221923828125, -15.9072265625, -14.592529296875, -13.27783203125, -11.963134765625, -10.6484375, -9.333740234375, -8.01904296875, -6.704345703125, -5.3896484375, -4.074951171875, -2.76025390625, -1.445556640625, -0.130859375, 1.183837890625, 2.49853515625, 3.813232421875, 5.1279296875, 6.442626953125, 7.75732421875, 9.072021484375, 10.38671875, 11.701416015625, 13.01611328125, 14.330810546875, 15.6455078125, 16.960205078125, 18.27490234375, 19.589599609375, 20.904296875, 22.218994140625, 23.53369140625, 24.848388671875, 26.1630859375, 27.477783203125, 28.79248046875, 30.107177734375, 31.421875]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 11.0, 70.0, 464.0, 410.0, 58.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.39975357055664, -19.182167053222656, -15.964580535888672, -12.746994018554688, -9.529407501220703, -6.311820983886719, -3.0942344665527344, 0.12335205078125, 3.3409385681152344, 6.558525085449219, 9.776111602783203, 12.993698120117188, 16.211284637451172, 19.428871154785156, 22.64645767211914, 25.864044189453125, 29.08163070678711, 32.299217224121094, 35.51680374145508, 38.73439025878906, 41.95197677612305, 45.16956329345703, 48.387149810791016, 51.604736328125, 54.822322845458984, 58.03990936279297, 61.25749588012695, 64.47508239746094, 67.69267272949219, 70.9102554321289, 74.12783813476562, 77.34542846679688, 80.56301879882812, 83.78060913085938, 86.9981918334961, 90.21577453613281, 93.43336486816406, 96.65095520019531, 99.86853790283203, 103.08612060546875, 106.3037109375, 109.52130126953125, 112.73888397216797, 115.95646667480469, 119.17405700683594, 122.39164733886719, 125.6092300415039, 128.82681274414062, 132.04440307617188, 135.26199340820312, 138.47958374023438, 141.69715881347656, 144.9147491455078, 148.13233947753906, 151.34991455078125, 154.5675048828125, 157.78509521484375, 161.002685546875, 164.22027587890625, 167.43785095214844, 170.6554412841797, 173.87303161621094, 177.09060668945312, 180.30819702148438, 183.52578735351562]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 11.0, 8.0, 16.0, 8.0, 19.0, 13.0, 23.0, 27.0, 32.0, 24.0, 31.0, 30.0, 44.0, 31.0, 35.0, 42.0, 39.0, 50.0, 37.0, 44.0, 43.0, 30.0, 43.0, 43.0, 28.0, 27.0, 21.0, 24.0, 34.0, 21.0, 19.0, 20.0, 14.0, 14.0, 11.0, 6.0, 9.0, 4.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.0926456451416, -27.120649337768555, -26.14865493774414, -25.176658630371094, -24.204662322998047, -23.232666015625, -22.260669708251953, -21.28867530822754, -20.316679000854492, -19.344682693481445, -18.37268829345703, -17.400691986083984, -16.428695678710938, -15.45669937133789, -14.48470401763916, -13.51270866394043, -12.540712356567383, -11.568716049194336, -10.596720695495605, -9.624725341796875, -8.652729034423828, -7.6807332038879395, -6.708737373352051, -5.736741542816162, -4.764745712280273, -3.7927498817443848, -2.820754051208496, -1.8487582206726074, -0.8767623901367188, 0.09523344039916992, 1.0672292709350586, 2.0392251014709473, 3.0112228393554688, 3.9832186698913574, 4.955214500427246, 5.927210330963135, 6.899206161499023, 7.871201992034912, 8.8431978225708, 9.815193176269531, 10.787189483642578, 11.759185791015625, 12.731181144714355, 13.703176498413086, 14.675172805786133, 15.64716911315918, 16.619163513183594, 17.59115982055664, 18.563156127929688, 19.535152435302734, 20.50714874267578, 21.479143142700195, 22.451139450073242, 23.42313575744629, 24.395130157470703, 25.36712646484375, 26.339122772216797, 27.311119079589844, 28.28311538696289, 29.255109786987305, 30.22710609436035, 31.1991024017334, 32.17109680175781, 33.14309310913086, 34.115089416503906]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 6.0, 9.0, 14.0, 12.0, 10.0, 11.0, 18.0, 13.0, 24.0, 22.0, 30.0, 34.0, 31.0, 34.0, 43.0, 34.0, 28.0, 31.0, 26.0, 43.0, 51.0, 37.0, 52.0, 34.0, 30.0, 34.0, 40.0, 27.0, 23.0, 18.0, 24.0, 18.0, 25.0, 16.0, 17.0, 12.0, 13.0, 7.0, 8.0, 9.0, 9.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.28515625, -3.178497314453125, -3.07183837890625, -2.965179443359375, -2.8585205078125, -2.751861572265625, -2.64520263671875, -2.538543701171875, -2.431884765625, -2.325225830078125, -2.21856689453125, -2.111907958984375, -2.0052490234375, -1.898590087890625, -1.79193115234375, -1.685272216796875, -1.57861328125, -1.471954345703125, -1.36529541015625, -1.258636474609375, -1.1519775390625, -1.045318603515625, -0.93865966796875, -0.832000732421875, -0.725341796875, -0.618682861328125, -0.51202392578125, -0.405364990234375, -0.2987060546875, -0.192047119140625, -0.08538818359375, 0.021270751953125, 0.1279296875, 0.234588623046875, 0.34124755859375, 0.447906494140625, 0.5545654296875, 0.661224365234375, 0.76788330078125, 0.874542236328125, 0.981201171875, 1.087860107421875, 1.19451904296875, 1.301177978515625, 1.4078369140625, 1.514495849609375, 1.62115478515625, 1.727813720703125, 1.83447265625, 1.941131591796875, 2.04779052734375, 2.154449462890625, 2.2611083984375, 2.367767333984375, 2.47442626953125, 2.581085205078125, 2.687744140625, 2.794403076171875, 2.90106201171875, 3.007720947265625, 3.1143798828125, 3.221038818359375, 3.32769775390625, 3.434356689453125, 3.541015625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 10.0, 3.0, 12.0, 10.0, 13.0, 20.0, 13.0, 13.0, 26.0, 28.0, 33.0, 36.0, 58.0, 108.0, 227.0, 810.0, 3777.0, 28203.0, 343624.0, 2891862.0, 858717.0, 58117.0, 6624.0, 1195.0, 303.0, 130.0, 58.0, 42.0, 29.0, 30.0, 19.0, 16.0, 19.0, 13.0, 17.0, 11.0, 9.0, 5.0, 14.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.9765625, -11.5982666015625, -11.219970703125, -10.8416748046875, -10.46337890625, -10.0850830078125, -9.706787109375, -9.3284912109375, -8.9501953125, -8.5718994140625, -8.193603515625, -7.8153076171875, -7.43701171875, -7.0587158203125, -6.680419921875, -6.3021240234375, -5.923828125, -5.5455322265625, -5.167236328125, -4.7889404296875, -4.41064453125, -4.0323486328125, -3.654052734375, -3.2757568359375, -2.8974609375, -2.5191650390625, -2.140869140625, -1.7625732421875, -1.38427734375, -1.0059814453125, -0.627685546875, -0.2493896484375, 0.12890625, 0.5072021484375, 0.885498046875, 1.2637939453125, 1.64208984375, 2.0203857421875, 2.398681640625, 2.7769775390625, 3.1552734375, 3.5335693359375, 3.911865234375, 4.2901611328125, 4.66845703125, 5.0467529296875, 5.425048828125, 5.8033447265625, 6.181640625, 6.5599365234375, 6.938232421875, 7.3165283203125, 7.69482421875, 8.0731201171875, 8.451416015625, 8.8297119140625, 9.2080078125, 9.5863037109375, 9.964599609375, 10.3428955078125, 10.72119140625, 11.0994873046875, 11.477783203125, 11.8560791015625, 12.234375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 11.0, 17.0, 18.0, 33.0, 29.0, 48.0, 96.0, 114.0, 133.0, 193.0, 281.0, 361.0, 452.0, 469.0, 477.0, 381.0, 281.0, 188.0, 133.0, 111.0, 77.0, 45.0, 41.0, 26.0, 17.0, 14.0, 11.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5703125, -9.275634765625, -8.98095703125, -8.686279296875, -8.3916015625, -8.096923828125, -7.80224609375, -7.507568359375, -7.212890625, -6.918212890625, -6.62353515625, -6.328857421875, -6.0341796875, -5.739501953125, -5.44482421875, -5.150146484375, -4.85546875, -4.560791015625, -4.26611328125, -3.971435546875, -3.6767578125, -3.382080078125, -3.08740234375, -2.792724609375, -2.498046875, -2.203369140625, -1.90869140625, -1.614013671875, -1.3193359375, -1.024658203125, -0.72998046875, -0.435302734375, -0.140625, 0.154052734375, 0.44873046875, 0.743408203125, 1.0380859375, 1.332763671875, 1.62744140625, 1.922119140625, 2.216796875, 2.511474609375, 2.80615234375, 3.100830078125, 3.3955078125, 3.690185546875, 3.98486328125, 4.279541015625, 4.57421875, 4.868896484375, 5.16357421875, 5.458251953125, 5.7529296875, 6.047607421875, 6.34228515625, 6.636962890625, 6.931640625, 7.226318359375, 7.52099609375, 7.815673828125, 8.1103515625, 8.405029296875, 8.69970703125, 8.994384765625, 9.2890625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 7.0, 8.0, 18.0, 14.0, 25.0, 26.0, 43.0, 58.0, 60.0, 91.0, 124.0, 176.0, 273.0, 533.0, 1583.0, 8882.0, 127176.0, 2706783.0, 1287052.0, 54196.0, 4783.0, 1033.0, 447.0, 240.0, 174.0, 105.0, 101.0, 49.0, 52.0, 45.0, 42.0, 24.0, 17.0, 9.0, 7.0, 11.0, 3.0, 0.0, 0.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.8125, -19.17041015625, -18.5283203125, -17.88623046875, -17.244140625, -16.60205078125, -15.9599609375, -15.31787109375, -14.67578125, -14.03369140625, -13.3916015625, -12.74951171875, -12.107421875, -11.46533203125, -10.8232421875, -10.18115234375, -9.5390625, -8.89697265625, -8.2548828125, -7.61279296875, -6.970703125, -6.32861328125, -5.6865234375, -5.04443359375, -4.40234375, -3.76025390625, -3.1181640625, -2.47607421875, -1.833984375, -1.19189453125, -0.5498046875, 0.09228515625, 0.734375, 1.37646484375, 2.0185546875, 2.66064453125, 3.302734375, 3.94482421875, 4.5869140625, 5.22900390625, 5.87109375, 6.51318359375, 7.1552734375, 7.79736328125, 8.439453125, 9.08154296875, 9.7236328125, 10.36572265625, 11.0078125, 11.64990234375, 12.2919921875, 12.93408203125, 13.576171875, 14.21826171875, 14.8603515625, 15.50244140625, 16.14453125, 16.78662109375, 17.4287109375, 18.07080078125, 18.712890625, 19.35498046875, 19.9970703125, 20.63916015625, 21.28125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 14.0, 156.0, 459.0, 323.0, 63.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.87850189208984, -102.39380645751953, -95.90910339355469, -89.42440795898438, -82.93970489501953, -76.45500946044922, -69.97030639648438, -63.48561096191406, -57.000911712646484, -50.516212463378906, -44.03151321411133, -37.54681396484375, -31.062116622924805, -24.57741928100586, -18.09272003173828, -11.608020782470703, -5.123321533203125, 1.361377239227295, 7.846076011657715, 14.330774307250977, 20.815473556518555, 27.3001708984375, 33.78487014770508, 40.269569396972656, 46.754268646240234, 53.23896789550781, 59.72366714477539, 66.20836639404297, 72.69306182861328, 79.17776489257812, 85.66246032714844, 92.14715576171875, 98.63185119628906, 105.11654663085938, 111.60124969482422, 118.08594512939453, 124.57064819335938, 131.0553436279297, 137.5400390625, 144.02474975585938, 150.5094451904297, 156.994140625, 163.4788360595703, 169.9635467529297, 176.4482421875, 182.9329376220703, 189.41763305664062, 195.90234375, 202.38702392578125, 208.87171936035156, 215.35641479492188, 221.84112548828125, 228.32582092285156, 234.81051635742188, 241.2952117919922, 247.7799072265625, 254.26461791992188, 260.74932861328125, 267.2340087890625, 273.7187194824219, 280.2033996582031, 286.6881103515625, 293.1728210449219, 299.6575012207031, 306.1422119140625]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 8.0, 5.0, 11.0, 9.0, 9.0, 16.0, 14.0, 18.0, 19.0, 27.0, 19.0, 28.0, 36.0, 33.0, 42.0, 36.0, 45.0, 34.0, 43.0, 46.0, 33.0, 45.0, 32.0, 34.0, 36.0, 31.0, 31.0, 34.0, 22.0, 33.0, 26.0, 23.0, 16.0, 22.0, 14.0, 11.0, 9.0, 8.0, 9.0, 8.0, 9.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.666175842285156, -24.8515567779541, -24.036937713623047, -23.22231674194336, -22.407697677612305, -21.59307861328125, -20.778459548950195, -19.96384048461914, -19.149219512939453, -18.3346004486084, -17.519981384277344, -16.705360412597656, -15.890741348266602, -15.076122283935547, -14.261503219604492, -13.446884155273438, -12.632265090942383, -11.817646026611328, -11.003026008605957, -10.188406944274902, -9.373786926269531, -8.559167861938477, -7.744548797607422, -6.929929256439209, -6.115309715270996, -5.300690174102783, -4.48607063293457, -3.6714515686035156, -2.8568320274353027, -2.04221248626709, -1.2275934219360352, -0.41297388076782227, 0.4016456604003906, 1.216265082359314, 2.0308845043182373, 2.845503807067871, 3.660123348236084, 4.474742889404297, 5.289361953735352, 6.1039814949035645, 6.918601036071777, 7.73322057723999, 8.547840118408203, 9.362459182739258, 10.177078247070312, 10.991698265075684, 11.806317329406738, 12.62093734741211, 13.435556411743164, 14.250175476074219, 15.06479549407959, 15.879414558410645, 16.694034576416016, 17.50865364074707, 18.323272705078125, 19.13789176940918, 19.952510833740234, 20.76712989807129, 21.581748962402344, 22.39636993408203, 23.210988998413086, 24.02560806274414, 24.840227127075195, 25.65484619140625, 26.469467163085938]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 6.0, 9.0, 4.0, 16.0, 14.0, 12.0, 10.0, 14.0, 13.0, 17.0, 20.0, 34.0, 32.0, 32.0, 27.0, 29.0, 47.0, 38.0, 40.0, 32.0, 48.0, 39.0, 43.0, 41.0, 36.0, 32.0, 37.0, 31.0, 28.0, 15.0, 33.0, 24.0, 21.0, 20.0, 17.0, 18.0, 12.0, 7.0, 10.0, 12.0, 4.0, 7.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.330078125, -3.22265625, -3.115234375, -3.0078125, -2.900390625, -2.79296875, -2.685546875, -2.578125, -2.470703125, -2.36328125, -2.255859375, -2.1484375, -2.041015625, -1.93359375, -1.826171875, -1.71875, -1.611328125, -1.50390625, -1.396484375, -1.2890625, -1.181640625, -1.07421875, -0.966796875, -0.859375, -0.751953125, -0.64453125, -0.537109375, -0.4296875, -0.322265625, -0.21484375, -0.107421875, 0.0, 0.107421875, 0.21484375, 0.322265625, 0.4296875, 0.537109375, 0.64453125, 0.751953125, 0.859375, 0.966796875, 1.07421875, 1.181640625, 1.2890625, 1.396484375, 1.50390625, 1.611328125, 1.71875, 1.826171875, 1.93359375, 2.041015625, 2.1484375, 2.255859375, 2.36328125, 2.470703125, 2.578125, 2.685546875, 2.79296875, 2.900390625, 3.0078125, 3.115234375, 3.22265625, 3.330078125, 3.4375, 3.544921875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 18.0, 21.0, 47.0, 72.0, 120.0, 193.0, 353.0, 549.0, 844.0, 1424.0, 2330.0, 3800.0, 5967.0, 9498.0, 14901.0, 23871.0, 37762.0, 58503.0, 89455.0, 129899.0, 166737.0, 159267.0, 119556.0, 80355.0, 52449.0, 33432.0, 21359.0, 13429.0, 8448.0, 5297.0, 3260.0, 2128.0, 1267.0, 780.0, 463.0, 273.0, 169.0, 111.0, 64.0, 39.0, 19.0, 14.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.399169921875, -0.3866462707519531, -0.37412261962890625, -0.3615989685058594, -0.3490753173828125, -0.3365516662597656, -0.32402801513671875, -0.3115043640136719, -0.298980712890625, -0.2864570617675781, -0.27393341064453125, -0.2614097595214844, -0.2488861083984375, -0.23636245727539062, -0.22383880615234375, -0.21131515502929688, -0.19879150390625, -0.18626785278320312, -0.17374420166015625, -0.16122055053710938, -0.1486968994140625, -0.13617324829101562, -0.12364959716796875, -0.11112594604492188, -0.098602294921875, -0.08607864379882812, -0.07355499267578125, -0.061031341552734375, -0.0485076904296875, -0.035984039306640625, -0.02346038818359375, -0.010936737060546875, 0.0015869140625, 0.014110565185546875, 0.02663421630859375, 0.039157867431640625, 0.0516815185546875, 0.06420516967773438, 0.07672882080078125, 0.08925247192382812, 0.101776123046875, 0.11429977416992188, 0.12682342529296875, 0.13934707641601562, 0.1518707275390625, 0.16439437866210938, 0.17691802978515625, 0.18944168090820312, 0.20196533203125, 0.21448898315429688, 0.22701263427734375, 0.23953628540039062, 0.2520599365234375, 0.2645835876464844, 0.27710723876953125, 0.2896308898925781, 0.302154541015625, 0.3146781921386719, 0.32720184326171875, 0.3397254943847656, 0.3522491455078125, 0.3647727966308594, 0.37729644775390625, 0.3898200988769531, 0.40234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 4.0, 6.0, 13.0, 11.0, 13.0, 13.0, 11.0, 24.0, 23.0, 18.0, 33.0, 31.0, 29.0, 41.0, 39.0, 49.0, 33.0, 42.0, 41.0, 1073.0, 38.0, 42.0, 45.0, 35.0, 30.0, 39.0, 38.0, 33.0, 23.0, 31.0, 19.0, 20.0, 11.0, 17.0, 13.0, 7.0, 13.0, 9.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.284759521484375, -2.20819091796875, -2.131622314453125, -2.0550537109375, -1.978485107421875, -1.90191650390625, -1.825347900390625, -1.748779296875, -1.672210693359375, -1.59564208984375, -1.519073486328125, -1.4425048828125, -1.365936279296875, -1.28936767578125, -1.212799072265625, -1.13623046875, -1.059661865234375, -0.98309326171875, -0.906524658203125, -0.8299560546875, -0.753387451171875, -0.67681884765625, -0.600250244140625, -0.523681640625, -0.447113037109375, -0.37054443359375, -0.293975830078125, -0.2174072265625, -0.140838623046875, -0.06427001953125, 0.012298583984375, 0.0888671875, 0.165435791015625, 0.24200439453125, 0.318572998046875, 0.3951416015625, 0.471710205078125, 0.54827880859375, 0.624847412109375, 0.701416015625, 0.777984619140625, 0.85455322265625, 0.931121826171875, 1.0076904296875, 1.084259033203125, 1.16082763671875, 1.237396240234375, 1.31396484375, 1.390533447265625, 1.46710205078125, 1.543670654296875, 1.6202392578125, 1.696807861328125, 1.77337646484375, 1.849945068359375, 1.926513671875, 2.003082275390625, 2.07965087890625, 2.156219482421875, 2.2327880859375, 2.309356689453125, 2.38592529296875, 2.462493896484375, 2.5390625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 15.0, 12.0, 39.0, 47.0, 56.0, 98.0, 148.0, 244.0, 381.0, 598.0, 930.0, 1467.0, 2290.0, 3377.0, 5472.0, 8153.0, 12880.0, 19880.0, 30100.0, 46013.0, 67563.0, 95466.0, 127210.0, 1137733.0, 181939.0, 111159.0, 80438.0, 56135.0, 37328.0, 24784.0, 16076.0, 10238.0, 6554.0, 4475.0, 2778.0, 1803.0, 1208.0, 727.0, 481.0, 327.0, 181.0, 126.0, 80.0, 49.0, 27.0, 18.0, 12.0, 10.0, 3.0, 4.0, 0.0, 1.0], "bins": [-0.2313232421875, -0.224853515625, -0.2183837890625, -0.2119140625, -0.2054443359375, -0.198974609375, -0.1925048828125, -0.18603515625, -0.1795654296875, -0.173095703125, -0.1666259765625, -0.16015625, -0.1536865234375, -0.147216796875, -0.1407470703125, -0.13427734375, -0.1278076171875, -0.121337890625, -0.1148681640625, -0.1083984375, -0.1019287109375, -0.095458984375, -0.0889892578125, -0.08251953125, -0.0760498046875, -0.069580078125, -0.0631103515625, -0.056640625, -0.0501708984375, -0.043701171875, -0.0372314453125, -0.03076171875, -0.0242919921875, -0.017822265625, -0.0113525390625, -0.0048828125, 0.0015869140625, 0.008056640625, 0.0145263671875, 0.02099609375, 0.0274658203125, 0.033935546875, 0.0404052734375, 0.046875, 0.0533447265625, 0.059814453125, 0.0662841796875, 0.07275390625, 0.0792236328125, 0.085693359375, 0.0921630859375, 0.0986328125, 0.1051025390625, 0.111572265625, 0.1180419921875, 0.12451171875, 0.1309814453125, 0.137451171875, 0.1439208984375, 0.150390625, 0.1568603515625, 0.163330078125, 0.1697998046875, 0.17626953125, 0.1827392578125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 4.0, 3.0, 3.0, 7.0, 7.0, 7.0, 10.0, 11.0, 8.0, 9.0, 21.0, 30.0, 38.0, 72.0, 96.0, 78.0, 150.0, 86.0, 101.0, 64.0, 43.0, 29.0, 29.0, 16.0, 9.0, 9.0, 7.0, 16.0, 11.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0303497314453125, -0.02944183349609375, -0.028533935546875, -0.02762603759765625, -0.0267181396484375, -0.02581024169921875, -0.02490234375, -0.02399444580078125, -0.0230865478515625, -0.02217864990234375, -0.021270751953125, -0.02036285400390625, -0.0194549560546875, -0.01854705810546875, -0.01763916015625, -0.01673126220703125, -0.0158233642578125, -0.01491546630859375, -0.014007568359375, -0.01309967041015625, -0.0121917724609375, -0.01128387451171875, -0.0103759765625, -0.00946807861328125, -0.0085601806640625, -0.00765228271484375, -0.006744384765625, -0.00583648681640625, -0.0049285888671875, -0.00402069091796875, -0.00311279296875, -0.00220489501953125, -0.0012969970703125, -0.00038909912109375, 0.000518798828125, 0.00142669677734375, 0.0023345947265625, 0.00324249267578125, 0.004150390625, 0.00505828857421875, 0.0059661865234375, 0.00687408447265625, 0.007781982421875, 0.00868988037109375, 0.0095977783203125, 0.01050567626953125, 0.01141357421875, 0.01232147216796875, 0.0132293701171875, 0.01413726806640625, 0.015045166015625, 0.01595306396484375, 0.0168609619140625, 0.01776885986328125, 0.0186767578125, 0.01958465576171875, 0.0204925537109375, 0.02140045166015625, 0.022308349609375, 0.02321624755859375, 0.0241241455078125, 0.02503204345703125, 0.02593994140625, 0.02684783935546875, 0.0277557373046875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 4.0, 6.0, 11.0, 14.0, 11.0, 4.0, 16.0, 15.0, 27.0, 28.0, 47.0, 77.0, 185.0, 667.0, 36556.0, 1006964.0, 3293.0, 313.0, 102.0, 56.0, 27.0, 27.0, 14.0, 12.0, 11.0, 8.0, 6.0, 12.0, 7.0, 5.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6337890625, -0.6135177612304688, -0.5932464599609375, -0.5729751586914062, -0.552703857421875, -0.5324325561523438, -0.5121612548828125, -0.49188995361328125, -0.47161865234375, -0.45134735107421875, -0.4310760498046875, -0.41080474853515625, -0.390533447265625, -0.37026214599609375, -0.3499908447265625, -0.32971954345703125, -0.3094482421875, -0.28917694091796875, -0.2689056396484375, -0.24863433837890625, -0.228363037109375, -0.20809173583984375, -0.1878204345703125, -0.16754913330078125, -0.14727783203125, -0.12700653076171875, -0.1067352294921875, -0.08646392822265625, -0.066192626953125, -0.04592132568359375, -0.0256500244140625, -0.00537872314453125, 0.014892578125, 0.03516387939453125, 0.0554351806640625, 0.07570648193359375, 0.095977783203125, 0.11624908447265625, 0.1365203857421875, 0.15679168701171875, 0.17706298828125, 0.19733428955078125, 0.2176055908203125, 0.23787689208984375, 0.258148193359375, 0.27841949462890625, 0.2986907958984375, 0.31896209716796875, 0.3392333984375, 0.35950469970703125, 0.3797760009765625, 0.40004730224609375, 0.420318603515625, 0.44058990478515625, 0.4608612060546875, 0.48113250732421875, 0.50140380859375, 0.5216751098632812, 0.5419464111328125, 0.5622177124023438, 0.582489013671875, 0.6027603149414062, 0.6230316162109375, 0.6433029174804688, 0.66357421875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 17.0, 25.0, 38.0, 62.0, 176.0, 412.0, 164.0, 67.0, 24.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18517185747623444, -0.18128155171871185, -0.17739124596118927, -0.1735009402036667, -0.1696106344461441, -0.16572032868862152, -0.16183002293109894, -0.15793973207473755, -0.15404942631721497, -0.15015912055969238, -0.1462688148021698, -0.14237850904464722, -0.13848820328712463, -0.13459789752960205, -0.13070759177207947, -0.12681728601455688, -0.1229269802570343, -0.11903667449951172, -0.11514636874198914, -0.11125606298446655, -0.10736575722694397, -0.10347545146942139, -0.0995851531624794, -0.09569484740495682, -0.09180454164743423, -0.08791423588991165, -0.08402393013238907, -0.08013362437486649, -0.0762433260679245, -0.07235302031040192, -0.06846271455287933, -0.06457240879535675, -0.06068210303783417, -0.056791797280311584, -0.052901491522789, -0.04901118949055672, -0.045120883733034134, -0.04123057797551155, -0.037340275943279266, -0.03344997018575668, -0.0295596644282341, -0.025669358670711517, -0.021779054775834084, -0.01788875088095665, -0.013998445123434067, -0.010108139365911484, -0.00621783547103405, -0.002327531576156616, 0.0015627741813659668, 0.005453079007565975, 0.009343383833765984, 0.013233688659965992, 0.017123993486166, 0.021014299243688583, 0.024904603138566017, 0.02879490703344345, 0.032685212790966034, 0.03657551854848862, 0.0404658243060112, 0.044356126338243484, 0.04824643209576607, 0.05213673785328865, 0.056027039885520935, 0.05991734564304352, 0.0638076514005661]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 9.0, 4.0, 2.0, 9.0, 7.0, 16.0, 12.0, 16.0, 19.0, 15.0, 26.0, 23.0, 32.0, 30.0, 35.0, 27.0, 39.0, 41.0, 33.0, 44.0, 38.0, 39.0, 31.0, 44.0, 38.0, 37.0, 41.0, 34.0, 20.0, 19.0, 32.0, 25.0, 23.0, 16.0, 27.0, 17.0, 18.0, 15.0, 12.0, 8.0, 6.0, 4.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036732017993927, -0.035495974123477936, -0.03425993025302887, -0.0330238901078701, -0.031787846237421036, -0.03055180236697197, -0.029315760359168053, -0.028079718351364136, -0.02684367448091507, -0.025607630610466003, -0.024371588602662086, -0.02313554659485817, -0.021899502724409103, -0.020663458853960037, -0.01942741684615612, -0.018191374838352203, -0.016955330967903137, -0.01571928709745407, -0.014483245089650154, -0.013247202150523663, -0.012011159211397171, -0.01077511627227068, -0.009539073333144188, -0.008303030394017696, -0.007066987454891205, -0.005830944515764713, -0.004594901576638222, -0.00335885863751173, -0.0021228156983852386, -0.0008867727592587471, 0.00034927017986774445, 0.001585313118994236, 0.0028213560581207275, 0.004057398997247219, 0.005293441936373711, 0.006529484875500202, 0.007765527814626694, 0.009001570753753185, 0.010237613692879677, 0.011473656632006168, 0.01270969957113266, 0.013945742510259151, 0.015181785449385643, 0.01641782745718956, 0.017653871327638626, 0.018889915198087692, 0.02012595720589161, 0.021361999213695526, 0.022598043084144592, 0.02383408695459366, 0.025070128962397575, 0.026306170970201492, 0.02754221484065056, 0.028778258711099625, 0.03001430071890354, 0.03125034272670746, 0.032486386597156525, 0.03372243046760559, 0.03495847433805466, 0.036194514483213425, 0.03743055835366249, 0.03866660222411156, 0.039902642369270325, 0.04113868623971939, 0.04237473011016846]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 5.0, 6.0, 9.0, 4.0, 16.0, 14.0, 11.0, 11.0, 15.0, 11.0, 18.0, 20.0, 34.0, 31.0, 33.0, 27.0, 29.0, 47.0, 38.0, 40.0, 31.0, 49.0, 39.0, 41.0, 43.0, 36.0, 32.0, 37.0, 31.0, 28.0, 15.0, 33.0, 24.0, 21.0, 19.0, 18.0, 18.0, 12.0, 7.0, 10.0, 12.0, 4.0, 7.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.330078125, -3.222686767578125, -3.11529541015625, -3.007904052734375, -2.9005126953125, -2.793121337890625, -2.68572998046875, -2.578338623046875, -2.470947265625, -2.363555908203125, -2.25616455078125, -2.148773193359375, -2.0413818359375, -1.933990478515625, -1.82659912109375, -1.719207763671875, -1.61181640625, -1.504425048828125, -1.39703369140625, -1.289642333984375, -1.1822509765625, -1.074859619140625, -0.96746826171875, -0.860076904296875, -0.752685546875, -0.645294189453125, -0.53790283203125, -0.430511474609375, -0.3231201171875, -0.215728759765625, -0.10833740234375, -0.000946044921875, 0.1064453125, 0.213836669921875, 0.32122802734375, 0.428619384765625, 0.5360107421875, 0.643402099609375, 0.75079345703125, 0.858184814453125, 0.965576171875, 1.072967529296875, 1.18035888671875, 1.287750244140625, 1.3951416015625, 1.502532958984375, 1.60992431640625, 1.717315673828125, 1.82470703125, 1.932098388671875, 2.03948974609375, 2.146881103515625, 2.2542724609375, 2.361663818359375, 2.46905517578125, 2.576446533203125, 2.683837890625, 2.791229248046875, 2.89862060546875, 3.006011962890625, 3.1134033203125, 3.220794677734375, 3.32818603515625, 3.435577392578125, 3.54296875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 5.0, 13.0, 9.0, 11.0, 20.0, 33.0, 34.0, 71.0, 123.0, 200.0, 267.0, 457.0, 677.0, 1165.0, 2017.0, 3458.0, 6011.0, 11057.0, 21813.0, 45184.0, 100755.0, 252317.0, 349702.0, 135417.0, 58506.0, 27540.0, 14101.0, 7415.0, 4133.0, 2361.0, 1415.0, 850.0, 534.0, 312.0, 217.0, 108.0, 95.0, 58.0, 35.0, 25.0, 13.0, 11.0, 6.0, 8.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.8665771484375, -2.752685546875, -2.6387939453125, -2.52490234375, -2.4110107421875, -2.297119140625, -2.1832275390625, -2.0693359375, -1.9554443359375, -1.841552734375, -1.7276611328125, -1.61376953125, -1.4998779296875, -1.385986328125, -1.2720947265625, -1.158203125, -1.0443115234375, -0.930419921875, -0.8165283203125, -0.70263671875, -0.5887451171875, -0.474853515625, -0.3609619140625, -0.2470703125, -0.1331787109375, -0.019287109375, 0.0946044921875, 0.20849609375, 0.3223876953125, 0.436279296875, 0.5501708984375, 0.6640625, 0.7779541015625, 0.891845703125, 1.0057373046875, 1.11962890625, 1.2335205078125, 1.347412109375, 1.4613037109375, 1.5751953125, 1.6890869140625, 1.802978515625, 1.9168701171875, 2.03076171875, 2.1446533203125, 2.258544921875, 2.3724365234375, 2.486328125, 2.6002197265625, 2.714111328125, 2.8280029296875, 2.94189453125, 3.0557861328125, 3.169677734375, 3.2835693359375, 3.3974609375, 3.5113525390625, 3.625244140625, 3.7391357421875, 3.85302734375, 3.9669189453125, 4.080810546875, 4.1947021484375, 4.30859375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 8.0, 6.0, 8.0, 13.0, 21.0, 11.0, 17.0, 24.0, 30.0, 22.0, 33.0, 37.0, 38.0, 36.0, 51.0, 45.0, 63.0, 110.0, 274.0, 1461.0, 191.0, 103.0, 55.0, 50.0, 32.0, 35.0, 43.0, 25.0, 23.0, 23.0, 28.0, 19.0, 17.0, 25.0, 13.0, 17.0, 7.0, 9.0, 2.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.28125, -11.9129638671875, -11.544677734375, -11.1763916015625, -10.80810546875, -10.4398193359375, -10.071533203125, -9.7032470703125, -9.3349609375, -8.9666748046875, -8.598388671875, -8.2301025390625, -7.86181640625, -7.4935302734375, -7.125244140625, -6.7569580078125, -6.388671875, -6.0203857421875, -5.652099609375, -5.2838134765625, -4.91552734375, -4.5472412109375, -4.178955078125, -3.8106689453125, -3.4423828125, -3.0740966796875, -2.705810546875, -2.3375244140625, -1.96923828125, -1.6009521484375, -1.232666015625, -0.8643798828125, -0.49609375, -0.1278076171875, 0.240478515625, 0.6087646484375, 0.97705078125, 1.3453369140625, 1.713623046875, 2.0819091796875, 2.4501953125, 2.8184814453125, 3.186767578125, 3.5550537109375, 3.92333984375, 4.2916259765625, 4.659912109375, 5.0281982421875, 5.396484375, 5.7647705078125, 6.133056640625, 6.5013427734375, 6.86962890625, 7.2379150390625, 7.606201171875, 7.9744873046875, 8.3427734375, 8.7110595703125, 9.079345703125, 9.4476318359375, 9.81591796875, 10.1842041015625, 10.552490234375, 10.9207763671875, 11.2890625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 8.0, 8.0, 17.0, 23.0, 38.0, 67.0, 60.0, 114.0, 164.0, 340.0, 670.0, 4433.0, 2979933.0, 156866.0, 1784.0, 487.0, 254.0, 156.0, 99.0, 57.0, 50.0, 23.0, 20.0, 15.0, 5.0, 6.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.875, -43.4189453125, -41.962890625, -40.5068359375, -39.05078125, -37.5947265625, -36.138671875, -34.6826171875, -33.2265625, -31.7705078125, -30.314453125, -28.8583984375, -27.40234375, -25.9462890625, -24.490234375, -23.0341796875, -21.578125, -20.1220703125, -18.666015625, -17.2099609375, -15.75390625, -14.2978515625, -12.841796875, -11.3857421875, -9.9296875, -8.4736328125, -7.017578125, -5.5615234375, -4.10546875, -2.6494140625, -1.193359375, 0.2626953125, 1.71875, 3.1748046875, 4.630859375, 6.0869140625, 7.54296875, 8.9990234375, 10.455078125, 11.9111328125, 13.3671875, 14.8232421875, 16.279296875, 17.7353515625, 19.19140625, 20.6474609375, 22.103515625, 23.5595703125, 25.015625, 26.4716796875, 27.927734375, 29.3837890625, 30.83984375, 32.2958984375, 33.751953125, 35.2080078125, 36.6640625, 38.1201171875, 39.576171875, 41.0322265625, 42.48828125, 43.9443359375, 45.400390625, 46.8564453125, 48.3125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 141.0, 653.0, 213.0, 6.0, 0.0, 2.0, 1.0, 1.0], "bins": [-216.15609741210938, -212.39772033691406, -208.63934326171875, -204.88096618652344, -201.12258911132812, -197.36422729492188, -193.60585021972656, -189.84747314453125, -186.08909606933594, -182.33071899414062, -178.5723419189453, -174.81396484375, -171.05560302734375, -167.29722595214844, -163.53884887695312, -159.7804718017578, -156.0220947265625, -152.2637176513672, -148.50534057617188, -144.74696350097656, -140.98858642578125, -137.230224609375, -133.4718475341797, -129.71347045898438, -125.95509338378906, -122.19671630859375, -118.43833923339844, -114.67996978759766, -110.92159271240234, -107.16321563720703, -103.40484619140625, -99.64646911621094, -95.8880844116211, -92.12970733642578, -88.371337890625, -84.61296081542969, -80.85458374023438, -77.09620666503906, -73.33782958984375, -69.57946014404297, -65.82108306884766, -62.062705993652344, -58.3043327331543, -54.54595947265625, -50.78758239746094, -47.029205322265625, -43.27083206176758, -39.51245880126953, -35.75408172607422, -31.99570655822754, -28.23733139038086, -24.47895622253418, -20.7205810546875, -16.96220588684082, -13.20383071899414, -9.445455551147461, -5.687082290649414, -1.9287071228027344, 1.8296680450439453, 5.588043212890625, 9.346418380737305, 13.104793548583984, 16.863168716430664, 20.621543884277344, 24.379919052124023]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 10.0, 11.0, 12.0, 7.0, 18.0, 13.0, 18.0, 29.0, 19.0, 35.0, 37.0, 33.0, 34.0, 54.0, 45.0, 37.0, 35.0, 46.0, 49.0, 38.0, 48.0, 46.0, 40.0, 39.0, 30.0, 35.0, 33.0, 30.0, 15.0, 24.0, 24.0, 11.0, 10.0, 5.0, 6.0, 7.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-46.052860260009766, -44.86296463012695, -43.673072814941406, -42.483177185058594, -41.29328155517578, -40.10338592529297, -38.91349411010742, -37.72359848022461, -36.53370666503906, -35.34381103515625, -34.1539192199707, -32.96402359008789, -31.774127960205078, -30.5842342376709, -29.39434051513672, -28.204444885253906, -27.014549255371094, -25.824655532836914, -24.6347599029541, -23.444866180419922, -22.25497055053711, -21.06507682800293, -19.87518310546875, -18.685287475585938, -17.495393753051758, -16.305500030517578, -15.115604400634766, -13.925710678100586, -12.73581600189209, -11.545921325683594, -10.356027603149414, -9.166132926940918, -7.9762420654296875, -6.786347389221191, -5.5964531898498535, -4.406558990478516, -3.2166643142700195, -2.0267696380615234, -0.8368754386901855, 0.35301876068115234, 1.5429134368896484, 2.7328078746795654, 3.9227023124694824, 5.11259651184082, 6.302491188049316, 7.4923858642578125, 8.682279586791992, 9.872174263000488, 11.062068939208984, 12.25196361541748, 13.441858291625977, 14.631752014160156, 15.821646690368652, 17.01154136657715, 18.201435089111328, 19.39133071899414, 20.58122444152832, 21.7711181640625, 22.961013793945312, 24.150907516479492, 25.340801239013672, 26.530696868896484, 27.720590591430664, 28.910484313964844, 30.100379943847656]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 7.0, 6.0, 2.0, 7.0, 8.0, 8.0, 5.0, 11.0, 14.0, 17.0, 11.0, 27.0, 12.0, 24.0, 29.0, 26.0, 29.0, 21.0, 45.0, 34.0, 39.0, 39.0, 47.0, 35.0, 40.0, 38.0, 35.0, 38.0, 38.0, 36.0, 22.0, 28.0, 28.0, 24.0, 28.0, 20.0, 27.0, 14.0, 17.0, 8.0, 12.0, 7.0, 8.0, 3.0, 10.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.373046875, -3.260955810546875, -3.14886474609375, -3.036773681640625, -2.9246826171875, -2.812591552734375, -2.70050048828125, -2.588409423828125, -2.476318359375, -2.364227294921875, -2.25213623046875, -2.140045166015625, -2.0279541015625, -1.915863037109375, -1.80377197265625, -1.691680908203125, -1.57958984375, -1.467498779296875, -1.35540771484375, -1.243316650390625, -1.1312255859375, -1.019134521484375, -0.90704345703125, -0.794952392578125, -0.682861328125, -0.570770263671875, -0.45867919921875, -0.346588134765625, -0.2344970703125, -0.122406005859375, -0.01031494140625, 0.101776123046875, 0.2138671875, 0.325958251953125, 0.43804931640625, 0.550140380859375, 0.6622314453125, 0.774322509765625, 0.88641357421875, 0.998504638671875, 1.110595703125, 1.222686767578125, 1.33477783203125, 1.446868896484375, 1.5589599609375, 1.671051025390625, 1.78314208984375, 1.895233154296875, 2.00732421875, 2.119415283203125, 2.23150634765625, 2.343597412109375, 2.4556884765625, 2.567779541015625, 2.67987060546875, 2.791961669921875, 2.904052734375, 3.016143798828125, 3.12823486328125, 3.240325927734375, 3.3524169921875, 3.464508056640625, 3.57659912109375, 3.688690185546875, 3.80078125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 1.0, 2.0, 6.0, 4.0, 9.0, 8.0, 4.0, 7.0, 12.0, 11.0, 15.0, 11.0, 10.0, 23.0, 31.0, 38.0, 60.0, 73.0, 119.0, 254.0, 619.0, 1830.0, 6659.0, 32857.0, 224283.0, 1662160.0, 1930900.0, 282880.0, 39969.0, 7964.0, 2052.0, 683.0, 279.0, 123.0, 79.0, 59.0, 35.0, 26.0, 21.0, 26.0, 16.0, 6.0, 11.0, 7.0, 14.0, 8.0, 7.0, 3.0, 7.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.0546875, -8.75341796875, -8.4521484375, -8.15087890625, -7.849609375, -7.54833984375, -7.2470703125, -6.94580078125, -6.64453125, -6.34326171875, -6.0419921875, -5.74072265625, -5.439453125, -5.13818359375, -4.8369140625, -4.53564453125, -4.234375, -3.93310546875, -3.6318359375, -3.33056640625, -3.029296875, -2.72802734375, -2.4267578125, -2.12548828125, -1.82421875, -1.52294921875, -1.2216796875, -0.92041015625, -0.619140625, -0.31787109375, -0.0166015625, 0.28466796875, 0.5859375, 0.88720703125, 1.1884765625, 1.48974609375, 1.791015625, 2.09228515625, 2.3935546875, 2.69482421875, 2.99609375, 3.29736328125, 3.5986328125, 3.89990234375, 4.201171875, 4.50244140625, 4.8037109375, 5.10498046875, 5.40625, 5.70751953125, 6.0087890625, 6.31005859375, 6.611328125, 6.91259765625, 7.2138671875, 7.51513671875, 7.81640625, 8.11767578125, 8.4189453125, 8.72021484375, 9.021484375, 9.32275390625, 9.6240234375, 9.92529296875, 10.2265625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 10.0, 11.0, 14.0, 5.0, 16.0, 29.0, 36.0, 39.0, 47.0, 50.0, 84.0, 102.0, 111.0, 137.0, 180.0, 236.0, 269.0, 309.0, 310.0, 341.0, 329.0, 289.0, 235.0, 175.0, 139.0, 112.0, 93.0, 73.0, 56.0, 43.0, 42.0, 24.0, 27.0, 28.0, 12.0, 15.0, 12.0, 9.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.359375, -6.14764404296875, -5.9359130859375, -5.72418212890625, -5.512451171875, -5.30072021484375, -5.0889892578125, -4.87725830078125, -4.66552734375, -4.45379638671875, -4.2420654296875, -4.03033447265625, -3.818603515625, -3.60687255859375, -3.3951416015625, -3.18341064453125, -2.9716796875, -2.75994873046875, -2.5482177734375, -2.33648681640625, -2.124755859375, -1.91302490234375, -1.7012939453125, -1.48956298828125, -1.27783203125, -1.06610107421875, -0.8543701171875, -0.64263916015625, -0.430908203125, -0.21917724609375, -0.0074462890625, 0.20428466796875, 0.416015625, 0.62774658203125, 0.8394775390625, 1.05120849609375, 1.262939453125, 1.47467041015625, 1.6864013671875, 1.89813232421875, 2.10986328125, 2.32159423828125, 2.5333251953125, 2.74505615234375, 2.956787109375, 3.16851806640625, 3.3802490234375, 3.59197998046875, 3.8037109375, 4.01544189453125, 4.2271728515625, 4.43890380859375, 4.650634765625, 4.86236572265625, 5.0740966796875, 5.28582763671875, 5.49755859375, 5.70928955078125, 5.9210205078125, 6.13275146484375, 6.344482421875, 6.55621337890625, 6.7679443359375, 6.97967529296875, 7.19140625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 5.0, 6.0, 14.0, 22.0, 22.0, 24.0, 31.0, 37.0, 39.0, 61.0, 60.0, 100.0, 97.0, 135.0, 163.0, 235.0, 332.0, 680.0, 3216.0, 42064.0, 1114182.0, 2894901.0, 127881.0, 7311.0, 1067.0, 398.0, 223.0, 188.0, 158.0, 137.0, 102.0, 77.0, 73.0, 44.0, 37.0, 37.0, 22.0, 21.0, 20.0, 16.0, 11.0, 8.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.375, -20.689453125, -20.00390625, -19.318359375, -18.6328125, -17.947265625, -17.26171875, -16.576171875, -15.890625, -15.205078125, -14.51953125, -13.833984375, -13.1484375, -12.462890625, -11.77734375, -11.091796875, -10.40625, -9.720703125, -9.03515625, -8.349609375, -7.6640625, -6.978515625, -6.29296875, -5.607421875, -4.921875, -4.236328125, -3.55078125, -2.865234375, -2.1796875, -1.494140625, -0.80859375, -0.123046875, 0.5625, 1.248046875, 1.93359375, 2.619140625, 3.3046875, 3.990234375, 4.67578125, 5.361328125, 6.046875, 6.732421875, 7.41796875, 8.103515625, 8.7890625, 9.474609375, 10.16015625, 10.845703125, 11.53125, 12.216796875, 12.90234375, 13.587890625, 14.2734375, 14.958984375, 15.64453125, 16.330078125, 17.015625, 17.701171875, 18.38671875, 19.072265625, 19.7578125, 20.443359375, 21.12890625, 21.814453125, 22.5]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 77.0, 255.0, 360.0, 237.0, 65.0, 15.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.81350708007812, -165.16014099121094, -160.50677490234375, -155.8533935546875, -151.2000274658203, -146.54666137695312, -141.89329528808594, -137.23992919921875, -132.5865478515625, -127.93318176269531, -123.2798080444336, -118.6264419555664, -113.97306823730469, -109.3197021484375, -104.66633605957031, -100.01296997070312, -95.35960388183594, -90.70623779296875, -86.05286407470703, -81.39949798583984, -76.74612426757812, -72.09275817871094, -67.43939208984375, -62.7860221862793, -58.132652282714844, -53.47928237915039, -48.82591247558594, -44.17254638671875, -39.5191764831543, -34.865806579589844, -30.212438583374023, -25.559070587158203, -20.905715942382812, -16.25234603881836, -11.598978042602539, -6.945609092712402, -2.2922401428222656, 2.3611297607421875, 7.014497756958008, 11.667865753173828, 16.32123565673828, 20.974605560302734, 25.627973556518555, 30.281341552734375, 34.93471145629883, 39.58808135986328, 44.24144744873047, 48.89481735229492, 53.548187255859375, 58.20155715942383, 62.85492706298828, 67.50829315185547, 72.16166687011719, 76.81503295898438, 81.46839904785156, 86.12176513671875, 90.77513885498047, 95.42850494384766, 100.08187866210938, 104.73524475097656, 109.38861083984375, 114.04198455810547, 118.69535064697266, 123.34872436523438, 128.00209045410156]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 3.0, 3.0, 9.0, 12.0, 9.0, 8.0, 15.0, 18.0, 14.0, 15.0, 16.0, 32.0, 20.0, 20.0, 19.0, 33.0, 29.0, 35.0, 38.0, 32.0, 42.0, 37.0, 32.0, 35.0, 52.0, 37.0, 23.0, 34.0, 35.0, 39.0, 23.0, 26.0, 20.0, 17.0, 24.0, 20.0, 22.0, 11.0, 11.0, 10.0, 20.0, 9.0, 6.0, 9.0, 5.0, 2.0, 5.0, 1.0, 8.0, 1.0, 4.0, 0.0, 2.0], "bins": [-26.075408935546875, -25.31734275817871, -24.559276580810547, -23.801212310791016, -23.04314613342285, -22.285079956054688, -21.527015686035156, -20.768949508666992, -20.010883331298828, -19.252817153930664, -18.4947509765625, -17.73668670654297, -16.978620529174805, -16.22055435180664, -15.462489128112793, -14.704423904418945, -13.946357727050781, -13.188291549682617, -12.43022632598877, -11.672161102294922, -10.914094924926758, -10.156028747558594, -9.397963523864746, -8.639898300170898, -7.881832122802734, -7.1237664222717285, -6.365700721740723, -5.607635021209717, -4.849569320678711, -4.091503620147705, -3.333437919616699, -2.5753722190856934, -1.8173065185546875, -1.0592408180236816, -0.3011751174926758, 0.4568905830383301, 1.214956283569336, 1.9730219841003418, 2.7310876846313477, 3.4891533851623535, 4.247219085693359, 5.005284786224365, 5.763350486755371, 6.521416187286377, 7.279481887817383, 8.037548065185547, 8.795613288879395, 9.553678512573242, 10.311744689941406, 11.06981086730957, 11.827876091003418, 12.585941314697266, 13.34400749206543, 14.102073669433594, 14.860138893127441, 15.618204116821289, 16.376270294189453, 17.134336471557617, 17.89240264892578, 18.650466918945312, 19.408533096313477, 20.16659927368164, 20.924663543701172, 21.682729721069336, 22.4407958984375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 9.0, 8.0, 6.0, 7.0, 17.0, 10.0, 20.0, 17.0, 19.0, 15.0, 29.0, 27.0, 32.0, 31.0, 28.0, 37.0, 34.0, 46.0, 31.0, 36.0, 46.0, 48.0, 41.0, 41.0, 28.0, 43.0, 27.0, 31.0, 24.0, 20.0, 19.0, 24.0, 19.0, 19.0, 15.0, 19.0, 15.0, 14.0, 14.0, 7.0, 4.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.466796875, -3.35345458984375, -3.2401123046875, -3.12677001953125, -3.013427734375, -2.90008544921875, -2.7867431640625, -2.67340087890625, -2.56005859375, -2.44671630859375, -2.3333740234375, -2.22003173828125, -2.106689453125, -1.99334716796875, -1.8800048828125, -1.76666259765625, -1.6533203125, -1.53997802734375, -1.4266357421875, -1.31329345703125, -1.199951171875, -1.08660888671875, -0.9732666015625, -0.85992431640625, -0.74658203125, -0.63323974609375, -0.5198974609375, -0.40655517578125, -0.293212890625, -0.17987060546875, -0.0665283203125, 0.04681396484375, 0.16015625, 0.27349853515625, 0.3868408203125, 0.50018310546875, 0.613525390625, 0.72686767578125, 0.8402099609375, 0.95355224609375, 1.06689453125, 1.18023681640625, 1.2935791015625, 1.40692138671875, 1.520263671875, 1.63360595703125, 1.7469482421875, 1.86029052734375, 1.9736328125, 2.08697509765625, 2.2003173828125, 2.31365966796875, 2.427001953125, 2.54034423828125, 2.6536865234375, 2.76702880859375, 2.88037109375, 2.99371337890625, 3.1070556640625, 3.22039794921875, 3.333740234375, 3.44708251953125, 3.5604248046875, 3.67376708984375, 3.787109375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 11.0, 5.0, 14.0, 18.0, 31.0, 34.0, 54.0, 80.0, 122.0, 163.0, 283.0, 460.0, 706.0, 1277.0, 2322.0, 5041.0, 10868.0, 24500.0, 57468.0, 135251.0, 273650.0, 283057.0, 143163.0, 61255.0, 26026.0, 11474.0, 5184.0, 2648.0, 1337.0, 756.0, 434.0, 294.0, 169.0, 111.0, 85.0, 59.0, 37.0, 32.0, 21.0, 15.0, 14.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.9892578125, -0.9625473022460938, -0.9358367919921875, -0.9091262817382812, -0.882415771484375, -0.8557052612304688, -0.8289947509765625, -0.8022842407226562, -0.77557373046875, -0.7488632202148438, -0.7221527099609375, -0.6954421997070312, -0.668731689453125, -0.6420211791992188, -0.6153106689453125, -0.5886001586914062, -0.5618896484375, -0.5351791381835938, -0.5084686279296875, -0.48175811767578125, -0.455047607421875, -0.42833709716796875, -0.4016265869140625, -0.37491607666015625, -0.34820556640625, -0.32149505615234375, -0.2947845458984375, -0.26807403564453125, -0.241363525390625, -0.21465301513671875, -0.1879425048828125, -0.16123199462890625, -0.134521484375, -0.10781097412109375, -0.0811004638671875, -0.05438995361328125, -0.027679443359375, -0.00096893310546875, 0.0257415771484375, 0.05245208740234375, 0.07916259765625, 0.10587310791015625, 0.1325836181640625, 0.15929412841796875, 0.186004638671875, 0.21271514892578125, 0.2394256591796875, 0.26613616943359375, 0.2928466796875, 0.31955718994140625, 0.3462677001953125, 0.37297821044921875, 0.399688720703125, 0.42639923095703125, 0.4531097412109375, 0.47982025146484375, 0.50653076171875, 0.5332412719726562, 0.5599517822265625, 0.5866622924804688, 0.613372802734375, 0.6400833129882812, 0.6667938232421875, 0.6935043334960938, 0.72021484375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 6.0, 8.0, 7.0, 6.0, 7.0, 13.0, 17.0, 15.0, 19.0, 21.0, 21.0, 29.0, 40.0, 35.0, 32.0, 29.0, 40.0, 39.0, 35.0, 48.0, 1064.0, 39.0, 37.0, 32.0, 38.0, 41.0, 27.0, 34.0, 32.0, 30.0, 26.0, 27.0, 15.0, 17.0, 14.0, 14.0, 9.0, 8.0, 4.0, 8.0, 8.0, 7.0, 1.0, 8.0, 1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.162109375, -2.089019775390625, -2.01593017578125, -1.942840576171875, -1.8697509765625, -1.796661376953125, -1.72357177734375, -1.650482177734375, -1.577392578125, -1.504302978515625, -1.43121337890625, -1.358123779296875, -1.2850341796875, -1.211944580078125, -1.13885498046875, -1.065765380859375, -0.99267578125, -0.919586181640625, -0.84649658203125, -0.773406982421875, -0.7003173828125, -0.627227783203125, -0.55413818359375, -0.481048583984375, -0.407958984375, -0.334869384765625, -0.26177978515625, -0.188690185546875, -0.1156005859375, -0.042510986328125, 0.03057861328125, 0.103668212890625, 0.1767578125, 0.249847412109375, 0.32293701171875, 0.396026611328125, 0.4691162109375, 0.542205810546875, 0.61529541015625, 0.688385009765625, 0.761474609375, 0.834564208984375, 0.90765380859375, 0.980743408203125, 1.0538330078125, 1.126922607421875, 1.20001220703125, 1.273101806640625, 1.34619140625, 1.419281005859375, 1.49237060546875, 1.565460205078125, 1.6385498046875, 1.711639404296875, 1.78472900390625, 1.857818603515625, 1.930908203125, 2.003997802734375, 2.07708740234375, 2.150177001953125, 2.2232666015625, 2.296356201171875, 2.36944580078125, 2.442535400390625, 2.515625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 7.0, 6.0, 8.0, 15.0, 15.0, 22.0, 30.0, 44.0, 72.0, 91.0, 127.0, 231.0, 356.0, 612.0, 894.0, 1457.0, 2533.0, 4399.0, 7458.0, 13545.0, 24874.0, 45570.0, 81275.0, 138725.0, 556797.0, 886278.0, 142711.0, 83801.0, 46684.0, 25442.0, 14100.0, 7727.0, 4527.0, 2575.0, 1500.0, 929.0, 598.0, 371.0, 236.0, 165.0, 92.0, 64.0, 43.0, 34.0, 21.0, 20.0, 21.0, 9.0, 6.0, 5.0, 1.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.339599609375, -0.3289947509765625, -0.318389892578125, -0.3077850341796875, -0.29718017578125, -0.2865753173828125, -0.275970458984375, -0.2653656005859375, -0.2547607421875, -0.2441558837890625, -0.233551025390625, -0.2229461669921875, -0.21234130859375, -0.2017364501953125, -0.191131591796875, -0.1805267333984375, -0.169921875, -0.1593170166015625, -0.148712158203125, -0.1381072998046875, -0.12750244140625, -0.1168975830078125, -0.106292724609375, -0.0956878662109375, -0.0850830078125, -0.0744781494140625, -0.063873291015625, -0.0532684326171875, -0.04266357421875, -0.0320587158203125, -0.021453857421875, -0.0108489990234375, -0.000244140625, 0.0103607177734375, 0.020965576171875, 0.0315704345703125, 0.04217529296875, 0.0527801513671875, 0.063385009765625, 0.0739898681640625, 0.0845947265625, 0.0951995849609375, 0.105804443359375, 0.1164093017578125, 0.12701416015625, 0.1376190185546875, 0.148223876953125, 0.1588287353515625, 0.16943359375, 0.1800384521484375, 0.190643310546875, 0.2012481689453125, 0.21185302734375, 0.2224578857421875, 0.233062744140625, 0.2436676025390625, 0.2542724609375, 0.2648773193359375, 0.275482177734375, 0.2860870361328125, 0.29669189453125, 0.3072967529296875, 0.317901611328125, 0.3285064697265625, 0.339111328125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 5.0, 3.0, 5.0, 6.0, 7.0, 11.0, 10.0, 21.0, 26.0, 62.0, 88.0, 104.0, 209.0, 130.0, 84.0, 71.0, 37.0, 29.0, 28.0, 12.0, 6.0, 10.0, 5.0, 2.0, 4.0, 10.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0782470703125, -0.07611370086669922, -0.07398033142089844, -0.07184696197509766, -0.06971359252929688, -0.0675802230834961, -0.06544685363769531, -0.06331348419189453, -0.06118011474609375, -0.05904674530029297, -0.05691337585449219, -0.054780006408691406, -0.052646636962890625, -0.050513267517089844, -0.04837989807128906, -0.04624652862548828, -0.0441131591796875, -0.04197978973388672, -0.03984642028808594, -0.037713050842285156, -0.035579681396484375, -0.033446311950683594, -0.03131294250488281, -0.02917957305908203, -0.02704620361328125, -0.02491283416748047, -0.022779464721679688, -0.020646095275878906, -0.018512725830078125, -0.016379356384277344, -0.014245986938476562, -0.012112617492675781, -0.009979248046875, -0.007845878601074219, -0.0057125091552734375, -0.0035791397094726562, -0.001445770263671875, 0.0006875991821289062, 0.0028209686279296875, 0.004954338073730469, 0.00708770751953125, 0.009221076965332031, 0.011354446411132812, 0.013487815856933594, 0.015621185302734375, 0.017754554748535156, 0.019887924194335938, 0.02202129364013672, 0.0241546630859375, 0.02628803253173828, 0.028421401977539062, 0.030554771423339844, 0.032688140869140625, 0.034821510314941406, 0.03695487976074219, 0.03908824920654297, 0.04122161865234375, 0.04335498809814453, 0.04548835754394531, 0.047621726989746094, 0.049755096435546875, 0.051888465881347656, 0.05402183532714844, 0.05615520477294922, 0.05828857421875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 7.0, 3.0, 3.0, 10.0, 11.0, 10.0, 29.0, 42.0, 45.0, 112.0, 265.0, 1707.0, 917225.0, 127613.0, 1021.0, 209.0, 93.0, 43.0, 24.0, 20.0, 14.0, 9.0, 5.0, 5.0, 6.0, 1.0, 5.0, 1.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3037109375, -1.25701904296875, -1.2103271484375, -1.16363525390625, -1.116943359375, -1.07025146484375, -1.0235595703125, -0.97686767578125, -0.93017578125, -0.88348388671875, -0.8367919921875, -0.79010009765625, -0.743408203125, -0.69671630859375, -0.6500244140625, -0.60333251953125, -0.556640625, -0.50994873046875, -0.4632568359375, -0.41656494140625, -0.369873046875, -0.32318115234375, -0.2764892578125, -0.22979736328125, -0.18310546875, -0.13641357421875, -0.0897216796875, -0.04302978515625, 0.003662109375, 0.05035400390625, 0.0970458984375, 0.14373779296875, 0.1904296875, 0.23712158203125, 0.2838134765625, 0.33050537109375, 0.377197265625, 0.42388916015625, 0.4705810546875, 0.51727294921875, 0.56396484375, 0.61065673828125, 0.6573486328125, 0.70404052734375, 0.750732421875, 0.79742431640625, 0.8441162109375, 0.89080810546875, 0.9375, 0.98419189453125, 1.0308837890625, 1.07757568359375, 1.124267578125, 1.17095947265625, 1.2176513671875, 1.26434326171875, 1.31103515625, 1.35772705078125, 1.4044189453125, 1.45111083984375, 1.497802734375, 1.54449462890625, 1.5911865234375, 1.63787841796875, 1.6845703125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 26.0, 81.0, 199.0, 540.0, 113.0, 30.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2866206765174866, -0.27487069368362427, -0.2631206810474396, -0.25137069821357727, -0.23962070047855377, -0.22787070274353027, -0.21612071990966797, -0.20437072217464447, -0.19262072443962097, -0.18087072670459747, -0.16912074387073517, -0.15737074613571167, -0.14562074840068817, -0.13387075066566467, -0.12212076783180237, -0.11037077009677887, -0.09862078726291656, -0.08687079697847366, -0.07512079924345016, -0.06337080895900726, -0.05162081494927406, -0.03987082093954086, -0.02812083065509796, -0.016370832920074463, -0.004620842635631561, 0.007129150442779064, 0.01887914352118969, 0.03062913566827774, 0.04237912967801094, 0.05412912368774414, 0.06587911397218704, 0.07762911170721054, 0.08937910199165344, 0.10112909227609634, 0.11287909001111984, 0.12462908029556274, 0.13637907803058624, 0.14812907576560974, 0.15987905859947205, 0.17162905633449554, 0.18337905406951904, 0.19512905180454254, 0.20687903463840485, 0.21862903237342834, 0.23037903010845184, 0.24212902784347534, 0.25387901067733765, 0.26562899351119995, 0.27737897634506226, 0.28912895917892456, 0.30087897181510925, 0.31262895464897156, 0.32437893748283386, 0.33612895011901855, 0.34787893295288086, 0.35962891578674316, 0.37137892842292786, 0.38312891125679016, 0.39487892389297485, 0.40662890672683716, 0.41837888956069946, 0.43012890219688416, 0.44187888503074646, 0.45362889766693115, 0.46537888050079346]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 11.0, 5.0, 6.0, 15.0, 12.0, 11.0, 16.0, 14.0, 25.0, 26.0, 29.0, 35.0, 26.0, 30.0, 29.0, 38.0, 32.0, 41.0, 44.0, 35.0, 34.0, 46.0, 36.0, 36.0, 36.0, 39.0, 23.0, 35.0, 23.0, 30.0, 24.0, 24.0, 22.0, 17.0, 22.0, 14.0, 15.0, 7.0, 8.0, 10.0, 6.0, 1.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07481110095977783, -0.07235562801361084, -0.06990016251802444, -0.06744469702243805, -0.06498922407627106, -0.06253375113010406, -0.06007828563451767, -0.057622816413640976, -0.05516734719276428, -0.05271187797188759, -0.050256408751010895, -0.0478009395301342, -0.04534547030925751, -0.042890001088380814, -0.04043453186750412, -0.037979062646627426, -0.03552359342575073, -0.03306812420487404, -0.030612654983997345, -0.02815718576312065, -0.025701716542243958, -0.023246247321367264, -0.02079077810049057, -0.018335308879613876, -0.015879839658737183, -0.013424370437860489, -0.010968901216983795, -0.008513431996107101, -0.006057962775230408, -0.003602493554353714, -0.0011470243334770203, 0.0013084448873996735, 0.003763914108276367, 0.006219383329153061, 0.008674852550029755, 0.011130321770906448, 0.013585790991783142, 0.016041260212659836, 0.01849672943353653, 0.020952198654413223, 0.023407667875289917, 0.02586313709616661, 0.028318606317043304, 0.030774075537919998, 0.03322954475879669, 0.035685013979673386, 0.03814048320055008, 0.04059595242142677, 0.04305142164230347, 0.04550689086318016, 0.047962360084056854, 0.05041782930493355, 0.05287329852581024, 0.055328767746686935, 0.05778423696756363, 0.06023970618844032, 0.06269517540931702, 0.06515064835548401, 0.0676061138510704, 0.0700615793466568, 0.07251705229282379, 0.07497252523899078, 0.07742799073457718, 0.07988345623016357, 0.08233892917633057]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 9.0, 7.0, 7.0, 7.0, 16.0, 11.0, 19.0, 18.0, 18.0, 16.0, 27.0, 29.0, 33.0, 30.0, 26.0, 39.0, 32.0, 45.0, 33.0, 34.0, 47.0, 50.0, 40.0, 41.0, 29.0, 43.0, 26.0, 32.0, 24.0, 20.0, 19.0, 23.0, 19.0, 20.0, 15.0, 19.0, 15.0, 13.0, 15.0, 7.0, 4.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.46875, -3.35540771484375, -3.2420654296875, -3.12872314453125, -3.015380859375, -2.90203857421875, -2.7886962890625, -2.67535400390625, -2.56201171875, -2.44866943359375, -2.3353271484375, -2.22198486328125, -2.108642578125, -1.99530029296875, -1.8819580078125, -1.76861572265625, -1.6552734375, -1.54193115234375, -1.4285888671875, -1.31524658203125, -1.201904296875, -1.08856201171875, -0.9752197265625, -0.86187744140625, -0.74853515625, -0.63519287109375, -0.5218505859375, -0.40850830078125, -0.295166015625, -0.18182373046875, -0.0684814453125, 0.04486083984375, 0.158203125, 0.27154541015625, 0.3848876953125, 0.49822998046875, 0.611572265625, 0.72491455078125, 0.8382568359375, 0.95159912109375, 1.06494140625, 1.17828369140625, 1.2916259765625, 1.40496826171875, 1.518310546875, 1.63165283203125, 1.7449951171875, 1.85833740234375, 1.9716796875, 2.08502197265625, 2.1983642578125, 2.31170654296875, 2.425048828125, 2.53839111328125, 2.6517333984375, 2.76507568359375, 2.87841796875, 2.99176025390625, 3.1051025390625, 3.21844482421875, 3.331787109375, 3.44512939453125, 3.5584716796875, 3.67181396484375, 3.78515625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 10.0, 19.0, 23.0, 38.0, 55.0, 97.0, 145.0, 240.0, 478.0, 763.0, 1253.0, 2007.0, 3681.0, 6613.0, 12153.0, 24083.0, 55508.0, 158083.0, 410607.0, 229194.0, 78130.0, 31273.0, 15371.0, 8054.0, 4532.0, 2497.0, 1511.0, 878.0, 476.0, 286.0, 182.0, 116.0, 73.0, 43.0, 38.0, 26.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4453125, -3.32080078125, -3.1962890625, -3.07177734375, -2.947265625, -2.82275390625, -2.6982421875, -2.57373046875, -2.44921875, -2.32470703125, -2.2001953125, -2.07568359375, -1.951171875, -1.82666015625, -1.7021484375, -1.57763671875, -1.453125, -1.32861328125, -1.2041015625, -1.07958984375, -0.955078125, -0.83056640625, -0.7060546875, -0.58154296875, -0.45703125, -0.33251953125, -0.2080078125, -0.08349609375, 0.041015625, 0.16552734375, 0.2900390625, 0.41455078125, 0.5390625, 0.66357421875, 0.7880859375, 0.91259765625, 1.037109375, 1.16162109375, 1.2861328125, 1.41064453125, 1.53515625, 1.65966796875, 1.7841796875, 1.90869140625, 2.033203125, 2.15771484375, 2.2822265625, 2.40673828125, 2.53125, 2.65576171875, 2.7802734375, 2.90478515625, 3.029296875, 3.15380859375, 3.2783203125, 3.40283203125, 3.52734375, 3.65185546875, 3.7763671875, 3.90087890625, 4.025390625, 4.14990234375, 4.2744140625, 4.39892578125, 4.5234375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 8.0, 5.0, 5.0, 5.0, 7.0, 13.0, 13.0, 18.0, 13.0, 22.0, 18.0, 22.0, 27.0, 34.0, 36.0, 34.0, 50.0, 35.0, 74.0, 164.0, 1467.0, 355.0, 155.0, 98.0, 50.0, 42.0, 29.0, 49.0, 35.0, 22.0, 16.0, 23.0, 19.0, 15.0, 19.0, 15.0, 6.0, 6.0, 14.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.90625, -13.4844970703125, -13.062744140625, -12.6409912109375, -12.21923828125, -11.7974853515625, -11.375732421875, -10.9539794921875, -10.5322265625, -10.1104736328125, -9.688720703125, -9.2669677734375, -8.84521484375, -8.4234619140625, -8.001708984375, -7.5799560546875, -7.158203125, -6.7364501953125, -6.314697265625, -5.8929443359375, -5.47119140625, -5.0494384765625, -4.627685546875, -4.2059326171875, -3.7841796875, -3.3624267578125, -2.940673828125, -2.5189208984375, -2.09716796875, -1.6754150390625, -1.253662109375, -0.8319091796875, -0.41015625, 0.0115966796875, 0.433349609375, 0.8551025390625, 1.27685546875, 1.6986083984375, 2.120361328125, 2.5421142578125, 2.9638671875, 3.3856201171875, 3.807373046875, 4.2291259765625, 4.65087890625, 5.0726318359375, 5.494384765625, 5.9161376953125, 6.337890625, 6.7596435546875, 7.181396484375, 7.6031494140625, 8.02490234375, 8.4466552734375, 8.868408203125, 9.2901611328125, 9.7119140625, 10.1336669921875, 10.555419921875, 10.9771728515625, 11.39892578125, 11.8206787109375, 12.242431640625, 12.6641845703125, 13.0859375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 9.0, 9.0, 17.0, 36.0, 31.0, 63.0, 89.0, 136.0, 201.0, 301.0, 547.0, 3207.0, 2755444.0, 382385.0, 1909.0, 482.0, 270.0, 188.0, 115.0, 89.0, 65.0, 44.0, 12.0, 18.0, 14.0, 9.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.5, -44.99560546875, -43.4912109375, -41.98681640625, -40.482421875, -38.97802734375, -37.4736328125, -35.96923828125, -34.46484375, -32.96044921875, -31.4560546875, -29.95166015625, -28.447265625, -26.94287109375, -25.4384765625, -23.93408203125, -22.4296875, -20.92529296875, -19.4208984375, -17.91650390625, -16.412109375, -14.90771484375, -13.4033203125, -11.89892578125, -10.39453125, -8.89013671875, -7.3857421875, -5.88134765625, -4.376953125, -2.87255859375, -1.3681640625, 0.13623046875, 1.640625, 3.14501953125, 4.6494140625, 6.15380859375, 7.658203125, 9.16259765625, 10.6669921875, 12.17138671875, 13.67578125, 15.18017578125, 16.6845703125, 18.18896484375, 19.693359375, 21.19775390625, 22.7021484375, 24.20654296875, 25.7109375, 27.21533203125, 28.7197265625, 30.22412109375, 31.728515625, 33.23291015625, 34.7373046875, 36.24169921875, 37.74609375, 39.25048828125, 40.7548828125, 42.25927734375, 43.763671875, 45.26806640625, 46.7724609375, 48.27685546875, 49.78125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 12.0, 124.0, 528.0, 307.0, 45.0, 2.0, 1.0, 1.0], "bins": [-172.621826171875, -169.68186950683594, -166.74192810058594, -163.80197143554688, -160.86203002929688, -157.9220733642578, -154.9821319580078, -152.04217529296875, -149.10223388671875, -146.1622772216797, -143.2223358154297, -140.28237915039062, -137.34243774414062, -134.40248107910156, -131.46253967285156, -128.5225830078125, -125.5826416015625, -122.64269256591797, -119.70274353027344, -116.7627944946289, -113.82284545898438, -110.88289642333984, -107.94294738769531, -105.00299835205078, -102.06304168701172, -99.12309265136719, -96.18314361572266, -93.24319458007812, -90.3032455444336, -87.36329650878906, -84.42334747314453, -81.4833984375, -78.54344940185547, -75.60350036621094, -72.6635513305664, -69.72360229492188, -66.78365325927734, -63.84370422363281, -60.90375518798828, -57.96380615234375, -55.02385711669922, -52.08390808105469, -49.143959045410156, -46.204010009765625, -43.264060974121094, -40.32411193847656, -37.38416290283203, -34.4442138671875, -31.50426483154297, -28.564315795898438, -25.624366760253906, -22.684417724609375, -19.744468688964844, -16.804519653320312, -13.864568710327148, -10.924619674682617, -7.9846696853637695, -5.044720649719238, -2.104771137237549, 0.8351783752441406, 3.775127410888672, 6.715076446533203, 9.65502643585205, 12.594975471496582, 15.534924507141113]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 3.0, 8.0, 12.0, 13.0, 14.0, 12.0, 13.0, 14.0, 14.0, 19.0, 19.0, 21.0, 32.0, 34.0, 30.0, 39.0, 29.0, 34.0, 35.0, 29.0, 37.0, 40.0, 36.0, 32.0, 39.0, 27.0, 37.0, 33.0, 31.0, 29.0, 27.0, 18.0, 27.0, 26.0, 17.0, 13.0, 17.0, 13.0, 14.0, 13.0, 5.0, 4.0, 7.0, 5.0, 6.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.529407501220703, -30.55421257019043, -29.579015731811523, -28.60382080078125, -27.628623962402344, -26.65342903137207, -25.678234100341797, -24.70303726196289, -23.727842330932617, -22.752647399902344, -21.777450561523438, -20.802255630493164, -19.82706069946289, -18.851863861083984, -17.87666893005371, -16.901473999023438, -15.926277160644531, -14.951081275939941, -13.975885391235352, -13.000690460205078, -12.025494575500488, -11.050298690795898, -10.075103759765625, -9.099907875061035, -8.124711990356445, -7.1495161056518555, -6.174320697784424, -5.199125289916992, -4.223929405212402, -3.2487335205078125, -2.273538112640381, -1.2983427047729492, -0.3231468200683594, 0.6520488262176514, 1.627244472503662, 2.602440118789673, 3.5776357650756836, 4.552831649780273, 5.528027057647705, 6.503222465515137, 7.478418350219727, 8.453614234924316, 9.428810119628906, 10.40400505065918, 11.37920093536377, 12.35439682006836, 13.329591751098633, 14.304787635803223, 15.279983520507812, 16.255178451538086, 17.230375289916992, 18.205570220947266, 19.180767059326172, 20.155961990356445, 21.13115692138672, 22.106353759765625, 23.0815486907959, 24.056743621826172, 25.031940460205078, 26.00713539123535, 26.982330322265625, 27.95752716064453, 28.932722091674805, 29.907917022705078, 30.883113861083984]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 4.0, 5.0, 3.0, 9.0, 8.0, 10.0, 5.0, 17.0, 14.0, 17.0, 18.0, 19.0, 13.0, 31.0, 29.0, 28.0, 34.0, 31.0, 39.0, 28.0, 48.0, 34.0, 48.0, 38.0, 31.0, 46.0, 43.0, 38.0, 36.0, 31.0, 28.0, 27.0, 16.0, 21.0, 20.0, 14.0, 13.0, 18.0, 19.0, 14.0, 10.0, 14.0, 10.0, 9.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.7109375, -3.592010498046875, -3.47308349609375, -3.354156494140625, -3.2352294921875, -3.116302490234375, -2.99737548828125, -2.878448486328125, -2.759521484375, -2.640594482421875, -2.52166748046875, -2.402740478515625, -2.2838134765625, -2.164886474609375, -2.04595947265625, -1.927032470703125, -1.80810546875, -1.689178466796875, -1.57025146484375, -1.451324462890625, -1.3323974609375, -1.213470458984375, -1.09454345703125, -0.975616455078125, -0.856689453125, -0.737762451171875, -0.61883544921875, -0.499908447265625, -0.3809814453125, -0.262054443359375, -0.14312744140625, -0.024200439453125, 0.0947265625, 0.213653564453125, 0.33258056640625, 0.451507568359375, 0.5704345703125, 0.689361572265625, 0.80828857421875, 0.927215576171875, 1.046142578125, 1.165069580078125, 1.28399658203125, 1.402923583984375, 1.5218505859375, 1.640777587890625, 1.75970458984375, 1.878631591796875, 1.99755859375, 2.116485595703125, 2.23541259765625, 2.354339599609375, 2.4732666015625, 2.592193603515625, 2.71112060546875, 2.830047607421875, 2.948974609375, 3.067901611328125, 3.18682861328125, 3.305755615234375, 3.4246826171875, 3.543609619140625, 3.66253662109375, 3.781463623046875, 3.900390625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 5.0, 5.0, 10.0, 7.0, 12.0, 25.0, 20.0, 15.0, 34.0, 32.0, 59.0, 116.0, 196.0, 321.0, 779.0, 1936.0, 5719.0, 22305.0, 103629.0, 609558.0, 2062069.0, 1134273.0, 199463.0, 38937.0, 9591.0, 2940.0, 1095.0, 455.0, 214.0, 150.0, 93.0, 43.0, 37.0, 29.0, 27.0, 13.0, 14.0, 12.0, 13.0, 7.0, 6.0, 2.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.8359375, -7.58868408203125, -7.3414306640625, -7.09417724609375, -6.846923828125, -6.59967041015625, -6.3524169921875, -6.10516357421875, -5.85791015625, -5.61065673828125, -5.3634033203125, -5.11614990234375, -4.868896484375, -4.62164306640625, -4.3743896484375, -4.12713623046875, -3.8798828125, -3.63262939453125, -3.3853759765625, -3.13812255859375, -2.890869140625, -2.64361572265625, -2.3963623046875, -2.14910888671875, -1.90185546875, -1.65460205078125, -1.4073486328125, -1.16009521484375, -0.912841796875, -0.66558837890625, -0.4183349609375, -0.17108154296875, 0.076171875, 0.32342529296875, 0.5706787109375, 0.81793212890625, 1.065185546875, 1.31243896484375, 1.5596923828125, 1.80694580078125, 2.05419921875, 2.30145263671875, 2.5487060546875, 2.79595947265625, 3.043212890625, 3.29046630859375, 3.5377197265625, 3.78497314453125, 4.0322265625, 4.27947998046875, 4.5267333984375, 4.77398681640625, 5.021240234375, 5.26849365234375, 5.5157470703125, 5.76300048828125, 6.01025390625, 6.25750732421875, 6.5047607421875, 6.75201416015625, 6.999267578125, 7.24652099609375, 7.4937744140625, 7.74102783203125, 7.98828125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 8.0, 13.0, 9.0, 26.0, 26.0, 27.0, 55.0, 93.0, 98.0, 193.0, 222.0, 345.0, 447.0, 518.0, 466.0, 375.0, 346.0, 227.0, 165.0, 118.0, 99.0, 67.0, 42.0, 27.0, 20.0, 13.0, 12.0, 9.0, 5.0, 5.0, 0.0, 2.0, 1.0, 2.0], "bins": [-14.203125, -13.8795166015625, -13.555908203125, -13.2322998046875, -12.90869140625, -12.5850830078125, -12.261474609375, -11.9378662109375, -11.6142578125, -11.2906494140625, -10.967041015625, -10.6434326171875, -10.31982421875, -9.9962158203125, -9.672607421875, -9.3489990234375, -9.025390625, -8.7017822265625, -8.378173828125, -8.0545654296875, -7.73095703125, -7.4073486328125, -7.083740234375, -6.7601318359375, -6.4365234375, -6.1129150390625, -5.789306640625, -5.4656982421875, -5.14208984375, -4.8184814453125, -4.494873046875, -4.1712646484375, -3.84765625, -3.5240478515625, -3.200439453125, -2.8768310546875, -2.55322265625, -2.2296142578125, -1.906005859375, -1.5823974609375, -1.2587890625, -0.9351806640625, -0.611572265625, -0.2879638671875, 0.03564453125, 0.3592529296875, 0.682861328125, 1.0064697265625, 1.330078125, 1.6536865234375, 1.977294921875, 2.3009033203125, 2.62451171875, 2.9481201171875, 3.271728515625, 3.5953369140625, 3.9189453125, 4.2425537109375, 4.566162109375, 4.8897705078125, 5.21337890625, 5.5369873046875, 5.860595703125, 6.1842041015625, 6.5078125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 17.0, 23.0, 27.0, 34.0, 55.0, 87.0, 133.0, 191.0, 230.0, 357.0, 796.0, 5114.0, 583026.0, 3569030.0, 32557.0, 1233.0, 487.0, 296.0, 180.0, 139.0, 79.0, 63.0, 38.0, 28.0, 28.0, 9.0, 10.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.046875, -20.900146484375, -19.75341796875, -18.606689453125, -17.4599609375, -16.313232421875, -15.16650390625, -14.019775390625, -12.873046875, -11.726318359375, -10.57958984375, -9.432861328125, -8.2861328125, -7.139404296875, -5.99267578125, -4.845947265625, -3.69921875, -2.552490234375, -1.40576171875, -0.259033203125, 0.8876953125, 2.034423828125, 3.18115234375, 4.327880859375, 5.474609375, 6.621337890625, 7.76806640625, 8.914794921875, 10.0615234375, 11.208251953125, 12.35498046875, 13.501708984375, 14.6484375, 15.795166015625, 16.94189453125, 18.088623046875, 19.2353515625, 20.382080078125, 21.52880859375, 22.675537109375, 23.822265625, 24.968994140625, 26.11572265625, 27.262451171875, 28.4091796875, 29.555908203125, 30.70263671875, 31.849365234375, 32.99609375, 34.142822265625, 35.28955078125, 36.436279296875, 37.5830078125, 38.729736328125, 39.87646484375, 41.023193359375, 42.169921875, 43.316650390625, 44.46337890625, 45.610107421875, 46.7568359375, 47.903564453125, 49.05029296875, 50.197021484375, 51.34375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 2.0, 12.0, 21.0, 28.0, 64.0, 62.0, 71.0, 105.0, 112.0, 103.0, 88.0, 93.0, 73.0, 46.0, 50.0, 29.0, 19.0, 7.0, 9.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.66603469848633, -48.361122131347656, -47.05621337890625, -45.75130081176758, -44.446388244628906, -43.141475677490234, -41.83656311035156, -40.531654357910156, -39.226741790771484, -37.92182922363281, -36.616920471191406, -35.312007904052734, -34.00709533691406, -32.70218276977539, -31.39727210998535, -30.092361450195312, -28.78744888305664, -27.48253631591797, -26.17762565612793, -24.87271499633789, -23.56780242919922, -22.262889862060547, -20.957979202270508, -19.65306854248047, -18.348155975341797, -17.043243408203125, -15.738332748413086, -14.43342113494873, -13.128509521484375, -11.82359790802002, -10.518686294555664, -9.213774681091309, -7.9088592529296875, -6.603947639465332, -5.299036026000977, -3.994124412536621, -2.6892127990722656, -1.3843011856079102, -0.07938957214355469, 1.2255220413208008, 2.5304336547851562, 3.8353452682495117, 5.140256881713867, 6.445168495178223, 7.750080108642578, 9.054991722106934, 10.359903335571289, 11.664814949035645, 12.9697265625, 14.274638175964355, 15.579549789428711, 16.88446044921875, 18.189373016357422, 19.494285583496094, 20.799196243286133, 22.104106903076172, 23.409019470214844, 24.713932037353516, 26.018842697143555, 27.323753356933594, 28.628665924072266, 29.933578491210938, 31.238489151000977, 32.543399810791016, 33.84831237792969]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 0.0, 0.0, 4.0, 4.0, 5.0, 3.0, 5.0, 8.0, 9.0, 8.0, 6.0, 15.0, 14.0, 23.0, 22.0, 19.0, 19.0, 27.0, 28.0, 23.0, 37.0, 27.0, 18.0, 31.0, 28.0, 40.0, 29.0, 33.0, 45.0, 41.0, 33.0, 38.0, 37.0, 37.0, 28.0, 27.0, 28.0, 31.0, 19.0, 28.0, 16.0, 16.0, 19.0, 9.0, 21.0, 11.0, 6.0, 8.0, 9.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0], "bins": [-27.349945068359375, -26.553348541259766, -25.756750106811523, -24.96015167236328, -24.163555145263672, -23.366958618164062, -22.57036018371582, -21.773761749267578, -20.97716522216797, -20.18056869506836, -19.383970260620117, -18.587371826171875, -17.790775299072266, -16.994178771972656, -16.197580337524414, -15.400982856750488, -14.604385375976562, -13.807787895202637, -13.011190414428711, -12.214592933654785, -11.41799545288086, -10.621397972106934, -9.824800491333008, -9.028203010559082, -8.231605529785156, -7.4350080490112305, -6.638410568237305, -5.841813087463379, -5.045215606689453, -4.248618125915527, -3.4520206451416016, -2.655423164367676, -1.85882568359375, -1.0622282028198242, -0.26563072204589844, 0.5309667587280273, 1.3275642395019531, 2.124161720275879, 2.9207592010498047, 3.7173566818237305, 4.513954162597656, 5.310551643371582, 6.107149124145508, 6.903746604919434, 7.700344085693359, 8.496941566467285, 9.293539047241211, 10.090136528015137, 10.886734008789062, 11.683331489562988, 12.479928970336914, 13.27652645111084, 14.073123931884766, 14.869721412658691, 15.666318893432617, 16.46291732788086, 17.25951385498047, 18.056110382080078, 18.85270881652832, 19.649307250976562, 20.445903778076172, 21.24250030517578, 22.039098739624023, 22.835697174072266, 23.632293701171875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 4.0, 5.0, 7.0, 10.0, 7.0, 11.0, 11.0, 13.0, 15.0, 18.0, 20.0, 25.0, 23.0, 30.0, 23.0, 25.0, 29.0, 38.0, 35.0, 40.0, 38.0, 37.0, 48.0, 37.0, 42.0, 32.0, 38.0, 30.0, 33.0, 32.0, 30.0, 20.0, 32.0, 21.0, 24.0, 20.0, 13.0, 11.0, 15.0, 17.0, 11.0, 11.0, 5.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.88671875, -3.768463134765625, -3.65020751953125, -3.531951904296875, -3.4136962890625, -3.295440673828125, -3.17718505859375, -3.058929443359375, -2.940673828125, -2.822418212890625, -2.70416259765625, -2.585906982421875, -2.4676513671875, -2.349395751953125, -2.23114013671875, -2.112884521484375, -1.99462890625, -1.876373291015625, -1.75811767578125, -1.639862060546875, -1.5216064453125, -1.403350830078125, -1.28509521484375, -1.166839599609375, -1.048583984375, -0.930328369140625, -0.81207275390625, -0.693817138671875, -0.5755615234375, -0.457305908203125, -0.33905029296875, -0.220794677734375, -0.1025390625, 0.015716552734375, 0.13397216796875, 0.252227783203125, 0.3704833984375, 0.488739013671875, 0.60699462890625, 0.725250244140625, 0.843505859375, 0.961761474609375, 1.08001708984375, 1.198272705078125, 1.3165283203125, 1.434783935546875, 1.55303955078125, 1.671295166015625, 1.78955078125, 1.907806396484375, 2.02606201171875, 2.144317626953125, 2.2625732421875, 2.380828857421875, 2.49908447265625, 2.617340087890625, 2.735595703125, 2.853851318359375, 2.97210693359375, 3.090362548828125, 3.2086181640625, 3.326873779296875, 3.44512939453125, 3.563385009765625, 3.681640625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 10.0, 10.0, 19.0, 40.0, 45.0, 65.0, 97.0, 140.0, 192.0, 367.0, 485.0, 768.0, 1203.0, 1794.0, 2823.0, 4083.0, 6315.0, 9682.0, 14664.0, 22242.0, 33031.0, 50234.0, 74023.0, 106027.0, 139079.0, 152028.0, 131356.0, 97311.0, 67122.0, 45333.0, 29853.0, 19716.0, 13168.0, 8658.0, 5657.0, 3688.0, 2506.0, 1601.0, 1158.0, 632.0, 475.0, 296.0, 173.0, 134.0, 90.0, 56.0, 39.0, 29.0, 15.0, 13.0, 6.0, 3.0, 4.0, 4.0, 0.0, 2.0], "bins": [-0.425048828125, -0.4123115539550781, -0.39957427978515625, -0.3868370056152344, -0.3740997314453125, -0.3613624572753906, -0.34862518310546875, -0.3358879089355469, -0.323150634765625, -0.3104133605957031, -0.29767608642578125, -0.2849388122558594, -0.2722015380859375, -0.2594642639160156, -0.24672698974609375, -0.23398971557617188, -0.22125244140625, -0.20851516723632812, -0.19577789306640625, -0.18304061889648438, -0.1703033447265625, -0.15756607055664062, -0.14482879638671875, -0.13209152221679688, -0.119354248046875, -0.10661697387695312, -0.09387969970703125, -0.08114242553710938, -0.0684051513671875, -0.055667877197265625, -0.04293060302734375, -0.030193328857421875, -0.0174560546875, -0.004718780517578125, 0.00801849365234375, 0.020755767822265625, 0.0334930419921875, 0.046230316162109375, 0.05896759033203125, 0.07170486450195312, 0.084442138671875, 0.09717941284179688, 0.10991668701171875, 0.12265396118164062, 0.1353912353515625, 0.14812850952148438, 0.16086578369140625, 0.17360305786132812, 0.18634033203125, 0.19907760620117188, 0.21181488037109375, 0.22455215454101562, 0.2372894287109375, 0.2500267028808594, 0.26276397705078125, 0.2755012512207031, 0.288238525390625, 0.3009757995605469, 0.31371307373046875, 0.3264503479003906, 0.3391876220703125, 0.3519248962402344, 0.36466217041015625, 0.3773994445800781, 0.39013671875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 6.0, 3.0, 3.0, 11.0, 12.0, 8.0, 11.0, 22.0, 25.0, 26.0, 35.0, 38.0, 37.0, 41.0, 47.0, 38.0, 44.0, 46.0, 1078.0, 45.0, 52.0, 45.0, 41.0, 34.0, 33.0, 34.0, 30.0, 32.0, 23.0, 24.0, 17.0, 23.0, 10.0, 11.0, 7.0, 8.0, 5.0, 7.0, 2.0, 5.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.12109375, -3.0302734375, -2.939453125, -2.8486328125, -2.7578125, -2.6669921875, -2.576171875, -2.4853515625, -2.39453125, -2.3037109375, -2.212890625, -2.1220703125, -2.03125, -1.9404296875, -1.849609375, -1.7587890625, -1.66796875, -1.5771484375, -1.486328125, -1.3955078125, -1.3046875, -1.2138671875, -1.123046875, -1.0322265625, -0.94140625, -0.8505859375, -0.759765625, -0.6689453125, -0.578125, -0.4873046875, -0.396484375, -0.3056640625, -0.21484375, -0.1240234375, -0.033203125, 0.0576171875, 0.1484375, 0.2392578125, 0.330078125, 0.4208984375, 0.51171875, 0.6025390625, 0.693359375, 0.7841796875, 0.875, 0.9658203125, 1.056640625, 1.1474609375, 1.23828125, 1.3291015625, 1.419921875, 1.5107421875, 1.6015625, 1.6923828125, 1.783203125, 1.8740234375, 1.96484375, 2.0556640625, 2.146484375, 2.2373046875, 2.328125, 2.4189453125, 2.509765625, 2.6005859375, 2.69140625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 8.0, 7.0, 20.0, 36.0, 40.0, 74.0, 99.0, 153.0, 181.0, 370.0, 521.0, 825.0, 1233.0, 1935.0, 3094.0, 4720.0, 7783.0, 12343.0, 19309.0, 30220.0, 46341.0, 70294.0, 101726.0, 138104.0, 1176343.0, 154753.0, 108630.0, 76011.0, 50930.0, 33179.0, 21160.0, 13289.0, 8527.0, 5337.0, 3397.0, 2216.0, 1320.0, 904.0, 626.0, 372.0, 220.0, 157.0, 116.0, 74.0, 44.0, 36.0, 24.0, 11.0, 12.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2266845703125, -0.21875953674316406, -0.21083450317382812, -0.2029094696044922, -0.19498443603515625, -0.1870594024658203, -0.17913436889648438, -0.17120933532714844, -0.1632843017578125, -0.15535926818847656, -0.14743423461914062, -0.1395092010498047, -0.13158416748046875, -0.12365913391113281, -0.11573410034179688, -0.10780906677246094, -0.099884033203125, -0.09195899963378906, -0.08403396606445312, -0.07610893249511719, -0.06818389892578125, -0.06025886535644531, -0.052333831787109375, -0.04440879821777344, -0.0364837646484375, -0.028558731079101562, -0.020633697509765625, -0.012708663940429688, -0.00478363037109375, 0.0031414031982421875, 0.011066436767578125, 0.018991470336914062, 0.02691650390625, 0.03484153747558594, 0.042766571044921875, 0.05069160461425781, 0.05861663818359375, 0.06654167175292969, 0.07446670532226562, 0.08239173889160156, 0.0903167724609375, 0.09824180603027344, 0.10616683959960938, 0.11409187316894531, 0.12201690673828125, 0.1299419403076172, 0.13786697387695312, 0.14579200744628906, 0.153717041015625, 0.16164207458496094, 0.16956710815429688, 0.1774921417236328, 0.18541717529296875, 0.1933422088623047, 0.20126724243164062, 0.20919227600097656, 0.2171173095703125, 0.22504234313964844, 0.23296737670898438, 0.2408924102783203, 0.24881744384765625, 0.2567424774169922, 0.2646675109863281, 0.27259254455566406, 0.280517578125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 2.0, 5.0, 5.0, 3.0, 8.0, 8.0, 17.0, 17.0, 32.0, 42.0, 62.0, 90.0, 131.0, 177.0, 109.0, 61.0, 48.0, 45.0, 26.0, 29.0, 8.0, 18.0, 5.0, 8.0, 1.0, 9.0, 3.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.035064697265625, -0.034044504165649414, -0.03302431106567383, -0.03200411796569824, -0.030983924865722656, -0.02996373176574707, -0.028943538665771484, -0.0279233455657959, -0.026903152465820312, -0.025882959365844727, -0.02486276626586914, -0.023842573165893555, -0.02282238006591797, -0.021802186965942383, -0.020781993865966797, -0.01976180076599121, -0.018741607666015625, -0.01772141456604004, -0.016701221466064453, -0.015681028366088867, -0.014660835266113281, -0.013640642166137695, -0.01262044906616211, -0.011600255966186523, -0.010580062866210938, -0.009559869766235352, -0.008539676666259766, -0.00751948356628418, -0.006499290466308594, -0.005479097366333008, -0.004458904266357422, -0.003438711166381836, -0.00241851806640625, -0.001398324966430664, -0.0003781318664550781, 0.0006420612335205078, 0.0016622543334960938, 0.0026824474334716797, 0.0037026405334472656, 0.0047228336334228516, 0.0057430267333984375, 0.0067632198333740234, 0.007783412933349609, 0.008803606033325195, 0.009823799133300781, 0.010843992233276367, 0.011864185333251953, 0.012884378433227539, 0.013904571533203125, 0.014924764633178711, 0.015944957733154297, 0.016965150833129883, 0.01798534393310547, 0.019005537033081055, 0.02002573013305664, 0.021045923233032227, 0.022066116333007812, 0.0230863094329834, 0.024106502532958984, 0.02512669563293457, 0.026146888732910156, 0.027167081832885742, 0.028187274932861328, 0.029207468032836914, 0.0302276611328125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 10.0, 10.0, 6.0, 5.0, 16.0, 20.0, 33.0, 38.0, 72.0, 80.0, 142.0, 477.0, 9327.0, 1019694.0, 17567.0, 550.0, 170.0, 100.0, 57.0, 43.0, 33.0, 18.0, 15.0, 11.0, 11.0, 3.0, 4.0, 5.0, 7.0, 3.0, 6.0, 2.0, 1.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.620849609375, -0.59912109375, -0.577392578125, -0.5556640625, -0.533935546875, -0.51220703125, -0.490478515625, -0.46875, -0.447021484375, -0.42529296875, -0.403564453125, -0.3818359375, -0.360107421875, -0.33837890625, -0.316650390625, -0.294921875, -0.273193359375, -0.25146484375, -0.229736328125, -0.2080078125, -0.186279296875, -0.16455078125, -0.142822265625, -0.12109375, -0.099365234375, -0.07763671875, -0.055908203125, -0.0341796875, -0.012451171875, 0.00927734375, 0.031005859375, 0.052734375, 0.074462890625, 0.09619140625, 0.117919921875, 0.1396484375, 0.161376953125, 0.18310546875, 0.204833984375, 0.2265625, 0.248291015625, 0.27001953125, 0.291748046875, 0.3134765625, 0.335205078125, 0.35693359375, 0.378662109375, 0.400390625, 0.422119140625, 0.44384765625, 0.465576171875, 0.4873046875, 0.509033203125, 0.53076171875, 0.552490234375, 0.57421875, 0.595947265625, 0.61767578125, 0.639404296875, 0.6611328125, 0.682861328125, 0.70458984375, 0.726318359375, 0.748046875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 11.0, 20.0, 28.0, 54.0, 83.0, 139.0, 315.0, 195.0, 73.0, 34.0, 21.0, 14.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17712287604808807, -0.17362652719020844, -0.1701301783323288, -0.16663382947444916, -0.16313748061656952, -0.15964113175868988, -0.15614478290081024, -0.1526484191417694, -0.14915207028388977, -0.14565572142601013, -0.1421593725681305, -0.13866302371025085, -0.13516667485237122, -0.13167032599449158, -0.12817397713661194, -0.1246776208281517, -0.12118127942085266, -0.11768493056297302, -0.11418858170509338, -0.11069223284721375, -0.1071958839893341, -0.10369953513145447, -0.10020317882299423, -0.0967068299651146, -0.09321048110723495, -0.08971413224935532, -0.08621778339147568, -0.08272143453359604, -0.0792250782251358, -0.07572872936725616, -0.07223238050937653, -0.06873603165149689, -0.06523968279361725, -0.06174333393573761, -0.05824698507785797, -0.054750632494688034, -0.051254283636808395, -0.04775793477892876, -0.04426158219575882, -0.04076523333787918, -0.037268880754709244, -0.033772531896829605, -0.030276181176304817, -0.02677983045578003, -0.02328348159790039, -0.019787132740020752, -0.016290782019495964, -0.012794431298971176, -0.009298082441091537, -0.005801732651889324, -0.002305382862687111, 0.0011909669265151024, 0.004687316715717316, 0.008183665573596954, 0.011680016294121742, 0.01517636701464653, 0.01867271587252617, 0.022169064730405807, 0.025665415450930595, 0.029161766171455383, 0.03265811502933502, 0.03615446388721466, 0.0396508127450943, 0.043147165328264236, 0.046643514186143875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 6.0, 10.0, 8.0, 12.0, 18.0, 20.0, 15.0, 19.0, 19.0, 30.0, 32.0, 34.0, 26.0, 33.0, 47.0, 32.0, 36.0, 47.0, 29.0, 50.0, 41.0, 43.0, 28.0, 29.0, 30.0, 35.0, 29.0, 37.0, 24.0, 26.0, 20.0, 19.0, 15.0, 18.0, 8.0, 16.0, 18.0, 8.0, 8.0, 8.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.04727530479431152, -0.045874178409576416, -0.04447305202484131, -0.0430719256401062, -0.041670799255371094, -0.040269672870635986, -0.03886854648590088, -0.03746742010116577, -0.036066293716430664, -0.03466516733169556, -0.03326404094696045, -0.03186291456222534, -0.030461788177490234, -0.029060661792755127, -0.02765953540802002, -0.026258409023284912, -0.024857282638549805, -0.023456156253814697, -0.02205502986907959, -0.020653903484344482, -0.019252777099609375, -0.017851650714874268, -0.01645052433013916, -0.015049397945404053, -0.013648271560668945, -0.012247145175933838, -0.01084601879119873, -0.009444892406463623, -0.008043766021728516, -0.006642639636993408, -0.005241513252258301, -0.0038403868675231934, -0.002439260482788086, -0.0010381340980529785, 0.0003629922866821289, 0.0017641186714172363, 0.0031652450561523438, 0.004566371440887451, 0.005967497825622559, 0.007368624210357666, 0.008769750595092773, 0.01017087697982788, 0.011572003364562988, 0.012973129749298096, 0.014374256134033203, 0.01577538251876831, 0.017176508903503418, 0.018577635288238525, 0.019978761672973633, 0.02137988805770874, 0.022781014442443848, 0.024182140827178955, 0.025583267211914062, 0.02698439359664917, 0.028385519981384277, 0.029786646366119385, 0.031187772750854492, 0.0325888991355896, 0.03399002552032471, 0.035391151905059814, 0.03679227828979492, 0.03819340467453003, 0.03959453105926514, 0.040995657444000244, 0.04239678382873535]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 4.0, 5.0, 8.0, 9.0, 6.0, 13.0, 10.0, 13.0, 16.0, 17.0, 20.0, 25.0, 23.0, 29.0, 24.0, 26.0, 28.0, 38.0, 35.0, 40.0, 38.0, 38.0, 46.0, 38.0, 43.0, 31.0, 37.0, 31.0, 33.0, 32.0, 31.0, 19.0, 32.0, 21.0, 24.0, 20.0, 14.0, 10.0, 15.0, 17.0, 11.0, 11.0, 5.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.884765625, -3.76654052734375, -3.6483154296875, -3.53009033203125, -3.411865234375, -3.29364013671875, -3.1754150390625, -3.05718994140625, -2.93896484375, -2.82073974609375, -2.7025146484375, -2.58428955078125, -2.466064453125, -2.34783935546875, -2.2296142578125, -2.11138916015625, -1.9931640625, -1.87493896484375, -1.7567138671875, -1.63848876953125, -1.520263671875, -1.40203857421875, -1.2838134765625, -1.16558837890625, -1.04736328125, -0.92913818359375, -0.8109130859375, -0.69268798828125, -0.574462890625, -0.45623779296875, -0.3380126953125, -0.21978759765625, -0.1015625, 0.01666259765625, 0.1348876953125, 0.25311279296875, 0.371337890625, 0.48956298828125, 0.6077880859375, 0.72601318359375, 0.84423828125, 0.96246337890625, 1.0806884765625, 1.19891357421875, 1.317138671875, 1.43536376953125, 1.5535888671875, 1.67181396484375, 1.7900390625, 1.90826416015625, 2.0264892578125, 2.14471435546875, 2.262939453125, 2.38116455078125, 2.4993896484375, 2.61761474609375, 2.73583984375, 2.85406494140625, 2.9722900390625, 3.09051513671875, 3.208740234375, 3.32696533203125, 3.4451904296875, 3.56341552734375, 3.681640625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 2.0, 6.0, 8.0, 12.0, 14.0, 19.0, 26.0, 36.0, 48.0, 69.0, 119.0, 154.0, 253.0, 446.0, 743.0, 1150.0, 1855.0, 3204.0, 5452.0, 10461.0, 21831.0, 50512.0, 134559.0, 368861.0, 275447.0, 97842.0, 38507.0, 17099.0, 8409.0, 4460.0, 2565.0, 1658.0, 976.0, 615.0, 390.0, 249.0, 169.0, 98.0, 54.0, 53.0, 39.0, 23.0, 23.0, 11.0, 9.0, 9.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.65234375, -3.5411376953125, -3.429931640625, -3.3187255859375, -3.20751953125, -3.0963134765625, -2.985107421875, -2.8739013671875, -2.7626953125, -2.6514892578125, -2.540283203125, -2.4290771484375, -2.31787109375, -2.2066650390625, -2.095458984375, -1.9842529296875, -1.873046875, -1.7618408203125, -1.650634765625, -1.5394287109375, -1.42822265625, -1.3170166015625, -1.205810546875, -1.0946044921875, -0.9833984375, -0.8721923828125, -0.760986328125, -0.6497802734375, -0.53857421875, -0.4273681640625, -0.316162109375, -0.2049560546875, -0.09375, 0.0174560546875, 0.128662109375, 0.2398681640625, 0.35107421875, 0.4622802734375, 0.573486328125, 0.6846923828125, 0.7958984375, 0.9071044921875, 1.018310546875, 1.1295166015625, 1.24072265625, 1.3519287109375, 1.463134765625, 1.5743408203125, 1.685546875, 1.7967529296875, 1.907958984375, 2.0191650390625, 2.13037109375, 2.2415771484375, 2.352783203125, 2.4639892578125, 2.5751953125, 2.6864013671875, 2.797607421875, 2.9088134765625, 3.02001953125, 3.1312255859375, 3.242431640625, 3.3536376953125, 3.46484375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 9.0, 12.0, 13.0, 9.0, 9.0, 18.0, 13.0, 35.0, 34.0, 37.0, 33.0, 44.0, 37.0, 59.0, 83.0, 199.0, 1589.0, 278.0, 93.0, 59.0, 46.0, 38.0, 45.0, 32.0, 43.0, 34.0, 21.0, 18.0, 10.0, 20.0, 12.0, 10.0, 13.0, 10.0, 3.0, 5.0, 3.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.5234375, -15.0616455078125, -14.599853515625, -14.1380615234375, -13.67626953125, -13.2144775390625, -12.752685546875, -12.2908935546875, -11.8291015625, -11.3673095703125, -10.905517578125, -10.4437255859375, -9.98193359375, -9.5201416015625, -9.058349609375, -8.5965576171875, -8.134765625, -7.6729736328125, -7.211181640625, -6.7493896484375, -6.28759765625, -5.8258056640625, -5.364013671875, -4.9022216796875, -4.4404296875, -3.9786376953125, -3.516845703125, -3.0550537109375, -2.59326171875, -2.1314697265625, -1.669677734375, -1.2078857421875, -0.74609375, -0.2843017578125, 0.177490234375, 0.6392822265625, 1.10107421875, 1.5628662109375, 2.024658203125, 2.4864501953125, 2.9482421875, 3.4100341796875, 3.871826171875, 4.3336181640625, 4.79541015625, 5.2572021484375, 5.718994140625, 6.1807861328125, 6.642578125, 7.1043701171875, 7.566162109375, 8.0279541015625, 8.48974609375, 8.9515380859375, 9.413330078125, 9.8751220703125, 10.3369140625, 10.7987060546875, 11.260498046875, 11.7222900390625, 12.18408203125, 12.6458740234375, 13.107666015625, 13.5694580078125, 14.03125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 6.0, 6.0, 4.0, 12.0, 18.0, 19.0, 24.0, 28.0, 33.0, 59.0, 90.0, 136.0, 158.0, 248.0, 358.0, 956.0, 6847.0, 2628893.0, 501566.0, 4418.0, 732.0, 311.0, 214.0, 166.0, 102.0, 82.0, 49.0, 39.0, 22.0, 21.0, 21.0, 14.0, 7.0, 10.0, 5.0, 7.0, 6.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.125, -38.00439453125, -36.8837890625, -35.76318359375, -34.642578125, -33.52197265625, -32.4013671875, -31.28076171875, -30.16015625, -29.03955078125, -27.9189453125, -26.79833984375, -25.677734375, -24.55712890625, -23.4365234375, -22.31591796875, -21.1953125, -20.07470703125, -18.9541015625, -17.83349609375, -16.712890625, -15.59228515625, -14.4716796875, -13.35107421875, -12.23046875, -11.10986328125, -9.9892578125, -8.86865234375, -7.748046875, -6.62744140625, -5.5068359375, -4.38623046875, -3.265625, -2.14501953125, -1.0244140625, 0.09619140625, 1.216796875, 2.33740234375, 3.4580078125, 4.57861328125, 5.69921875, 6.81982421875, 7.9404296875, 9.06103515625, 10.181640625, 11.30224609375, 12.4228515625, 13.54345703125, 14.6640625, 15.78466796875, 16.9052734375, 18.02587890625, 19.146484375, 20.26708984375, 21.3876953125, 22.50830078125, 23.62890625, 24.74951171875, 25.8701171875, 26.99072265625, 28.111328125, 29.23193359375, 30.3525390625, 31.47314453125, 32.59375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 74.0, 885.0, 61.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-281.42095947265625, -276.25244140625, -271.08392333984375, -265.9154052734375, -260.7468566894531, -255.57833862304688, -250.40982055664062, -245.24130249023438, -240.07278442382812, -234.90426635742188, -229.73573303222656, -224.5672149658203, -219.39869689941406, -214.23016357421875, -209.0616455078125, -203.89312744140625, -198.72459411621094, -193.5560760498047, -188.38754272460938, -183.21902465820312, -178.05050659179688, -172.88198852539062, -167.7134552001953, -162.54493713378906, -157.37640380859375, -152.2078857421875, -147.0393524169922, -141.87083435058594, -136.7023162841797, -131.53378295898438, -126.36526489257812, -121.19674682617188, -116.02821350097656, -110.85968780517578, -105.69116973876953, -100.52264404296875, -95.3541259765625, -90.18560028076172, -85.01707458496094, -79.84855651855469, -74.68003845214844, -69.51151275634766, -64.3429946899414, -59.174468994140625, -54.00594711303711, -48.837425231933594, -43.66889953613281, -38.5003776550293, -33.331851959228516, -28.163330078125, -22.99480628967285, -17.826282501220703, -12.657760620117188, -7.489238739013672, -2.3207149505615234, 2.847808837890625, 8.01633071899414, 13.184853553771973, 18.353376388549805, 23.521900177001953, 28.69042205810547, 33.858943939208984, 39.0274658203125, 44.19599151611328, 49.3645133972168]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 7.0, 4.0, 9.0, 12.0, 12.0, 7.0, 9.0, 19.0, 15.0, 17.0, 19.0, 20.0, 33.0, 26.0, 40.0, 24.0, 25.0, 35.0, 31.0, 43.0, 44.0, 54.0, 37.0, 52.0, 51.0, 40.0, 39.0, 38.0, 28.0, 28.0, 28.0, 19.0, 26.0, 20.0, 17.0, 15.0, 15.0, 9.0, 14.0, 6.0, 8.0, 6.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0], "bins": [-40.91716766357422, -39.75961685180664, -38.6020622253418, -37.44451141357422, -36.28696060180664, -35.12940979003906, -33.97185516357422, -32.81430435180664, -31.656753540039062, -30.49920082092285, -29.341650009155273, -28.184097290039062, -27.026546478271484, -25.868993759155273, -24.711441040039062, -23.553890228271484, -22.396337509155273, -21.238784790039062, -20.081233978271484, -18.923681259155273, -17.766130447387695, -16.608577728271484, -15.45102596282959, -14.293474197387695, -13.1359224319458, -11.978370666503906, -10.820818901062012, -9.663267135620117, -8.505714416503906, -7.34816312789917, -6.190610885620117, -5.033059120178223, -3.875507354736328, -2.7179555892944336, -1.56040358543396, -0.40285158157348633, 0.7547001838684082, 1.9122519493103027, 3.0698041915893555, 4.22735595703125, 5.3849077224731445, 6.542459487915039, 7.700011253356934, 8.857563018798828, 10.015115737915039, 11.172666549682617, 12.330219268798828, 13.487771034240723, 14.645322799682617, 15.802874565124512, 16.960426330566406, 18.117979049682617, 19.275529861450195, 20.433082580566406, 21.590633392333984, 22.748186111450195, 23.905738830566406, 25.063291549682617, 26.220842361450195, 27.378395080566406, 28.535945892333984, 29.693498611450195, 30.851051330566406, 32.008602142333984, 33.16615295410156]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 7.0, 6.0, 12.0, 8.0, 8.0, 7.0, 17.0, 16.0, 17.0, 20.0, 25.0, 21.0, 27.0, 24.0, 31.0, 29.0, 33.0, 34.0, 38.0, 51.0, 40.0, 45.0, 27.0, 34.0, 43.0, 22.0, 31.0, 27.0, 28.0, 29.0, 32.0, 27.0, 22.0, 23.0, 21.0, 19.0, 13.0, 23.0, 10.0, 6.0, 14.0, 11.0, 2.0, 6.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.9453125, -3.82550048828125, -3.7056884765625, -3.58587646484375, -3.466064453125, -3.34625244140625, -3.2264404296875, -3.10662841796875, -2.98681640625, -2.86700439453125, -2.7471923828125, -2.62738037109375, -2.507568359375, -2.38775634765625, -2.2679443359375, -2.14813232421875, -2.0283203125, -1.90850830078125, -1.7886962890625, -1.66888427734375, -1.549072265625, -1.42926025390625, -1.3094482421875, -1.18963623046875, -1.06982421875, -0.95001220703125, -0.8302001953125, -0.71038818359375, -0.590576171875, -0.47076416015625, -0.3509521484375, -0.23114013671875, -0.111328125, 0.00848388671875, 0.1282958984375, 0.24810791015625, 0.367919921875, 0.48773193359375, 0.6075439453125, 0.72735595703125, 0.84716796875, 0.96697998046875, 1.0867919921875, 1.20660400390625, 1.326416015625, 1.44622802734375, 1.5660400390625, 1.68585205078125, 1.8056640625, 1.92547607421875, 2.0452880859375, 2.16510009765625, 2.284912109375, 2.40472412109375, 2.5245361328125, 2.64434814453125, 2.76416015625, 2.88397216796875, 3.0037841796875, 3.12359619140625, 3.243408203125, 3.36322021484375, 3.4830322265625, 3.60284423828125, 3.72265625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 6.0, 7.0, 11.0, 9.0, 13.0, 21.0, 27.0, 23.0, 27.0, 37.0, 62.0, 49.0, 68.0, 114.0, 196.0, 338.0, 587.0, 1374.0, 3702.0, 11860.0, 43570.0, 200335.0, 1015223.0, 1993985.0, 735719.0, 140008.0, 32167.0, 9077.0, 2992.0, 1197.0, 553.0, 286.0, 156.0, 94.0, 73.0, 52.0, 42.0, 57.0, 35.0, 23.0, 22.0, 12.0, 21.0, 16.0, 6.0, 7.0, 6.0, 3.0, 6.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.921875, -7.68463134765625, -7.4473876953125, -7.21014404296875, -6.972900390625, -6.73565673828125, -6.4984130859375, -6.26116943359375, -6.02392578125, -5.78668212890625, -5.5494384765625, -5.31219482421875, -5.074951171875, -4.83770751953125, -4.6004638671875, -4.36322021484375, -4.1259765625, -3.88873291015625, -3.6514892578125, -3.41424560546875, -3.177001953125, -2.93975830078125, -2.7025146484375, -2.46527099609375, -2.22802734375, -1.99078369140625, -1.7535400390625, -1.51629638671875, -1.279052734375, -1.04180908203125, -0.8045654296875, -0.56732177734375, -0.330078125, -0.09283447265625, 0.1444091796875, 0.38165283203125, 0.618896484375, 0.85614013671875, 1.0933837890625, 1.33062744140625, 1.56787109375, 1.80511474609375, 2.0423583984375, 2.27960205078125, 2.516845703125, 2.75408935546875, 2.9913330078125, 3.22857666015625, 3.4658203125, 3.70306396484375, 3.9403076171875, 4.17755126953125, 4.414794921875, 4.65203857421875, 4.8892822265625, 5.12652587890625, 5.36376953125, 5.60101318359375, 5.8382568359375, 6.07550048828125, 6.312744140625, 6.54998779296875, 6.7872314453125, 7.02447509765625, 7.26171875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 9.0, 10.0, 7.0, 12.0, 15.0, 26.0, 37.0, 49.0, 59.0, 72.0, 110.0, 173.0, 219.0, 275.0, 369.0, 465.0, 448.0, 403.0, 346.0, 280.0, 191.0, 152.0, 96.0, 63.0, 56.0, 42.0, 19.0, 17.0, 16.0, 8.0, 8.0, 10.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.015625, -10.72039794921875, -10.4251708984375, -10.12994384765625, -9.834716796875, -9.53948974609375, -9.2442626953125, -8.94903564453125, -8.65380859375, -8.35858154296875, -8.0633544921875, -7.76812744140625, -7.472900390625, -7.17767333984375, -6.8824462890625, -6.58721923828125, -6.2919921875, -5.99676513671875, -5.7015380859375, -5.40631103515625, -5.111083984375, -4.81585693359375, -4.5206298828125, -4.22540283203125, -3.93017578125, -3.63494873046875, -3.3397216796875, -3.04449462890625, -2.749267578125, -2.45404052734375, -2.1588134765625, -1.86358642578125, -1.568359375, -1.27313232421875, -0.9779052734375, -0.68267822265625, -0.387451171875, -0.09222412109375, 0.2030029296875, 0.49822998046875, 0.79345703125, 1.08868408203125, 1.3839111328125, 1.67913818359375, 1.974365234375, 2.26959228515625, 2.5648193359375, 2.86004638671875, 3.1552734375, 3.45050048828125, 3.7457275390625, 4.04095458984375, 4.336181640625, 4.63140869140625, 4.9266357421875, 5.22186279296875, 5.51708984375, 5.81231689453125, 6.1075439453125, 6.40277099609375, 6.697998046875, 6.99322509765625, 7.2884521484375, 7.58367919921875, 7.87890625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 8.0, 12.0, 8.0, 18.0, 27.0, 46.0, 55.0, 73.0, 137.0, 213.0, 290.0, 538.0, 1459.0, 29366.0, 3906022.0, 251286.0, 2908.0, 709.0, 354.0, 256.0, 149.0, 94.0, 80.0, 48.0, 34.0, 21.0, 16.0, 10.0, 17.0, 4.0, 10.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.6875, -40.283203125, -38.87890625, -37.474609375, -36.0703125, -34.666015625, -33.26171875, -31.857421875, -30.453125, -29.048828125, -27.64453125, -26.240234375, -24.8359375, -23.431640625, -22.02734375, -20.623046875, -19.21875, -17.814453125, -16.41015625, -15.005859375, -13.6015625, -12.197265625, -10.79296875, -9.388671875, -7.984375, -6.580078125, -5.17578125, -3.771484375, -2.3671875, -0.962890625, 0.44140625, 1.845703125, 3.25, 4.654296875, 6.05859375, 7.462890625, 8.8671875, 10.271484375, 11.67578125, 13.080078125, 14.484375, 15.888671875, 17.29296875, 18.697265625, 20.1015625, 21.505859375, 22.91015625, 24.314453125, 25.71875, 27.123046875, 28.52734375, 29.931640625, 31.3359375, 32.740234375, 34.14453125, 35.548828125, 36.953125, 38.357421875, 39.76171875, 41.166015625, 42.5703125, 43.974609375, 45.37890625, 46.783203125, 48.1875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 22.0, 117.0, 375.0, 354.0, 130.0, 18.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-277.0457763671875, -271.2831115722656, -265.5204772949219, -259.7578125, -253.9951629638672, -248.23251342773438, -242.4698486328125, -236.7071990966797, -230.94454956054688, -225.18190002441406, -219.4192352294922, -213.65658569335938, -207.89393615722656, -202.13128662109375, -196.36862182617188, -190.60597229003906, -184.8433074951172, -179.08065795898438, -173.3179931640625, -167.5553436279297, -161.79269409179688, -156.030029296875, -150.2673797607422, -144.50473022460938, -138.7420654296875, -132.9794158935547, -127.21675872802734, -121.4541015625, -115.69145202636719, -109.92879486083984, -104.1661376953125, -98.40348815917969, -92.64083862304688, -86.87818145751953, -81.11553192138672, -75.35287475585938, -69.59022521972656, -63.82756805419922, -58.064910888671875, -52.3022575378418, -46.53960418701172, -40.77695083618164, -35.01429748535156, -29.25164031982422, -23.48898696899414, -17.726333618164062, -11.963676452636719, -6.201023101806641, -0.4383697509765625, 5.324284553527832, 11.086938858032227, 16.849594116210938, 22.612247467041016, 28.374900817871094, 34.13755798339844, 39.900211334228516, 45.662864685058594, 51.42551803588867, 57.18817138671875, 62.950828552246094, 68.71348571777344, 74.47613525390625, 80.2387924194336, 86.00144958496094, 91.76409912109375]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 3.0, 3.0, 7.0, 10.0, 10.0, 14.0, 8.0, 10.0, 28.0, 8.0, 15.0, 29.0, 19.0, 38.0, 19.0, 38.0, 47.0, 38.0, 37.0, 48.0, 41.0, 38.0, 35.0, 46.0, 34.0, 49.0, 38.0, 43.0, 26.0, 42.0, 35.0, 30.0, 20.0, 14.0, 12.0, 16.0, 10.0, 10.0, 6.0, 5.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.287445068359375, -30.28133773803711, -29.275232315063477, -28.26912498474121, -27.263019561767578, -26.256912231445312, -25.250804901123047, -24.24469757080078, -23.23859214782715, -22.232484817504883, -21.22637939453125, -20.220272064208984, -19.21416473388672, -18.208059310913086, -17.20195198059082, -16.195846557617188, -15.189739227294922, -14.183632850646973, -13.177526473999023, -12.171419143676758, -11.165312767028809, -10.15920639038086, -9.153099060058594, -8.146992683410645, -7.140886306762695, -6.134779930114746, -5.128673076629639, -4.122566223144531, -3.116459846496582, -2.110353469848633, -1.1042466163635254, -0.09813976287841797, 0.9079666137695312, 1.9140732288360596, 2.920179843902588, 3.926286458969116, 4.9323930740356445, 5.938499450683594, 6.944606304168701, 7.950713157653809, 8.956819534301758, 9.962925910949707, 10.969032287597656, 11.975139617919922, 12.981245994567871, 13.98735237121582, 14.993459701538086, 15.999566078186035, 17.005672454833984, 18.01177978515625, 19.017885208129883, 20.02399253845215, 21.03009796142578, 22.036205291748047, 23.042312622070312, 24.048419952392578, 25.05452537536621, 26.060632705688477, 27.06673812866211, 28.072845458984375, 29.07895278930664, 30.085058212280273, 31.09116554260254, 32.09727096557617, 33.10337829589844]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 7.0, 1.0, 3.0, 10.0, 8.0, 12.0, 10.0, 14.0, 20.0, 20.0, 18.0, 17.0, 24.0, 21.0, 22.0, 20.0, 26.0, 32.0, 37.0, 25.0, 38.0, 31.0, 30.0, 34.0, 37.0, 39.0, 30.0, 29.0, 38.0, 28.0, 33.0, 28.0, 40.0, 27.0, 24.0, 28.0, 20.0, 14.0, 13.0, 11.0, 10.0, 13.0, 8.0, 5.0, 12.0, 4.0, 5.0, 6.0, 4.0, 6.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0], "bins": [-3.60546875, -3.493804931640625, -3.38214111328125, -3.270477294921875, -3.1588134765625, -3.047149658203125, -2.93548583984375, -2.823822021484375, -2.712158203125, -2.600494384765625, -2.48883056640625, -2.377166748046875, -2.2655029296875, -2.153839111328125, -2.04217529296875, -1.930511474609375, -1.81884765625, -1.707183837890625, -1.59552001953125, -1.483856201171875, -1.3721923828125, -1.260528564453125, -1.14886474609375, -1.037200927734375, -0.925537109375, -0.813873291015625, -0.70220947265625, -0.590545654296875, -0.4788818359375, -0.367218017578125, -0.25555419921875, -0.143890380859375, -0.0322265625, 0.079437255859375, 0.19110107421875, 0.302764892578125, 0.4144287109375, 0.526092529296875, 0.63775634765625, 0.749420166015625, 0.861083984375, 0.972747802734375, 1.08441162109375, 1.196075439453125, 1.3077392578125, 1.419403076171875, 1.53106689453125, 1.642730712890625, 1.75439453125, 1.866058349609375, 1.97772216796875, 2.089385986328125, 2.2010498046875, 2.312713623046875, 2.42437744140625, 2.536041259765625, 2.647705078125, 2.759368896484375, 2.87103271484375, 2.982696533203125, 3.0943603515625, 3.206024169921875, 3.31768798828125, 3.429351806640625, 3.541015625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 8.0, 11.0, 26.0, 33.0, 61.0, 98.0, 135.0, 209.0, 308.0, 444.0, 730.0, 1125.0, 1616.0, 2604.0, 4050.0, 6291.0, 9553.0, 14970.0, 23554.0, 36533.0, 55399.0, 82775.0, 117549.0, 151257.0, 154780.0, 124122.0, 88668.0, 60674.0, 39521.0, 25257.0, 16396.0, 10657.0, 6784.0, 4326.0, 2800.0, 1806.0, 1169.0, 810.0, 478.0, 344.0, 220.0, 132.0, 108.0, 55.0, 44.0, 21.0, 13.0, 12.0, 8.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.415771484375, -0.4028167724609375, -0.389862060546875, -0.3769073486328125, -0.36395263671875, -0.3509979248046875, -0.338043212890625, -0.3250885009765625, -0.3121337890625, -0.2991790771484375, -0.286224365234375, -0.2732696533203125, -0.26031494140625, -0.2473602294921875, -0.234405517578125, -0.2214508056640625, -0.20849609375, -0.1955413818359375, -0.182586669921875, -0.1696319580078125, -0.15667724609375, -0.1437225341796875, -0.130767822265625, -0.1178131103515625, -0.1048583984375, -0.0919036865234375, -0.078948974609375, -0.0659942626953125, -0.05303955078125, -0.0400848388671875, -0.027130126953125, -0.0141754150390625, -0.001220703125, 0.0117340087890625, 0.024688720703125, 0.0376434326171875, 0.05059814453125, 0.0635528564453125, 0.076507568359375, 0.0894622802734375, 0.1024169921875, 0.1153717041015625, 0.128326416015625, 0.1412811279296875, 0.15423583984375, 0.1671905517578125, 0.180145263671875, 0.1930999755859375, 0.2060546875, 0.2190093994140625, 0.231964111328125, 0.2449188232421875, 0.25787353515625, 0.2708282470703125, 0.283782958984375, 0.2967376708984375, 0.3096923828125, 0.3226470947265625, 0.335601806640625, 0.3485565185546875, 0.36151123046875, 0.3744659423828125, 0.387420654296875, 0.4003753662109375, 0.413330078125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 8.0, 8.0, 6.0, 8.0, 9.0, 14.0, 19.0, 14.0, 23.0, 27.0, 15.0, 25.0, 27.0, 34.0, 38.0, 31.0, 29.0, 47.0, 41.0, 50.0, 1054.0, 41.0, 40.0, 45.0, 38.0, 36.0, 28.0, 39.0, 36.0, 21.0, 26.0, 22.0, 15.0, 18.0, 15.0, 20.0, 12.0, 8.0, 6.0, 9.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.796875, -2.71136474609375, -2.6258544921875, -2.54034423828125, -2.454833984375, -2.36932373046875, -2.2838134765625, -2.19830322265625, -2.11279296875, -2.02728271484375, -1.9417724609375, -1.85626220703125, -1.770751953125, -1.68524169921875, -1.5997314453125, -1.51422119140625, -1.4287109375, -1.34320068359375, -1.2576904296875, -1.17218017578125, -1.086669921875, -1.00115966796875, -0.9156494140625, -0.83013916015625, -0.74462890625, -0.65911865234375, -0.5736083984375, -0.48809814453125, -0.402587890625, -0.31707763671875, -0.2315673828125, -0.14605712890625, -0.060546875, 0.02496337890625, 0.1104736328125, 0.19598388671875, 0.281494140625, 0.36700439453125, 0.4525146484375, 0.53802490234375, 0.62353515625, 0.70904541015625, 0.7945556640625, 0.88006591796875, 0.965576171875, 1.05108642578125, 1.1365966796875, 1.22210693359375, 1.3076171875, 1.39312744140625, 1.4786376953125, 1.56414794921875, 1.649658203125, 1.73516845703125, 1.8206787109375, 1.90618896484375, 1.99169921875, 2.07720947265625, 2.1627197265625, 2.24822998046875, 2.333740234375, 2.41925048828125, 2.5047607421875, 2.59027099609375, 2.67578125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 9.0, 6.0, 13.0, 10.0, 18.0, 25.0, 47.0, 73.0, 93.0, 175.0, 246.0, 390.0, 622.0, 959.0, 1587.0, 2425.0, 3929.0, 6503.0, 10343.0, 16933.0, 27612.0, 44191.0, 69523.0, 103879.0, 144191.0, 1200756.0, 152990.0, 110451.0, 74342.0, 47366.0, 29425.0, 18573.0, 11152.0, 6900.0, 4332.0, 2650.0, 1567.0, 1045.0, 597.0, 413.0, 250.0, 165.0, 121.0, 87.0, 56.0, 35.0, 17.0, 11.0, 16.0, 9.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.265625, -0.2569389343261719, -0.24825286865234375, -0.23956680297851562, -0.2308807373046875, -0.22219467163085938, -0.21350860595703125, -0.20482254028320312, -0.196136474609375, -0.18745040893554688, -0.17876434326171875, -0.17007827758789062, -0.1613922119140625, -0.15270614624023438, -0.14402008056640625, -0.13533401489257812, -0.12664794921875, -0.11796188354492188, -0.10927581787109375, -0.10058975219726562, -0.0919036865234375, -0.08321762084960938, -0.07453155517578125, -0.06584548950195312, -0.057159423828125, -0.048473358154296875, -0.03978729248046875, -0.031101226806640625, -0.0224151611328125, -0.013729095458984375, -0.00504302978515625, 0.003643035888671875, 0.0123291015625, 0.021015167236328125, 0.02970123291015625, 0.038387298583984375, 0.0470733642578125, 0.055759429931640625, 0.06444549560546875, 0.07313156127929688, 0.081817626953125, 0.09050369262695312, 0.09918975830078125, 0.10787582397460938, 0.1165618896484375, 0.12524795532226562, 0.13393402099609375, 0.14262008666992188, 0.15130615234375, 0.15999221801757812, 0.16867828369140625, 0.17736434936523438, 0.1860504150390625, 0.19473648071289062, 0.20342254638671875, 0.21210861206054688, 0.220794677734375, 0.22948074340820312, 0.23816680908203125, 0.24685287475585938, 0.2555389404296875, 0.2642250061035156, 0.27291107177734375, 0.2815971374511719, 0.290283203125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 8.0, 4.0, 4.0, 10.0, 10.0, 8.0, 17.0, 11.0, 13.0, 20.0, 22.0, 36.0, 31.0, 48.0, 64.0, 63.0, 89.0, 112.0, 85.0, 54.0, 45.0, 50.0, 31.0, 23.0, 18.0, 13.0, 12.0, 8.0, 10.0, 10.0, 10.0, 6.0, 10.0, 5.0, 4.0, 7.0, 5.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0175933837890625, -0.017015457153320312, -0.016437530517578125, -0.015859603881835938, -0.01528167724609375, -0.014703750610351562, -0.014125823974609375, -0.013547897338867188, -0.012969970703125, -0.012392044067382812, -0.011814117431640625, -0.011236190795898438, -0.01065826416015625, -0.010080337524414062, -0.009502410888671875, -0.008924484252929688, -0.0083465576171875, -0.0077686309814453125, -0.007190704345703125, -0.0066127777099609375, -0.00603485107421875, -0.0054569244384765625, -0.004878997802734375, -0.0043010711669921875, -0.00372314453125, -0.0031452178955078125, -0.002567291259765625, -0.0019893646240234375, -0.00141143798828125, -0.0008335113525390625, -0.000255584716796875, 0.0003223419189453125, 0.0009002685546875, 0.0014781951904296875, 0.002056121826171875, 0.0026340484619140625, 0.00321197509765625, 0.0037899017333984375, 0.004367828369140625, 0.0049457550048828125, 0.005523681640625, 0.0061016082763671875, 0.006679534912109375, 0.0072574615478515625, 0.00783538818359375, 0.008413314819335938, 0.008991241455078125, 0.009569168090820312, 0.0101470947265625, 0.010725021362304688, 0.011302947998046875, 0.011880874633789062, 0.01245880126953125, 0.013036727905273438, 0.013614654541015625, 0.014192581176757812, 0.0147705078125, 0.015348434448242188, 0.015926361083984375, 0.016504287719726562, 0.01708221435546875, 0.017660140991210938, 0.018238067626953125, 0.018815994262695312, 0.0193939208984375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 6.0, 3.0, 6.0, 9.0, 7.0, 7.0, 9.0, 9.0, 17.0, 13.0, 16.0, 13.0, 39.0, 30.0, 60.0, 93.0, 121.0, 438.0, 5005.0, 1021423.0, 20005.0, 624.0, 194.0, 105.0, 62.0, 39.0, 31.0, 33.0, 19.0, 23.0, 13.0, 12.0, 12.0, 8.0, 7.0, 5.0, 7.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.4560546875, -0.4424934387207031, -0.42893218994140625, -0.4153709411621094, -0.4018096923828125, -0.3882484436035156, -0.37468719482421875, -0.3611259460449219, -0.347564697265625, -0.3340034484863281, -0.32044219970703125, -0.3068809509277344, -0.2933197021484375, -0.2797584533691406, -0.26619720458984375, -0.2526359558105469, -0.23907470703125, -0.22551345825195312, -0.21195220947265625, -0.19839096069335938, -0.1848297119140625, -0.17126846313476562, -0.15770721435546875, -0.14414596557617188, -0.130584716796875, -0.11702346801757812, -0.10346221923828125, -0.08990097045898438, -0.0763397216796875, -0.06277847290039062, -0.04921722412109375, -0.035655975341796875, -0.0220947265625, -0.008533477783203125, 0.00502777099609375, 0.018589019775390625, 0.0321502685546875, 0.045711517333984375, 0.05927276611328125, 0.07283401489257812, 0.086395263671875, 0.09995651245117188, 0.11351776123046875, 0.12707901000976562, 0.1406402587890625, 0.15420150756835938, 0.16776275634765625, 0.18132400512695312, 0.19488525390625, 0.20844650268554688, 0.22200775146484375, 0.23556900024414062, 0.2491302490234375, 0.2626914978027344, 0.27625274658203125, 0.2898139953613281, 0.303375244140625, 0.3169364929199219, 0.33049774169921875, 0.3440589904785156, 0.3576202392578125, 0.3711814880371094, 0.38474273681640625, 0.3983039855957031, 0.411865234375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 12.0, 19.0, 78.0, 332.0, 475.0, 79.0, 18.0, 3.0, 3.0], "bins": [-0.25232696533203125, -0.2480594515800476, -0.24379193782806396, -0.23952442407608032, -0.23525691032409668, -0.23098939657211304, -0.2267218828201294, -0.22245436906814575, -0.2181868553161621, -0.21391934156417847, -0.20965182781219482, -0.20538431406021118, -0.20111680030822754, -0.1968492865562439, -0.19258177280426025, -0.1883142590522766, -0.18404674530029297, -0.17977923154830933, -0.17551171779632568, -0.17124420404434204, -0.1669766902923584, -0.16270917654037476, -0.1584416627883911, -0.15417414903640747, -0.14990663528442383, -0.14563912153244019, -0.14137160778045654, -0.1371040940284729, -0.13283658027648926, -0.12856906652450562, -0.12430155277252197, -0.12003403902053833, -0.11576651781797409, -0.11149900406599045, -0.1072314903140068, -0.10296397656202316, -0.09869646281003952, -0.09442894905805588, -0.09016143530607224, -0.08589392155408859, -0.08162640780210495, -0.07735889405012131, -0.07309138029813766, -0.06882386654615402, -0.06455635279417038, -0.06028883904218674, -0.056021325290203094, -0.05175381153821945, -0.04748629778623581, -0.04321878403425217, -0.038951270282268524, -0.03468375653028488, -0.03041624277830124, -0.026148729026317596, -0.021881215274333954, -0.01761370152235031, -0.01334618590772152, -0.009078672155737877, -0.004811158403754234, -0.0005436446517705917, 0.003723869100213051, 0.007991382852196693, 0.012258896604180336, 0.01652641035616398, 0.02079392410814762]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 4.0, 10.0, 6.0, 13.0, 17.0, 15.0, 11.0, 24.0, 21.0, 26.0, 36.0, 38.0, 35.0, 38.0, 39.0, 52.0, 50.0, 39.0, 44.0, 29.0, 45.0, 51.0, 28.0, 35.0, 24.0, 21.0, 31.0, 38.0, 27.0, 28.0, 24.0, 16.0, 13.0, 16.0, 14.0, 8.0, 10.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.03228342533111572, -0.03128441423177719, -0.03028540126979351, -0.02928638830780983, -0.028287377208471298, -0.027288366109132767, -0.026289353147149086, -0.025290340185165405, -0.024291329085826874, -0.023292317986488342, -0.02229330502450466, -0.02129429206252098, -0.02029528096318245, -0.019296269863843918, -0.018297256901860237, -0.017298243939876556, -0.016299232840538025, -0.015300220809876919, -0.014301208779215813, -0.013302196748554707, -0.0123031847178936, -0.011304172687232494, -0.010305160656571388, -0.009306148625910282, -0.008307136595249176, -0.00730812456458807, -0.006309112533926964, -0.005310100503265858, -0.004311088472604752, -0.0033120764419436455, -0.0023130644112825394, -0.0013140523806214333, -0.00031504034996032715, 0.000683971680700779, 0.001682983711361885, 0.002681995742022991, 0.0036810077726840973, 0.004680019803345203, 0.0056790318340063095, 0.006678043864667416, 0.007677055895328522, 0.008676067925989628, 0.009675079956650734, 0.01067409198731184, 0.011673104017972946, 0.012672116048634052, 0.013671128079295158, 0.014670140109956264, 0.01566915214061737, 0.016668163239955902, 0.017667176201939583, 0.018666189163923264, 0.019665200263261795, 0.020664211362600327, 0.021663224324584007, 0.022662237286567688, 0.02366124838590622, 0.02466025948524475, 0.02565927244722843, 0.026658285409212112, 0.027657296508550644, 0.028656307607889175, 0.029655320569872856, 0.030654333531856537, 0.03165334463119507]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 7.0, 1.0, 3.0, 10.0, 8.0, 12.0, 9.0, 15.0, 21.0, 19.0, 18.0, 18.0, 23.0, 21.0, 22.0, 19.0, 28.0, 31.0, 38.0, 24.0, 38.0, 31.0, 30.0, 34.0, 37.0, 39.0, 30.0, 29.0, 38.0, 28.0, 33.0, 28.0, 41.0, 26.0, 24.0, 28.0, 21.0, 13.0, 13.0, 10.0, 12.0, 12.0, 7.0, 6.0, 12.0, 4.0, 5.0, 6.0, 4.0, 6.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0], "bins": [-3.60546875, -3.493804931640625, -3.38214111328125, -3.270477294921875, -3.1588134765625, -3.047149658203125, -2.93548583984375, -2.823822021484375, -2.712158203125, -2.600494384765625, -2.48883056640625, -2.377166748046875, -2.2655029296875, -2.153839111328125, -2.04217529296875, -1.930511474609375, -1.81884765625, -1.707183837890625, -1.59552001953125, -1.483856201171875, -1.3721923828125, -1.260528564453125, -1.14886474609375, -1.037200927734375, -0.925537109375, -0.813873291015625, -0.70220947265625, -0.590545654296875, -0.4788818359375, -0.367218017578125, -0.25555419921875, -0.143890380859375, -0.0322265625, 0.079437255859375, 0.19110107421875, 0.302764892578125, 0.4144287109375, 0.526092529296875, 0.63775634765625, 0.749420166015625, 0.861083984375, 0.972747802734375, 1.08441162109375, 1.196075439453125, 1.3077392578125, 1.419403076171875, 1.53106689453125, 1.642730712890625, 1.75439453125, 1.866058349609375, 1.97772216796875, 2.089385986328125, 2.2010498046875, 2.312713623046875, 2.42437744140625, 2.536041259765625, 2.647705078125, 2.759368896484375, 2.87103271484375, 2.982696533203125, 3.0943603515625, 3.206024169921875, 3.31768798828125, 3.429351806640625, 3.541015625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 8.0, 3.0, 5.0, 9.0, 20.0, 33.0, 52.0, 60.0, 85.0, 152.0, 206.0, 344.0, 540.0, 865.0, 1450.0, 2388.0, 4049.0, 7111.0, 12714.0, 23298.0, 45056.0, 94157.0, 203462.0, 334792.0, 161170.0, 75149.0, 36511.0, 19469.0, 10451.0, 6107.0, 3450.0, 2012.0, 1306.0, 757.0, 468.0, 305.0, 189.0, 114.0, 62.0, 57.0, 39.0, 21.0, 10.0, 13.0, 16.0, 6.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.826171875, -3.71478271484375, -3.6033935546875, -3.49200439453125, -3.380615234375, -3.26922607421875, -3.1578369140625, -3.04644775390625, -2.93505859375, -2.82366943359375, -2.7122802734375, -2.60089111328125, -2.489501953125, -2.37811279296875, -2.2667236328125, -2.15533447265625, -2.0439453125, -1.93255615234375, -1.8211669921875, -1.70977783203125, -1.598388671875, -1.48699951171875, -1.3756103515625, -1.26422119140625, -1.15283203125, -1.04144287109375, -0.9300537109375, -0.81866455078125, -0.707275390625, -0.59588623046875, -0.4844970703125, -0.37310791015625, -0.26171875, -0.15032958984375, -0.0389404296875, 0.07244873046875, 0.183837890625, 0.29522705078125, 0.4066162109375, 0.51800537109375, 0.62939453125, 0.74078369140625, 0.8521728515625, 0.96356201171875, 1.074951171875, 1.18634033203125, 1.2977294921875, 1.40911865234375, 1.5205078125, 1.63189697265625, 1.7432861328125, 1.85467529296875, 1.966064453125, 2.07745361328125, 2.1888427734375, 2.30023193359375, 2.41162109375, 2.52301025390625, 2.6343994140625, 2.74578857421875, 2.857177734375, 2.96856689453125, 3.0799560546875, 3.19134521484375, 3.302734375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 9.0, 15.0, 15.0, 11.0, 26.0, 23.0, 24.0, 22.0, 37.0, 32.0, 27.0, 40.0, 50.0, 84.0, 103.0, 255.0, 1503.0, 243.0, 99.0, 55.0, 54.0, 41.0, 27.0, 41.0, 23.0, 32.0, 20.0, 17.0, 21.0, 18.0, 21.0, 7.0, 13.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-16.875, -16.41259765625, -15.9501953125, -15.48779296875, -15.025390625, -14.56298828125, -14.1005859375, -13.63818359375, -13.17578125, -12.71337890625, -12.2509765625, -11.78857421875, -11.326171875, -10.86376953125, -10.4013671875, -9.93896484375, -9.4765625, -9.01416015625, -8.5517578125, -8.08935546875, -7.626953125, -7.16455078125, -6.7021484375, -6.23974609375, -5.77734375, -5.31494140625, -4.8525390625, -4.39013671875, -3.927734375, -3.46533203125, -3.0029296875, -2.54052734375, -2.078125, -1.61572265625, -1.1533203125, -0.69091796875, -0.228515625, 0.23388671875, 0.6962890625, 1.15869140625, 1.62109375, 2.08349609375, 2.5458984375, 3.00830078125, 3.470703125, 3.93310546875, 4.3955078125, 4.85791015625, 5.3203125, 5.78271484375, 6.2451171875, 6.70751953125, 7.169921875, 7.63232421875, 8.0947265625, 8.55712890625, 9.01953125, 9.48193359375, 9.9443359375, 10.40673828125, 10.869140625, 11.33154296875, 11.7939453125, 12.25634765625, 12.71875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 7.0, 7.0, 15.0, 10.0, 10.0, 35.0, 36.0, 35.0, 49.0, 63.0, 91.0, 115.0, 183.0, 214.0, 386.0, 1152.0, 14282.0, 2950225.0, 173896.0, 3152.0, 671.0, 299.0, 199.0, 143.0, 124.0, 82.0, 50.0, 36.0, 32.0, 21.0, 24.0, 16.0, 19.0, 10.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.40625, -36.22802734375, -35.0498046875, -33.87158203125, -32.693359375, -31.51513671875, -30.3369140625, -29.15869140625, -27.98046875, -26.80224609375, -25.6240234375, -24.44580078125, -23.267578125, -22.08935546875, -20.9111328125, -19.73291015625, -18.5546875, -17.37646484375, -16.1982421875, -15.02001953125, -13.841796875, -12.66357421875, -11.4853515625, -10.30712890625, -9.12890625, -7.95068359375, -6.7724609375, -5.59423828125, -4.416015625, -3.23779296875, -2.0595703125, -0.88134765625, 0.296875, 1.47509765625, 2.6533203125, 3.83154296875, 5.009765625, 6.18798828125, 7.3662109375, 8.54443359375, 9.72265625, 10.90087890625, 12.0791015625, 13.25732421875, 14.435546875, 15.61376953125, 16.7919921875, 17.97021484375, 19.1484375, 20.32666015625, 21.5048828125, 22.68310546875, 23.861328125, 25.03955078125, 26.2177734375, 27.39599609375, 28.57421875, 29.75244140625, 30.9306640625, 32.10888671875, 33.287109375, 34.46533203125, 35.6435546875, 36.82177734375, 38.0]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [71.0, 606.0, 318.0, 24.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.739951133728027, -2.998826742172241, 0.7422976493835449, 4.48342227935791, 8.224546432495117, 11.965670585632324, 15.706795692443848, 19.447917938232422, 23.189044952392578, 26.9301700592041, 30.671293258666992, 34.412418365478516, 38.153541564941406, 41.89466857910156, 45.63579177856445, 49.376914978027344, 53.118038177490234, 56.859161376953125, 60.60028839111328, 64.34141540527344, 68.08253479003906, 71.82366180419922, 75.56478881835938, 79.305908203125, 83.04703521728516, 86.78816223144531, 90.52928161621094, 94.2704086303711, 98.01153564453125, 101.75265502929688, 105.49378204345703, 109.23490905761719, 112.97603607177734, 116.7171630859375, 120.45828247070312, 124.19940948486328, 127.94053649902344, 131.68165588378906, 135.42279052734375, 139.16390991210938, 142.905029296875, 146.64614868164062, 150.3872833251953, 154.12840270996094, 157.86952209472656, 161.61065673828125, 165.35177612304688, 169.0928955078125, 172.8340301513672, 176.5751495361328, 180.3162841796875, 184.05740356445312, 187.79852294921875, 191.53965759277344, 195.28077697753906, 199.0218963623047, 202.7630157470703, 206.50413513183594, 210.24526977539062, 213.98638916015625, 217.72750854492188, 221.46864318847656, 225.2097625732422, 228.9508819580078, 232.6920166015625]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 9.0, 7.0, 5.0, 11.0, 5.0, 11.0, 19.0, 17.0, 15.0, 22.0, 15.0, 30.0, 29.0, 18.0, 25.0, 32.0, 42.0, 27.0, 26.0, 37.0, 51.0, 45.0, 38.0, 29.0, 31.0, 35.0, 35.0, 38.0, 44.0, 29.0, 25.0, 20.0, 22.0, 20.0, 31.0, 20.0, 22.0, 7.0, 8.0, 13.0, 3.0, 15.0, 12.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.540550231933594, -32.49601364135742, -31.45147705078125, -30.406940460205078, -29.362403869628906, -28.317867279052734, -27.27332878112793, -26.228792190551758, -25.184255599975586, -24.139719009399414, -23.095182418823242, -22.05064582824707, -21.006107330322266, -19.961570739746094, -18.917034149169922, -17.87249755859375, -16.827960968017578, -15.783424377441406, -14.738887786865234, -13.694350242614746, -12.649813652038574, -11.605277061462402, -10.560739517211914, -9.516202926635742, -8.47166633605957, -7.427129745483398, -6.382592678070068, -5.338055610656738, -4.293519020080566, -3.2489824295043945, -2.2044453620910645, -1.1599082946777344, -0.1153717041015625, 0.9291651248931885, 1.9737019538879395, 3.0182387828826904, 4.062775611877441, 5.107312202453613, 6.151849269866943, 7.196386337280273, 8.240922927856445, 9.285459518432617, 10.329996109008789, 11.374533653259277, 12.41907024383545, 13.463606834411621, 14.50814437866211, 15.552680969238281, 16.597217559814453, 17.641754150390625, 18.686290740966797, 19.73082733154297, 20.77536392211914, 21.819900512695312, 22.864439010620117, 23.90897560119629, 24.95351219177246, 25.998048782348633, 27.042585372924805, 28.087121963500977, 29.13166046142578, 30.176197052001953, 31.220733642578125, 32.2652702331543, 33.30980682373047]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 9.0, 5.0, 9.0, 14.0, 17.0, 14.0, 17.0, 21.0, 21.0, 28.0, 20.0, 20.0, 25.0, 35.0, 35.0, 37.0, 33.0, 22.0, 35.0, 31.0, 33.0, 33.0, 39.0, 48.0, 35.0, 32.0, 32.0, 32.0, 36.0, 29.0, 21.0, 22.0, 19.0, 18.0, 21.0, 9.0, 13.0, 6.0, 12.0, 11.0, 5.0, 3.0, 14.0, 3.0, 2.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.767578125, -3.645355224609375, -3.52313232421875, -3.400909423828125, -3.2786865234375, -3.156463623046875, -3.03424072265625, -2.912017822265625, -2.789794921875, -2.667572021484375, -2.54534912109375, -2.423126220703125, -2.3009033203125, -2.178680419921875, -2.05645751953125, -1.934234619140625, -1.81201171875, -1.689788818359375, -1.56756591796875, -1.445343017578125, -1.3231201171875, -1.200897216796875, -1.07867431640625, -0.956451416015625, -0.834228515625, -0.712005615234375, -0.58978271484375, -0.467559814453125, -0.3453369140625, -0.223114013671875, -0.10089111328125, 0.021331787109375, 0.1435546875, 0.265777587890625, 0.38800048828125, 0.510223388671875, 0.6324462890625, 0.754669189453125, 0.87689208984375, 0.999114990234375, 1.121337890625, 1.243560791015625, 1.36578369140625, 1.488006591796875, 1.6102294921875, 1.732452392578125, 1.85467529296875, 1.976898193359375, 2.09912109375, 2.221343994140625, 2.34356689453125, 2.465789794921875, 2.5880126953125, 2.710235595703125, 2.83245849609375, 2.954681396484375, 3.076904296875, 3.199127197265625, 3.32135009765625, 3.443572998046875, 3.5657958984375, 3.688018798828125, 3.81024169921875, 3.932464599609375, 4.0546875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 4.0, 4.0, 6.0, 14.0, 13.0, 11.0, 17.0, 19.0, 28.0, 35.0, 23.0, 50.0, 61.0, 104.0, 214.0, 444.0, 1047.0, 3093.0, 11055.0, 51726.0, 367535.0, 2206545.0, 1346560.0, 166870.0, 28174.0, 6825.0, 2058.0, 831.0, 363.0, 166.0, 99.0, 66.0, 36.0, 27.0, 28.0, 29.0, 17.0, 14.0, 12.0, 4.0, 8.0, 6.0, 6.0, 5.0, 4.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0], "bins": [-11.0078125, -10.67236328125, -10.3369140625, -10.00146484375, -9.666015625, -9.33056640625, -8.9951171875, -8.65966796875, -8.32421875, -7.98876953125, -7.6533203125, -7.31787109375, -6.982421875, -6.64697265625, -6.3115234375, -5.97607421875, -5.640625, -5.30517578125, -4.9697265625, -4.63427734375, -4.298828125, -3.96337890625, -3.6279296875, -3.29248046875, -2.95703125, -2.62158203125, -2.2861328125, -1.95068359375, -1.615234375, -1.27978515625, -0.9443359375, -0.60888671875, -0.2734375, 0.06201171875, 0.3974609375, 0.73291015625, 1.068359375, 1.40380859375, 1.7392578125, 2.07470703125, 2.41015625, 2.74560546875, 3.0810546875, 3.41650390625, 3.751953125, 4.08740234375, 4.4228515625, 4.75830078125, 5.09375, 5.42919921875, 5.7646484375, 6.10009765625, 6.435546875, 6.77099609375, 7.1064453125, 7.44189453125, 7.77734375, 8.11279296875, 8.4482421875, 8.78369140625, 9.119140625, 9.45458984375, 9.7900390625, 10.12548828125, 10.4609375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 10.0, 5.0, 6.0, 7.0, 12.0, 15.0, 11.0, 17.0, 28.0, 43.0, 54.0, 50.0, 74.0, 87.0, 130.0, 189.0, 242.0, 258.0, 343.0, 418.0, 401.0, 391.0, 285.0, 215.0, 190.0, 142.0, 108.0, 86.0, 46.0, 48.0, 45.0, 30.0, 20.0, 16.0, 17.0, 6.0, 4.0, 6.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.2421875, -8.9713134765625, -8.700439453125, -8.4295654296875, -8.15869140625, -7.8878173828125, -7.616943359375, -7.3460693359375, -7.0751953125, -6.8043212890625, -6.533447265625, -6.2625732421875, -5.99169921875, -5.7208251953125, -5.449951171875, -5.1790771484375, -4.908203125, -4.6373291015625, -4.366455078125, -4.0955810546875, -3.82470703125, -3.5538330078125, -3.282958984375, -3.0120849609375, -2.7412109375, -2.4703369140625, -2.199462890625, -1.9285888671875, -1.65771484375, -1.3868408203125, -1.115966796875, -0.8450927734375, -0.57421875, -0.3033447265625, -0.032470703125, 0.2384033203125, 0.50927734375, 0.7801513671875, 1.051025390625, 1.3218994140625, 1.5927734375, 1.8636474609375, 2.134521484375, 2.4053955078125, 2.67626953125, 2.9471435546875, 3.218017578125, 3.4888916015625, 3.759765625, 4.0306396484375, 4.301513671875, 4.5723876953125, 4.84326171875, 5.1141357421875, 5.385009765625, 5.6558837890625, 5.9267578125, 6.1976318359375, 6.468505859375, 6.7393798828125, 7.01025390625, 7.2811279296875, 7.552001953125, 7.8228759765625, 8.09375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 8.0, 7.0, 8.0, 14.0, 15.0, 25.0, 31.0, 47.0, 59.0, 66.0, 111.0, 152.0, 207.0, 279.0, 542.0, 2091.0, 37821.0, 3471548.0, 669269.0, 9582.0, 1037.0, 414.0, 255.0, 168.0, 133.0, 95.0, 68.0, 62.0, 49.0, 23.0, 17.0, 19.0, 12.0, 12.0, 4.0, 7.0, 9.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-40.1875, -38.923828125, -37.66015625, -36.396484375, -35.1328125, -33.869140625, -32.60546875, -31.341796875, -30.078125, -28.814453125, -27.55078125, -26.287109375, -25.0234375, -23.759765625, -22.49609375, -21.232421875, -19.96875, -18.705078125, -17.44140625, -16.177734375, -14.9140625, -13.650390625, -12.38671875, -11.123046875, -9.859375, -8.595703125, -7.33203125, -6.068359375, -4.8046875, -3.541015625, -2.27734375, -1.013671875, 0.25, 1.513671875, 2.77734375, 4.041015625, 5.3046875, 6.568359375, 7.83203125, 9.095703125, 10.359375, 11.623046875, 12.88671875, 14.150390625, 15.4140625, 16.677734375, 17.94140625, 19.205078125, 20.46875, 21.732421875, 22.99609375, 24.259765625, 25.5234375, 26.787109375, 28.05078125, 29.314453125, 30.578125, 31.841796875, 33.10546875, 34.369140625, 35.6328125, 36.896484375, 38.16015625, 39.423828125, 40.6875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 31.0, 148.0, 377.0, 323.0, 109.0, 20.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.74324798583984, -90.66070556640625, -85.57817077636719, -80.4956283569336, -75.4130859375, -70.33055114746094, -65.24800872802734, -60.165470123291016, -55.08293151855469, -50.00039291381836, -44.91785430908203, -39.83531188964844, -34.75277328491211, -29.67023468017578, -24.58769416809082, -19.50515365600586, -14.422615051269531, -9.340075492858887, -4.257535934448242, 0.8250036239624023, 5.907543182373047, 10.990081787109375, 16.072622299194336, 21.155162811279297, 26.237701416015625, 31.320240020751953, 36.40277862548828, 41.485321044921875, 46.5678596496582, 51.65039825439453, 56.732940673828125, 61.81547927856445, 66.89801025390625, 71.98055267333984, 77.0630874633789, 82.1456298828125, 87.22816467285156, 92.31070709228516, 97.39324951171875, 102.47578430175781, 107.5583267211914, 112.640869140625, 117.72340393066406, 122.80594635009766, 127.88848876953125, 132.9710235595703, 138.05355834960938, 143.1361083984375, 148.21864318847656, 153.30117797851562, 158.38372802734375, 163.4662628173828, 168.54879760742188, 173.63134765625, 178.71388244628906, 183.79641723632812, 188.87896728515625, 193.9615020751953, 199.04405212402344, 204.1265869140625, 209.20912170410156, 214.29165649414062, 219.37420654296875, 224.4567413330078, 229.53927612304688]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 3.0, 6.0, 5.0, 8.0, 13.0, 16.0, 10.0, 15.0, 26.0, 30.0, 22.0, 32.0, 30.0, 31.0, 33.0, 38.0, 37.0, 27.0, 44.0, 44.0, 50.0, 46.0, 42.0, 36.0, 36.0, 31.0, 38.0, 22.0, 28.0, 27.0, 22.0, 31.0, 17.0, 20.0, 15.0, 17.0, 9.0, 9.0, 4.0, 9.0, 1.0, 0.0, 4.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.20622253417969, -31.215606689453125, -30.22498893737793, -29.234373092651367, -28.243755340576172, -27.25313949584961, -26.262521743774414, -25.27190589904785, -24.281288146972656, -23.290672302246094, -22.3000545501709, -21.309438705444336, -20.31882095336914, -19.328205108642578, -18.337587356567383, -17.34697151184082, -16.356353759765625, -15.365736961364746, -14.375120162963867, -13.384503364562988, -12.39388656616211, -11.403270721435547, -10.412652969360352, -9.422037124633789, -8.431421279907227, -7.440804481506348, -6.450187683105469, -5.45957088470459, -4.468954086303711, -3.4783377647399902, -2.4877209663391113, -1.4971041679382324, -0.5064868927001953, 0.4841298460960388, 1.474746584892273, 2.4653632640838623, 3.455980062484741, 4.446596622467041, 5.43721342086792, 6.427830219268799, 7.418447017669678, 8.409063339233398, 9.399680137634277, 10.390296936035156, 11.380913734436035, 12.371530532836914, 13.362147331237793, 14.352764129638672, 15.34338092803955, 16.33399772644043, 17.324613571166992, 18.315231323242188, 19.30584716796875, 20.296464920043945, 21.287080764770508, 22.277698516845703, 23.268314361572266, 24.258930206298828, 25.249547958374023, 26.240163803100586, 27.23078155517578, 28.221397399902344, 29.21201515197754, 30.2026309967041, 31.193248748779297]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 2.0, 4.0, 6.0, 7.0, 11.0, 17.0, 15.0, 17.0, 18.0, 26.0, 29.0, 25.0, 36.0, 34.0, 35.0, 29.0, 55.0, 40.0, 47.0, 29.0, 35.0, 44.0, 42.0, 40.0, 42.0, 48.0, 39.0, 33.0, 16.0, 23.0, 17.0, 27.0, 14.0, 20.0, 14.0, 12.0, 6.0, 10.0, 7.0, 3.0, 4.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.8046875, -4.65557861328125, -4.5064697265625, -4.35736083984375, -4.208251953125, -4.05914306640625, -3.9100341796875, -3.76092529296875, -3.61181640625, -3.46270751953125, -3.3135986328125, -3.16448974609375, -3.015380859375, -2.86627197265625, -2.7171630859375, -2.56805419921875, -2.4189453125, -2.26983642578125, -2.1207275390625, -1.97161865234375, -1.822509765625, -1.67340087890625, -1.5242919921875, -1.37518310546875, -1.22607421875, -1.07696533203125, -0.9278564453125, -0.77874755859375, -0.629638671875, -0.48052978515625, -0.3314208984375, -0.18231201171875, -0.033203125, 0.11590576171875, 0.2650146484375, 0.41412353515625, 0.563232421875, 0.71234130859375, 0.8614501953125, 1.01055908203125, 1.15966796875, 1.30877685546875, 1.4578857421875, 1.60699462890625, 1.756103515625, 1.90521240234375, 2.0543212890625, 2.20343017578125, 2.3525390625, 2.50164794921875, 2.6507568359375, 2.79986572265625, 2.948974609375, 3.09808349609375, 3.2471923828125, 3.39630126953125, 3.54541015625, 3.69451904296875, 3.8436279296875, 3.99273681640625, 4.141845703125, 4.29095458984375, 4.4400634765625, 4.58917236328125, 4.73828125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 7.0, 13.0, 17.0, 18.0, 26.0, 41.0, 78.0, 105.0, 120.0, 228.0, 326.0, 566.0, 775.0, 1160.0, 1844.0, 2862.0, 4506.0, 6840.0, 10600.0, 16438.0, 24978.0, 37814.0, 56726.0, 82466.0, 115334.0, 146051.0, 149464.0, 121888.0, 88956.0, 60569.0, 40401.0, 27256.0, 17501.0, 11579.0, 7459.0, 4801.0, 3019.0, 2003.0, 1257.0, 840.0, 535.0, 352.0, 238.0, 182.0, 102.0, 58.0, 46.0, 42.0, 20.0, 24.0, 3.0, 7.0, 11.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.463134765625, -0.4491386413574219, -0.43514251708984375, -0.4211463928222656, -0.4071502685546875, -0.3931541442871094, -0.37915802001953125, -0.3651618957519531, -0.351165771484375, -0.3371696472167969, -0.32317352294921875, -0.3091773986816406, -0.2951812744140625, -0.2811851501464844, -0.26718902587890625, -0.2531929016113281, -0.23919677734375, -0.22520065307617188, -0.21120452880859375, -0.19720840454101562, -0.1832122802734375, -0.16921615600585938, -0.15522003173828125, -0.14122390747070312, -0.127227783203125, -0.11323165893554688, -0.09923553466796875, -0.08523941040039062, -0.0712432861328125, -0.057247161865234375, -0.04325103759765625, -0.029254913330078125, -0.0152587890625, -0.001262664794921875, 0.01273345947265625, 0.026729583740234375, 0.0407257080078125, 0.054721832275390625, 0.06871795654296875, 0.08271408081054688, 0.096710205078125, 0.11070632934570312, 0.12470245361328125, 0.13869857788085938, 0.1526947021484375, 0.16669082641601562, 0.18068695068359375, 0.19468307495117188, 0.20867919921875, 0.22267532348632812, 0.23667144775390625, 0.2506675720214844, 0.2646636962890625, 0.2786598205566406, 0.29265594482421875, 0.3066520690917969, 0.320648193359375, 0.3346443176269531, 0.34864044189453125, 0.3626365661621094, 0.3766326904296875, 0.3906288146972656, 0.40462493896484375, 0.4186210632324219, 0.4326171875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 3.0, 5.0, 3.0, 4.0, 5.0, 6.0, 12.0, 8.0, 14.0, 13.0, 18.0, 24.0, 18.0, 31.0, 24.0, 35.0, 37.0, 39.0, 45.0, 41.0, 40.0, 46.0, 1076.0, 50.0, 42.0, 45.0, 32.0, 51.0, 32.0, 24.0, 34.0, 37.0, 24.0, 14.0, 17.0, 18.0, 12.0, 13.0, 9.0, 10.0, 5.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.54296875, -3.4346923828125, -3.326416015625, -3.2181396484375, -3.10986328125, -3.0015869140625, -2.893310546875, -2.7850341796875, -2.6767578125, -2.5684814453125, -2.460205078125, -2.3519287109375, -2.24365234375, -2.1353759765625, -2.027099609375, -1.9188232421875, -1.810546875, -1.7022705078125, -1.593994140625, -1.4857177734375, -1.37744140625, -1.2691650390625, -1.160888671875, -1.0526123046875, -0.9443359375, -0.8360595703125, -0.727783203125, -0.6195068359375, -0.51123046875, -0.4029541015625, -0.294677734375, -0.1864013671875, -0.078125, 0.0301513671875, 0.138427734375, 0.2467041015625, 0.35498046875, 0.4632568359375, 0.571533203125, 0.6798095703125, 0.7880859375, 0.8963623046875, 1.004638671875, 1.1129150390625, 1.22119140625, 1.3294677734375, 1.437744140625, 1.5460205078125, 1.654296875, 1.7625732421875, 1.870849609375, 1.9791259765625, 2.08740234375, 2.1956787109375, 2.303955078125, 2.4122314453125, 2.5205078125, 2.6287841796875, 2.737060546875, 2.8453369140625, 2.95361328125, 3.0618896484375, 3.170166015625, 3.2784423828125, 3.38671875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 9.0, 17.0, 22.0, 46.0, 40.0, 67.0, 124.0, 185.0, 301.0, 464.0, 743.0, 1136.0, 1825.0, 2665.0, 4127.0, 6601.0, 10426.0, 16934.0, 26664.0, 42985.0, 66797.0, 101186.0, 139062.0, 1205328.0, 152171.0, 111537.0, 75494.0, 48274.0, 30493.0, 18925.0, 11820.0, 7413.0, 4782.0, 2922.0, 1978.0, 1244.0, 835.0, 533.0, 351.0, 210.0, 131.0, 88.0, 54.0, 45.0, 23.0, 22.0, 11.0, 5.0, 7.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.319091796875, -0.3093147277832031, -0.29953765869140625, -0.2897605895996094, -0.2799835205078125, -0.2702064514160156, -0.26042938232421875, -0.2506523132324219, -0.240875244140625, -0.23109817504882812, -0.22132110595703125, -0.21154403686523438, -0.2017669677734375, -0.19198989868164062, -0.18221282958984375, -0.17243576049804688, -0.16265869140625, -0.15288162231445312, -0.14310455322265625, -0.13332748413085938, -0.1235504150390625, -0.11377334594726562, -0.10399627685546875, -0.09421920776367188, -0.084442138671875, -0.07466506958007812, -0.06488800048828125, -0.055110931396484375, -0.0453338623046875, -0.035556793212890625, -0.02577972412109375, -0.016002655029296875, -0.0062255859375, 0.003551483154296875, 0.01332855224609375, 0.023105621337890625, 0.0328826904296875, 0.042659759521484375, 0.05243682861328125, 0.062213897705078125, 0.071990966796875, 0.08176803588867188, 0.09154510498046875, 0.10132217407226562, 0.1110992431640625, 0.12087631225585938, 0.13065338134765625, 0.14043045043945312, 0.15020751953125, 0.15998458862304688, 0.16976165771484375, 0.17953872680664062, 0.1893157958984375, 0.19909286499023438, 0.20886993408203125, 0.21864700317382812, 0.228424072265625, 0.23820114135742188, 0.24797821044921875, 0.2577552795410156, 0.2675323486328125, 0.2773094177246094, 0.28708648681640625, 0.2968635559082031, 0.306640625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 2.0, 2.0, 8.0, 11.0, 10.0, 21.0, 14.0, 37.0, 44.0, 78.0, 125.0, 172.0, 157.0, 108.0, 71.0, 35.0, 29.0, 15.0, 14.0, 7.0, 11.0, 5.0, 2.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0261688232421875, -0.025418758392333984, -0.02466869354248047, -0.023918628692626953, -0.023168563842773438, -0.022418498992919922, -0.021668434143066406, -0.02091836929321289, -0.020168304443359375, -0.01941823959350586, -0.018668174743652344, -0.017918109893798828, -0.017168045043945312, -0.016417980194091797, -0.01566791534423828, -0.014917850494384766, -0.01416778564453125, -0.013417720794677734, -0.012667655944824219, -0.011917591094970703, -0.011167526245117188, -0.010417461395263672, -0.009667396545410156, -0.00891733169555664, -0.008167266845703125, -0.007417201995849609, -0.006667137145996094, -0.005917072296142578, -0.0051670074462890625, -0.004416942596435547, -0.0036668777465820312, -0.0029168128967285156, -0.002166748046875, -0.0014166831970214844, -0.0006666183471679688, 8.344650268554688e-05, 0.0008335113525390625, 0.0015835762023925781, 0.0023336410522460938, 0.0030837059020996094, 0.003833770751953125, 0.004583835601806641, 0.005333900451660156, 0.006083965301513672, 0.0068340301513671875, 0.007584095001220703, 0.008334159851074219, 0.009084224700927734, 0.00983428955078125, 0.010584354400634766, 0.011334419250488281, 0.012084484100341797, 0.012834548950195312, 0.013584613800048828, 0.014334678649902344, 0.01508474349975586, 0.015834808349609375, 0.01658487319946289, 0.017334938049316406, 0.018085002899169922, 0.018835067749023438, 0.019585132598876953, 0.02033519744873047, 0.021085262298583984, 0.0218353271484375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 2.0, 5.0, 7.0, 12.0, 7.0, 8.0, 27.0, 29.0, 43.0, 76.0, 143.0, 469.0, 47885.0, 998290.0, 1070.0, 192.0, 86.0, 66.0, 34.0, 26.0, 20.0, 12.0, 10.0, 6.0, 5.0, 1.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4921875, -0.475311279296875, -0.45843505859375, -0.441558837890625, -0.4246826171875, -0.407806396484375, -0.39093017578125, -0.374053955078125, -0.357177734375, -0.340301513671875, -0.32342529296875, -0.306549072265625, -0.2896728515625, -0.272796630859375, -0.25592041015625, -0.239044189453125, -0.22216796875, -0.205291748046875, -0.18841552734375, -0.171539306640625, -0.1546630859375, -0.137786865234375, -0.12091064453125, -0.104034423828125, -0.087158203125, -0.070281982421875, -0.05340576171875, -0.036529541015625, -0.0196533203125, -0.002777099609375, 0.01409912109375, 0.030975341796875, 0.0478515625, 0.064727783203125, 0.08160400390625, 0.098480224609375, 0.1153564453125, 0.132232666015625, 0.14910888671875, 0.165985107421875, 0.182861328125, 0.199737548828125, 0.21661376953125, 0.233489990234375, 0.2503662109375, 0.267242431640625, 0.28411865234375, 0.300994873046875, 0.31787109375, 0.334747314453125, 0.35162353515625, 0.368499755859375, 0.3853759765625, 0.402252197265625, 0.41912841796875, 0.436004638671875, 0.452880859375, 0.469757080078125, 0.48663330078125, 0.503509521484375, 0.5203857421875, 0.537261962890625, 0.55413818359375, 0.571014404296875, 0.587890625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 25.0, 84.0, 568.0, 297.0, 25.0, 10.0, 3.0], "bins": [-0.2608456015586853, -0.256485253572464, -0.2521249055862427, -0.24776457250118256, -0.24340422451496124, -0.23904389142990112, -0.2346835434436798, -0.2303231954574585, -0.22596284747123718, -0.22160249948501587, -0.21724216639995575, -0.21288181841373444, -0.20852147042751312, -0.204161137342453, -0.1998007893562317, -0.19544044137001038, -0.19108010828495026, -0.18671976029872894, -0.18235942721366882, -0.1779990792274475, -0.1736387312412262, -0.16927838325500488, -0.16491805016994476, -0.16055770218372345, -0.15619736909866333, -0.15183702111244202, -0.1474766880273819, -0.14311634004116058, -0.13875599205493927, -0.13439565896987915, -0.13003531098365784, -0.12567496299743652, -0.1213146224617958, -0.11695428192615509, -0.11259393393993378, -0.10823359340429306, -0.10387325286865234, -0.09951290488243103, -0.09515256434679031, -0.0907922238111496, -0.08643187582492828, -0.08207153528928757, -0.07771118730306625, -0.07335084676742554, -0.06899049878120422, -0.06463015824556351, -0.06026981770992279, -0.055909473448991776, -0.05154912918806076, -0.047188784927129745, -0.04282844066619873, -0.038468100130558014, -0.034107755869627, -0.029747411608695984, -0.025387069210410118, -0.021026726812124252, -0.016666382551193237, -0.012306039221584797, -0.007945695891976357, -0.003585352562367916, 0.0007749907672405243, 0.005135335028171539, 0.009495677426457405, 0.013856019824743271, 0.018216364085674286]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 7.0, 7.0, 9.0, 12.0, 11.0, 24.0, 25.0, 23.0, 29.0, 28.0, 38.0, 26.0, 39.0, 47.0, 42.0, 36.0, 45.0, 45.0, 37.0, 50.0, 34.0, 43.0, 37.0, 24.0, 35.0, 27.0, 32.0, 28.0, 36.0, 20.0, 13.0, 17.0, 13.0, 9.0, 9.0, 8.0, 8.0, 4.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02130967378616333, -0.020653054118156433, -0.019996436312794685, -0.019339818507432938, -0.01868319883942604, -0.018026579171419144, -0.017369961366057396, -0.016713343560695648, -0.01605672389268875, -0.015400105156004429, -0.014743486419320107, -0.014086867682635784, -0.013430248945951462, -0.01277363020926714, -0.012117011472582817, -0.011460392735898495, -0.010803773999214172, -0.01014715526252985, -0.009490536525845528, -0.008833917789161205, -0.008177299052476883, -0.007520680315792561, -0.006864061579108238, -0.006207442842423916, -0.0055508241057395935, -0.004894205369055271, -0.004237586632370949, -0.0035809678956866264, -0.002924349159002304, -0.0022677304223179817, -0.0016111116856336594, -0.000954492948949337, -0.00029787421226501465, 0.0003587445244193077, 0.00101536326110363, 0.0016719819977879524, 0.0023286007344722748, 0.002985219471156597, 0.0036418382078409195, 0.004298456944525242, 0.004955075681209564, 0.0056116944178938866, 0.006268313154578209, 0.006924931891262531, 0.007581550627946854, 0.008238169364631176, 0.008894788101315498, 0.00955140683799982, 0.010208025574684143, 0.010864644311368465, 0.011521263048052788, 0.01217788178473711, 0.012834500521421432, 0.013491119258105755, 0.014147737994790077, 0.0148043567314744, 0.015460975468158722, 0.01611759513616562, 0.016774212941527367, 0.017430830746889114, 0.01808745041489601, 0.01874407008290291, 0.019400687888264656, 0.020057305693626404, 0.0207139253616333]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 2.0, 3.0, 7.0, 7.0, 11.0, 17.0, 15.0, 17.0, 18.0, 26.0, 29.0, 25.0, 36.0, 34.0, 35.0, 29.0, 54.0, 41.0, 46.0, 30.0, 35.0, 44.0, 43.0, 39.0, 42.0, 48.0, 39.0, 33.0, 16.0, 23.0, 17.0, 27.0, 14.0, 20.0, 14.0, 12.0, 6.0, 10.0, 7.0, 3.0, 4.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.8046875, -4.65557861328125, -4.5064697265625, -4.35736083984375, -4.208251953125, -4.05914306640625, -3.9100341796875, -3.76092529296875, -3.61181640625, -3.46270751953125, -3.3135986328125, -3.16448974609375, -3.015380859375, -2.86627197265625, -2.7171630859375, -2.56805419921875, -2.4189453125, -2.26983642578125, -2.1207275390625, -1.97161865234375, -1.822509765625, -1.67340087890625, -1.5242919921875, -1.37518310546875, -1.22607421875, -1.07696533203125, -0.9278564453125, -0.77874755859375, -0.629638671875, -0.48052978515625, -0.3314208984375, -0.18231201171875, -0.033203125, 0.11590576171875, 0.2650146484375, 0.41412353515625, 0.563232421875, 0.71234130859375, 0.8614501953125, 1.01055908203125, 1.15966796875, 1.30877685546875, 1.4578857421875, 1.60699462890625, 1.756103515625, 1.90521240234375, 2.0543212890625, 2.20343017578125, 2.3525390625, 2.50164794921875, 2.6507568359375, 2.79986572265625, 2.948974609375, 3.09808349609375, 3.2471923828125, 3.39630126953125, 3.54541015625, 3.69451904296875, 3.8436279296875, 3.99273681640625, 4.141845703125, 4.29095458984375, 4.4400634765625, 4.58917236328125, 4.73828125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 9.0, 5.0, 4.0, 18.0, 13.0, 12.0, 23.0, 36.0, 49.0, 63.0, 99.0, 124.0, 197.0, 349.0, 496.0, 883.0, 1597.0, 3229.0, 6294.0, 13185.0, 28164.0, 61443.0, 145171.0, 390835.0, 229705.0, 89480.0, 40107.0, 18634.0, 8948.0, 4365.0, 2103.0, 1104.0, 605.0, 402.0, 241.0, 155.0, 115.0, 86.0, 49.0, 45.0, 26.0, 16.0, 17.0, 12.0, 16.0, 9.0, 10.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.765625, -4.61541748046875, -4.4652099609375, -4.31500244140625, -4.164794921875, -4.01458740234375, -3.8643798828125, -3.71417236328125, -3.56396484375, -3.41375732421875, -3.2635498046875, -3.11334228515625, -2.963134765625, -2.81292724609375, -2.6627197265625, -2.51251220703125, -2.3623046875, -2.21209716796875, -2.0618896484375, -1.91168212890625, -1.761474609375, -1.61126708984375, -1.4610595703125, -1.31085205078125, -1.16064453125, -1.01043701171875, -0.8602294921875, -0.71002197265625, -0.559814453125, -0.40960693359375, -0.2593994140625, -0.10919189453125, 0.041015625, 0.19122314453125, 0.3414306640625, 0.49163818359375, 0.641845703125, 0.79205322265625, 0.9422607421875, 1.09246826171875, 1.24267578125, 1.39288330078125, 1.5430908203125, 1.69329833984375, 1.843505859375, 1.99371337890625, 2.1439208984375, 2.29412841796875, 2.4443359375, 2.59454345703125, 2.7447509765625, 2.89495849609375, 3.045166015625, 3.19537353515625, 3.3455810546875, 3.49578857421875, 3.64599609375, 3.79620361328125, 3.9464111328125, 4.09661865234375, 4.246826171875, 4.39703369140625, 4.5472412109375, 4.69744873046875, 4.84765625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 6.0, 7.0, 5.0, 3.0, 13.0, 9.0, 13.0, 18.0, 29.0, 33.0, 33.0, 32.0, 45.0, 62.0, 60.0, 77.0, 85.0, 317.0, 1581.0, 174.0, 77.0, 58.0, 43.0, 42.0, 32.0, 35.0, 26.0, 27.0, 27.0, 23.0, 10.0, 6.0, 10.0, 10.0, 7.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.03125, -17.488525390625, -16.94580078125, -16.403076171875, -15.8603515625, -15.317626953125, -14.77490234375, -14.232177734375, -13.689453125, -13.146728515625, -12.60400390625, -12.061279296875, -11.5185546875, -10.975830078125, -10.43310546875, -9.890380859375, -9.34765625, -8.804931640625, -8.26220703125, -7.719482421875, -7.1767578125, -6.634033203125, -6.09130859375, -5.548583984375, -5.005859375, -4.463134765625, -3.92041015625, -3.377685546875, -2.8349609375, -2.292236328125, -1.74951171875, -1.206787109375, -0.6640625, -0.121337890625, 0.42138671875, 0.964111328125, 1.5068359375, 2.049560546875, 2.59228515625, 3.135009765625, 3.677734375, 4.220458984375, 4.76318359375, 5.305908203125, 5.8486328125, 6.391357421875, 6.93408203125, 7.476806640625, 8.01953125, 8.562255859375, 9.10498046875, 9.647705078125, 10.1904296875, 10.733154296875, 11.27587890625, 11.818603515625, 12.361328125, 12.904052734375, 13.44677734375, 13.989501953125, 14.5322265625, 15.074951171875, 15.61767578125, 16.160400390625, 16.703125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 11.0, 19.0, 15.0, 19.0, 25.0, 28.0, 41.0, 57.0, 65.0, 80.0, 147.0, 176.0, 308.0, 554.0, 1866.0, 44160.0, 3057612.0, 37135.0, 1840.0, 570.0, 287.0, 192.0, 112.0, 87.0, 75.0, 53.0, 44.0, 28.0, 23.0, 19.0, 19.0, 6.0, 9.0, 10.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.4375, -43.18505859375, -41.9326171875, -40.68017578125, -39.427734375, -38.17529296875, -36.9228515625, -35.67041015625, -34.41796875, -33.16552734375, -31.9130859375, -30.66064453125, -29.408203125, -28.15576171875, -26.9033203125, -25.65087890625, -24.3984375, -23.14599609375, -21.8935546875, -20.64111328125, -19.388671875, -18.13623046875, -16.8837890625, -15.63134765625, -14.37890625, -13.12646484375, -11.8740234375, -10.62158203125, -9.369140625, -8.11669921875, -6.8642578125, -5.61181640625, -4.359375, -3.10693359375, -1.8544921875, -0.60205078125, 0.650390625, 1.90283203125, 3.1552734375, 4.40771484375, 5.66015625, 6.91259765625, 8.1650390625, 9.41748046875, 10.669921875, 11.92236328125, 13.1748046875, 14.42724609375, 15.6796875, 16.93212890625, 18.1845703125, 19.43701171875, 20.689453125, 21.94189453125, 23.1943359375, 24.44677734375, 25.69921875, 26.95166015625, 28.2041015625, 29.45654296875, 30.708984375, 31.96142578125, 33.2138671875, 34.46630859375, 35.71875]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 38.0, 120.0, 250.0, 328.0, 199.0, 60.0, 11.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.499195098876953, -20.797929763793945, -19.09666633605957, -17.395401000976562, -15.694136619567871, -13.99287223815918, -12.291606903076172, -10.59034252166748, -8.889078140258789, -7.187813758850098, -5.486548900604248, -3.7852840423583984, -2.084019660949707, -0.3827552795410156, 1.3185100555419922, 3.0197744369506836, 4.721038818359375, 6.422303199768066, 8.123567581176758, 9.824832916259766, 11.526097297668457, 13.227361679077148, 14.928627014160156, 16.62989044189453, 18.33115577697754, 20.032421112060547, 21.733684539794922, 23.43494987487793, 25.136215209960938, 26.837478637695312, 28.53874397277832, 30.240009307861328, 31.941268920898438, 33.64253234863281, 35.34379959106445, 37.04506301879883, 38.7463264465332, 40.447593688964844, 42.14885711669922, 43.850120544433594, 45.55138397216797, 47.252647399902344, 48.953914642333984, 50.65517807006836, 52.356441497802734, 54.057708740234375, 55.75897216796875, 57.460235595703125, 59.161502838134766, 60.86276626586914, 62.56403350830078, 64.26529693603516, 65.96656036376953, 67.6678237915039, 69.36909484863281, 71.07035827636719, 72.77162170410156, 74.47288513183594, 76.17414855957031, 77.87541198730469, 79.5766830444336, 81.27794647216797, 82.97920989990234, 84.68047332763672, 86.3817367553711]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 0.0, 4.0, 3.0, 12.0, 5.0, 11.0, 10.0, 10.0, 11.0, 12.0, 26.0, 18.0, 28.0, 23.0, 36.0, 33.0, 26.0, 41.0, 33.0, 39.0, 35.0, 28.0, 38.0, 28.0, 48.0, 46.0, 37.0, 37.0, 40.0, 32.0, 30.0, 36.0, 23.0, 31.0, 17.0, 24.0, 15.0, 17.0, 13.0, 10.0, 12.0, 6.0, 2.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.065216064453125, -33.90144729614258, -32.73767852783203, -31.57390785217285, -30.410139083862305, -29.246370315551758, -28.082599639892578, -26.91883087158203, -25.755062103271484, -24.591293334960938, -23.42752456665039, -22.26375389099121, -21.099985122680664, -19.936216354370117, -18.772445678710938, -17.60867691040039, -16.444908142089844, -15.281139373779297, -14.117369651794434, -12.95359992980957, -11.789831161499023, -10.626062393188477, -9.462292671203613, -8.29852294921875, -7.134754180908203, -5.970984935760498, -4.807215690612793, -3.643446445465088, -2.479677200317383, -1.3159079551696777, -0.15213871002197266, 1.0116310119628906, 2.1753997802734375, 3.3391690254211426, 4.502938270568848, 5.666707515716553, 6.830476760864258, 7.994246006011963, 9.158015251159668, 10.321784973144531, 11.485553741455078, 12.649322509765625, 13.813092231750488, 14.976861953735352, 16.1406307220459, 17.304399490356445, 18.468170166015625, 19.631938934326172, 20.79570770263672, 21.959476470947266, 23.123245239257812, 24.287015914916992, 25.45078468322754, 26.614553451538086, 27.778324127197266, 28.942092895507812, 30.10586166381836, 31.269630432128906, 32.43339920043945, 33.59716796875, 34.76094055175781, 35.92470932006836, 37.088478088378906, 38.25224685668945, 39.416015625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 7.0, 4.0, 3.0, 5.0, 10.0, 14.0, 13.0, 17.0, 12.0, 22.0, 19.0, 25.0, 32.0, 31.0, 35.0, 34.0, 39.0, 57.0, 35.0, 38.0, 40.0, 38.0, 39.0, 36.0, 40.0, 41.0, 41.0, 31.0, 30.0, 33.0, 21.0, 25.0, 16.0, 19.0, 20.0, 18.0, 13.0, 7.0, 9.0, 5.0, 9.0, 6.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.01953125, -4.86456298828125, -4.7095947265625, -4.55462646484375, -4.399658203125, -4.24468994140625, -4.0897216796875, -3.93475341796875, -3.77978515625, -3.62481689453125, -3.4698486328125, -3.31488037109375, -3.159912109375, -3.00494384765625, -2.8499755859375, -2.69500732421875, -2.5400390625, -2.38507080078125, -2.2301025390625, -2.07513427734375, -1.920166015625, -1.76519775390625, -1.6102294921875, -1.45526123046875, -1.30029296875, -1.14532470703125, -0.9903564453125, -0.83538818359375, -0.680419921875, -0.52545166015625, -0.3704833984375, -0.21551513671875, -0.060546875, 0.09442138671875, 0.2493896484375, 0.40435791015625, 0.559326171875, 0.71429443359375, 0.8692626953125, 1.02423095703125, 1.17919921875, 1.33416748046875, 1.4891357421875, 1.64410400390625, 1.799072265625, 1.95404052734375, 2.1090087890625, 2.26397705078125, 2.4189453125, 2.57391357421875, 2.7288818359375, 2.88385009765625, 3.038818359375, 3.19378662109375, 3.3487548828125, 3.50372314453125, 3.65869140625, 3.81365966796875, 3.9686279296875, 4.12359619140625, 4.278564453125, 4.43353271484375, 4.5885009765625, 4.74346923828125, 4.8984375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 8.0, 6.0, 11.0, 4.0, 10.0, 14.0, 10.0, 20.0, 21.0, 22.0, 36.0, 63.0, 119.0, 149.0, 385.0, 947.0, 2463.0, 8043.0, 34865.0, 267495.0, 2316237.0, 1404010.0, 130073.0, 20653.0, 5366.0, 1747.0, 731.0, 303.0, 152.0, 77.0, 51.0, 32.0, 25.0, 25.0, 21.0, 18.0, 12.0, 8.0, 10.0, 7.0, 4.0, 2.0, 6.0, 5.0, 4.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-13.078125, -12.679931640625, -12.28173828125, -11.883544921875, -11.4853515625, -11.087158203125, -10.68896484375, -10.290771484375, -9.892578125, -9.494384765625, -9.09619140625, -8.697998046875, -8.2998046875, -7.901611328125, -7.50341796875, -7.105224609375, -6.70703125, -6.308837890625, -5.91064453125, -5.512451171875, -5.1142578125, -4.716064453125, -4.31787109375, -3.919677734375, -3.521484375, -3.123291015625, -2.72509765625, -2.326904296875, -1.9287109375, -1.530517578125, -1.13232421875, -0.734130859375, -0.3359375, 0.062255859375, 0.46044921875, 0.858642578125, 1.2568359375, 1.655029296875, 2.05322265625, 2.451416015625, 2.849609375, 3.247802734375, 3.64599609375, 4.044189453125, 4.4423828125, 4.840576171875, 5.23876953125, 5.636962890625, 6.03515625, 6.433349609375, 6.83154296875, 7.229736328125, 7.6279296875, 8.026123046875, 8.42431640625, 8.822509765625, 9.220703125, 9.618896484375, 10.01708984375, 10.415283203125, 10.8134765625, 11.211669921875, 11.60986328125, 12.008056640625, 12.40625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 7.0, 2.0, 2.0, 10.0, 8.0, 15.0, 24.0, 23.0, 49.0, 63.0, 119.0, 179.0, 285.0, 455.0, 696.0, 710.0, 517.0, 341.0, 212.0, 121.0, 69.0, 58.0, 37.0, 14.0, 14.0, 22.0, 9.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.234375, -19.7427978515625, -19.251220703125, -18.7596435546875, -18.26806640625, -17.7764892578125, -17.284912109375, -16.7933349609375, -16.3017578125, -15.8101806640625, -15.318603515625, -14.8270263671875, -14.33544921875, -13.8438720703125, -13.352294921875, -12.8607177734375, -12.369140625, -11.8775634765625, -11.385986328125, -10.8944091796875, -10.40283203125, -9.9112548828125, -9.419677734375, -8.9281005859375, -8.4365234375, -7.9449462890625, -7.453369140625, -6.9617919921875, -6.47021484375, -5.9786376953125, -5.487060546875, -4.9954833984375, -4.50390625, -4.0123291015625, -3.520751953125, -3.0291748046875, -2.53759765625, -2.0460205078125, -1.554443359375, -1.0628662109375, -0.5712890625, -0.0797119140625, 0.411865234375, 0.9034423828125, 1.39501953125, 1.8865966796875, 2.378173828125, 2.8697509765625, 3.361328125, 3.8529052734375, 4.344482421875, 4.8360595703125, 5.32763671875, 5.8192138671875, 6.310791015625, 6.8023681640625, 7.2939453125, 7.7855224609375, 8.277099609375, 8.7686767578125, 9.26025390625, 9.7518310546875, 10.243408203125, 10.7349853515625, 11.2265625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 7.0, 24.0, 15.0, 18.0, 33.0, 67.0, 87.0, 168.0, 360.0, 957.0, 5226.0, 1166267.0, 3012191.0, 6857.0, 1081.0, 406.0, 212.0, 113.0, 67.0, 32.0, 22.0, 25.0, 10.0, 8.0, 4.0, 2.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.03125, -55.51416015625, -52.9970703125, -50.47998046875, -47.962890625, -45.44580078125, -42.9287109375, -40.41162109375, -37.89453125, -35.37744140625, -32.8603515625, -30.34326171875, -27.826171875, -25.30908203125, -22.7919921875, -20.27490234375, -17.7578125, -15.24072265625, -12.7236328125, -10.20654296875, -7.689453125, -5.17236328125, -2.6552734375, -0.13818359375, 2.37890625, 4.89599609375, 7.4130859375, 9.93017578125, 12.447265625, 14.96435546875, 17.4814453125, 19.99853515625, 22.515625, 25.03271484375, 27.5498046875, 30.06689453125, 32.583984375, 35.10107421875, 37.6181640625, 40.13525390625, 42.65234375, 45.16943359375, 47.6865234375, 50.20361328125, 52.720703125, 55.23779296875, 57.7548828125, 60.27197265625, 62.7890625, 65.30615234375, 67.8232421875, 70.34033203125, 72.857421875, 75.37451171875, 77.8916015625, 80.40869140625, 82.92578125, 85.44287109375, 87.9599609375, 90.47705078125, 92.994140625, 95.51123046875, 98.0283203125, 100.54541015625, 103.0625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 11.0, 27.0, 54.0, 100.0, 138.0, 164.0, 207.0, 139.0, 86.0, 34.0, 25.0, 15.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.94692611694336, -41.362361907958984, -38.77779769897461, -36.193233489990234, -33.60866928100586, -31.024105072021484, -28.439542770385742, -25.854978561401367, -23.270414352416992, -20.685850143432617, -18.101285934448242, -15.516722679138184, -12.932158470153809, -10.347594261169434, -7.763031005859375, -5.178466796875, -2.593902587890625, -0.009338617324829102, 2.575225353240967, 5.159789085388184, 7.744353294372559, 10.328917503356934, 12.913480758666992, 15.498044967651367, 18.082609176635742, 20.667173385620117, 23.251737594604492, 25.836299896240234, 28.42086410522461, 31.005428314208984, 33.58999252319336, 36.174556732177734, 38.759117126464844, 41.34368133544922, 43.928245544433594, 46.51280975341797, 49.097373962402344, 51.68193817138672, 54.266502380371094, 56.85106658935547, 59.435630798339844, 62.02019500732422, 64.6047592163086, 67.18932342529297, 69.77388763427734, 72.35845184326172, 74.9430160522461, 77.52758026123047, 80.11213684082031, 82.69670104980469, 85.28126525878906, 87.86582946777344, 90.45039367675781, 93.03495788574219, 95.61952209472656, 98.20408630371094, 100.78865051269531, 103.37321472167969, 105.95777893066406, 108.54234313964844, 111.12690734863281, 113.71147155761719, 116.29603576660156, 118.88059997558594, 121.46516418457031]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 12.0, 14.0, 13.0, 22.0, 21.0, 16.0, 34.0, 26.0, 33.0, 33.0, 41.0, 34.0, 44.0, 45.0, 37.0, 35.0, 57.0, 46.0, 45.0, 44.0, 23.0, 46.0, 30.0, 18.0, 38.0, 24.0, 19.0, 27.0, 16.0, 13.0, 10.0, 8.0, 10.0, 11.0, 8.0, 5.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.99497985839844, -34.83114242553711, -33.667301177978516, -32.50346374511719, -31.33962631225586, -30.1757869720459, -29.011947631835938, -27.84811019897461, -26.68427085876465, -25.520431518554688, -24.35659408569336, -23.1927547454834, -22.028915405273438, -20.86507797241211, -19.70123863220215, -18.537399291992188, -17.37356185913086, -16.2097225189209, -15.04588508605957, -13.88204574584961, -12.718207359313965, -11.55436897277832, -10.39052963256836, -9.226691246032715, -8.06285285949707, -6.899014472961426, -5.735175609588623, -4.57133674621582, -3.407498359680176, -2.2436599731445312, -1.0798211097717285, 0.08401775360107422, 1.2478561401367188, 2.4116947650909424, 3.575533390045166, 4.739372253417969, 5.903210639953613, 7.067049026489258, 8.230888366699219, 9.394726753234863, 10.558565139770508, 11.722403526306152, 12.886241912841797, 14.050081253051758, 15.213919639587402, 16.377758026123047, 17.541597366333008, 18.70543670654297, 19.869274139404297, 21.033113479614258, 22.196950912475586, 23.360790252685547, 24.524627685546875, 25.688467025756836, 26.852306365966797, 28.016143798828125, 29.179983139038086, 30.343822479248047, 31.507659912109375, 32.6714973449707, 33.8353385925293, 34.999176025390625, 36.16301345825195, 37.32685470581055, 38.490692138671875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 5.0, 2.0, 6.0, 17.0, 11.0, 13.0, 12.0, 14.0, 22.0, 20.0, 20.0, 37.0, 38.0, 38.0, 30.0, 40.0, 47.0, 40.0, 42.0, 41.0, 46.0, 50.0, 35.0, 47.0, 45.0, 26.0, 18.0, 36.0, 31.0, 24.0, 24.0, 17.0, 17.0, 21.0, 11.0, 11.0, 5.0, 6.0, 4.0, 10.0, 8.0, 1.0, 2.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.3203125, -5.1534423828125, -4.986572265625, -4.8197021484375, -4.65283203125, -4.4859619140625, -4.319091796875, -4.1522216796875, -3.9853515625, -3.8184814453125, -3.651611328125, -3.4847412109375, -3.31787109375, -3.1510009765625, -2.984130859375, -2.8172607421875, -2.650390625, -2.4835205078125, -2.316650390625, -2.1497802734375, -1.98291015625, -1.8160400390625, -1.649169921875, -1.4822998046875, -1.3154296875, -1.1485595703125, -0.981689453125, -0.8148193359375, -0.64794921875, -0.4810791015625, -0.314208984375, -0.1473388671875, 0.01953125, 0.1864013671875, 0.353271484375, 0.5201416015625, 0.68701171875, 0.8538818359375, 1.020751953125, 1.1876220703125, 1.3544921875, 1.5213623046875, 1.688232421875, 1.8551025390625, 2.02197265625, 2.1888427734375, 2.355712890625, 2.5225830078125, 2.689453125, 2.8563232421875, 3.023193359375, 3.1900634765625, 3.35693359375, 3.5238037109375, 3.690673828125, 3.8575439453125, 4.0244140625, 4.1912841796875, 4.358154296875, 4.5250244140625, 4.69189453125, 4.8587646484375, 5.025634765625, 5.1925048828125, 5.359375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 11.0, 13.0, 18.0, 20.0, 27.0, 50.0, 79.0, 132.0, 232.0, 381.0, 671.0, 1185.0, 2235.0, 3826.0, 7362.0, 14598.0, 28475.0, 57530.0, 113116.0, 209025.0, 257939.0, 170932.0, 89826.0, 44623.0, 21948.0, 11223.0, 5916.0, 3204.0, 1694.0, 926.0, 518.0, 326.0, 174.0, 105.0, 75.0, 61.0, 30.0, 15.0, 10.0, 8.0, 4.0, 1.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.125, -1.0931472778320312, -1.0612945556640625, -1.0294418334960938, -0.997589111328125, -0.9657363891601562, -0.9338836669921875, -0.9020309448242188, -0.87017822265625, -0.8383255004882812, -0.8064727783203125, -0.7746200561523438, -0.742767333984375, -0.7109146118164062, -0.6790618896484375, -0.6472091674804688, -0.6153564453125, -0.5835037231445312, -0.5516510009765625, -0.5197982788085938, -0.487945556640625, -0.45609283447265625, -0.4242401123046875, -0.39238739013671875, -0.36053466796875, -0.32868194580078125, -0.2968292236328125, -0.26497650146484375, -0.233123779296875, -0.20127105712890625, -0.1694183349609375, -0.13756561279296875, -0.105712890625, -0.07386016845703125, -0.0420074462890625, -0.01015472412109375, 0.021697998046875, 0.05355072021484375, 0.0854034423828125, 0.11725616455078125, 0.14910888671875, 0.18096160888671875, 0.2128143310546875, 0.24466705322265625, 0.276519775390625, 0.30837249755859375, 0.3402252197265625, 0.37207794189453125, 0.4039306640625, 0.43578338623046875, 0.4676361083984375, 0.49948883056640625, 0.531341552734375, 0.5631942749023438, 0.5950469970703125, 0.6268997192382812, 0.65875244140625, 0.6906051635742188, 0.7224578857421875, 0.7543106079101562, 0.786163330078125, 0.8180160522460938, 0.8498687744140625, 0.8817214965820312, 0.91357421875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 1.0, 3.0, 3.0, 7.0, 4.0, 11.0, 14.0, 15.0, 14.0, 27.0, 16.0, 17.0, 17.0, 34.0, 32.0, 36.0, 43.0, 30.0, 29.0, 42.0, 37.0, 39.0, 1057.0, 58.0, 28.0, 47.0, 54.0, 41.0, 27.0, 28.0, 22.0, 37.0, 25.0, 20.0, 10.0, 18.0, 21.0, 11.0, 14.0, 10.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-4.06640625, -3.951995849609375, -3.83758544921875, -3.723175048828125, -3.6087646484375, -3.494354248046875, -3.37994384765625, -3.265533447265625, -3.151123046875, -3.036712646484375, -2.92230224609375, -2.807891845703125, -2.6934814453125, -2.579071044921875, -2.46466064453125, -2.350250244140625, -2.23583984375, -2.121429443359375, -2.00701904296875, -1.892608642578125, -1.7781982421875, -1.663787841796875, -1.54937744140625, -1.434967041015625, -1.320556640625, -1.206146240234375, -1.09173583984375, -0.977325439453125, -0.8629150390625, -0.748504638671875, -0.63409423828125, -0.519683837890625, -0.4052734375, -0.290863037109375, -0.17645263671875, -0.062042236328125, 0.0523681640625, 0.166778564453125, 0.28118896484375, 0.395599365234375, 0.510009765625, 0.624420166015625, 0.73883056640625, 0.853240966796875, 0.9676513671875, 1.082061767578125, 1.19647216796875, 1.310882568359375, 1.42529296875, 1.539703369140625, 1.65411376953125, 1.768524169921875, 1.8829345703125, 1.997344970703125, 2.11175537109375, 2.226165771484375, 2.340576171875, 2.454986572265625, 2.56939697265625, 2.683807373046875, 2.7982177734375, 2.912628173828125, 3.02703857421875, 3.141448974609375, 3.255859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 12.0, 14.0, 25.0, 27.0, 65.0, 68.0, 105.0, 150.0, 253.0, 325.0, 560.0, 896.0, 1315.0, 2043.0, 3131.0, 4704.0, 7517.0, 11993.0, 19306.0, 31047.0, 50130.0, 78822.0, 116735.0, 183867.0, 1179256.0, 138568.0, 97062.0, 63027.0, 39509.0, 24592.0, 15246.0, 9664.0, 6108.0, 3799.0, 2541.0, 1601.0, 1003.0, 675.0, 443.0, 285.0, 213.0, 132.0, 110.0, 68.0, 36.0, 32.0, 16.0, 10.0, 12.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.380615234375, -0.36803436279296875, -0.3554534912109375, -0.34287261962890625, -0.330291748046875, -0.31771087646484375, -0.3051300048828125, -0.29254913330078125, -0.27996826171875, -0.26738739013671875, -0.2548065185546875, -0.24222564697265625, -0.229644775390625, -0.21706390380859375, -0.2044830322265625, -0.19190216064453125, -0.1793212890625, -0.16674041748046875, -0.1541595458984375, -0.14157867431640625, -0.128997802734375, -0.11641693115234375, -0.1038360595703125, -0.09125518798828125, -0.07867431640625, -0.06609344482421875, -0.0535125732421875, -0.04093170166015625, -0.028350830078125, -0.01576995849609375, -0.0031890869140625, 0.00939178466796875, 0.02197265625, 0.03455352783203125, 0.0471343994140625, 0.05971527099609375, 0.072296142578125, 0.08487701416015625, 0.0974578857421875, 0.11003875732421875, 0.12261962890625, 0.13520050048828125, 0.1477813720703125, 0.16036224365234375, 0.172943115234375, 0.18552398681640625, 0.1981048583984375, 0.21068572998046875, 0.2232666015625, 0.23584747314453125, 0.2484283447265625, 0.26100921630859375, 0.273590087890625, 0.28617095947265625, 0.2987518310546875, 0.31133270263671875, 0.32391357421875, 0.33649444580078125, 0.3490753173828125, 0.36165618896484375, 0.374237060546875, 0.38681793212890625, 0.3993988037109375, 0.41197967529296875, 0.424560546875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 3.0, 3.0, 11.0, 1.0, 9.0, 6.0, 15.0, 15.0, 24.0, 27.0, 42.0, 65.0, 82.0, 114.0, 139.0, 115.0, 90.0, 68.0, 37.0, 26.0, 25.0, 18.0, 12.0, 4.0, 5.0, 7.0, 2.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029541015625, -0.02854633331298828, -0.027551651000976562, -0.026556968688964844, -0.025562286376953125, -0.024567604064941406, -0.023572921752929688, -0.02257823944091797, -0.02158355712890625, -0.02058887481689453, -0.019594192504882812, -0.018599510192871094, -0.017604827880859375, -0.016610145568847656, -0.015615463256835938, -0.014620780944824219, -0.0136260986328125, -0.012631416320800781, -0.011636734008789062, -0.010642051696777344, -0.009647369384765625, -0.008652687072753906, -0.0076580047607421875, -0.006663322448730469, -0.00566864013671875, -0.004673957824707031, -0.0036792755126953125, -0.0026845932006835938, -0.001689910888671875, -0.0006952285766601562, 0.0002994537353515625, 0.0012941360473632812, 0.002288818359375, 0.0032835006713867188, 0.0042781829833984375, 0.005272865295410156, 0.006267547607421875, 0.007262229919433594, 0.008256912231445312, 0.009251594543457031, 0.01024627685546875, 0.011240959167480469, 0.012235641479492188, 0.013230323791503906, 0.014225006103515625, 0.015219688415527344, 0.016214370727539062, 0.01720905303955078, 0.0182037353515625, 0.01919841766357422, 0.020193099975585938, 0.021187782287597656, 0.022182464599609375, 0.023177146911621094, 0.024171829223632812, 0.02516651153564453, 0.02616119384765625, 0.02715587615966797, 0.028150558471679688, 0.029145240783691406, 0.030139923095703125, 0.031134605407714844, 0.03212928771972656, 0.03312397003173828, 0.03411865234375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 8.0, 12.0, 16.0, 18.0, 30.0, 45.0, 95.0, 186.0, 693.0, 4123.0, 96264.0, 931797.0, 13005.0, 1518.0, 351.0, 137.0, 65.0, 43.0, 33.0, 20.0, 12.0, 8.0, 8.0, 7.0, 7.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.73486328125, -0.7127532958984375, -0.690643310546875, -0.6685333251953125, -0.64642333984375, -0.6243133544921875, -0.602203369140625, -0.5800933837890625, -0.5579833984375, -0.5358734130859375, -0.513763427734375, -0.4916534423828125, -0.46954345703125, -0.4474334716796875, -0.425323486328125, -0.4032135009765625, -0.381103515625, -0.3589935302734375, -0.336883544921875, -0.3147735595703125, -0.29266357421875, -0.2705535888671875, -0.248443603515625, -0.2263336181640625, -0.2042236328125, -0.1821136474609375, -0.160003662109375, -0.1378936767578125, -0.11578369140625, -0.0936737060546875, -0.071563720703125, -0.0494537353515625, -0.02734375, -0.0052337646484375, 0.016876220703125, 0.0389862060546875, 0.06109619140625, 0.0832061767578125, 0.105316162109375, 0.1274261474609375, 0.1495361328125, 0.1716461181640625, 0.193756103515625, 0.2158660888671875, 0.23797607421875, 0.2600860595703125, 0.282196044921875, 0.3043060302734375, 0.326416015625, 0.3485260009765625, 0.370635986328125, 0.3927459716796875, 0.41485595703125, 0.4369659423828125, 0.459075927734375, 0.4811859130859375, 0.5032958984375, 0.5254058837890625, 0.547515869140625, 0.5696258544921875, 0.59173583984375, 0.6138458251953125, 0.635955810546875, 0.6580657958984375, 0.68017578125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 11.0, 13.0, 9.0, 10.0, 19.0, 20.0, 32.0, 47.0, 49.0, 65.0, 105.0, 189.0, 159.0, 77.0, 67.0, 53.0, 22.0, 12.0, 9.0, 9.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09589116275310516, -0.09267681837081909, -0.08946247398853302, -0.08624812960624695, -0.08303378522396088, -0.0798194408416748, -0.07660509645938873, -0.07339075207710266, -0.07017640769481659, -0.06696206331253052, -0.06374771893024445, -0.060533374547958374, -0.0573190301656723, -0.05410468578338623, -0.05089034140110016, -0.04767599701881409, -0.04446164891123772, -0.041247304528951645, -0.03803296014666557, -0.0348186157643795, -0.03160427138209343, -0.02838992513716221, -0.025175580754876137, -0.021961236372590065, -0.018746891990303993, -0.015532547608017921, -0.01231820322573185, -0.009103857912123203, -0.0058895135298371315, -0.002675168216228485, 0.0005391761660575867, 0.0037535205483436584, 0.00696786493062973, 0.010182209312915802, 0.013396553695201874, 0.016610898077487946, 0.019825242459774017, 0.02303958870470524, 0.02625393308699131, 0.029468277469277382, 0.032682619988918304, 0.035896964371204376, 0.03911130875349045, 0.04232565313577652, 0.04553999751806259, 0.04875434190034866, 0.051968686282634735, 0.05518303066492081, 0.05839737877249718, 0.06161172315478325, 0.06482607126235962, 0.06804041564464569, 0.07125476002693176, 0.07446910440921783, 0.0776834487915039, 0.08089779317378998, 0.08411213755607605, 0.08732648193836212, 0.0905408263206482, 0.09375517070293427, 0.09696951508522034, 0.10018385946750641, 0.10339820384979248, 0.10661254823207855, 0.10982689261436462]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 6.0, 6.0, 8.0, 10.0, 10.0, 20.0, 19.0, 24.0, 29.0, 28.0, 35.0, 44.0, 27.0, 49.0, 40.0, 41.0, 40.0, 34.0, 49.0, 39.0, 46.0, 48.0, 60.0, 41.0, 36.0, 41.0, 29.0, 18.0, 27.0, 20.0, 15.0, 10.0, 20.0, 12.0, 4.0, 5.0, 1.0, 4.0, 5.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018271148204803467, -0.01762533187866211, -0.016979515552520752, -0.016333699226379395, -0.015687882900238037, -0.01504206657409668, -0.014396250247955322, -0.013750433921813965, -0.013104617595672607, -0.01245880126953125, -0.011812984943389893, -0.011167168617248535, -0.010521352291107178, -0.00987553596496582, -0.009229719638824463, -0.008583903312683105, -0.007938086986541748, -0.007292270660400391, -0.006646454334259033, -0.006000638008117676, -0.005354821681976318, -0.004709005355834961, -0.0040631890296936035, -0.003417372703552246, -0.0027715563774108887, -0.0021257400512695312, -0.0014799237251281738, -0.0008341073989868164, -0.00018829107284545898, 0.00045752525329589844, 0.0011033415794372559, 0.0017491579055786133, 0.0023949742317199707, 0.003040790557861328, 0.0036866068840026855, 0.004332423210144043, 0.0049782395362854, 0.005624055862426758, 0.006269872188568115, 0.006915688514709473, 0.00756150484085083, 0.008207321166992188, 0.008853137493133545, 0.009498953819274902, 0.01014477014541626, 0.010790586471557617, 0.011436402797698975, 0.012082219123840332, 0.01272803544998169, 0.013373851776123047, 0.014019668102264404, 0.014665484428405762, 0.01531130075454712, 0.015957117080688477, 0.016602933406829834, 0.01724874973297119, 0.01789456605911255, 0.018540382385253906, 0.019186198711395264, 0.01983201503753662, 0.02047783136367798, 0.021123647689819336, 0.021769464015960693, 0.02241528034210205, 0.023061096668243408]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 2.0, 6.0, 17.0, 11.0, 13.0, 12.0, 14.0, 22.0, 20.0, 20.0, 40.0, 35.0, 38.0, 30.0, 41.0, 46.0, 40.0, 44.0, 39.0, 46.0, 50.0, 35.0, 49.0, 44.0, 25.0, 18.0, 36.0, 32.0, 23.0, 24.0, 17.0, 17.0, 21.0, 11.0, 11.0, 5.0, 6.0, 4.0, 10.0, 8.0, 1.0, 2.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.31640625, -5.14959716796875, -4.9827880859375, -4.81597900390625, -4.649169921875, -4.48236083984375, -4.3155517578125, -4.14874267578125, -3.98193359375, -3.81512451171875, -3.6483154296875, -3.48150634765625, -3.314697265625, -3.14788818359375, -2.9810791015625, -2.81427001953125, -2.6474609375, -2.48065185546875, -2.3138427734375, -2.14703369140625, -1.980224609375, -1.81341552734375, -1.6466064453125, -1.47979736328125, -1.31298828125, -1.14617919921875, -0.9793701171875, -0.81256103515625, -0.645751953125, -0.47894287109375, -0.3121337890625, -0.14532470703125, 0.021484375, 0.18829345703125, 0.3551025390625, 0.52191162109375, 0.688720703125, 0.85552978515625, 1.0223388671875, 1.18914794921875, 1.35595703125, 1.52276611328125, 1.6895751953125, 1.85638427734375, 2.023193359375, 2.19000244140625, 2.3568115234375, 2.52362060546875, 2.6904296875, 2.85723876953125, 3.0240478515625, 3.19085693359375, 3.357666015625, 3.52447509765625, 3.6912841796875, 3.85809326171875, 4.02490234375, 4.19171142578125, 4.3585205078125, 4.52532958984375, 4.692138671875, 4.85894775390625, 5.0257568359375, 5.19256591796875, 5.359375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 6.0, 5.0, 11.0, 17.0, 24.0, 25.0, 27.0, 42.0, 62.0, 84.0, 119.0, 256.0, 348.0, 758.0, 1511.0, 3337.0, 8125.0, 23536.0, 96636.0, 622221.0, 226486.0, 42505.0, 12862.0, 4918.0, 2209.0, 1076.0, 513.0, 273.0, 169.0, 109.0, 72.0, 38.0, 34.0, 36.0, 20.0, 23.0, 9.0, 6.0, 10.0, 8.0, 8.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.21875, -8.92822265625, -8.6376953125, -8.34716796875, -8.056640625, -7.76611328125, -7.4755859375, -7.18505859375, -6.89453125, -6.60400390625, -6.3134765625, -6.02294921875, -5.732421875, -5.44189453125, -5.1513671875, -4.86083984375, -4.5703125, -4.27978515625, -3.9892578125, -3.69873046875, -3.408203125, -3.11767578125, -2.8271484375, -2.53662109375, -2.24609375, -1.95556640625, -1.6650390625, -1.37451171875, -1.083984375, -0.79345703125, -0.5029296875, -0.21240234375, 0.078125, 0.36865234375, 0.6591796875, 0.94970703125, 1.240234375, 1.53076171875, 1.8212890625, 2.11181640625, 2.40234375, 2.69287109375, 2.9833984375, 3.27392578125, 3.564453125, 3.85498046875, 4.1455078125, 4.43603515625, 4.7265625, 5.01708984375, 5.3076171875, 5.59814453125, 5.888671875, 6.17919921875, 6.4697265625, 6.76025390625, 7.05078125, 7.34130859375, 7.6318359375, 7.92236328125, 8.212890625, 8.50341796875, 8.7939453125, 9.08447265625, 9.375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 12.0, 11.0, 18.0, 11.0, 10.0, 18.0, 13.0, 23.0, 30.0, 28.0, 30.0, 33.0, 33.0, 36.0, 43.0, 64.0, 93.0, 281.0, 1597.0, 147.0, 85.0, 57.0, 46.0, 34.0, 42.0, 36.0, 23.0, 26.0, 30.0, 27.0, 15.0, 17.0, 14.0, 9.0, 12.0, 11.0, 6.0, 5.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.125, -15.59228515625, -15.0595703125, -14.52685546875, -13.994140625, -13.46142578125, -12.9287109375, -12.39599609375, -11.86328125, -11.33056640625, -10.7978515625, -10.26513671875, -9.732421875, -9.19970703125, -8.6669921875, -8.13427734375, -7.6015625, -7.06884765625, -6.5361328125, -6.00341796875, -5.470703125, -4.93798828125, -4.4052734375, -3.87255859375, -3.33984375, -2.80712890625, -2.2744140625, -1.74169921875, -1.208984375, -0.67626953125, -0.1435546875, 0.38916015625, 0.921875, 1.45458984375, 1.9873046875, 2.52001953125, 3.052734375, 3.58544921875, 4.1181640625, 4.65087890625, 5.18359375, 5.71630859375, 6.2490234375, 6.78173828125, 7.314453125, 7.84716796875, 8.3798828125, 8.91259765625, 9.4453125, 9.97802734375, 10.5107421875, 11.04345703125, 11.576171875, 12.10888671875, 12.6416015625, 13.17431640625, 13.70703125, 14.23974609375, 14.7724609375, 15.30517578125, 15.837890625, 16.37060546875, 16.9033203125, 17.43603515625, 17.96875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 5.0, 4.0, 13.0, 16.0, 12.0, 13.0, 19.0, 28.0, 34.0, 35.0, 48.0, 51.0, 70.0, 120.0, 170.0, 319.0, 756.0, 5315.0, 2803224.0, 331362.0, 2712.0, 503.0, 293.0, 137.0, 98.0, 62.0, 53.0, 38.0, 31.0, 27.0, 23.0, 17.0, 16.0, 20.0, 16.0, 10.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-55.0625, -53.48388671875, -51.9052734375, -50.32666015625, -48.748046875, -47.16943359375, -45.5908203125, -44.01220703125, -42.43359375, -40.85498046875, -39.2763671875, -37.69775390625, -36.119140625, -34.54052734375, -32.9619140625, -31.38330078125, -29.8046875, -28.22607421875, -26.6474609375, -25.06884765625, -23.490234375, -21.91162109375, -20.3330078125, -18.75439453125, -17.17578125, -15.59716796875, -14.0185546875, -12.43994140625, -10.861328125, -9.28271484375, -7.7041015625, -6.12548828125, -4.546875, -2.96826171875, -1.3896484375, 0.18896484375, 1.767578125, 3.34619140625, 4.9248046875, 6.50341796875, 8.08203125, 9.66064453125, 11.2392578125, 12.81787109375, 14.396484375, 15.97509765625, 17.5537109375, 19.13232421875, 20.7109375, 22.28955078125, 23.8681640625, 25.44677734375, 27.025390625, 28.60400390625, 30.1826171875, 31.76123046875, 33.33984375, 34.91845703125, 36.4970703125, 38.07568359375, 39.654296875, 41.23291015625, 42.8115234375, 44.39013671875, 45.96875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 120.0, 526.0, 332.0, 33.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.603519439697266, -39.50398254394531, -36.40444564819336, -33.304908752441406, -30.205373764038086, -27.105836868286133, -24.006301879882812, -20.90676498413086, -17.807228088378906, -14.707691192626953, -11.608155250549316, -8.50861930847168, -5.409082412719727, -2.3095455169677734, 0.7899894714355469, 3.8895263671875, 6.989063262939453, 10.088600158691406, 13.188136100769043, 16.28767204284668, 19.387208938598633, 22.486745834350586, 25.586280822753906, 28.68581771850586, 31.785354614257812, 34.884891510009766, 37.98442840576172, 41.083961486816406, 44.183502197265625, 47.28303527832031, 50.382572174072266, 53.48210906982422, 56.58164978027344, 59.68118667602539, 62.780723571777344, 65.88025665283203, 68.97979736328125, 72.07933044433594, 75.17886352539062, 78.27840423583984, 81.37794494628906, 84.47747802734375, 87.57701873779297, 90.67655181884766, 93.77609252929688, 96.87562561035156, 99.97515869140625, 103.07469940185547, 106.17423248291016, 109.27376556396484, 112.37330627441406, 115.47283935546875, 118.57238006591797, 121.67191314697266, 124.77145385742188, 127.87098693847656, 130.97052001953125, 134.07005310058594, 137.16958618164062, 140.26913452148438, 143.36866760253906, 146.46820068359375, 149.56773376464844, 152.66726684570312, 155.76681518554688]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 6.0, 10.0, 12.0, 9.0, 10.0, 22.0, 21.0, 16.0, 21.0, 24.0, 28.0, 42.0, 33.0, 33.0, 36.0, 59.0, 44.0, 50.0, 43.0, 41.0, 56.0, 39.0, 45.0, 41.0, 36.0, 30.0, 29.0, 31.0, 33.0, 19.0, 14.0, 17.0, 10.0, 12.0, 4.0, 4.0, 8.0, 3.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-63.52619934082031, -61.83320999145508, -60.140220642089844, -58.44723129272461, -56.754241943359375, -55.061248779296875, -53.368263244628906, -51.675270080566406, -49.98228073120117, -48.28929138183594, -46.5963020324707, -44.90331268310547, -43.210323333740234, -41.517333984375, -39.8243408203125, -38.131351470947266, -36.43836212158203, -34.7453727722168, -33.05238342285156, -31.359394073486328, -29.66640281677246, -27.973413467407227, -26.280424118041992, -24.587432861328125, -22.894447326660156, -21.201457977294922, -19.508468627929688, -17.815479278564453, -16.122488021850586, -14.429498672485352, -12.736509323120117, -11.043519020080566, -9.350528717041016, -7.657538890838623, -5.9645490646362305, -4.271559715270996, -2.5785698890686035, -0.8855800628662109, 0.8074092864990234, 2.500399589538574, 4.193388938903809, 5.886378765106201, 7.579368591308594, 9.272357940673828, 10.965347290039062, 12.658337593078613, 14.351326942443848, 16.0443172454834, 17.737306594848633, 19.430295944213867, 21.1232852935791, 22.81627655029297, 24.509265899658203, 26.202255249023438, 27.895244598388672, 29.588233947753906, 31.28122329711914, 32.974212646484375, 34.66720199584961, 36.360191345214844, 38.05318069458008, 39.74617004394531, 41.43916320800781, 43.13215255737305, 44.82514190673828]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 5.0, 4.0, 7.0, 6.0, 12.0, 8.0, 12.0, 16.0, 19.0, 21.0, 27.0, 26.0, 36.0, 32.0, 28.0, 30.0, 38.0, 50.0, 37.0, 50.0, 48.0, 42.0, 38.0, 33.0, 38.0, 41.0, 41.0, 25.0, 25.0, 22.0, 29.0, 21.0, 23.0, 14.0, 14.0, 17.0, 14.0, 6.0, 9.0, 8.0, 7.0, 6.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.1875, -5.01373291015625, -4.8399658203125, -4.66619873046875, -4.492431640625, -4.31866455078125, -4.1448974609375, -3.97113037109375, -3.79736328125, -3.62359619140625, -3.4498291015625, -3.27606201171875, -3.102294921875, -2.92852783203125, -2.7547607421875, -2.58099365234375, -2.4072265625, -2.23345947265625, -2.0596923828125, -1.88592529296875, -1.712158203125, -1.53839111328125, -1.3646240234375, -1.19085693359375, -1.01708984375, -0.84332275390625, -0.6695556640625, -0.49578857421875, -0.322021484375, -0.14825439453125, 0.0255126953125, 0.19927978515625, 0.373046875, 0.54681396484375, 0.7205810546875, 0.89434814453125, 1.068115234375, 1.24188232421875, 1.4156494140625, 1.58941650390625, 1.76318359375, 1.93695068359375, 2.1107177734375, 2.28448486328125, 2.458251953125, 2.63201904296875, 2.8057861328125, 2.97955322265625, 3.1533203125, 3.32708740234375, 3.5008544921875, 3.67462158203125, 3.848388671875, 4.02215576171875, 4.1959228515625, 4.36968994140625, 4.54345703125, 4.71722412109375, 4.8909912109375, 5.06475830078125, 5.238525390625, 5.41229248046875, 5.5860595703125, 5.75982666015625, 5.93359375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 10.0, 9.0, 15.0, 18.0, 25.0, 38.0, 47.0, 104.0, 126.0, 183.0, 288.0, 415.0, 713.0, 1067.0, 1657.0, 2893.0, 5194.0, 10179.0, 24013.0, 66877.0, 227836.0, 767043.0, 1557455.0, 1037866.0, 334213.0, 96681.0, 31892.0, 12711.0, 6239.0, 3280.0, 1877.0, 1169.0, 703.0, 435.0, 326.0, 225.0, 121.0, 99.0, 65.0, 55.0, 34.0, 18.0, 18.0, 19.0, 7.0, 5.0, 3.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.26171875, -7.03228759765625, -6.8028564453125, -6.57342529296875, -6.343994140625, -6.11456298828125, -5.8851318359375, -5.65570068359375, -5.42626953125, -5.19683837890625, -4.9674072265625, -4.73797607421875, -4.508544921875, -4.27911376953125, -4.0496826171875, -3.82025146484375, -3.5908203125, -3.36138916015625, -3.1319580078125, -2.90252685546875, -2.673095703125, -2.44366455078125, -2.2142333984375, -1.98480224609375, -1.75537109375, -1.52593994140625, -1.2965087890625, -1.06707763671875, -0.837646484375, -0.60821533203125, -0.3787841796875, -0.14935302734375, 0.080078125, 0.30950927734375, 0.5389404296875, 0.76837158203125, 0.997802734375, 1.22723388671875, 1.4566650390625, 1.68609619140625, 1.91552734375, 2.14495849609375, 2.3743896484375, 2.60382080078125, 2.833251953125, 3.06268310546875, 3.2921142578125, 3.52154541015625, 3.7509765625, 3.98040771484375, 4.2098388671875, 4.43927001953125, 4.668701171875, 4.89813232421875, 5.1275634765625, 5.35699462890625, 5.58642578125, 5.81585693359375, 6.0452880859375, 6.27471923828125, 6.504150390625, 6.73358154296875, 6.9630126953125, 7.19244384765625, 7.421875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 8.0, 11.0, 17.0, 14.0, 20.0, 34.0, 56.0, 62.0, 99.0, 139.0, 219.0, 263.0, 408.0, 489.0, 530.0, 466.0, 344.0, 248.0, 200.0, 123.0, 78.0, 73.0, 47.0, 31.0, 27.0, 20.0, 15.0, 10.0, 5.0, 3.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.015625, -13.5958251953125, -13.176025390625, -12.7562255859375, -12.33642578125, -11.9166259765625, -11.496826171875, -11.0770263671875, -10.6572265625, -10.2374267578125, -9.817626953125, -9.3978271484375, -8.97802734375, -8.5582275390625, -8.138427734375, -7.7186279296875, -7.298828125, -6.8790283203125, -6.459228515625, -6.0394287109375, -5.61962890625, -5.1998291015625, -4.780029296875, -4.3602294921875, -3.9404296875, -3.5206298828125, -3.100830078125, -2.6810302734375, -2.26123046875, -1.8414306640625, -1.421630859375, -1.0018310546875, -0.58203125, -0.1622314453125, 0.257568359375, 0.6773681640625, 1.09716796875, 1.5169677734375, 1.936767578125, 2.3565673828125, 2.7763671875, 3.1961669921875, 3.615966796875, 4.0357666015625, 4.45556640625, 4.8753662109375, 5.295166015625, 5.7149658203125, 6.134765625, 6.5545654296875, 6.974365234375, 7.3941650390625, 7.81396484375, 8.2337646484375, 8.653564453125, 9.0733642578125, 9.4931640625, 9.9129638671875, 10.332763671875, 10.7525634765625, 11.17236328125, 11.5921630859375, 12.011962890625, 12.4317626953125, 12.8515625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 14.0, 14.0, 22.0, 26.0, 30.0, 48.0, 78.0, 127.0, 189.0, 379.0, 691.0, 1932.0, 8918.0, 150747.0, 3874168.0, 144520.0, 8885.0, 1851.0, 722.0, 381.0, 183.0, 110.0, 75.0, 55.0, 39.0, 17.0, 15.0, 14.0, 9.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.0625, -41.650390625, -40.23828125, -38.826171875, -37.4140625, -36.001953125, -34.58984375, -33.177734375, -31.765625, -30.353515625, -28.94140625, -27.529296875, -26.1171875, -24.705078125, -23.29296875, -21.880859375, -20.46875, -19.056640625, -17.64453125, -16.232421875, -14.8203125, -13.408203125, -11.99609375, -10.583984375, -9.171875, -7.759765625, -6.34765625, -4.935546875, -3.5234375, -2.111328125, -0.69921875, 0.712890625, 2.125, 3.537109375, 4.94921875, 6.361328125, 7.7734375, 9.185546875, 10.59765625, 12.009765625, 13.421875, 14.833984375, 16.24609375, 17.658203125, 19.0703125, 20.482421875, 21.89453125, 23.306640625, 24.71875, 26.130859375, 27.54296875, 28.955078125, 30.3671875, 31.779296875, 33.19140625, 34.603515625, 36.015625, 37.427734375, 38.83984375, 40.251953125, 41.6640625, 43.076171875, 44.48828125, 45.900390625, 47.3125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 38.0, 310.0, 547.0, 117.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.59405517578125, -96.21231079101562, -86.83056640625, -77.4488296508789, -68.06708526611328, -58.685340881347656, -49.3036003112793, -39.92185974121094, -30.540115356445312, -21.15837287902832, -11.776630401611328, -2.394887924194336, 6.986854553222656, 16.36859893798828, 25.75033950805664, 35.132080078125, 44.513824462890625, 53.89556884765625, 63.27730941772461, 72.65904998779297, 82.0407943725586, 91.42253875732422, 100.80427551269531, 110.18601989746094, 119.56776428222656, 128.9495086669922, 138.3312530517578, 147.71299743652344, 157.0947265625, 166.47647094726562, 175.85821533203125, 185.23995971679688, 194.6217041015625, 204.00344848632812, 213.38519287109375, 222.76693725585938, 232.148681640625, 241.53042602539062, 250.9121551513672, 260.29388427734375, 269.6756591796875, 279.0574035644531, 288.43914794921875, 297.8208923339844, 307.20263671875, 316.5843811035156, 325.96612548828125, 335.34783935546875, 344.7295837402344, 354.111328125, 363.4930725097656, 372.87481689453125, 382.2565612792969, 391.6383056640625, 401.0200500488281, 410.40179443359375, 419.78350830078125, 429.1652526855469, 438.5469970703125, 447.9287414550781, 457.31048583984375, 466.6922302246094, 476.073974609375, 485.4556884765625, 494.83746337890625]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 7.0, 9.0, 13.0, 10.0, 19.0, 16.0, 25.0, 24.0, 22.0, 27.0, 37.0, 31.0, 34.0, 40.0, 33.0, 41.0, 46.0, 47.0, 47.0, 43.0, 38.0, 38.0, 44.0, 41.0, 22.0, 37.0, 27.0, 29.0, 25.0, 22.0, 22.0, 18.0, 16.0, 14.0, 9.0, 3.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.166351318359375, -39.82866287231445, -38.4909782409668, -37.153289794921875, -35.81560134887695, -34.4779167175293, -33.140228271484375, -31.802541732788086, -30.464855194091797, -29.127168655395508, -27.789480209350586, -26.451793670654297, -25.114107131958008, -23.77642059326172, -22.438732147216797, -21.101045608520508, -19.763357162475586, -18.425670623779297, -17.087982177734375, -15.750295639038086, -14.412609100341797, -13.074921607971191, -11.737234115600586, -10.399547576904297, -9.061860084533691, -7.724173069000244, -6.386486053466797, -5.048798561096191, -3.711111545562744, -2.373424530029297, -1.0357370376586914, 0.30194950103759766, 1.6396369934082031, 2.9773240089416504, 4.315011024475098, 5.652698516845703, 6.99038553237915, 8.328072547912598, 9.665760040283203, 11.003446578979492, 12.341134071350098, 13.678821563720703, 15.016508102416992, 16.35419464111328, 17.691883087158203, 19.029569625854492, 20.36725616455078, 21.704944610595703, 23.042631149291992, 24.38031768798828, 25.718006134033203, 27.055692672729492, 28.39337921142578, 29.731067657470703, 31.068754196166992, 32.40644073486328, 33.7441291809082, 35.081817626953125, 36.41950225830078, 37.7571907043457, 39.094879150390625, 40.43256378173828, 41.7702522277832, 43.107940673828125, 44.44562530517578]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 12.0, 10.0, 23.0, 21.0, 14.0, 18.0, 22.0, 26.0, 38.0, 31.0, 32.0, 43.0, 46.0, 38.0, 44.0, 50.0, 45.0, 49.0, 38.0, 38.0, 48.0, 42.0, 26.0, 34.0, 28.0, 19.0, 23.0, 22.0, 15.0, 19.0, 14.0, 17.0, 9.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0], "bins": [-6.734375, -6.54443359375, -6.3544921875, -6.16455078125, -5.974609375, -5.78466796875, -5.5947265625, -5.40478515625, -5.21484375, -5.02490234375, -4.8349609375, -4.64501953125, -4.455078125, -4.26513671875, -4.0751953125, -3.88525390625, -3.6953125, -3.50537109375, -3.3154296875, -3.12548828125, -2.935546875, -2.74560546875, -2.5556640625, -2.36572265625, -2.17578125, -1.98583984375, -1.7958984375, -1.60595703125, -1.416015625, -1.22607421875, -1.0361328125, -0.84619140625, -0.65625, -0.46630859375, -0.2763671875, -0.08642578125, 0.103515625, 0.29345703125, 0.4833984375, 0.67333984375, 0.86328125, 1.05322265625, 1.2431640625, 1.43310546875, 1.623046875, 1.81298828125, 2.0029296875, 2.19287109375, 2.3828125, 2.57275390625, 2.7626953125, 2.95263671875, 3.142578125, 3.33251953125, 3.5224609375, 3.71240234375, 3.90234375, 4.09228515625, 4.2822265625, 4.47216796875, 4.662109375, 4.85205078125, 5.0419921875, 5.23193359375, 5.421875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 10.0, 7.0, 6.0, 18.0, 21.0, 34.0, 45.0, 50.0, 79.0, 130.0, 174.0, 277.0, 435.0, 621.0, 981.0, 1460.0, 2142.0, 3474.0, 5599.0, 8698.0, 13577.0, 21176.0, 33140.0, 52077.0, 81856.0, 125067.0, 173279.0, 173211.0, 124606.0, 81700.0, 52261.0, 33300.0, 21141.0, 13684.0, 8595.0, 5456.0, 3493.0, 2337.0, 1544.0, 921.0, 615.0, 402.0, 279.0, 183.0, 140.0, 91.0, 51.0, 28.0, 34.0, 23.0, 12.0, 8.0, 12.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.64453125, -0.6243896484375, -0.604248046875, -0.5841064453125, -0.56396484375, -0.5438232421875, -0.523681640625, -0.5035400390625, -0.4833984375, -0.4632568359375, -0.443115234375, -0.4229736328125, -0.40283203125, -0.3826904296875, -0.362548828125, -0.3424072265625, -0.322265625, -0.3021240234375, -0.281982421875, -0.2618408203125, -0.24169921875, -0.2215576171875, -0.201416015625, -0.1812744140625, -0.1611328125, -0.1409912109375, -0.120849609375, -0.1007080078125, -0.08056640625, -0.0604248046875, -0.040283203125, -0.0201416015625, 0.0, 0.0201416015625, 0.040283203125, 0.0604248046875, 0.08056640625, 0.1007080078125, 0.120849609375, 0.1409912109375, 0.1611328125, 0.1812744140625, 0.201416015625, 0.2215576171875, 0.24169921875, 0.2618408203125, 0.281982421875, 0.3021240234375, 0.322265625, 0.3424072265625, 0.362548828125, 0.3826904296875, 0.40283203125, 0.4229736328125, 0.443115234375, 0.4632568359375, 0.4833984375, 0.5035400390625, 0.523681640625, 0.5438232421875, 0.56396484375, 0.5841064453125, 0.604248046875, 0.6243896484375, 0.64453125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 0.0, 3.0, 6.0, 6.0, 5.0, 12.0, 12.0, 13.0, 9.0, 7.0, 18.0, 24.0, 18.0, 21.0, 22.0, 27.0, 28.0, 37.0, 34.0, 39.0, 44.0, 30.0, 33.0, 41.0, 1064.0, 42.0, 40.0, 43.0, 33.0, 25.0, 31.0, 25.0, 34.0, 29.0, 25.0, 26.0, 21.0, 14.0, 16.0, 7.0, 9.0, 22.0, 6.0, 11.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.390625, -3.28131103515625, -3.1719970703125, -3.06268310546875, -2.953369140625, -2.84405517578125, -2.7347412109375, -2.62542724609375, -2.51611328125, -2.40679931640625, -2.2974853515625, -2.18817138671875, -2.078857421875, -1.96954345703125, -1.8602294921875, -1.75091552734375, -1.6416015625, -1.53228759765625, -1.4229736328125, -1.31365966796875, -1.204345703125, -1.09503173828125, -0.9857177734375, -0.87640380859375, -0.76708984375, -0.65777587890625, -0.5484619140625, -0.43914794921875, -0.329833984375, -0.22052001953125, -0.1112060546875, -0.00189208984375, 0.107421875, 0.21673583984375, 0.3260498046875, 0.43536376953125, 0.544677734375, 0.65399169921875, 0.7633056640625, 0.87261962890625, 0.98193359375, 1.09124755859375, 1.2005615234375, 1.30987548828125, 1.419189453125, 1.52850341796875, 1.6378173828125, 1.74713134765625, 1.8564453125, 1.96575927734375, 2.0750732421875, 2.18438720703125, 2.293701171875, 2.40301513671875, 2.5123291015625, 2.62164306640625, 2.73095703125, 2.84027099609375, 2.9495849609375, 3.05889892578125, 3.168212890625, 3.27752685546875, 3.3868408203125, 3.49615478515625, 3.60546875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 7.0, 6.0, 8.0, 17.0, 30.0, 32.0, 57.0, 76.0, 115.0, 137.0, 235.0, 303.0, 432.0, 651.0, 923.0, 1408.0, 1984.0, 2822.0, 3994.0, 5783.0, 8443.0, 12044.0, 17219.0, 24957.0, 35766.0, 51274.0, 72816.0, 100057.0, 128898.0, 1179376.0, 122491.0, 95698.0, 69544.0, 48684.0, 34068.0, 23312.0, 16105.0, 11439.0, 7942.0, 5561.0, 3669.0, 2685.0, 1913.0, 1268.0, 924.0, 617.0, 457.0, 300.0, 200.0, 129.0, 93.0, 65.0, 31.0, 28.0, 26.0, 13.0, 9.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.326904296875, -0.3168220520019531, -0.30673980712890625, -0.2966575622558594, -0.2865753173828125, -0.2764930725097656, -0.26641082763671875, -0.2563285827636719, -0.246246337890625, -0.23616409301757812, -0.22608184814453125, -0.21599960327148438, -0.2059173583984375, -0.19583511352539062, -0.18575286865234375, -0.17567062377929688, -0.16558837890625, -0.15550613403320312, -0.14542388916015625, -0.13534164428710938, -0.1252593994140625, -0.11517715454101562, -0.10509490966796875, -0.09501266479492188, -0.084930419921875, -0.07484817504882812, -0.06476593017578125, -0.054683685302734375, -0.0446014404296875, -0.034519195556640625, -0.02443695068359375, -0.014354705810546875, -0.0042724609375, 0.005809783935546875, 0.01589202880859375, 0.025974273681640625, 0.0360565185546875, 0.046138763427734375, 0.05622100830078125, 0.06630325317382812, 0.076385498046875, 0.08646774291992188, 0.09654998779296875, 0.10663223266601562, 0.1167144775390625, 0.12679672241210938, 0.13687896728515625, 0.14696121215820312, 0.15704345703125, 0.16712570190429688, 0.17720794677734375, 0.18729019165039062, 0.1973724365234375, 0.20745468139648438, 0.21753692626953125, 0.22761917114257812, 0.237701416015625, 0.24778366088867188, 0.25786590576171875, 0.2679481506347656, 0.2780303955078125, 0.2881126403808594, 0.29819488525390625, 0.3082771301269531, 0.318359375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 11.0, 5.0, 5.0, 8.0, 11.0, 16.0, 13.0, 19.0, 24.0, 19.0, 22.0, 35.0, 45.0, 35.0, 41.0, 47.0, 52.0, 41.0, 50.0, 62.0, 59.0, 41.0, 36.0, 36.0, 34.0, 32.0, 30.0, 23.0, 28.0, 19.0, 15.0, 14.0, 16.0, 6.0, 6.0, 9.0, 4.0, 6.0, 3.0, 6.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.016754150390625, -0.0162808895111084, -0.015807628631591797, -0.015334367752075195, -0.014861106872558594, -0.014387845993041992, -0.01391458511352539, -0.013441324234008789, -0.012968063354492188, -0.012494802474975586, -0.012021541595458984, -0.011548280715942383, -0.011075019836425781, -0.01060175895690918, -0.010128498077392578, -0.009655237197875977, -0.009181976318359375, -0.008708715438842773, -0.008235454559326172, -0.00776219367980957, -0.007288932800292969, -0.006815671920776367, -0.006342411041259766, -0.005869150161743164, -0.0053958892822265625, -0.004922628402709961, -0.004449367523193359, -0.003976106643676758, -0.0035028457641601562, -0.0030295848846435547, -0.002556324005126953, -0.0020830631256103516, -0.00160980224609375, -0.0011365413665771484, -0.0006632804870605469, -0.0001900196075439453, 0.00028324127197265625, 0.0007565021514892578, 0.0012297630310058594, 0.001703023910522461, 0.0021762847900390625, 0.002649545669555664, 0.0031228065490722656, 0.003596067428588867, 0.004069328308105469, 0.00454258918762207, 0.005015850067138672, 0.0054891109466552734, 0.005962371826171875, 0.0064356327056884766, 0.006908893585205078, 0.00738215446472168, 0.007855415344238281, 0.008328676223754883, 0.008801937103271484, 0.009275197982788086, 0.009748458862304688, 0.010221719741821289, 0.01069498062133789, 0.011168241500854492, 0.011641502380371094, 0.012114763259887695, 0.012588024139404297, 0.013061285018920898, 0.0135345458984375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 7.0, 6.0, 15.0, 17.0, 11.0, 26.0, 21.0, 25.0, 30.0, 27.0, 41.0, 63.0, 91.0, 134.0, 278.0, 925.0, 5817.0, 102645.0, 917552.0, 17579.0, 2071.0, 517.0, 186.0, 108.0, 81.0, 53.0, 40.0, 30.0, 34.0, 22.0, 17.0, 17.0, 9.0, 10.0, 7.0, 6.0, 2.0, 2.0, 6.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334228515625, -0.3227996826171875, -0.311370849609375, -0.2999420166015625, -0.28851318359375, -0.2770843505859375, -0.265655517578125, -0.2542266845703125, -0.2427978515625, -0.2313690185546875, -0.219940185546875, -0.2085113525390625, -0.19708251953125, -0.1856536865234375, -0.174224853515625, -0.1627960205078125, -0.1513671875, -0.1399383544921875, -0.128509521484375, -0.1170806884765625, -0.10565185546875, -0.0942230224609375, -0.082794189453125, -0.0713653564453125, -0.0599365234375, -0.0485076904296875, -0.037078857421875, -0.0256500244140625, -0.01422119140625, -0.0027923583984375, 0.008636474609375, 0.0200653076171875, 0.031494140625, 0.0429229736328125, 0.054351806640625, 0.0657806396484375, 0.07720947265625, 0.0886383056640625, 0.100067138671875, 0.1114959716796875, 0.1229248046875, 0.1343536376953125, 0.145782470703125, 0.1572113037109375, 0.16864013671875, 0.1800689697265625, 0.191497802734375, 0.2029266357421875, 0.21435546875, 0.2257843017578125, 0.237213134765625, 0.2486419677734375, 0.26007080078125, 0.2714996337890625, 0.282928466796875, 0.2943572998046875, 0.3057861328125, 0.3172149658203125, 0.328643798828125, 0.3400726318359375, 0.35150146484375, 0.3629302978515625, 0.374359130859375, 0.3857879638671875, 0.397216796875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 10.0, 10.0, 19.0, 14.0, 16.0, 31.0, 29.0, 40.0, 66.0, 111.0, 155.0, 154.0, 111.0, 72.0, 47.0, 30.0, 17.0, 17.0, 12.0, 11.0, 8.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03648126870393753, -0.034911785274744034, -0.03334230184555054, -0.03177281841635704, -0.030203333124518394, -0.028633849695324898, -0.027064364403486252, -0.025494880974292755, -0.02392539754509926, -0.02235591411590576, -0.020786430686712265, -0.01921694539487362, -0.017647461965680122, -0.016077978536486626, -0.014508494175970554, -0.012939009815454483, -0.011369526386260986, -0.00980004295706749, -0.008230558596551418, -0.006661074701696634, -0.00509159080684185, -0.0035221073776483536, -0.0019526230171322823, -0.00038313865661621094, 0.0011863447725772858, 0.0027558286674320698, 0.004325312562286854, 0.005894796457141638, 0.007464280351996422, 0.009033763781189919, 0.01060324814170599, 0.012172732502222061, 0.013742215931415558, 0.015311699360609055, 0.01688118278980255, 0.018450668081641197, 0.020020151510834694, 0.02158963494002819, 0.023159120231866837, 0.024728603661060333, 0.02629808709025383, 0.027867570519447327, 0.029437053948640823, 0.03100653924047947, 0.032576024532318115, 0.034145504236221313, 0.03571499139070511, 0.037284474819898605, 0.0388539582490921, 0.0404234416782856, 0.041992925107479095, 0.04356240853667259, 0.04513189196586609, 0.046701379120349884, 0.04827086254954338, 0.04984034597873688, 0.051409829407930374, 0.05297931283712387, 0.05454879626631737, 0.056118279695510864, 0.05768776684999466, 0.05925724655389786, 0.06082673370838165, 0.06239621713757515, 0.06396570056676865]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 8.0, 3.0, 5.0, 5.0, 10.0, 18.0, 16.0, 16.0, 15.0, 16.0, 23.0, 26.0, 28.0, 30.0, 34.0, 29.0, 42.0, 42.0, 34.0, 43.0, 42.0, 38.0, 44.0, 46.0, 41.0, 34.0, 34.0, 35.0, 31.0, 27.0, 25.0, 30.0, 19.0, 18.0, 18.0, 11.0, 11.0, 18.0, 7.0, 4.0, 4.0, 7.0, 2.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.010998070240020752, -0.010667339898645878, -0.010336609557271004, -0.01000587921589613, -0.009675148874521255, -0.009344418533146381, -0.009013688191771507, -0.008682957850396633, -0.008352227509021759, -0.008021497167646885, -0.007690766826272011, -0.007360036484897137, -0.007029306143522263, -0.0066985758021473885, -0.006367845460772514, -0.00603711511939764, -0.005706384778022766, -0.005375654436647892, -0.005044924095273018, -0.004714193753898144, -0.00438346341252327, -0.0040527330711483955, -0.0037220027297735214, -0.0033912723883986473, -0.003060542047023773, -0.002729811705648899, -0.002399081364274025, -0.002068351022899151, -0.0017376206815242767, -0.0014068903401494026, -0.0010761599987745285, -0.0007454296573996544, -0.0004146993160247803, -8.396897464990616e-05, 0.00024676136672496796, 0.0005774917080998421, 0.0009082220494747162, 0.0012389523908495903, 0.0015696827322244644, 0.0019004130735993385, 0.0022311434149742126, 0.0025618737563490868, 0.002892604097723961, 0.003223334439098835, 0.003554064780473709, 0.0038847951218485832, 0.004215525463223457, 0.0045462558045983315, 0.004876986145973206, 0.00520771648734808, 0.005538446828722954, 0.005869177170097828, 0.006199907511472702, 0.006530637852847576, 0.00686136819422245, 0.007192098535597324, 0.0075228288769721985, 0.007853559218347073, 0.008184289559721947, 0.00851501990109682, 0.008845750242471695, 0.009176480583846569, 0.009507210925221443, 0.009837941266596317, 0.010168671607971191]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 12.0, 10.0, 23.0, 21.0, 14.0, 19.0, 21.0, 26.0, 38.0, 31.0, 32.0, 43.0, 46.0, 38.0, 43.0, 51.0, 45.0, 49.0, 38.0, 38.0, 48.0, 42.0, 26.0, 34.0, 27.0, 20.0, 23.0, 22.0, 15.0, 19.0, 14.0, 17.0, 9.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0], "bins": [-6.734375, -6.54443359375, -6.3544921875, -6.16455078125, -5.974609375, -5.78466796875, -5.5947265625, -5.40478515625, -5.21484375, -5.02490234375, -4.8349609375, -4.64501953125, -4.455078125, -4.26513671875, -4.0751953125, -3.88525390625, -3.6953125, -3.50537109375, -3.3154296875, -3.12548828125, -2.935546875, -2.74560546875, -2.5556640625, -2.36572265625, -2.17578125, -1.98583984375, -1.7958984375, -1.60595703125, -1.416015625, -1.22607421875, -1.0361328125, -0.84619140625, -0.65625, -0.46630859375, -0.2763671875, -0.08642578125, 0.103515625, 0.29345703125, 0.4833984375, 0.67333984375, 0.86328125, 1.05322265625, 1.2431640625, 1.43310546875, 1.623046875, 1.81298828125, 2.0029296875, 2.19287109375, 2.3828125, 2.57275390625, 2.7626953125, 2.95263671875, 3.142578125, 3.33251953125, 3.5224609375, 3.71240234375, 3.90234375, 4.09228515625, 4.2822265625, 4.47216796875, 4.662109375, 4.85205078125, 5.0419921875, 5.23193359375, 5.421875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 14.0, 9.0, 20.0, 26.0, 49.0, 56.0, 77.0, 129.0, 180.0, 322.0, 478.0, 724.0, 1225.0, 2102.0, 3737.0, 7003.0, 13446.0, 28163.0, 64271.0, 175537.0, 405369.0, 208446.0, 72995.0, 31441.0, 15135.0, 7766.0, 4103.0, 2198.0, 1274.0, 858.0, 455.0, 301.0, 210.0, 139.0, 104.0, 55.0, 45.0, 34.0, 14.0, 17.0, 9.0, 7.0, 6.0, 2.0, 0.0, 4.0, 0.0, 2.0, 3.0], "bins": [-6.62890625, -6.44256591796875, -6.2562255859375, -6.06988525390625, -5.883544921875, -5.69720458984375, -5.5108642578125, -5.32452392578125, -5.13818359375, -4.95184326171875, -4.7655029296875, -4.57916259765625, -4.392822265625, -4.20648193359375, -4.0201416015625, -3.83380126953125, -3.6474609375, -3.46112060546875, -3.2747802734375, -3.08843994140625, -2.902099609375, -2.71575927734375, -2.5294189453125, -2.34307861328125, -2.15673828125, -1.97039794921875, -1.7840576171875, -1.59771728515625, -1.411376953125, -1.22503662109375, -1.0386962890625, -0.85235595703125, -0.666015625, -0.47967529296875, -0.2933349609375, -0.10699462890625, 0.079345703125, 0.26568603515625, 0.4520263671875, 0.63836669921875, 0.82470703125, 1.01104736328125, 1.1973876953125, 1.38372802734375, 1.570068359375, 1.75640869140625, 1.9427490234375, 2.12908935546875, 2.3154296875, 2.50177001953125, 2.6881103515625, 2.87445068359375, 3.060791015625, 3.24713134765625, 3.4334716796875, 3.61981201171875, 3.80615234375, 3.99249267578125, 4.1788330078125, 4.36517333984375, 4.551513671875, 4.73785400390625, 4.9241943359375, 5.11053466796875, 5.296875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 7.0, 4.0, 7.0, 11.0, 13.0, 16.0, 17.0, 21.0, 25.0, 24.0, 30.0, 28.0, 27.0, 34.0, 35.0, 55.0, 58.0, 85.0, 153.0, 1401.0, 381.0, 121.0, 86.0, 52.0, 47.0, 49.0, 25.0, 39.0, 24.0, 23.0, 19.0, 17.0, 22.0, 14.0, 15.0, 9.0, 8.0, 11.0, 8.0, 8.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.875, -17.29833984375, -16.7216796875, -16.14501953125, -15.568359375, -14.99169921875, -14.4150390625, -13.83837890625, -13.26171875, -12.68505859375, -12.1083984375, -11.53173828125, -10.955078125, -10.37841796875, -9.8017578125, -9.22509765625, -8.6484375, -8.07177734375, -7.4951171875, -6.91845703125, -6.341796875, -5.76513671875, -5.1884765625, -4.61181640625, -4.03515625, -3.45849609375, -2.8818359375, -2.30517578125, -1.728515625, -1.15185546875, -0.5751953125, 0.00146484375, 0.578125, 1.15478515625, 1.7314453125, 2.30810546875, 2.884765625, 3.46142578125, 4.0380859375, 4.61474609375, 5.19140625, 5.76806640625, 6.3447265625, 6.92138671875, 7.498046875, 8.07470703125, 8.6513671875, 9.22802734375, 9.8046875, 10.38134765625, 10.9580078125, 11.53466796875, 12.111328125, 12.68798828125, 13.2646484375, 13.84130859375, 14.41796875, 14.99462890625, 15.5712890625, 16.14794921875, 16.724609375, 17.30126953125, 17.8779296875, 18.45458984375, 19.03125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 8.0, 7.0, 13.0, 23.0, 18.0, 25.0, 43.0, 69.0, 76.0, 150.0, 213.0, 349.0, 725.0, 3456.0, 123108.0, 2992328.0, 21913.0, 1747.0, 534.0, 298.0, 204.0, 140.0, 78.0, 49.0, 38.0, 28.0, 20.0, 13.0, 11.0, 8.0, 5.0, 2.0, 4.0, 0.0, 1.0, 4.0], "bins": [-63.46875, -62.00341796875, -60.5380859375, -59.07275390625, -57.607421875, -56.14208984375, -54.6767578125, -53.21142578125, -51.74609375, -50.28076171875, -48.8154296875, -47.35009765625, -45.884765625, -44.41943359375, -42.9541015625, -41.48876953125, -40.0234375, -38.55810546875, -37.0927734375, -35.62744140625, -34.162109375, -32.69677734375, -31.2314453125, -29.76611328125, -28.30078125, -26.83544921875, -25.3701171875, -23.90478515625, -22.439453125, -20.97412109375, -19.5087890625, -18.04345703125, -16.578125, -15.11279296875, -13.6474609375, -12.18212890625, -10.716796875, -9.25146484375, -7.7861328125, -6.32080078125, -4.85546875, -3.39013671875, -1.9248046875, -0.45947265625, 1.005859375, 2.47119140625, 3.9365234375, 5.40185546875, 6.8671875, 8.33251953125, 9.7978515625, 11.26318359375, 12.728515625, 14.19384765625, 15.6591796875, 17.12451171875, 18.58984375, 20.05517578125, 21.5205078125, 22.98583984375, 24.451171875, 25.91650390625, 27.3818359375, 28.84716796875, 30.3125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 48.0, 841.0, 127.0], "bins": [-551.3821411132812, -542.5691528320312, -533.7561645507812, -524.9431762695312, -516.1301879882812, -507.31719970703125, -498.50421142578125, -489.69122314453125, -480.87823486328125, -472.06524658203125, -463.25225830078125, -454.43927001953125, -445.62628173828125, -436.81329345703125, -428.00030517578125, -419.18731689453125, -410.37432861328125, -401.56134033203125, -392.74835205078125, -383.93536376953125, -375.12237548828125, -366.30938720703125, -357.49639892578125, -348.68341064453125, -339.8704528808594, -331.0574645996094, -322.2444763183594, -313.4314880371094, -304.6184997558594, -295.8055114746094, -286.9925231933594, -278.1795349121094, -269.3665771484375, -260.5535888671875, -251.7406005859375, -242.9276123046875, -234.1146240234375, -225.3016357421875, -216.4886474609375, -207.6756591796875, -198.8626708984375, -190.0496826171875, -181.2366943359375, -172.4237060546875, -163.6107177734375, -154.7977294921875, -145.9847412109375, -137.1717529296875, -128.35877990722656, -119.54579162597656, -110.73280334472656, -101.91981506347656, -93.10682678222656, -84.29383850097656, -75.4808578491211, -66.6678695678711, -57.85487747192383, -49.04188919067383, -40.228904724121094, -31.415916442871094, -22.602928161621094, -13.789939880371094, -4.976955413818359, 3.8360328674316406, 12.64902114868164]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 8.0, 7.0, 9.0, 9.0, 13.0, 16.0, 21.0, 22.0, 20.0, 15.0, 28.0, 18.0, 32.0, 34.0, 37.0, 35.0, 40.0, 46.0, 36.0, 37.0, 47.0, 34.0, 32.0, 43.0, 34.0, 34.0, 29.0, 27.0, 34.0, 21.0, 30.0, 20.0, 20.0, 20.0, 13.0, 11.0, 12.0, 12.0, 7.0, 6.0, 12.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-48.853546142578125, -47.29233932495117, -45.73113250732422, -44.169921875, -42.60871505737305, -41.047508239746094, -39.48630142211914, -37.92509460449219, -36.36388397216797, -34.802677154541016, -33.24147033691406, -31.680261611938477, -30.11905288696289, -28.557846069335938, -26.996639251708984, -25.4354305267334, -23.874223709106445, -22.313016891479492, -20.751808166503906, -19.190601348876953, -17.629392623901367, -16.068185806274414, -14.506978034973145, -12.945770263671875, -11.384562492370605, -9.823354721069336, -8.262146949768066, -6.700939655303955, -5.1397318840026855, -3.578524112701416, -2.0173168182373047, -0.45610904693603516, 1.1050987243652344, 2.666306495666504, 4.227514266967773, 5.788721561431885, 7.349929332733154, 8.911136627197266, 10.472344398498535, 12.033552169799805, 13.594759941101074, 15.155967712402344, 16.717174530029297, 18.278383255004883, 19.839590072631836, 21.400798797607422, 22.962005615234375, 24.523212432861328, 26.084421157836914, 27.645627975463867, 29.206836700439453, 30.768043518066406, 32.32925033569336, 33.89046096801758, 35.45166778564453, 37.012874603271484, 38.57408142089844, 40.13528823852539, 41.696495056152344, 43.25770568847656, 44.818912506103516, 46.38011932373047, 47.94132614135742, 49.502532958984375, 51.063743591308594]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 0.0, 2.0, 5.0, 3.0, 9.0, 14.0, 14.0, 18.0, 17.0, 22.0, 26.0, 23.0, 27.0, 42.0, 32.0, 37.0, 39.0, 44.0, 43.0, 46.0, 50.0, 49.0, 39.0, 52.0, 34.0, 47.0, 33.0, 27.0, 37.0, 21.0, 24.0, 24.0, 23.0, 18.0, 10.0, 11.0, 5.0, 9.0, 4.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.07421875, -6.8712158203125, -6.668212890625, -6.4652099609375, -6.26220703125, -6.0592041015625, -5.856201171875, -5.6531982421875, -5.4501953125, -5.2471923828125, -5.044189453125, -4.8411865234375, -4.63818359375, -4.4351806640625, -4.232177734375, -4.0291748046875, -3.826171875, -3.6231689453125, -3.420166015625, -3.2171630859375, -3.01416015625, -2.8111572265625, -2.608154296875, -2.4051513671875, -2.2021484375, -1.9991455078125, -1.796142578125, -1.5931396484375, -1.39013671875, -1.1871337890625, -0.984130859375, -0.7811279296875, -0.578125, -0.3751220703125, -0.172119140625, 0.0308837890625, 0.23388671875, 0.4368896484375, 0.639892578125, 0.8428955078125, 1.0458984375, 1.2489013671875, 1.451904296875, 1.6549072265625, 1.85791015625, 2.0609130859375, 2.263916015625, 2.4669189453125, 2.669921875, 2.8729248046875, 3.075927734375, 3.2789306640625, 3.48193359375, 3.6849365234375, 3.887939453125, 4.0909423828125, 4.2939453125, 4.4969482421875, 4.699951171875, 4.9029541015625, 5.10595703125, 5.3089599609375, 5.511962890625, 5.7149658203125, 5.91796875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 10.0, 9.0, 19.0, 23.0, 38.0, 58.0, 91.0, 117.0, 222.0, 327.0, 567.0, 929.0, 1626.0, 3043.0, 6836.0, 20956.0, 105475.0, 902560.0, 2570780.0, 491274.0, 62719.0, 14800.0, 5481.0, 2671.0, 1420.0, 836.0, 492.0, 309.0, 200.0, 118.0, 86.0, 52.0, 34.0, 20.0, 24.0, 9.0, 12.0, 10.0, 7.0, 1.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.3984375, -11.9761962890625, -11.553955078125, -11.1317138671875, -10.70947265625, -10.2872314453125, -9.864990234375, -9.4427490234375, -9.0205078125, -8.5982666015625, -8.176025390625, -7.7537841796875, -7.33154296875, -6.9093017578125, -6.487060546875, -6.0648193359375, -5.642578125, -5.2203369140625, -4.798095703125, -4.3758544921875, -3.95361328125, -3.5313720703125, -3.109130859375, -2.6868896484375, -2.2646484375, -1.8424072265625, -1.420166015625, -0.9979248046875, -0.57568359375, -0.1534423828125, 0.268798828125, 0.6910400390625, 1.11328125, 1.5355224609375, 1.957763671875, 2.3800048828125, 2.80224609375, 3.2244873046875, 3.646728515625, 4.0689697265625, 4.4912109375, 4.9134521484375, 5.335693359375, 5.7579345703125, 6.18017578125, 6.6024169921875, 7.024658203125, 7.4468994140625, 7.869140625, 8.2913818359375, 8.713623046875, 9.1358642578125, 9.55810546875, 9.9803466796875, 10.402587890625, 10.8248291015625, 11.2470703125, 11.6693115234375, 12.091552734375, 12.5137939453125, 12.93603515625, 13.3582763671875, 13.780517578125, 14.2027587890625, 14.625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 6.0, 6.0, 15.0, 16.0, 25.0, 24.0, 52.0, 67.0, 125.0, 167.0, 280.0, 451.0, 669.0, 699.0, 548.0, 328.0, 204.0, 143.0, 77.0, 41.0, 27.0, 18.0, 18.0, 15.0, 10.0, 6.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.5625, -18.02001953125, -17.4775390625, -16.93505859375, -16.392578125, -15.85009765625, -15.3076171875, -14.76513671875, -14.22265625, -13.68017578125, -13.1376953125, -12.59521484375, -12.052734375, -11.51025390625, -10.9677734375, -10.42529296875, -9.8828125, -9.34033203125, -8.7978515625, -8.25537109375, -7.712890625, -7.17041015625, -6.6279296875, -6.08544921875, -5.54296875, -5.00048828125, -4.4580078125, -3.91552734375, -3.373046875, -2.83056640625, -2.2880859375, -1.74560546875, -1.203125, -0.66064453125, -0.1181640625, 0.42431640625, 0.966796875, 1.50927734375, 2.0517578125, 2.59423828125, 3.13671875, 3.67919921875, 4.2216796875, 4.76416015625, 5.306640625, 5.84912109375, 6.3916015625, 6.93408203125, 7.4765625, 8.01904296875, 8.5615234375, 9.10400390625, 9.646484375, 10.18896484375, 10.7314453125, 11.27392578125, 11.81640625, 12.35888671875, 12.9013671875, 13.44384765625, 13.986328125, 14.52880859375, 15.0712890625, 15.61376953125, 16.15625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 4.0, 5.0, 8.0, 5.0, 5.0, 19.0, 37.0, 41.0, 75.0, 151.0, 321.0, 754.0, 2014.0, 7354.0, 53530.0, 3747822.0, 360809.0, 15579.0, 3571.0, 1181.0, 496.0, 224.0, 104.0, 70.0, 33.0, 23.0, 14.0, 7.0, 6.0, 5.0, 2.0, 6.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.46875, -48.64892578125, -46.8291015625, -45.00927734375, -43.189453125, -41.36962890625, -39.5498046875, -37.72998046875, -35.91015625, -34.09033203125, -32.2705078125, -30.45068359375, -28.630859375, -26.81103515625, -24.9912109375, -23.17138671875, -21.3515625, -19.53173828125, -17.7119140625, -15.89208984375, -14.072265625, -12.25244140625, -10.4326171875, -8.61279296875, -6.79296875, -4.97314453125, -3.1533203125, -1.33349609375, 0.486328125, 2.30615234375, 4.1259765625, 5.94580078125, 7.765625, 9.58544921875, 11.4052734375, 13.22509765625, 15.044921875, 16.86474609375, 18.6845703125, 20.50439453125, 22.32421875, 24.14404296875, 25.9638671875, 27.78369140625, 29.603515625, 31.42333984375, 33.2431640625, 35.06298828125, 36.8828125, 38.70263671875, 40.5224609375, 42.34228515625, 44.162109375, 45.98193359375, 47.8017578125, 49.62158203125, 51.44140625, 53.26123046875, 55.0810546875, 56.90087890625, 58.720703125, 60.54052734375, 62.3603515625, 64.18017578125, 66.0]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 10.0, 20.0, 62.0, 182.0, 336.0, 248.0, 100.0, 33.0, 9.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.34639739990234, -77.09847259521484, -71.85054779052734, -66.60263061523438, -61.354705810546875, -56.106781005859375, -50.858856201171875, -45.61093521118164, -40.36301040649414, -35.11508560180664, -29.867164611816406, -24.619239807128906, -19.37131690979004, -14.123394012451172, -8.875469207763672, -3.6275482177734375, 1.6203765869140625, 6.868299961090088, 12.116223335266113, 17.364147186279297, 22.612070083618164, 27.85999298095703, 33.10791778564453, 38.355838775634766, 43.603763580322266, 48.851688385009766, 54.099609375, 59.3475341796875, 64.595458984375, 69.8433837890625, 75.09130859375, 80.33922576904297, 85.587158203125, 90.8350830078125, 96.0830078125, 101.3309326171875, 106.57884979248047, 111.82677459716797, 117.07469940185547, 122.32261657714844, 127.57054138183594, 132.81846618652344, 138.06639099121094, 143.31431579589844, 148.56224060058594, 153.81015014648438, 159.05807495117188, 164.30599975585938, 169.55392456054688, 174.80184936523438, 180.04977416992188, 185.29769897460938, 190.54562377929688, 195.79354858398438, 201.04147338867188, 206.2893829345703, 211.53732299804688, 216.78524780273438, 222.03317260742188, 227.28109741210938, 232.52902221679688, 237.77694702148438, 243.02487182617188, 248.2727813720703, 253.5207061767578]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 6.0, 3.0, 4.0, 3.0, 7.0, 2.0, 8.0, 9.0, 5.0, 10.0, 12.0, 11.0, 10.0, 23.0, 20.0, 16.0, 19.0, 22.0, 24.0, 32.0, 33.0, 28.0, 36.0, 30.0, 35.0, 43.0, 33.0, 30.0, 40.0, 34.0, 26.0, 30.0, 23.0, 36.0, 31.0, 35.0, 34.0, 24.0, 19.0, 19.0, 15.0, 9.0, 13.0, 19.0, 17.0, 18.0, 8.0, 11.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0], "bins": [-37.57875061035156, -36.38471984863281, -35.19068908691406, -33.99665832519531, -32.80262756347656, -31.608596801757812, -30.41456413269043, -29.22053337097168, -28.02650260925293, -26.83247184753418, -25.63844108581543, -24.44441032409668, -23.250377655029297, -22.056346893310547, -20.862316131591797, -19.668285369873047, -18.474254608154297, -17.280223846435547, -16.086193084716797, -14.89216136932373, -13.69813060760498, -12.50409984588623, -11.310068130493164, -10.116037368774414, -8.922006607055664, -7.727975845336914, -6.533944606781006, -5.339913368225098, -4.145882606506348, -2.9518518447875977, -1.7578206062316895, -0.5637893676757812, 0.6302413940429688, 1.8242723941802979, 3.018303394317627, 4.212334632873535, 5.406365394592285, 6.600396156311035, 7.794427394866943, 8.988458633422852, 10.182489395141602, 11.376520156860352, 12.570550918579102, 13.764582633972168, 14.958613395690918, 16.152645111083984, 17.346675872802734, 18.540706634521484, 19.734737396240234, 20.928768157958984, 22.122798919677734, 23.316829681396484, 24.510860443115234, 25.704891204833984, 26.898923873901367, 28.092954635620117, 29.286985397338867, 30.481016159057617, 31.675046920776367, 32.86907958984375, 34.0631103515625, 35.25714111328125, 36.451171875, 37.64520263671875, 38.8392333984375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 5.0, 4.0, 3.0, 4.0, 10.0, 10.0, 8.0, 8.0, 13.0, 24.0, 10.0, 27.0, 26.0, 35.0, 36.0, 32.0, 40.0, 47.0, 55.0, 34.0, 40.0, 50.0, 42.0, 36.0, 52.0, 36.0, 39.0, 27.0, 35.0, 32.0, 27.0, 21.0, 19.0, 23.0, 14.0, 13.0, 16.0, 16.0, 4.0, 7.0, 7.0, 3.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.375, -6.1685791015625, -5.962158203125, -5.7557373046875, -5.54931640625, -5.3428955078125, -5.136474609375, -4.9300537109375, -4.7236328125, -4.5172119140625, -4.310791015625, -4.1043701171875, -3.89794921875, -3.6915283203125, -3.485107421875, -3.2786865234375, -3.072265625, -2.8658447265625, -2.659423828125, -2.4530029296875, -2.24658203125, -2.0401611328125, -1.833740234375, -1.6273193359375, -1.4208984375, -1.2144775390625, -1.008056640625, -0.8016357421875, -0.59521484375, -0.3887939453125, -0.182373046875, 0.0240478515625, 0.23046875, 0.4368896484375, 0.643310546875, 0.8497314453125, 1.05615234375, 1.2625732421875, 1.468994140625, 1.6754150390625, 1.8818359375, 2.0882568359375, 2.294677734375, 2.5010986328125, 2.70751953125, 2.9139404296875, 3.120361328125, 3.3267822265625, 3.533203125, 3.7396240234375, 3.946044921875, 4.1524658203125, 4.35888671875, 4.5653076171875, 4.771728515625, 4.9781494140625, 5.1845703125, 5.3909912109375, 5.597412109375, 5.8038330078125, 6.01025390625, 6.2166748046875, 6.423095703125, 6.6295166015625, 6.8359375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 9.0, 9.0, 16.0, 25.0, 31.0, 39.0, 62.0, 98.0, 148.0, 219.0, 341.0, 515.0, 839.0, 1332.0, 2235.0, 3481.0, 5843.0, 9987.0, 16518.0, 28248.0, 48116.0, 80827.0, 131476.0, 191619.0, 192569.0, 133090.0, 81553.0, 48358.0, 28493.0, 16923.0, 9944.0, 5975.0, 3592.0, 2282.0, 1384.0, 858.0, 518.0, 335.0, 229.0, 135.0, 83.0, 66.0, 51.0, 34.0, 22.0, 11.0, 5.0, 11.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7578125, -0.7333755493164062, -0.7089385986328125, -0.6845016479492188, -0.660064697265625, -0.6356277465820312, -0.6111907958984375, -0.5867538452148438, -0.56231689453125, -0.5378799438476562, -0.5134429931640625, -0.48900604248046875, -0.464569091796875, -0.44013214111328125, -0.4156951904296875, -0.39125823974609375, -0.3668212890625, -0.34238433837890625, -0.3179473876953125, -0.29351043701171875, -0.269073486328125, -0.24463653564453125, -0.2201995849609375, -0.19576263427734375, -0.17132568359375, -0.14688873291015625, -0.1224517822265625, -0.09801483154296875, -0.073577880859375, -0.04914093017578125, -0.0247039794921875, -0.00026702880859375, 0.024169921875, 0.04860687255859375, 0.0730438232421875, 0.09748077392578125, 0.121917724609375, 0.14635467529296875, 0.1707916259765625, 0.19522857666015625, 0.21966552734375, 0.24410247802734375, 0.2685394287109375, 0.29297637939453125, 0.317413330078125, 0.34185028076171875, 0.3662872314453125, 0.39072418212890625, 0.4151611328125, 0.43959808349609375, 0.4640350341796875, 0.48847198486328125, 0.512908935546875, 0.5373458862304688, 0.5617828369140625, 0.5862197875976562, 0.61065673828125, 0.6350936889648438, 0.6595306396484375, 0.6839675903320312, 0.708404541015625, 0.7328414916992188, 0.7572784423828125, 0.7817153930664062, 0.80615234375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 6.0, 7.0, 11.0, 10.0, 16.0, 18.0, 19.0, 15.0, 24.0, 24.0, 36.0, 35.0, 43.0, 42.0, 28.0, 48.0, 45.0, 55.0, 1055.0, 43.0, 36.0, 43.0, 37.0, 44.0, 36.0, 27.0, 39.0, 28.0, 27.0, 21.0, 13.0, 15.0, 8.0, 13.0, 11.0, 13.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.29296875, -4.15185546875, -4.0107421875, -3.86962890625, -3.728515625, -3.58740234375, -3.4462890625, -3.30517578125, -3.1640625, -3.02294921875, -2.8818359375, -2.74072265625, -2.599609375, -2.45849609375, -2.3173828125, -2.17626953125, -2.03515625, -1.89404296875, -1.7529296875, -1.61181640625, -1.470703125, -1.32958984375, -1.1884765625, -1.04736328125, -0.90625, -0.76513671875, -0.6240234375, -0.48291015625, -0.341796875, -0.20068359375, -0.0595703125, 0.08154296875, 0.22265625, 0.36376953125, 0.5048828125, 0.64599609375, 0.787109375, 0.92822265625, 1.0693359375, 1.21044921875, 1.3515625, 1.49267578125, 1.6337890625, 1.77490234375, 1.916015625, 2.05712890625, 2.1982421875, 2.33935546875, 2.48046875, 2.62158203125, 2.7626953125, 2.90380859375, 3.044921875, 3.18603515625, 3.3271484375, 3.46826171875, 3.609375, 3.75048828125, 3.8916015625, 4.03271484375, 4.173828125, 4.31494140625, 4.4560546875, 4.59716796875, 4.73828125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 15.0, 18.0, 39.0, 43.0, 81.0, 114.0, 161.0, 284.0, 397.0, 628.0, 937.0, 1477.0, 2131.0, 3487.0, 5251.0, 8044.0, 12445.0, 19322.0, 30527.0, 48548.0, 76974.0, 118374.0, 176523.0, 1203420.0, 136713.0, 91460.0, 57972.0, 36571.0, 22926.0, 14870.0, 9521.0, 6249.0, 3984.0, 2717.0, 1665.0, 1128.0, 731.0, 455.0, 307.0, 192.0, 145.0, 90.0, 64.0, 37.0, 28.0, 16.0, 16.0, 10.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.453125, -0.4385986328125, -0.424072265625, -0.4095458984375, -0.39501953125, -0.3804931640625, -0.365966796875, -0.3514404296875, -0.3369140625, -0.3223876953125, -0.307861328125, -0.2933349609375, -0.27880859375, -0.2642822265625, -0.249755859375, -0.2352294921875, -0.220703125, -0.2061767578125, -0.191650390625, -0.1771240234375, -0.16259765625, -0.1480712890625, -0.133544921875, -0.1190185546875, -0.1044921875, -0.0899658203125, -0.075439453125, -0.0609130859375, -0.04638671875, -0.0318603515625, -0.017333984375, -0.0028076171875, 0.01171875, 0.0262451171875, 0.040771484375, 0.0552978515625, 0.06982421875, 0.0843505859375, 0.098876953125, 0.1134033203125, 0.1279296875, 0.1424560546875, 0.156982421875, 0.1715087890625, 0.18603515625, 0.2005615234375, 0.215087890625, 0.2296142578125, 0.244140625, 0.2586669921875, 0.273193359375, 0.2877197265625, 0.30224609375, 0.3167724609375, 0.331298828125, 0.3458251953125, 0.3603515625, 0.3748779296875, 0.389404296875, 0.4039306640625, 0.41845703125, 0.4329833984375, 0.447509765625, 0.4620361328125, 0.4765625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 13.0, 15.0, 16.0, 48.0, 139.0, 441.0, 188.0, 60.0, 27.0, 14.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07061767578125, -0.06857967376708984, -0.06654167175292969, -0.06450366973876953, -0.062465667724609375, -0.06042766571044922, -0.05838966369628906, -0.056351661682128906, -0.05431365966796875, -0.052275657653808594, -0.05023765563964844, -0.04819965362548828, -0.046161651611328125, -0.04412364959716797, -0.04208564758300781, -0.040047645568847656, -0.0380096435546875, -0.035971641540527344, -0.03393363952636719, -0.03189563751220703, -0.029857635498046875, -0.02781963348388672, -0.025781631469726562, -0.023743629455566406, -0.02170562744140625, -0.019667625427246094, -0.017629623413085938, -0.015591621398925781, -0.013553619384765625, -0.011515617370605469, -0.009477615356445312, -0.007439613342285156, -0.005401611328125, -0.0033636093139648438, -0.0013256072998046875, 0.0007123947143554688, 0.002750396728515625, 0.004788398742675781, 0.0068264007568359375, 0.008864402770996094, 0.01090240478515625, 0.012940406799316406, 0.014978408813476562, 0.01701641082763672, 0.019054412841796875, 0.02109241485595703, 0.023130416870117188, 0.025168418884277344, 0.0272064208984375, 0.029244422912597656, 0.03128242492675781, 0.03332042694091797, 0.035358428955078125, 0.03739643096923828, 0.03943443298339844, 0.041472434997558594, 0.04351043701171875, 0.045548439025878906, 0.04758644104003906, 0.04962444305419922, 0.051662445068359375, 0.05370044708251953, 0.05573844909667969, 0.057776451110839844, 0.059814453125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 3.0, 4.0, 6.0, 11.0, 21.0, 26.0, 38.0, 83.0, 160.0, 2977.0, 1043846.0, 974.0, 173.0, 71.0, 32.0, 18.0, 20.0, 16.0, 17.0, 8.0, 5.0, 6.0, 5.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1787109375, -1.1385955810546875, -1.098480224609375, -1.0583648681640625, -1.01824951171875, -0.9781341552734375, -0.938018798828125, -0.8979034423828125, -0.8577880859375, -0.8176727294921875, -0.777557373046875, -0.7374420166015625, -0.69732666015625, -0.6572113037109375, -0.617095947265625, -0.5769805908203125, -0.536865234375, -0.4967498779296875, -0.456634521484375, -0.4165191650390625, -0.37640380859375, -0.3362884521484375, -0.296173095703125, -0.2560577392578125, -0.2159423828125, -0.1758270263671875, -0.135711669921875, -0.0955963134765625, -0.05548095703125, -0.0153656005859375, 0.024749755859375, 0.0648651123046875, 0.10498046875, 0.1450958251953125, 0.185211181640625, 0.2253265380859375, 0.26544189453125, 0.3055572509765625, 0.345672607421875, 0.3857879638671875, 0.4259033203125, 0.4660186767578125, 0.506134033203125, 0.5462493896484375, 0.58636474609375, 0.6264801025390625, 0.666595458984375, 0.7067108154296875, 0.746826171875, 0.7869415283203125, 0.827056884765625, 0.8671722412109375, 0.90728759765625, 0.9474029541015625, 0.987518310546875, 1.0276336669921875, 1.0677490234375, 1.1078643798828125, 1.147979736328125, 1.1880950927734375, 1.22821044921875, 1.2683258056640625, 1.308441162109375, 1.3485565185546875, 1.388671875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 40.0, 720.0, 240.0, 12.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4045638144016266, -0.39690497517585754, -0.3892461061477661, -0.38158726692199707, -0.37392839789390564, -0.3662695586681366, -0.35861068964004517, -0.3509518504142761, -0.3432930111885071, -0.33563417196273804, -0.3279753029346466, -0.32031646370887756, -0.31265759468078613, -0.3049987554550171, -0.29733988642692566, -0.2896810472011566, -0.2820221781730652, -0.27436333894729614, -0.2667044699192047, -0.25904563069343567, -0.25138676166534424, -0.2437279224395752, -0.23606906831264496, -0.22841021418571472, -0.22075136005878448, -0.21309250593185425, -0.205433651804924, -0.19777479767799377, -0.19011595845222473, -0.1824570894241333, -0.17479825019836426, -0.16713939607143402, -0.15948054194450378, -0.15182168781757355, -0.1441628336906433, -0.13650397956371307, -0.12884512543678284, -0.1211862787604332, -0.11352743208408356, -0.10586857795715332, -0.09820971637964249, -0.09055086225271225, -0.08289201557636261, -0.07523316144943237, -0.06757430732250214, -0.0599154531955719, -0.05225660279393196, -0.04459775239229202, -0.036938898265361786, -0.0292800460010767, -0.02162119373679161, -0.013962341472506523, -0.0063034892082214355, 0.0013553649187088013, 0.00901421532034874, 0.016673065721988678, 0.024331919848918915, 0.03199077397584915, 0.03964962437748909, 0.04730847477912903, 0.054967328906059265, 0.0626261830329895, 0.07028503715991974, 0.07794388383626938, 0.08560273796319962]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 3.0, 7.0, 8.0, 4.0, 16.0, 12.0, 12.0, 13.0, 15.0, 16.0, 21.0, 30.0, 29.0, 36.0, 32.0, 32.0, 46.0, 38.0, 42.0, 50.0, 34.0, 44.0, 43.0, 40.0, 34.0, 44.0, 27.0, 37.0, 30.0, 21.0, 34.0, 29.0, 24.0, 14.0, 22.0, 17.0, 5.0, 6.0, 7.0, 5.0, 7.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023527026176452637, -0.022762481123209, -0.021997936069965363, -0.021233391016721725, -0.02046884596347809, -0.01970430091023445, -0.018939755856990814, -0.018175210803747177, -0.01741066575050354, -0.016646120697259903, -0.015881575644016266, -0.015117030590772629, -0.014352485537528992, -0.013587940484285355, -0.012823395431041718, -0.01205885037779808, -0.011294305324554443, -0.010529760271310806, -0.00976521521806717, -0.009000670164823532, -0.008236125111579895, -0.007471580058336258, -0.006707035005092621, -0.005942489951848984, -0.005177944898605347, -0.00441339984536171, -0.0036488547921180725, -0.0028843097388744354, -0.0021197646856307983, -0.0013552196323871613, -0.0005906745791435242, 0.00017387047410011292, 0.00093841552734375, 0.001702960580587387, 0.002467505633831024, 0.0032320506870746613, 0.003996595740318298, 0.004761140793561935, 0.0055256858468055725, 0.00629023090004921, 0.007054775953292847, 0.007819321006536484, 0.00858386605978012, 0.009348411113023758, 0.010112956166267395, 0.010877501219511032, 0.01164204627275467, 0.012406591325998306, 0.013171136379241943, 0.01393568143248558, 0.014700226485729218, 0.015464771538972855, 0.01622931659221649, 0.01699386164546013, 0.017758406698703766, 0.018522951751947403, 0.01928749680519104, 0.020052041858434677, 0.020816586911678314, 0.02158113196492195, 0.02234567701816559, 0.023110222071409225, 0.023874767124652863, 0.0246393121778965, 0.025403857231140137]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 5.0, 4.0, 3.0, 4.0, 10.0, 10.0, 9.0, 7.0, 13.0, 24.0, 10.0, 27.0, 26.0, 35.0, 36.0, 32.0, 40.0, 47.0, 55.0, 34.0, 40.0, 49.0, 43.0, 36.0, 52.0, 36.0, 39.0, 27.0, 35.0, 32.0, 27.0, 21.0, 19.0, 23.0, 14.0, 13.0, 16.0, 16.0, 4.0, 7.0, 7.0, 3.0, 7.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.375, -6.1685791015625, -5.962158203125, -5.7557373046875, -5.54931640625, -5.3428955078125, -5.136474609375, -4.9300537109375, -4.7236328125, -4.5172119140625, -4.310791015625, -4.1043701171875, -3.89794921875, -3.6915283203125, -3.485107421875, -3.2786865234375, -3.072265625, -2.8658447265625, -2.659423828125, -2.4530029296875, -2.24658203125, -2.0401611328125, -1.833740234375, -1.6273193359375, -1.4208984375, -1.2144775390625, -1.008056640625, -0.8016357421875, -0.59521484375, -0.3887939453125, -0.182373046875, 0.0240478515625, 0.23046875, 0.4368896484375, 0.643310546875, 0.8497314453125, 1.05615234375, 1.2625732421875, 1.468994140625, 1.6754150390625, 1.8818359375, 2.0882568359375, 2.294677734375, 2.5010986328125, 2.70751953125, 2.9139404296875, 3.120361328125, 3.3267822265625, 3.533203125, 3.7396240234375, 3.946044921875, 4.1524658203125, 4.35888671875, 4.5653076171875, 4.771728515625, 4.9781494140625, 5.1845703125, 5.3909912109375, 5.597412109375, 5.8038330078125, 6.01025390625, 6.2166748046875, 6.423095703125, 6.6295166015625, 6.8359375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 4.0, 6.0, 6.0, 9.0, 13.0, 12.0, 13.0, 29.0, 38.0, 31.0, 59.0, 60.0, 96.0, 158.0, 195.0, 406.0, 977.0, 3426.0, 13887.0, 67762.0, 543113.0, 352774.0, 50007.0, 10936.0, 2694.0, 817.0, 313.0, 212.0, 116.0, 88.0, 71.0, 48.0, 38.0, 29.0, 21.0, 22.0, 20.0, 9.0, 8.0, 8.0, 4.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.640625, -12.231689453125, -11.82275390625, -11.413818359375, -11.0048828125, -10.595947265625, -10.18701171875, -9.778076171875, -9.369140625, -8.960205078125, -8.55126953125, -8.142333984375, -7.7333984375, -7.324462890625, -6.91552734375, -6.506591796875, -6.09765625, -5.688720703125, -5.27978515625, -4.870849609375, -4.4619140625, -4.052978515625, -3.64404296875, -3.235107421875, -2.826171875, -2.417236328125, -2.00830078125, -1.599365234375, -1.1904296875, -0.781494140625, -0.37255859375, 0.036376953125, 0.4453125, 0.854248046875, 1.26318359375, 1.672119140625, 2.0810546875, 2.489990234375, 2.89892578125, 3.307861328125, 3.716796875, 4.125732421875, 4.53466796875, 4.943603515625, 5.3525390625, 5.761474609375, 6.17041015625, 6.579345703125, 6.98828125, 7.397216796875, 7.80615234375, 8.215087890625, 8.6240234375, 9.032958984375, 9.44189453125, 9.850830078125, 10.259765625, 10.668701171875, 11.07763671875, 11.486572265625, 11.8955078125, 12.304443359375, 12.71337890625, 13.122314453125, 13.53125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 6.0, 8.0, 10.0, 13.0, 18.0, 10.0, 19.0, 21.0, 28.0, 24.0, 29.0, 34.0, 28.0, 37.0, 42.0, 46.0, 61.0, 97.0, 345.0, 1540.0, 149.0, 57.0, 71.0, 52.0, 32.0, 30.0, 46.0, 36.0, 23.0, 16.0, 17.0, 15.0, 20.0, 9.0, 10.0, 13.0, 6.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-21.15625, -20.537109375, -19.91796875, -19.298828125, -18.6796875, -18.060546875, -17.44140625, -16.822265625, -16.203125, -15.583984375, -14.96484375, -14.345703125, -13.7265625, -13.107421875, -12.48828125, -11.869140625, -11.25, -10.630859375, -10.01171875, -9.392578125, -8.7734375, -8.154296875, -7.53515625, -6.916015625, -6.296875, -5.677734375, -5.05859375, -4.439453125, -3.8203125, -3.201171875, -2.58203125, -1.962890625, -1.34375, -0.724609375, -0.10546875, 0.513671875, 1.1328125, 1.751953125, 2.37109375, 2.990234375, 3.609375, 4.228515625, 4.84765625, 5.466796875, 6.0859375, 6.705078125, 7.32421875, 7.943359375, 8.5625, 9.181640625, 9.80078125, 10.419921875, 11.0390625, 11.658203125, 12.27734375, 12.896484375, 13.515625, 14.134765625, 14.75390625, 15.373046875, 15.9921875, 16.611328125, 17.23046875, 17.849609375, 18.46875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 10.0, 5.0, 9.0, 6.0, 11.0, 13.0, 14.0, 14.0, 23.0, 19.0, 23.0, 39.0, 56.0, 84.0, 61.0, 139.0, 194.0, 357.0, 848.0, 6936.0, 2121656.0, 1007680.0, 5616.0, 857.0, 341.0, 165.0, 128.0, 90.0, 66.0, 64.0, 33.0, 30.0, 21.0, 21.0, 20.0, 16.0, 16.0, 7.0, 6.0, 7.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.5625, -41.14208984375, -39.7216796875, -38.30126953125, -36.880859375, -35.46044921875, -34.0400390625, -32.61962890625, -31.19921875, -29.77880859375, -28.3583984375, -26.93798828125, -25.517578125, -24.09716796875, -22.6767578125, -21.25634765625, -19.8359375, -18.41552734375, -16.9951171875, -15.57470703125, -14.154296875, -12.73388671875, -11.3134765625, -9.89306640625, -8.47265625, -7.05224609375, -5.6318359375, -4.21142578125, -2.791015625, -1.37060546875, 0.0498046875, 1.47021484375, 2.890625, 4.31103515625, 5.7314453125, 7.15185546875, 8.572265625, 9.99267578125, 11.4130859375, 12.83349609375, 14.25390625, 15.67431640625, 17.0947265625, 18.51513671875, 19.935546875, 21.35595703125, 22.7763671875, 24.19677734375, 25.6171875, 27.03759765625, 28.4580078125, 29.87841796875, 31.298828125, 32.71923828125, 34.1396484375, 35.56005859375, 36.98046875, 38.40087890625, 39.8212890625, 41.24169921875, 42.662109375, 44.08251953125, 45.5029296875, 46.92333984375, 48.34375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 25.0, 331.0, 533.0, 117.0, 9.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-239.1573486328125, -234.90525817871094, -230.6531524658203, -226.40106201171875, -222.1489715576172, -217.89686584472656, -213.644775390625, -209.39268493652344, -205.1405792236328, -200.88848876953125, -196.63638305664062, -192.38429260253906, -188.1322021484375, -183.88009643554688, -179.6280059814453, -175.37591552734375, -171.12380981445312, -166.87171936035156, -162.61961364746094, -158.36752319335938, -154.1154327392578, -149.8633270263672, -145.61123657226562, -141.35914611816406, -137.1070556640625, -132.85496520996094, -128.6028594970703, -124.35076904296875, -120.09867095947266, -115.84657287597656, -111.594482421875, -107.3423843383789, -103.09027099609375, -98.83817291259766, -94.5860824584961, -90.333984375, -86.0818862915039, -81.82978820800781, -77.57769775390625, -73.32559967041016, -69.0735092163086, -64.8214111328125, -60.56931686401367, -56.317222595214844, -52.06512451171875, -47.81303024291992, -43.560935974121094, -39.308837890625, -35.05674362182617, -30.80464744567871, -26.55255126953125, -22.300457000732422, -18.04836082458496, -13.7962646484375, -9.544170379638672, -5.292074203491211, -1.03997802734375, 3.2121176719665527, 7.4642133712768555, 11.71630859375, 15.968404769897461, 20.220500946044922, 24.47259521484375, 28.72469139099121, 32.97678756713867]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 10.0, 11.0, 8.0, 9.0, 17.0, 18.0, 21.0, 28.0, 27.0, 39.0, 31.0, 41.0, 39.0, 43.0, 51.0, 41.0, 44.0, 56.0, 61.0, 53.0, 54.0, 41.0, 31.0, 37.0, 25.0, 30.0, 30.0, 15.0, 19.0, 10.0, 12.0, 13.0, 14.0, 9.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.69481658935547, -46.60063171386719, -44.506446838378906, -42.41226577758789, -40.31808090209961, -38.22389602661133, -36.12971496582031, -34.03553009033203, -31.94134521484375, -29.84716033935547, -27.75297737121582, -25.658794403076172, -23.56460952758789, -21.47042465209961, -19.37624168395996, -17.282058715820312, -15.187873840332031, -13.093689918518066, -10.999505996704102, -8.905322074890137, -6.811138153076172, -4.716954231262207, -2.622770309448242, -0.5285863876342773, 1.5655975341796875, 3.6597814559936523, 5.753965377807617, 7.848149299621582, 9.942333221435547, 12.036517143249512, 14.130701065063477, 16.224884033203125, 18.319076538085938, 20.41326141357422, 22.507444381713867, 24.601627349853516, 26.695812225341797, 28.789997100830078, 30.884180068969727, 32.978363037109375, 35.072547912597656, 37.16673278808594, 39.26091766357422, 41.355098724365234, 43.449283599853516, 45.5434684753418, 47.63764953613281, 49.731834411621094, 51.826019287109375, 53.920204162597656, 56.01438903808594, 58.10857009887695, 60.202754974365234, 62.296939849853516, 64.39112091064453, 66.48530578613281, 68.5794906616211, 70.67367553710938, 72.76786041259766, 74.86204528808594, 76.95622253417969, 79.05040740966797, 81.14459228515625, 83.23877716064453, 85.33296203613281]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 8.0, 1.0, 5.0, 3.0, 6.0, 6.0, 10.0, 18.0, 13.0, 13.0, 17.0, 17.0, 30.0, 18.0, 30.0, 32.0, 36.0, 36.0, 53.0, 41.0, 47.0, 41.0, 51.0, 36.0, 43.0, 35.0, 38.0, 36.0, 41.0, 35.0, 32.0, 20.0, 24.0, 19.0, 14.0, 21.0, 18.0, 13.0, 13.0, 7.0, 8.0, 7.0, 3.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.13671875, -6.92486572265625, -6.7130126953125, -6.50115966796875, -6.289306640625, -6.07745361328125, -5.8656005859375, -5.65374755859375, -5.44189453125, -5.23004150390625, -5.0181884765625, -4.80633544921875, -4.594482421875, -4.38262939453125, -4.1707763671875, -3.95892333984375, -3.7470703125, -3.53521728515625, -3.3233642578125, -3.11151123046875, -2.899658203125, -2.68780517578125, -2.4759521484375, -2.26409912109375, -2.05224609375, -1.84039306640625, -1.6285400390625, -1.41668701171875, -1.204833984375, -0.99298095703125, -0.7811279296875, -0.56927490234375, -0.357421875, -0.14556884765625, 0.0662841796875, 0.27813720703125, 0.489990234375, 0.70184326171875, 0.9136962890625, 1.12554931640625, 1.33740234375, 1.54925537109375, 1.7611083984375, 1.97296142578125, 2.184814453125, 2.39666748046875, 2.6085205078125, 2.82037353515625, 3.0322265625, 3.24407958984375, 3.4559326171875, 3.66778564453125, 3.879638671875, 4.09149169921875, 4.3033447265625, 4.51519775390625, 4.72705078125, 4.93890380859375, 5.1507568359375, 5.36260986328125, 5.574462890625, 5.78631591796875, 5.9981689453125, 6.21002197265625, 6.421875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 9.0, 7.0, 6.0, 17.0, 15.0, 28.0, 26.0, 29.0, 49.0, 82.0, 87.0, 108.0, 190.0, 211.0, 320.0, 382.0, 609.0, 855.0, 1372.0, 2119.0, 3556.0, 6219.0, 12506.0, 33851.0, 151680.0, 997155.0, 2302295.0, 543787.0, 89606.0, 23829.0, 9841.0, 5130.0, 2852.0, 1745.0, 1156.0, 760.0, 500.0, 330.0, 228.0, 180.0, 158.0, 94.0, 79.0, 51.0, 43.0, 39.0, 25.0, 19.0, 17.0, 8.0, 4.0, 9.0, 7.0, 1.0, 3.0, 4.0], "bins": [-13.5859375, -13.1903076171875, -12.794677734375, -12.3990478515625, -12.00341796875, -11.6077880859375, -11.212158203125, -10.8165283203125, -10.4208984375, -10.0252685546875, -9.629638671875, -9.2340087890625, -8.83837890625, -8.4427490234375, -8.047119140625, -7.6514892578125, -7.255859375, -6.8602294921875, -6.464599609375, -6.0689697265625, -5.67333984375, -5.2777099609375, -4.882080078125, -4.4864501953125, -4.0908203125, -3.6951904296875, -3.299560546875, -2.9039306640625, -2.50830078125, -2.1126708984375, -1.717041015625, -1.3214111328125, -0.92578125, -0.5301513671875, -0.134521484375, 0.2611083984375, 0.65673828125, 1.0523681640625, 1.447998046875, 1.8436279296875, 2.2392578125, 2.6348876953125, 3.030517578125, 3.4261474609375, 3.82177734375, 4.2174072265625, 4.613037109375, 5.0086669921875, 5.404296875, 5.7999267578125, 6.195556640625, 6.5911865234375, 6.98681640625, 7.3824462890625, 7.778076171875, 8.1737060546875, 8.5693359375, 8.9649658203125, 9.360595703125, 9.7562255859375, 10.15185546875, 10.5474853515625, 10.943115234375, 11.3387451171875, 11.734375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 0.0, 6.0, 8.0, 10.0, 11.0, 14.0, 18.0, 23.0, 52.0, 59.0, 84.0, 119.0, 218.0, 308.0, 519.0, 648.0, 703.0, 492.0, 259.0, 187.0, 98.0, 70.0, 45.0, 32.0, 24.0, 18.0, 15.0, 4.0, 7.0, 7.0, 2.0, 5.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-18.046875, -17.529296875, -17.01171875, -16.494140625, -15.9765625, -15.458984375, -14.94140625, -14.423828125, -13.90625, -13.388671875, -12.87109375, -12.353515625, -11.8359375, -11.318359375, -10.80078125, -10.283203125, -9.765625, -9.248046875, -8.73046875, -8.212890625, -7.6953125, -7.177734375, -6.66015625, -6.142578125, -5.625, -5.107421875, -4.58984375, -4.072265625, -3.5546875, -3.037109375, -2.51953125, -2.001953125, -1.484375, -0.966796875, -0.44921875, 0.068359375, 0.5859375, 1.103515625, 1.62109375, 2.138671875, 2.65625, 3.173828125, 3.69140625, 4.208984375, 4.7265625, 5.244140625, 5.76171875, 6.279296875, 6.796875, 7.314453125, 7.83203125, 8.349609375, 8.8671875, 9.384765625, 9.90234375, 10.419921875, 10.9375, 11.455078125, 11.97265625, 12.490234375, 13.0078125, 13.525390625, 14.04296875, 14.560546875, 15.078125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 6.0, 6.0, 15.0, 17.0, 37.0, 49.0, 69.0, 132.0, 214.0, 355.0, 714.0, 1272.0, 3022.0, 7725.0, 28297.0, 282565.0, 3575966.0, 253451.0, 27117.0, 7482.0, 2866.0, 1334.0, 623.0, 386.0, 216.0, 122.0, 79.0, 49.0, 20.0, 28.0, 14.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.9375, -32.82421875, -31.7109375, -30.59765625, -29.484375, -28.37109375, -27.2578125, -26.14453125, -25.03125, -23.91796875, -22.8046875, -21.69140625, -20.578125, -19.46484375, -18.3515625, -17.23828125, -16.125, -15.01171875, -13.8984375, -12.78515625, -11.671875, -10.55859375, -9.4453125, -8.33203125, -7.21875, -6.10546875, -4.9921875, -3.87890625, -2.765625, -1.65234375, -0.5390625, 0.57421875, 1.6875, 2.80078125, 3.9140625, 5.02734375, 6.140625, 7.25390625, 8.3671875, 9.48046875, 10.59375, 11.70703125, 12.8203125, 13.93359375, 15.046875, 16.16015625, 17.2734375, 18.38671875, 19.5, 20.61328125, 21.7265625, 22.83984375, 23.953125, 25.06640625, 26.1796875, 27.29296875, 28.40625, 29.51953125, 30.6328125, 31.74609375, 32.859375, 33.97265625, 35.0859375, 36.19921875, 37.3125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 10.0, 29.0, 59.0, 121.0, 196.0, 234.0, 165.0, 100.0, 45.0, 24.0, 13.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.83023071289062, -130.26339721679688, -126.6965560913086, -123.12972259521484, -119.56288146972656, -115.99604797363281, -112.42921447753906, -108.86237335205078, -105.29553985595703, -101.72870635986328, -98.161865234375, -94.59503173828125, -91.02819061279297, -87.46135711669922, -83.89451599121094, -80.32768249511719, -76.76084899902344, -73.19401550292969, -69.6271743774414, -66.06034088134766, -62.49350357055664, -58.926666259765625, -55.35982894897461, -51.792991638183594, -48.22615051269531, -44.6593132019043, -41.09247589111328, -37.52564239501953, -33.958805084228516, -30.3919677734375, -26.825130462646484, -23.2582950592041, -19.69145965576172, -16.124622344970703, -12.55778694152832, -8.990949630737305, -5.4241132736206055, -1.8572769165039062, 1.7095603942871094, 5.276395797729492, 8.843233108520508, 12.410069465637207, 15.976905822753906, 19.543743133544922, 23.110580444335938, 26.67741584777832, 30.244253158569336, 33.81108856201172, 37.377925872802734, 40.94476318359375, 44.511600494384766, 48.07843780517578, 51.64527130126953, 55.21210861206055, 58.77894592285156, 62.34577941894531, 65.9126205444336, 69.47945404052734, 73.04629516601562, 76.61312866210938, 80.17996978759766, 83.7468032836914, 87.31364440917969, 90.88047790527344, 94.44731140136719]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 3.0, 4.0, 10.0, 3.0, 9.0, 7.0, 14.0, 9.0, 13.0, 23.0, 19.0, 14.0, 22.0, 24.0, 20.0, 25.0, 32.0, 23.0, 41.0, 40.0, 38.0, 40.0, 46.0, 32.0, 46.0, 45.0, 38.0, 32.0, 42.0, 23.0, 30.0, 17.0, 31.0, 24.0, 24.0, 26.0, 22.0, 15.0, 10.0, 10.0, 4.0, 9.0, 13.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-39.722686767578125, -38.48804473876953, -37.25340270996094, -36.01875686645508, -34.784114837646484, -33.54947280883789, -32.31482696533203, -31.080184936523438, -29.845542907714844, -28.61090087890625, -27.376256942749023, -26.141613006591797, -24.906970977783203, -23.67232894897461, -22.437685012817383, -21.203041076660156, -19.968399047851562, -18.73375701904297, -17.499113082885742, -16.264469146728516, -15.029827117919922, -13.795184135437012, -12.560541152954102, -11.325898170471191, -10.091255187988281, -8.856612205505371, -7.621969223022461, -6.387326240539551, -5.152683258056641, -3.9180402755737305, -2.6833972930908203, -1.4487543106079102, -0.214111328125, 1.0205316543579102, 2.2551746368408203, 3.4898176193237305, 4.724460601806641, 5.959103584289551, 7.193746566772461, 8.428389549255371, 9.663032531738281, 10.897675514221191, 12.132318496704102, 13.366961479187012, 14.601604461669922, 15.836247444152832, 17.070890426635742, 18.30553436279297, 19.540176391601562, 20.774818420410156, 22.009462356567383, 23.24410629272461, 24.478748321533203, 25.713390350341797, 26.948034286499023, 28.18267822265625, 29.417320251464844, 30.651962280273438, 31.886606216430664, 33.12125015258789, 34.355892181396484, 35.59053421020508, 36.82518005371094, 38.05982208251953, 39.294464111328125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 4.0, 3.0, 3.0, 2.0, 4.0, 8.0, 4.0, 5.0, 14.0, 11.0, 7.0, 24.0, 24.0, 23.0, 17.0, 27.0, 22.0, 34.0, 32.0, 24.0, 38.0, 27.0, 39.0, 41.0, 47.0, 40.0, 46.0, 35.0, 28.0, 33.0, 42.0, 34.0, 23.0, 15.0, 23.0, 22.0, 19.0, 18.0, 21.0, 15.0, 24.0, 15.0, 14.0, 6.0, 5.0, 14.0, 5.0, 7.0, 11.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.078125, -5.8751220703125, -5.672119140625, -5.4691162109375, -5.26611328125, -5.0631103515625, -4.860107421875, -4.6571044921875, -4.4541015625, -4.2510986328125, -4.048095703125, -3.8450927734375, -3.64208984375, -3.4390869140625, -3.236083984375, -3.0330810546875, -2.830078125, -2.6270751953125, -2.424072265625, -2.2210693359375, -2.01806640625, -1.8150634765625, -1.612060546875, -1.4090576171875, -1.2060546875, -1.0030517578125, -0.800048828125, -0.5970458984375, -0.39404296875, -0.1910400390625, 0.011962890625, 0.2149658203125, 0.41796875, 0.6209716796875, 0.823974609375, 1.0269775390625, 1.22998046875, 1.4329833984375, 1.635986328125, 1.8389892578125, 2.0419921875, 2.2449951171875, 2.447998046875, 2.6510009765625, 2.85400390625, 3.0570068359375, 3.260009765625, 3.4630126953125, 3.666015625, 3.8690185546875, 4.072021484375, 4.2750244140625, 4.47802734375, 4.6810302734375, 4.884033203125, 5.0870361328125, 5.2900390625, 5.4930419921875, 5.696044921875, 5.8990478515625, 6.10205078125, 6.3050537109375, 6.508056640625, 6.7110595703125, 6.9140625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 6.0, 9.0, 13.0, 25.0, 34.0, 56.0, 63.0, 101.0, 142.0, 229.0, 286.0, 476.0, 725.0, 1053.0, 1577.0, 2522.0, 3869.0, 5892.0, 9153.0, 14729.0, 24007.0, 40120.0, 68397.0, 115122.0, 182344.0, 209642.0, 146072.0, 88147.0, 51893.0, 30632.0, 18549.0, 11410.0, 7337.0, 4809.0, 3095.0, 2022.0, 1375.0, 859.0, 597.0, 384.0, 253.0, 175.0, 115.0, 76.0, 50.0, 40.0, 27.0, 16.0, 16.0, 7.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.80859375, -0.7835159301757812, -0.7584381103515625, -0.7333602905273438, -0.708282470703125, -0.6832046508789062, -0.6581268310546875, -0.6330490112304688, -0.60797119140625, -0.5828933715820312, -0.5578155517578125, -0.5327377319335938, -0.507659912109375, -0.48258209228515625, -0.4575042724609375, -0.43242645263671875, -0.4073486328125, -0.38227081298828125, -0.3571929931640625, -0.33211517333984375, -0.307037353515625, -0.28195953369140625, -0.2568817138671875, -0.23180389404296875, -0.20672607421875, -0.18164825439453125, -0.1565704345703125, -0.13149261474609375, -0.106414794921875, -0.08133697509765625, -0.0562591552734375, -0.03118133544921875, -0.006103515625, 0.01897430419921875, 0.0440521240234375, 0.06912994384765625, 0.094207763671875, 0.11928558349609375, 0.1443634033203125, 0.16944122314453125, 0.19451904296875, 0.21959686279296875, 0.2446746826171875, 0.26975250244140625, 0.294830322265625, 0.31990814208984375, 0.3449859619140625, 0.37006378173828125, 0.3951416015625, 0.42021942138671875, 0.4452972412109375, 0.47037506103515625, 0.495452880859375, 0.5205307006835938, 0.5456085205078125, 0.5706863403320312, 0.59576416015625, 0.6208419799804688, 0.6459197998046875, 0.6709976196289062, 0.696075439453125, 0.7211532592773438, 0.7462310791015625, 0.7713088989257812, 0.79638671875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 3.0, 8.0, 6.0, 6.0, 10.0, 7.0, 20.0, 10.0, 19.0, 22.0, 25.0, 32.0, 29.0, 20.0, 38.0, 33.0, 40.0, 36.0, 40.0, 46.0, 1073.0, 43.0, 57.0, 46.0, 37.0, 28.0, 31.0, 27.0, 34.0, 19.0, 27.0, 18.0, 28.0, 15.0, 16.0, 13.0, 16.0, 6.0, 5.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0], "bins": [-4.8203125, -4.676513671875, -4.53271484375, -4.388916015625, -4.2451171875, -4.101318359375, -3.95751953125, -3.813720703125, -3.669921875, -3.526123046875, -3.38232421875, -3.238525390625, -3.0947265625, -2.950927734375, -2.80712890625, -2.663330078125, -2.51953125, -2.375732421875, -2.23193359375, -2.088134765625, -1.9443359375, -1.800537109375, -1.65673828125, -1.512939453125, -1.369140625, -1.225341796875, -1.08154296875, -0.937744140625, -0.7939453125, -0.650146484375, -0.50634765625, -0.362548828125, -0.21875, -0.074951171875, 0.06884765625, 0.212646484375, 0.3564453125, 0.500244140625, 0.64404296875, 0.787841796875, 0.931640625, 1.075439453125, 1.21923828125, 1.363037109375, 1.5068359375, 1.650634765625, 1.79443359375, 1.938232421875, 2.08203125, 2.225830078125, 2.36962890625, 2.513427734375, 2.6572265625, 2.801025390625, 2.94482421875, 3.088623046875, 3.232421875, 3.376220703125, 3.52001953125, 3.663818359375, 3.8076171875, 3.951416015625, 4.09521484375, 4.239013671875, 4.3828125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 12.0, 19.0, 32.0, 46.0, 72.0, 96.0, 139.0, 230.0, 332.0, 458.0, 680.0, 1007.0, 1634.0, 2283.0, 3452.0, 5124.0, 7802.0, 12004.0, 18593.0, 29037.0, 46586.0, 75402.0, 119507.0, 175190.0, 1220083.0, 136765.0, 88683.0, 55096.0, 34167.0, 21564.0, 13988.0, 9156.0, 5915.0, 3891.0, 2721.0, 1719.0, 1154.0, 824.0, 530.0, 362.0, 261.0, 162.0, 120.0, 71.0, 57.0, 35.0, 16.0, 19.0, 8.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0], "bins": [-0.501953125, -0.48635101318359375, -0.4707489013671875, -0.45514678955078125, -0.439544677734375, -0.42394256591796875, -0.4083404541015625, -0.39273834228515625, -0.37713623046875, -0.36153411865234375, -0.3459320068359375, -0.33032989501953125, -0.314727783203125, -0.29912567138671875, -0.2835235595703125, -0.26792144775390625, -0.2523193359375, -0.23671722412109375, -0.2211151123046875, -0.20551300048828125, -0.189910888671875, -0.17430877685546875, -0.1587066650390625, -0.14310455322265625, -0.12750244140625, -0.11190032958984375, -0.0962982177734375, -0.08069610595703125, -0.065093994140625, -0.04949188232421875, -0.0338897705078125, -0.01828765869140625, -0.002685546875, 0.01291656494140625, 0.0285186767578125, 0.04412078857421875, 0.059722900390625, 0.07532501220703125, 0.0909271240234375, 0.10652923583984375, 0.12213134765625, 0.13773345947265625, 0.1533355712890625, 0.16893768310546875, 0.184539794921875, 0.20014190673828125, 0.2157440185546875, 0.23134613037109375, 0.2469482421875, 0.26255035400390625, 0.2781524658203125, 0.29375457763671875, 0.309356689453125, 0.32495880126953125, 0.3405609130859375, 0.35616302490234375, 0.37176513671875, 0.38736724853515625, 0.4029693603515625, 0.41857147216796875, 0.434173583984375, 0.44977569580078125, 0.4653778076171875, 0.48097991943359375, 0.49658203125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 7.0, 10.0, 9.0, 9.0, 11.0, 14.0, 21.0, 25.0, 22.0, 33.0, 50.0, 50.0, 56.0, 45.0, 78.0, 98.0, 58.0, 61.0, 50.0, 43.0, 47.0, 41.0, 30.0, 23.0, 18.0, 14.0, 8.0, 10.0, 11.0, 6.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0159912109375, -0.015482664108276367, -0.014974117279052734, -0.014465570449829102, -0.013957023620605469, -0.013448476791381836, -0.012939929962158203, -0.01243138313293457, -0.011922836303710938, -0.011414289474487305, -0.010905742645263672, -0.010397195816040039, -0.009888648986816406, -0.009380102157592773, -0.00887155532836914, -0.008363008499145508, -0.007854461669921875, -0.007345914840698242, -0.006837368011474609, -0.0063288211822509766, -0.005820274353027344, -0.005311727523803711, -0.004803180694580078, -0.004294633865356445, -0.0037860870361328125, -0.0032775402069091797, -0.002768993377685547, -0.002260446548461914, -0.0017518997192382812, -0.0012433528900146484, -0.0007348060607910156, -0.0002262592315673828, 0.00028228759765625, 0.0007908344268798828, 0.0012993812561035156, 0.0018079280853271484, 0.0023164749145507812, 0.002825021743774414, 0.003333568572998047, 0.0038421154022216797, 0.0043506622314453125, 0.004859209060668945, 0.005367755889892578, 0.005876302719116211, 0.006384849548339844, 0.0068933963775634766, 0.007401943206787109, 0.007910490036010742, 0.008419036865234375, 0.008927583694458008, 0.00943613052368164, 0.009944677352905273, 0.010453224182128906, 0.010961771011352539, 0.011470317840576172, 0.011978864669799805, 0.012487411499023438, 0.01299595832824707, 0.013504505157470703, 0.014013051986694336, 0.014521598815917969, 0.015030145645141602, 0.015538692474365234, 0.016047239303588867, 0.0165557861328125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 7.0, 8.0, 9.0, 10.0, 22.0, 18.0, 21.0, 35.0, 37.0, 52.0, 79.0, 107.0, 187.0, 255.0, 516.0, 5494.0, 1034362.0, 5912.0, 537.0, 281.0, 176.0, 101.0, 69.0, 44.0, 42.0, 38.0, 22.0, 23.0, 11.0, 19.0, 11.0, 18.0, 8.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.366943359375, -0.3556556701660156, -0.34436798095703125, -0.3330802917480469, -0.3217926025390625, -0.3105049133300781, -0.29921722412109375, -0.2879295349121094, -0.276641845703125, -0.2653541564941406, -0.25406646728515625, -0.24277877807617188, -0.2314910888671875, -0.22020339965820312, -0.20891571044921875, -0.19762802124023438, -0.18634033203125, -0.17505264282226562, -0.16376495361328125, -0.15247726440429688, -0.1411895751953125, -0.12990188598632812, -0.11861419677734375, -0.10732650756835938, -0.096038818359375, -0.08475112915039062, -0.07346343994140625, -0.062175750732421875, -0.0508880615234375, -0.039600372314453125, -0.02831268310546875, -0.017024993896484375, -0.0057373046875, 0.005550384521484375, 0.01683807373046875, 0.028125762939453125, 0.0394134521484375, 0.050701141357421875, 0.06198883056640625, 0.07327651977539062, 0.084564208984375, 0.09585189819335938, 0.10713958740234375, 0.11842727661132812, 0.1297149658203125, 0.14100265502929688, 0.15229034423828125, 0.16357803344726562, 0.17486572265625, 0.18615341186523438, 0.19744110107421875, 0.20872879028320312, 0.2200164794921875, 0.23130416870117188, 0.24259185791015625, 0.2538795471191406, 0.265167236328125, 0.2764549255371094, 0.28774261474609375, 0.2990303039550781, 0.3103179931640625, 0.3216056823730469, 0.33289337158203125, 0.3441810607910156, 0.35546875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 16.0, 793.0, 203.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034030091017484665, -0.025136243551969528, -0.01624239608645439, -0.007348548620939255, 0.001545298844575882, 0.010439146310091019, 0.019332993775606155, 0.028226841241121292, 0.03712068870663643, 0.046014536172151566, 0.0549083836376667, 0.06380222737789154, 0.07269607484340668, 0.08158992230892181, 0.09048376977443695, 0.09937761723995209, 0.10827146470546722, 0.11716531217098236, 0.1260591596364975, 0.13495300710201263, 0.14384685456752777, 0.1527407020330429, 0.16163454949855804, 0.17052839696407318, 0.17942224442958832, 0.18831609189510345, 0.1972099393606186, 0.20610378682613373, 0.21499763429164886, 0.223891481757164, 0.23278532922267914, 0.24167917668819427, 0.2505730390548706, 0.25946688652038574, 0.2683607339859009, 0.277254581451416, 0.28614842891693115, 0.2950422763824463, 0.3039361238479614, 0.31282997131347656, 0.3217238187789917, 0.33061766624450684, 0.339511513710022, 0.3484053611755371, 0.35729920864105225, 0.3661930561065674, 0.3750869035720825, 0.38398075103759766, 0.3928745985031128, 0.40176844596862793, 0.41066229343414307, 0.4195561408996582, 0.42844998836517334, 0.4373438358306885, 0.4462376832962036, 0.45513153076171875, 0.4640253782272339, 0.472919225692749, 0.48181307315826416, 0.4907069206237793, 0.49960076808929443, 0.5084946155548096, 0.5173884630203247, 0.5262823104858398, 0.535176157951355]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 5.0, 7.0, 7.0, 11.0, 10.0, 15.0, 29.0, 19.0, 30.0, 35.0, 40.0, 35.0, 36.0, 38.0, 62.0, 56.0, 54.0, 46.0, 52.0, 50.0, 43.0, 35.0, 52.0, 45.0, 35.0, 25.0, 16.0, 20.0, 23.0, 19.0, 20.0, 10.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03338998556137085, -0.0324234813451767, -0.03145698085427284, -0.03049047850072384, -0.029523976147174835, -0.02855747379362583, -0.027590971440076828, -0.026624469086527824, -0.02565796673297882, -0.024691464379429817, -0.023724962025880814, -0.02275845967233181, -0.021791957318782806, -0.020825454965233803, -0.0198589526116848, -0.018892450258135796, -0.017925947904586792, -0.01695944555103779, -0.015992943197488785, -0.015026440843939781, -0.014059938490390778, -0.013093436136841774, -0.01212693378329277, -0.011160431429743767, -0.010193929076194763, -0.00922742672264576, -0.008260924369096756, -0.007294422015547752, -0.006327919661998749, -0.005361417308449745, -0.004394914954900742, -0.003428412601351738, -0.0024619102478027344, -0.0014954078942537308, -0.0005289055407047272, 0.00043759681284427643, 0.00140409916639328, 0.0023706015199422836, 0.0033371038734912872, 0.004303606227040291, 0.005270108580589294, 0.006236610934138298, 0.007203113287687302, 0.008169615641236305, 0.009136117994785309, 0.010102620348334312, 0.011069122701883316, 0.01203562505543232, 0.013002127408981323, 0.013968629762530327, 0.01493513211607933, 0.015901634469628334, 0.016868136823177338, 0.01783463917672634, 0.018801141530275345, 0.01976764388382435, 0.020734146237373352, 0.021700648590922356, 0.02266715094447136, 0.023633653298020363, 0.024600155651569366, 0.02556665800511837, 0.026533160358667374, 0.027499662712216377, 0.02846616506576538]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 9.0, 3.0, 6.0, 13.0, 12.0, 7.0, 24.0, 23.0, 24.0, 16.0, 28.0, 21.0, 33.0, 33.0, 25.0, 38.0, 27.0, 39.0, 41.0, 46.0, 41.0, 46.0, 35.0, 28.0, 32.0, 43.0, 34.0, 23.0, 15.0, 22.0, 23.0, 19.0, 18.0, 21.0, 15.0, 24.0, 15.0, 14.0, 6.0, 5.0, 14.0, 5.0, 7.0, 11.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.08203125, -5.87896728515625, -5.6759033203125, -5.47283935546875, -5.269775390625, -5.06671142578125, -4.8636474609375, -4.66058349609375, -4.45751953125, -4.25445556640625, -4.0513916015625, -3.84832763671875, -3.645263671875, -3.44219970703125, -3.2391357421875, -3.03607177734375, -2.8330078125, -2.62994384765625, -2.4268798828125, -2.22381591796875, -2.020751953125, -1.81768798828125, -1.6146240234375, -1.41156005859375, -1.20849609375, -1.00543212890625, -0.8023681640625, -0.59930419921875, -0.396240234375, -0.19317626953125, 0.0098876953125, 0.21295166015625, 0.416015625, 0.61907958984375, 0.8221435546875, 1.02520751953125, 1.228271484375, 1.43133544921875, 1.6343994140625, 1.83746337890625, 2.04052734375, 2.24359130859375, 2.4466552734375, 2.64971923828125, 2.852783203125, 3.05584716796875, 3.2589111328125, 3.46197509765625, 3.6650390625, 3.86810302734375, 4.0711669921875, 4.27423095703125, 4.477294921875, 4.68035888671875, 4.8834228515625, 5.08648681640625, 5.28955078125, 5.49261474609375, 5.6956787109375, 5.89874267578125, 6.101806640625, 6.30487060546875, 6.5079345703125, 6.71099853515625, 6.9140625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 5.0, 7.0, 8.0, 9.0, 7.0, 11.0, 12.0, 18.0, 28.0, 34.0, 49.0, 45.0, 75.0, 120.0, 163.0, 201.0, 293.0, 367.0, 536.0, 833.0, 1274.0, 2008.0, 3497.0, 6582.0, 14962.0, 47287.0, 523660.0, 374970.0, 42151.0, 13963.0, 6234.0, 3267.0, 2002.0, 1209.0, 798.0, 493.0, 365.0, 256.0, 167.0, 144.0, 90.0, 94.0, 64.0, 48.0, 32.0, 26.0, 28.0, 11.0, 16.0, 21.0, 6.0, 5.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-14.5625, -14.076416015625, -13.59033203125, -13.104248046875, -12.6181640625, -12.132080078125, -11.64599609375, -11.159912109375, -10.673828125, -10.187744140625, -9.70166015625, -9.215576171875, -8.7294921875, -8.243408203125, -7.75732421875, -7.271240234375, -6.78515625, -6.299072265625, -5.81298828125, -5.326904296875, -4.8408203125, -4.354736328125, -3.86865234375, -3.382568359375, -2.896484375, -2.410400390625, -1.92431640625, -1.438232421875, -0.9521484375, -0.466064453125, 0.02001953125, 0.506103515625, 0.9921875, 1.478271484375, 1.96435546875, 2.450439453125, 2.9365234375, 3.422607421875, 3.90869140625, 4.394775390625, 4.880859375, 5.366943359375, 5.85302734375, 6.339111328125, 6.8251953125, 7.311279296875, 7.79736328125, 8.283447265625, 8.76953125, 9.255615234375, 9.74169921875, 10.227783203125, 10.7138671875, 11.199951171875, 11.68603515625, 12.172119140625, 12.658203125, 13.144287109375, 13.63037109375, 14.116455078125, 14.6025390625, 15.088623046875, 15.57470703125, 16.060791015625, 16.546875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 10.0, 13.0, 6.0, 7.0, 18.0, 20.0, 23.0, 21.0, 19.0, 27.0, 26.0, 25.0, 35.0, 50.0, 53.0, 66.0, 89.0, 180.0, 1620.0, 159.0, 87.0, 53.0, 60.0, 48.0, 34.0, 37.0, 35.0, 22.0, 34.0, 25.0, 24.0, 13.0, 22.0, 12.0, 13.0, 7.0, 4.0, 8.0, 7.0, 6.0, 9.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.890625, -19.258056640625, -18.62548828125, -17.992919921875, -17.3603515625, -16.727783203125, -16.09521484375, -15.462646484375, -14.830078125, -14.197509765625, -13.56494140625, -12.932373046875, -12.2998046875, -11.667236328125, -11.03466796875, -10.402099609375, -9.76953125, -9.136962890625, -8.50439453125, -7.871826171875, -7.2392578125, -6.606689453125, -5.97412109375, -5.341552734375, -4.708984375, -4.076416015625, -3.44384765625, -2.811279296875, -2.1787109375, -1.546142578125, -0.91357421875, -0.281005859375, 0.3515625, 0.984130859375, 1.61669921875, 2.249267578125, 2.8818359375, 3.514404296875, 4.14697265625, 4.779541015625, 5.412109375, 6.044677734375, 6.67724609375, 7.309814453125, 7.9423828125, 8.574951171875, 9.20751953125, 9.840087890625, 10.47265625, 11.105224609375, 11.73779296875, 12.370361328125, 13.0029296875, 13.635498046875, 14.26806640625, 14.900634765625, 15.533203125, 16.165771484375, 16.79833984375, 17.430908203125, 18.0634765625, 18.696044921875, 19.32861328125, 19.961181640625, 20.59375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 4.0, 14.0, 9.0, 10.0, 13.0, 14.0, 19.0, 29.0, 37.0, 40.0, 61.0, 59.0, 100.0, 129.0, 286.0, 700.0, 3466.0, 62026.0, 3047148.0, 28086.0, 2261.0, 518.0, 215.0, 112.0, 69.0, 72.0, 46.0, 29.0, 26.0, 22.0, 17.0, 13.0, 19.0, 12.0, 5.0, 4.0, 2.0, 2.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-66.1875, -64.0791015625, -61.970703125, -59.8623046875, -57.75390625, -55.6455078125, -53.537109375, -51.4287109375, -49.3203125, -47.2119140625, -45.103515625, -42.9951171875, -40.88671875, -38.7783203125, -36.669921875, -34.5615234375, -32.453125, -30.3447265625, -28.236328125, -26.1279296875, -24.01953125, -21.9111328125, -19.802734375, -17.6943359375, -15.5859375, -13.4775390625, -11.369140625, -9.2607421875, -7.15234375, -5.0439453125, -2.935546875, -0.8271484375, 1.28125, 3.3896484375, 5.498046875, 7.6064453125, 9.71484375, 11.8232421875, 13.931640625, 16.0400390625, 18.1484375, 20.2568359375, 22.365234375, 24.4736328125, 26.58203125, 28.6904296875, 30.798828125, 32.9072265625, 35.015625, 37.1240234375, 39.232421875, 41.3408203125, 43.44921875, 45.5576171875, 47.666015625, 49.7744140625, 51.8828125, 53.9912109375, 56.099609375, 58.2080078125, 60.31640625, 62.4248046875, 64.533203125, 66.6416015625, 68.75]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 12.0, 52.0, 277.0, 425.0, 184.0, 49.0, 7.0, 4.0, 1.0, 0.0, 1.0], "bins": [-212.79273986816406, -209.0165557861328, -205.24038696289062, -201.46420288085938, -197.68801879882812, -193.91183471679688, -190.1356658935547, -186.35948181152344, -182.58331298828125, -178.80712890625, -175.0309600830078, -171.25477600097656, -167.4785919189453, -163.70242309570312, -159.92623901367188, -156.15005493164062, -152.37387084960938, -148.59768676757812, -144.82151794433594, -141.0453338623047, -137.26914978027344, -133.49298095703125, -129.716796875, -125.94061279296875, -122.16443634033203, -118.38825988769531, -114.61207580566406, -110.83589935302734, -107.05972290039062, -103.28353881835938, -99.50736236572266, -95.73118591308594, -91.95499420166016, -88.17881774902344, -84.40263366699219, -80.62645721435547, -76.85028076171875, -73.0740966796875, -69.29792022705078, -65.52174377441406, -61.74555969238281, -57.96937942504883, -54.193199157714844, -50.417022705078125, -46.64084243774414, -42.864662170410156, -39.08848571777344, -35.31230545043945, -31.5361270904541, -27.75994873046875, -23.983768463134766, -20.20758819580078, -16.43140983581543, -12.655229568481445, -8.879051208496094, -5.102872848510742, -1.3266925811767578, 2.44948673248291, 6.225666046142578, 10.001845359802246, 13.778024673461914, 17.5542049407959, 21.33038330078125, 25.1065616607666, 28.882741928100586]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 6.0, 15.0, 15.0, 15.0, 12.0, 13.0, 30.0, 35.0, 25.0, 43.0, 40.0, 34.0, 44.0, 43.0, 50.0, 51.0, 39.0, 43.0, 53.0, 36.0, 41.0, 44.0, 36.0, 25.0, 31.0, 27.0, 19.0, 20.0, 17.0, 21.0, 13.0, 8.0, 13.0, 6.0, 4.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.248661041259766, -59.386024475097656, -57.52338409423828, -55.660743713378906, -53.7981071472168, -51.93547058105469, -50.07283020019531, -48.21018981933594, -46.34755325317383, -44.48491668701172, -42.622276306152344, -40.75963592529297, -38.89699935913086, -37.03436279296875, -35.171722412109375, -33.30908203125, -31.44644546508789, -29.58380699157715, -27.721168518066406, -25.858530044555664, -23.995891571044922, -22.13325309753418, -20.270614624023438, -18.407976150512695, -16.545337677001953, -14.682699203491211, -12.820060729980469, -10.957422256469727, -9.094783782958984, -7.232145309448242, -5.3695068359375, -3.506868362426758, -1.6442298889160156, 0.21840858459472656, 2.0810470581054688, 3.943685531616211, 5.806324005126953, 7.668962478637695, 9.531600952148438, 11.39423942565918, 13.256877899169922, 15.119516372680664, 16.982154846191406, 18.84479331970215, 20.70743179321289, 22.570070266723633, 24.432708740234375, 26.295347213745117, 28.15798568725586, 30.0206241607666, 31.883262634277344, 33.74590301513672, 35.60853958129883, 37.47117614746094, 39.33381652832031, 41.19645690917969, 43.0590934753418, 44.921730041503906, 46.78437042236328, 48.647010803222656, 50.509647369384766, 52.372283935546875, 54.23492431640625, 56.097564697265625, 57.960201263427734]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 0.0, 4.0, 6.0, 8.0, 4.0, 6.0, 10.0, 18.0, 13.0, 11.0, 18.0, 27.0, 23.0, 36.0, 22.0, 30.0, 31.0, 34.0, 38.0, 39.0, 42.0, 47.0, 34.0, 41.0, 39.0, 44.0, 32.0, 27.0, 36.0, 30.0, 20.0, 24.0, 17.0, 30.0, 24.0, 21.0, 13.0, 19.0, 12.0, 16.0, 11.0, 8.0, 9.0, 5.0, 5.0, 5.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.34765625, -6.1312255859375, -5.914794921875, -5.6983642578125, -5.48193359375, -5.2655029296875, -5.049072265625, -4.8326416015625, -4.6162109375, -4.3997802734375, -4.183349609375, -3.9669189453125, -3.75048828125, -3.5340576171875, -3.317626953125, -3.1011962890625, -2.884765625, -2.6683349609375, -2.451904296875, -2.2354736328125, -2.01904296875, -1.8026123046875, -1.586181640625, -1.3697509765625, -1.1533203125, -0.9368896484375, -0.720458984375, -0.5040283203125, -0.28759765625, -0.0711669921875, 0.145263671875, 0.3616943359375, 0.578125, 0.7945556640625, 1.010986328125, 1.2274169921875, 1.44384765625, 1.6602783203125, 1.876708984375, 2.0931396484375, 2.3095703125, 2.5260009765625, 2.742431640625, 2.9588623046875, 3.17529296875, 3.3917236328125, 3.608154296875, 3.8245849609375, 4.041015625, 4.2574462890625, 4.473876953125, 4.6903076171875, 4.90673828125, 5.1231689453125, 5.339599609375, 5.5560302734375, 5.7724609375, 5.9888916015625, 6.205322265625, 6.4217529296875, 6.63818359375, 6.8546142578125, 7.071044921875, 7.2874755859375, 7.50390625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 9.0, 9.0, 10.0, 17.0, 18.0, 28.0, 41.0, 64.0, 83.0, 119.0, 201.0, 307.0, 458.0, 723.0, 1160.0, 1830.0, 3121.0, 5360.0, 10535.0, 25562.0, 146566.0, 1980356.0, 1841724.0, 127645.0, 24304.0, 10176.0, 5425.0, 3079.0, 1871.0, 1186.0, 769.0, 494.0, 334.0, 214.0, 148.0, 93.0, 59.0, 45.0, 35.0, 22.0, 21.0, 14.0, 11.0, 12.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-20.53125, -19.90869140625, -19.2861328125, -18.66357421875, -18.041015625, -17.41845703125, -16.7958984375, -16.17333984375, -15.55078125, -14.92822265625, -14.3056640625, -13.68310546875, -13.060546875, -12.43798828125, -11.8154296875, -11.19287109375, -10.5703125, -9.94775390625, -9.3251953125, -8.70263671875, -8.080078125, -7.45751953125, -6.8349609375, -6.21240234375, -5.58984375, -4.96728515625, -4.3447265625, -3.72216796875, -3.099609375, -2.47705078125, -1.8544921875, -1.23193359375, -0.609375, 0.01318359375, 0.6357421875, 1.25830078125, 1.880859375, 2.50341796875, 3.1259765625, 3.74853515625, 4.37109375, 4.99365234375, 5.6162109375, 6.23876953125, 6.861328125, 7.48388671875, 8.1064453125, 8.72900390625, 9.3515625, 9.97412109375, 10.5966796875, 11.21923828125, 11.841796875, 12.46435546875, 13.0869140625, 13.70947265625, 14.33203125, 14.95458984375, 15.5771484375, 16.19970703125, 16.822265625, 17.44482421875, 18.0673828125, 18.68994140625, 19.3125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 5.0, 3.0, 9.0, 11.0, 17.0, 16.0, 19.0, 33.0, 32.0, 74.0, 79.0, 127.0, 237.0, 375.0, 560.0, 731.0, 588.0, 407.0, 229.0, 145.0, 113.0, 64.0, 47.0, 34.0, 26.0, 14.0, 17.0, 11.0, 14.0, 6.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.359375, -14.839599609375, -14.31982421875, -13.800048828125, -13.2802734375, -12.760498046875, -12.24072265625, -11.720947265625, -11.201171875, -10.681396484375, -10.16162109375, -9.641845703125, -9.1220703125, -8.602294921875, -8.08251953125, -7.562744140625, -7.04296875, -6.523193359375, -6.00341796875, -5.483642578125, -4.9638671875, -4.444091796875, -3.92431640625, -3.404541015625, -2.884765625, -2.364990234375, -1.84521484375, -1.325439453125, -0.8056640625, -0.285888671875, 0.23388671875, 0.753662109375, 1.2734375, 1.793212890625, 2.31298828125, 2.832763671875, 3.3525390625, 3.872314453125, 4.39208984375, 4.911865234375, 5.431640625, 5.951416015625, 6.47119140625, 6.990966796875, 7.5107421875, 8.030517578125, 8.55029296875, 9.070068359375, 9.58984375, 10.109619140625, 10.62939453125, 11.149169921875, 11.6689453125, 12.188720703125, 12.70849609375, 13.228271484375, 13.748046875, 14.267822265625, 14.78759765625, 15.307373046875, 15.8271484375, 16.346923828125, 16.86669921875, 17.386474609375, 17.90625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 8.0, 12.0, 13.0, 25.0, 27.0, 45.0, 52.0, 91.0, 150.0, 301.0, 509.0, 856.0, 1707.0, 3482.0, 8430.0, 23887.0, 120388.0, 3075996.0, 874112.0, 57190.0, 15466.0, 5876.0, 2707.0, 1342.0, 657.0, 378.0, 209.0, 128.0, 73.0, 55.0, 33.0, 24.0, 20.0, 10.0, 5.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-39.5, -38.39697265625, -37.2939453125, -36.19091796875, -35.087890625, -33.98486328125, -32.8818359375, -31.77880859375, -30.67578125, -29.57275390625, -28.4697265625, -27.36669921875, -26.263671875, -25.16064453125, -24.0576171875, -22.95458984375, -21.8515625, -20.74853515625, -19.6455078125, -18.54248046875, -17.439453125, -16.33642578125, -15.2333984375, -14.13037109375, -13.02734375, -11.92431640625, -10.8212890625, -9.71826171875, -8.615234375, -7.51220703125, -6.4091796875, -5.30615234375, -4.203125, -3.10009765625, -1.9970703125, -0.89404296875, 0.208984375, 1.31201171875, 2.4150390625, 3.51806640625, 4.62109375, 5.72412109375, 6.8271484375, 7.93017578125, 9.033203125, 10.13623046875, 11.2392578125, 12.34228515625, 13.4453125, 14.54833984375, 15.6513671875, 16.75439453125, 17.857421875, 18.96044921875, 20.0634765625, 21.16650390625, 22.26953125, 23.37255859375, 24.4755859375, 25.57861328125, 26.681640625, 27.78466796875, 28.8876953125, 29.99072265625, 31.09375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 51.0, 601.0, 347.0, 17.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-474.36749267578125, -457.90960693359375, -441.4517517089844, -424.993896484375, -408.5360107421875, -392.078125, -375.6202697753906, -359.16241455078125, -342.70452880859375, -326.24664306640625, -309.7887878417969, -293.3309326171875, -276.873046875, -260.4151611328125, -243.95730590820312, -227.4994354248047, -211.04156494140625, -194.5836944580078, -178.12582397460938, -161.66795349121094, -145.2100830078125, -128.75221252441406, -112.29434204101562, -95.83647155761719, -79.37860107421875, -62.92073059082031, -46.462860107421875, -30.004989624023438, -13.547119140625, 2.9107513427734375, 19.368621826171875, 35.82649230957031, 52.284423828125, 68.74229431152344, 85.20016479492188, 101.65803527832031, 118.11590576171875, 134.5737762451172, 151.03164672851562, 167.48951721191406, 183.9473876953125, 200.40525817871094, 216.86312866210938, 233.3209991455078, 249.77886962890625, 266.23675537109375, 282.6946105957031, 299.1524658203125, 315.6103515625, 332.0682373046875, 348.5260925292969, 364.98394775390625, 381.44183349609375, 397.89971923828125, 414.3575744628906, 430.8154296875, 447.2733154296875, 463.731201171875, 480.1890563964844, 496.64691162109375, 513.1047973632812, 529.5626831054688, 546.0205078125, 562.4783935546875, 578.936279296875]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 9.0, 2.0, 4.0, 5.0, 7.0, 6.0, 12.0, 16.0, 21.0, 14.0, 18.0, 25.0, 26.0, 32.0, 20.0, 27.0, 32.0, 35.0, 40.0, 35.0, 33.0, 40.0, 38.0, 36.0, 36.0, 36.0, 31.0, 37.0, 29.0, 32.0, 28.0, 25.0, 22.0, 27.0, 28.0, 27.0, 22.0, 20.0, 9.0, 11.0, 10.0, 12.0, 6.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-44.56242370605469, -43.203861236572266, -41.845298767089844, -40.48674011230469, -39.128177642822266, -37.769615173339844, -36.41105270385742, -35.052490234375, -33.693931579589844, -32.33536911010742, -30.976808547973633, -29.61824607849121, -28.259685516357422, -26.901123046875, -25.542560577392578, -24.183998107910156, -22.825435638427734, -21.466873168945312, -20.108312606811523, -18.7497501373291, -17.391189575195312, -16.03262710571289, -14.674064636230469, -13.315503120422363, -11.956941604614258, -10.598380088806152, -9.239818572998047, -7.881256103515625, -6.5226945877075195, -5.164133071899414, -3.805570602416992, -2.4470090866088867, -1.0884513854980469, 0.2701103687286377, 1.6286721229553223, 2.987234115600586, 4.345795631408691, 5.704357147216797, 7.062919616699219, 8.421481132507324, 9.78004264831543, 11.138604164123535, 12.49716567993164, 13.855728149414062, 15.214289665222168, 16.572851181030273, 17.931413650512695, 19.289974212646484, 20.648536682128906, 22.007099151611328, 23.365659713745117, 24.72422218322754, 26.082782745361328, 27.44134521484375, 28.799907684326172, 30.158470153808594, 31.517030715942383, 32.87559127807617, 34.234153747558594, 35.592716217041016, 36.95127868652344, 38.309837341308594, 39.66840362548828, 41.02696228027344, 42.38552474975586]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 8.0, 7.0, 13.0, 12.0, 15.0, 15.0, 14.0, 22.0, 23.0, 30.0, 48.0, 27.0, 30.0, 29.0, 30.0, 38.0, 34.0, 43.0, 32.0, 44.0, 39.0, 43.0, 38.0, 42.0, 39.0, 30.0, 31.0, 29.0, 17.0, 23.0, 27.0, 17.0, 11.0, 12.0, 15.0, 14.0, 5.0, 6.0, 9.0, 5.0, 1.0, 9.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0], "bins": [-8.09375, -7.85595703125, -7.6181640625, -7.38037109375, -7.142578125, -6.90478515625, -6.6669921875, -6.42919921875, -6.19140625, -5.95361328125, -5.7158203125, -5.47802734375, -5.240234375, -5.00244140625, -4.7646484375, -4.52685546875, -4.2890625, -4.05126953125, -3.8134765625, -3.57568359375, -3.337890625, -3.10009765625, -2.8623046875, -2.62451171875, -2.38671875, -2.14892578125, -1.9111328125, -1.67333984375, -1.435546875, -1.19775390625, -0.9599609375, -0.72216796875, -0.484375, -0.24658203125, -0.0087890625, 0.22900390625, 0.466796875, 0.70458984375, 0.9423828125, 1.18017578125, 1.41796875, 1.65576171875, 1.8935546875, 2.13134765625, 2.369140625, 2.60693359375, 2.8447265625, 3.08251953125, 3.3203125, 3.55810546875, 3.7958984375, 4.03369140625, 4.271484375, 4.50927734375, 4.7470703125, 4.98486328125, 5.22265625, 5.46044921875, 5.6982421875, 5.93603515625, 6.173828125, 6.41162109375, 6.6494140625, 6.88720703125, 7.125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 5.0, 5.0, 5.0, 18.0, 24.0, 32.0, 50.0, 83.0, 104.0, 139.0, 235.0, 273.0, 452.0, 615.0, 925.0, 1346.0, 1996.0, 2825.0, 4116.0, 5930.0, 8840.0, 13058.0, 19632.0, 30480.0, 47018.0, 72825.0, 111332.0, 160452.0, 176452.0, 132756.0, 88836.0, 57535.0, 36998.0, 24132.0, 15899.0, 10493.0, 7139.0, 4813.0, 3269.0, 2327.0, 1540.0, 1112.0, 733.0, 532.0, 377.0, 252.0, 184.0, 135.0, 77.0, 64.0, 32.0, 15.0, 18.0, 12.0, 11.0, 4.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.76171875, -0.7380828857421875, -0.714447021484375, -0.6908111572265625, -0.66717529296875, -0.6435394287109375, -0.619903564453125, -0.5962677001953125, -0.5726318359375, -0.5489959716796875, -0.525360107421875, -0.5017242431640625, -0.47808837890625, -0.4544525146484375, -0.430816650390625, -0.4071807861328125, -0.383544921875, -0.3599090576171875, -0.336273193359375, -0.3126373291015625, -0.28900146484375, -0.2653656005859375, -0.241729736328125, -0.2180938720703125, -0.1944580078125, -0.1708221435546875, -0.147186279296875, -0.1235504150390625, -0.09991455078125, -0.0762786865234375, -0.052642822265625, -0.0290069580078125, -0.00537109375, 0.0182647705078125, 0.041900634765625, 0.0655364990234375, 0.08917236328125, 0.1128082275390625, 0.136444091796875, 0.1600799560546875, 0.1837158203125, 0.2073516845703125, 0.230987548828125, 0.2546234130859375, 0.27825927734375, 0.3018951416015625, 0.325531005859375, 0.3491668701171875, 0.372802734375, 0.3964385986328125, 0.420074462890625, 0.4437103271484375, 0.46734619140625, 0.4909820556640625, 0.514617919921875, 0.5382537841796875, 0.5618896484375, 0.5855255126953125, 0.609161376953125, 0.6327972412109375, 0.65643310546875, 0.6800689697265625, 0.703704833984375, 0.7273406982421875, 0.7509765625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 9.0, 11.0, 4.0, 10.0, 19.0, 27.0, 21.0, 26.0, 29.0, 29.0, 32.0, 39.0, 37.0, 24.0, 31.0, 44.0, 54.0, 1061.0, 38.0, 57.0, 40.0, 42.0, 42.0, 37.0, 29.0, 28.0, 31.0, 33.0, 26.0, 19.0, 11.0, 16.0, 10.0, 11.0, 9.0, 5.0, 11.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.4609375, -5.2918701171875, -5.122802734375, -4.9537353515625, -4.78466796875, -4.6156005859375, -4.446533203125, -4.2774658203125, -4.1083984375, -3.9393310546875, -3.770263671875, -3.6011962890625, -3.43212890625, -3.2630615234375, -3.093994140625, -2.9249267578125, -2.755859375, -2.5867919921875, -2.417724609375, -2.2486572265625, -2.07958984375, -1.9105224609375, -1.741455078125, -1.5723876953125, -1.4033203125, -1.2342529296875, -1.065185546875, -0.8961181640625, -0.72705078125, -0.5579833984375, -0.388916015625, -0.2198486328125, -0.05078125, 0.1182861328125, 0.287353515625, 0.4564208984375, 0.62548828125, 0.7945556640625, 0.963623046875, 1.1326904296875, 1.3017578125, 1.4708251953125, 1.639892578125, 1.8089599609375, 1.97802734375, 2.1470947265625, 2.316162109375, 2.4852294921875, 2.654296875, 2.8233642578125, 2.992431640625, 3.1614990234375, 3.33056640625, 3.4996337890625, 3.668701171875, 3.8377685546875, 4.0068359375, 4.1759033203125, 4.344970703125, 4.5140380859375, 4.68310546875, 4.8521728515625, 5.021240234375, 5.1903076171875, 5.359375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 13.0, 13.0, 27.0, 36.0, 52.0, 75.0, 117.0, 188.0, 292.0, 364.0, 554.0, 788.0, 1188.0, 1711.0, 2536.0, 3675.0, 5498.0, 8106.0, 11951.0, 17836.0, 26951.0, 40900.0, 64203.0, 97516.0, 139494.0, 1214596.0, 148370.0, 105729.0, 69951.0, 45217.0, 29492.0, 19232.0, 12999.0, 8740.0, 5855.0, 4079.0, 2743.0, 1876.0, 1314.0, 884.0, 641.0, 442.0, 302.0, 199.0, 129.0, 95.0, 65.0, 37.0, 27.0, 18.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.55224609375, -0.5358123779296875, -0.519378662109375, -0.5029449462890625, -0.48651123046875, -0.4700775146484375, -0.453643798828125, -0.4372100830078125, -0.4207763671875, -0.4043426513671875, -0.387908935546875, -0.3714752197265625, -0.35504150390625, -0.3386077880859375, -0.322174072265625, -0.3057403564453125, -0.289306640625, -0.2728729248046875, -0.256439208984375, -0.2400054931640625, -0.22357177734375, -0.2071380615234375, -0.190704345703125, -0.1742706298828125, -0.1578369140625, -0.1414031982421875, -0.124969482421875, -0.1085357666015625, -0.09210205078125, -0.0756683349609375, -0.059234619140625, -0.0428009033203125, -0.0263671875, -0.0099334716796875, 0.006500244140625, 0.0229339599609375, 0.03936767578125, 0.0558013916015625, 0.072235107421875, 0.0886688232421875, 0.1051025390625, 0.1215362548828125, 0.137969970703125, 0.1544036865234375, 0.17083740234375, 0.1872711181640625, 0.203704833984375, 0.2201385498046875, 0.236572265625, 0.2530059814453125, 0.269439697265625, 0.2858734130859375, 0.30230712890625, 0.3187408447265625, 0.335174560546875, 0.3516082763671875, 0.3680419921875, 0.3844757080078125, 0.400909423828125, 0.4173431396484375, 0.43377685546875, 0.4502105712890625, 0.466644287109375, 0.4830780029296875, 0.49951171875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 3.0, 13.0, 5.0, 11.0, 33.0, 45.0, 43.0, 51.0, 77.0, 123.0, 158.0, 120.0, 57.0, 60.0, 40.0, 34.0, 19.0, 20.0, 14.0, 5.0, 12.0, 8.0, 8.0, 8.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.019805908203125, -0.019127368927001953, -0.018448829650878906, -0.01777029037475586, -0.017091751098632812, -0.016413211822509766, -0.01573467254638672, -0.015056133270263672, -0.014377593994140625, -0.013699054718017578, -0.013020515441894531, -0.012341976165771484, -0.011663436889648438, -0.01098489761352539, -0.010306358337402344, -0.009627819061279297, -0.00894927978515625, -0.008270740509033203, -0.007592201232910156, -0.006913661956787109, -0.0062351226806640625, -0.005556583404541016, -0.004878044128417969, -0.004199504852294922, -0.003520965576171875, -0.002842426300048828, -0.0021638870239257812, -0.0014853477478027344, -0.0008068084716796875, -0.00012826919555664062, 0.0005502700805664062, 0.0012288093566894531, 0.0019073486328125, 0.002585887908935547, 0.0032644271850585938, 0.003942966461181641, 0.0046215057373046875, 0.005300045013427734, 0.005978584289550781, 0.006657123565673828, 0.007335662841796875, 0.008014202117919922, 0.008692741394042969, 0.009371280670166016, 0.010049819946289062, 0.01072835922241211, 0.011406898498535156, 0.012085437774658203, 0.01276397705078125, 0.013442516326904297, 0.014121055603027344, 0.01479959487915039, 0.015478134155273438, 0.016156673431396484, 0.01683521270751953, 0.017513751983642578, 0.018192291259765625, 0.018870830535888672, 0.01954936981201172, 0.020227909088134766, 0.020906448364257812, 0.02158498764038086, 0.022263526916503906, 0.022942066192626953, 0.02362060546875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 10.0, 6.0, 6.0, 12.0, 10.0, 10.0, 11.0, 25.0, 28.0, 43.0, 58.0, 113.0, 123.0, 256.0, 1261.0, 991342.0, 54168.0, 569.0, 175.0, 94.0, 86.0, 50.0, 24.0, 9.0, 14.0, 6.0, 10.0, 13.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5380859375, -0.52264404296875, -0.5072021484375, -0.49176025390625, -0.476318359375, -0.46087646484375, -0.4454345703125, -0.42999267578125, -0.41455078125, -0.39910888671875, -0.3836669921875, -0.36822509765625, -0.352783203125, -0.33734130859375, -0.3218994140625, -0.30645751953125, -0.291015625, -0.27557373046875, -0.2601318359375, -0.24468994140625, -0.229248046875, -0.21380615234375, -0.1983642578125, -0.18292236328125, -0.16748046875, -0.15203857421875, -0.1365966796875, -0.12115478515625, -0.105712890625, -0.09027099609375, -0.0748291015625, -0.05938720703125, -0.0439453125, -0.02850341796875, -0.0130615234375, 0.00238037109375, 0.017822265625, 0.03326416015625, 0.0487060546875, 0.06414794921875, 0.07958984375, 0.09503173828125, 0.1104736328125, 0.12591552734375, 0.141357421875, 0.15679931640625, 0.1722412109375, 0.18768310546875, 0.203125, 0.21856689453125, 0.2340087890625, 0.24945068359375, 0.264892578125, 0.28033447265625, 0.2957763671875, 0.31121826171875, 0.32666015625, 0.34210205078125, 0.3575439453125, 0.37298583984375, 0.388427734375, 0.40386962890625, 0.4193115234375, 0.43475341796875, 0.4501953125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 8.0, 18.0, 32.0, 106.0, 285.0, 384.0, 117.0, 36.0, 20.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07168031483888626, -0.06975238770246506, -0.06782446056604385, -0.06589654088020325, -0.06396861374378204, -0.06204068660736084, -0.060112759470939636, -0.05818483605980873, -0.056256912648677826, -0.05432898551225662, -0.05240106210112572, -0.050473134964704514, -0.04854521155357361, -0.046617284417152405, -0.0446893572807312, -0.042761433869600296, -0.04083350673317909, -0.03890557959675789, -0.036977656185626984, -0.03504972904920578, -0.033121805638074875, -0.03119387850165367, -0.029265953227877617, -0.027338027954101562, -0.025410102680325508, -0.023482177406549454, -0.0215542521327734, -0.019626326858997345, -0.01769839972257614, -0.015770476311445236, -0.013842549175024033, -0.011914623901247978, -0.009986694902181625, -0.008058769628405571, -0.006130843888968229, -0.004202918149530888, -0.0022749928757548332, -0.00034706760197877884, 0.0015808586031198502, 0.0035087838768959045, 0.005436709150671959, 0.007364634424448013, 0.009292559698224068, 0.011220485903322697, 0.013148411177098751, 0.015076336450874805, 0.017004262655973434, 0.01893218792974949, 0.020860113203525543, 0.022788038477301598, 0.024715963751077652, 0.026643890887498856, 0.02857181429862976, 0.030499741435050964, 0.03242766857147217, 0.03435559198260307, 0.03628351539373398, 0.03821144253015518, 0.04013936594128609, 0.04206729307770729, 0.043995216488838196, 0.0459231436252594, 0.0478510707616806, 0.04977899417281151, 0.05170692130923271]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 14.0, 16.0, 21.0, 21.0, 30.0, 20.0, 27.0, 31.0, 40.0, 46.0, 45.0, 49.0, 47.0, 46.0, 56.0, 55.0, 39.0, 45.0, 49.0, 47.0, 42.0, 26.0, 37.0, 24.0, 20.0, 23.0, 18.0, 10.0, 19.0, 8.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.02317988872528076, -0.022519852966070175, -0.02185981720685959, -0.021199781447649002, -0.020539745688438416, -0.01987970992922783, -0.019219674170017242, -0.018559638410806656, -0.01789960265159607, -0.017239566892385483, -0.016579531133174896, -0.01591949537396431, -0.015259459614753723, -0.014599423855543137, -0.01393938809633255, -0.013279352337121964, -0.012619316577911377, -0.01195928081870079, -0.011299245059490204, -0.010639209300279617, -0.00997917354106903, -0.009319137781858444, -0.008659102022647858, -0.007999066263437271, -0.007339030504226685, -0.006678994745016098, -0.0060189589858055115, -0.005358923226594925, -0.004698887467384338, -0.004038851708173752, -0.0033788159489631653, -0.0027187801897525787, -0.002058744430541992, -0.0013987086713314056, -0.0007386729121208191, -7.863715291023254e-05, 0.000581398606300354, 0.0012414343655109406, 0.001901470124721527, 0.0025615058839321136, 0.0032215416431427, 0.0038815774023532867, 0.004541613161563873, 0.00520164892077446, 0.005861684679985046, 0.006521720439195633, 0.0071817561984062195, 0.007841791957616806, 0.008501827716827393, 0.009161863476037979, 0.009821899235248566, 0.010481934994459152, 0.011141970753669739, 0.011802006512880325, 0.012462042272090912, 0.013122078031301498, 0.013782113790512085, 0.014442149549722672, 0.015102185308933258, 0.015762221068143845, 0.01642225682735443, 0.017082292586565018, 0.017742328345775604, 0.01840236410498619, 0.019062399864196777]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 8.0, 7.0, 13.0, 12.0, 15.0, 15.0, 14.0, 22.0, 23.0, 30.0, 48.0, 27.0, 30.0, 29.0, 30.0, 38.0, 34.0, 42.0, 33.0, 44.0, 39.0, 43.0, 38.0, 42.0, 39.0, 30.0, 31.0, 29.0, 17.0, 23.0, 26.0, 18.0, 11.0, 12.0, 15.0, 14.0, 5.0, 6.0, 9.0, 5.0, 1.0, 9.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0], "bins": [-8.09375, -7.85595703125, -7.6181640625, -7.38037109375, -7.142578125, -6.90478515625, -6.6669921875, -6.42919921875, -6.19140625, -5.95361328125, -5.7158203125, -5.47802734375, -5.240234375, -5.00244140625, -4.7646484375, -4.52685546875, -4.2890625, -4.05126953125, -3.8134765625, -3.57568359375, -3.337890625, -3.10009765625, -2.8623046875, -2.62451171875, -2.38671875, -2.14892578125, -1.9111328125, -1.67333984375, -1.435546875, -1.19775390625, -0.9599609375, -0.72216796875, -0.484375, -0.24658203125, -0.0087890625, 0.22900390625, 0.466796875, 0.70458984375, 0.9423828125, 1.18017578125, 1.41796875, 1.65576171875, 1.8935546875, 2.13134765625, 2.369140625, 2.60693359375, 2.8447265625, 3.08251953125, 3.3203125, 3.55810546875, 3.7958984375, 4.03369140625, 4.271484375, 4.50927734375, 4.7470703125, 4.98486328125, 5.22265625, 5.46044921875, 5.6982421875, 5.93603515625, 6.173828125, 6.41162109375, 6.6494140625, 6.88720703125, 7.125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 9.0, 22.0, 17.0, 34.0, 34.0, 43.0, 61.0, 98.0, 130.0, 168.0, 261.0, 347.0, 528.0, 758.0, 1167.0, 1771.0, 2981.0, 5403.0, 10876.0, 26273.0, 75408.0, 301095.0, 450361.0, 105978.0, 34754.0, 13785.0, 6487.0, 3536.0, 2025.0, 1311.0, 800.0, 608.0, 398.0, 286.0, 212.0, 153.0, 100.0, 78.0, 58.0, 34.0, 30.0, 22.0, 16.0, 16.0, 8.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.390625, -10.999755859375, -10.60888671875, -10.218017578125, -9.8271484375, -9.436279296875, -9.04541015625, -8.654541015625, -8.263671875, -7.872802734375, -7.48193359375, -7.091064453125, -6.7001953125, -6.309326171875, -5.91845703125, -5.527587890625, -5.13671875, -4.745849609375, -4.35498046875, -3.964111328125, -3.5732421875, -3.182373046875, -2.79150390625, -2.400634765625, -2.009765625, -1.618896484375, -1.22802734375, -0.837158203125, -0.4462890625, -0.055419921875, 0.33544921875, 0.726318359375, 1.1171875, 1.508056640625, 1.89892578125, 2.289794921875, 2.6806640625, 3.071533203125, 3.46240234375, 3.853271484375, 4.244140625, 4.635009765625, 5.02587890625, 5.416748046875, 5.8076171875, 6.198486328125, 6.58935546875, 6.980224609375, 7.37109375, 7.761962890625, 8.15283203125, 8.543701171875, 8.9345703125, 9.325439453125, 9.71630859375, 10.107177734375, 10.498046875, 10.888916015625, 11.27978515625, 11.670654296875, 12.0615234375, 12.452392578125, 12.84326171875, 13.234130859375, 13.625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 4.0, 3.0, 5.0, 7.0, 4.0, 9.0, 9.0, 15.0, 14.0, 10.0, 11.0, 17.0, 19.0, 32.0, 35.0, 27.0, 40.0, 43.0, 47.0, 45.0, 85.0, 154.0, 1458.0, 322.0, 129.0, 76.0, 50.0, 51.0, 40.0, 38.0, 37.0, 29.0, 34.0, 24.0, 19.0, 19.0, 10.0, 14.0, 12.0, 8.0, 9.0, 6.0, 7.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-21.234375, -20.54833984375, -19.8623046875, -19.17626953125, -18.490234375, -17.80419921875, -17.1181640625, -16.43212890625, -15.74609375, -15.06005859375, -14.3740234375, -13.68798828125, -13.001953125, -12.31591796875, -11.6298828125, -10.94384765625, -10.2578125, -9.57177734375, -8.8857421875, -8.19970703125, -7.513671875, -6.82763671875, -6.1416015625, -5.45556640625, -4.76953125, -4.08349609375, -3.3974609375, -2.71142578125, -2.025390625, -1.33935546875, -0.6533203125, 0.03271484375, 0.71875, 1.40478515625, 2.0908203125, 2.77685546875, 3.462890625, 4.14892578125, 4.8349609375, 5.52099609375, 6.20703125, 6.89306640625, 7.5791015625, 8.26513671875, 8.951171875, 9.63720703125, 10.3232421875, 11.00927734375, 11.6953125, 12.38134765625, 13.0673828125, 13.75341796875, 14.439453125, 15.12548828125, 15.8115234375, 16.49755859375, 17.18359375, 17.86962890625, 18.5556640625, 19.24169921875, 19.927734375, 20.61376953125, 21.2998046875, 21.98583984375, 22.671875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 16.0, 10.0, 15.0, 29.0, 41.0, 56.0, 93.0, 164.0, 356.0, 884.0, 3921.0, 59456.0, 3000631.0, 74052.0, 4266.0, 897.0, 371.0, 149.0, 97.0, 68.0, 43.0, 19.0, 29.0, 11.0, 10.0, 4.0, 5.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-58.9375, -57.23046875, -55.5234375, -53.81640625, -52.109375, -50.40234375, -48.6953125, -46.98828125, -45.28125, -43.57421875, -41.8671875, -40.16015625, -38.453125, -36.74609375, -35.0390625, -33.33203125, -31.625, -29.91796875, -28.2109375, -26.50390625, -24.796875, -23.08984375, -21.3828125, -19.67578125, -17.96875, -16.26171875, -14.5546875, -12.84765625, -11.140625, -9.43359375, -7.7265625, -6.01953125, -4.3125, -2.60546875, -0.8984375, 0.80859375, 2.515625, 4.22265625, 5.9296875, 7.63671875, 9.34375, 11.05078125, 12.7578125, 14.46484375, 16.171875, 17.87890625, 19.5859375, 21.29296875, 23.0, 24.70703125, 26.4140625, 28.12109375, 29.828125, 31.53515625, 33.2421875, 34.94921875, 36.65625, 38.36328125, 40.0703125, 41.77734375, 43.484375, 45.19140625, 46.8984375, 48.60546875, 50.3125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 249.0, 640.0, 109.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.90864562988281, -50.050357818603516, -43.19207000732422, -36.33378219604492, -29.475494384765625, -22.617206573486328, -15.758918762207031, -8.900630950927734, -2.0423431396484375, 4.815944671630859, 11.674232482910156, 18.532520294189453, 25.39080810546875, 32.24909591674805, 39.107383728027344, 45.96567153930664, 52.82395935058594, 59.682247161865234, 66.54053497314453, 73.39881896972656, 80.25711059570312, 87.11540222167969, 93.97368621826172, 100.83197021484375, 107.69026184082031, 114.54855346679688, 121.4068374633789, 128.26512145996094, 135.1234130859375, 141.98170471191406, 148.83999633789062, 155.69827270507812, 162.55654907226562, 169.4148406982422, 176.27313232421875, 183.13140869140625, 189.9897003173828, 196.84799194335938, 203.70626831054688, 210.56455993652344, 217.4228515625, 224.28114318847656, 231.13943481445312, 237.99771118164062, 244.8560028076172, 251.71429443359375, 258.57257080078125, 265.4308776855469, 272.2891540527344, 279.1474304199219, 286.0057373046875, 292.864013671875, 299.7222900390625, 306.5805969238281, 313.4388732910156, 320.29718017578125, 327.15545654296875, 334.01373291015625, 340.8720397949219, 347.7303161621094, 354.588623046875, 361.4468994140625, 368.30517578125, 375.1634826660156, 382.0217590332031]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 9.0, 5.0, 9.0, 5.0, 12.0, 18.0, 19.0, 15.0, 18.0, 33.0, 27.0, 48.0, 31.0, 39.0, 47.0, 54.0, 46.0, 45.0, 38.0, 51.0, 43.0, 53.0, 38.0, 31.0, 32.0, 35.0, 32.0, 24.0, 25.0, 17.0, 24.0, 16.0, 11.0, 11.0, 7.0, 9.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.00137710571289, -51.068233489990234, -49.13508987426758, -47.20195007324219, -45.26880645751953, -43.335662841796875, -41.40251922607422, -39.46937561035156, -37.536231994628906, -35.60308837890625, -33.669944763183594, -31.73680305480957, -29.803661346435547, -27.87051773071289, -25.937374114990234, -24.004230499267578, -22.071090698242188, -20.13794708251953, -18.204805374145508, -16.27166175842285, -14.338519096374512, -12.405376434326172, -10.472232818603516, -8.539090156555176, -6.605947494506836, -4.672804832458496, -2.739661693572998, -0.8065185546875, 1.1266241073608398, 3.0597667694091797, 4.992910385131836, 6.926053047180176, 8.85919189453125, 10.79233455657959, 12.72547721862793, 14.658620834350586, 16.59176254272461, 18.524906158447266, 20.458049774169922, 22.391193389892578, 24.3243350982666, 26.257478713989258, 28.19062042236328, 30.123764038085938, 32.056907653808594, 33.99005126953125, 35.923194885253906, 37.8563346862793, 39.78947830200195, 41.72262191772461, 43.655765533447266, 45.588905334472656, 47.52204895019531, 49.45519256591797, 51.388336181640625, 53.32147979736328, 55.25462341308594, 57.187767028808594, 59.12091064453125, 61.054054260253906, 62.9871940612793, 64.92033386230469, 66.85348510742188, 68.78662109375, 70.71976470947266]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 3.0, 6.0, 10.0, 4.0, 6.0, 13.0, 10.0, 10.0, 15.0, 13.0, 26.0, 22.0, 27.0, 23.0, 36.0, 30.0, 33.0, 36.0, 36.0, 33.0, 38.0, 32.0, 34.0, 34.0, 39.0, 43.0, 39.0, 38.0, 42.0, 30.0, 32.0, 26.0, 21.0, 20.0, 13.0, 17.0, 15.0, 15.0, 7.0, 14.0, 11.0, 10.0, 5.0, 3.0, 3.0, 9.0, 3.0, 2.0, 3.0, 1.0, 6.0, 0.0, 1.0, 3.0], "bins": [-7.56640625, -7.3345947265625, -7.102783203125, -6.8709716796875, -6.63916015625, -6.4073486328125, -6.175537109375, -5.9437255859375, -5.7119140625, -5.4801025390625, -5.248291015625, -5.0164794921875, -4.78466796875, -4.5528564453125, -4.321044921875, -4.0892333984375, -3.857421875, -3.6256103515625, -3.393798828125, -3.1619873046875, -2.93017578125, -2.6983642578125, -2.466552734375, -2.2347412109375, -2.0029296875, -1.7711181640625, -1.539306640625, -1.3074951171875, -1.07568359375, -0.8438720703125, -0.612060546875, -0.3802490234375, -0.1484375, 0.0833740234375, 0.315185546875, 0.5469970703125, 0.77880859375, 1.0106201171875, 1.242431640625, 1.4742431640625, 1.7060546875, 1.9378662109375, 2.169677734375, 2.4014892578125, 2.63330078125, 2.8651123046875, 3.096923828125, 3.3287353515625, 3.560546875, 3.7923583984375, 4.024169921875, 4.2559814453125, 4.48779296875, 4.7196044921875, 4.951416015625, 5.1832275390625, 5.4150390625, 5.6468505859375, 5.878662109375, 6.1104736328125, 6.34228515625, 6.5740966796875, 6.805908203125, 7.0377197265625, 7.26953125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 14.0, 5.0, 14.0, 29.0, 38.0, 58.0, 65.0, 107.0, 144.0, 194.0, 230.0, 351.0, 518.0, 750.0, 1201.0, 1737.0, 2614.0, 4209.0, 7273.0, 14554.0, 43590.0, 320458.0, 2506664.0, 1123498.0, 116027.0, 24461.0, 10410.0, 5635.0, 3239.0, 1958.0, 1338.0, 897.0, 611.0, 418.0, 282.0, 182.0, 134.0, 105.0, 67.0, 56.0, 47.0, 27.0, 20.0, 20.0, 18.0, 7.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.109375, -14.565185546875, -14.02099609375, -13.476806640625, -12.9326171875, -12.388427734375, -11.84423828125, -11.300048828125, -10.755859375, -10.211669921875, -9.66748046875, -9.123291015625, -8.5791015625, -8.034912109375, -7.49072265625, -6.946533203125, -6.40234375, -5.858154296875, -5.31396484375, -4.769775390625, -4.2255859375, -3.681396484375, -3.13720703125, -2.593017578125, -2.048828125, -1.504638671875, -0.96044921875, -0.416259765625, 0.1279296875, 0.672119140625, 1.21630859375, 1.760498046875, 2.3046875, 2.848876953125, 3.39306640625, 3.937255859375, 4.4814453125, 5.025634765625, 5.56982421875, 6.114013671875, 6.658203125, 7.202392578125, 7.74658203125, 8.290771484375, 8.8349609375, 9.379150390625, 9.92333984375, 10.467529296875, 11.01171875, 11.555908203125, 12.10009765625, 12.644287109375, 13.1884765625, 13.732666015625, 14.27685546875, 14.821044921875, 15.365234375, 15.909423828125, 16.45361328125, 16.997802734375, 17.5419921875, 18.086181640625, 18.63037109375, 19.174560546875, 19.71875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 1.0, 5.0, 12.0, 6.0, 12.0, 4.0, 16.0, 8.0, 15.0, 26.0, 28.0, 30.0, 33.0, 71.0, 94.0, 129.0, 235.0, 367.0, 625.0, 700.0, 590.0, 394.0, 224.0, 148.0, 78.0, 48.0, 42.0, 34.0, 29.0, 10.0, 6.0, 11.0, 4.0, 6.0, 9.0, 2.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.65625, -15.1591796875, -14.662109375, -14.1650390625, -13.66796875, -13.1708984375, -12.673828125, -12.1767578125, -11.6796875, -11.1826171875, -10.685546875, -10.1884765625, -9.69140625, -9.1943359375, -8.697265625, -8.2001953125, -7.703125, -7.2060546875, -6.708984375, -6.2119140625, -5.71484375, -5.2177734375, -4.720703125, -4.2236328125, -3.7265625, -3.2294921875, -2.732421875, -2.2353515625, -1.73828125, -1.2412109375, -0.744140625, -0.2470703125, 0.25, 0.7470703125, 1.244140625, 1.7412109375, 2.23828125, 2.7353515625, 3.232421875, 3.7294921875, 4.2265625, 4.7236328125, 5.220703125, 5.7177734375, 6.21484375, 6.7119140625, 7.208984375, 7.7060546875, 8.203125, 8.7001953125, 9.197265625, 9.6943359375, 10.19140625, 10.6884765625, 11.185546875, 11.6826171875, 12.1796875, 12.6767578125, 13.173828125, 13.6708984375, 14.16796875, 14.6650390625, 15.162109375, 15.6591796875, 16.15625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 12.0, 9.0, 19.0, 18.0, 22.0, 40.0, 56.0, 81.0, 93.0, 134.0, 189.0, 304.0, 412.0, 540.0, 857.0, 1332.0, 1923.0, 3000.0, 4633.0, 7712.0, 13368.0, 26342.0, 67700.0, 300590.0, 2483759.0, 1049262.0, 143220.0, 42768.0, 18761.0, 9863.0, 6054.0, 3778.0, 2434.0, 1585.0, 1012.0, 719.0, 487.0, 348.0, 231.0, 179.0, 117.0, 72.0, 76.0, 51.0, 29.0, 26.0, 16.0, 15.0, 8.0, 4.0, 11.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-18.3125, -17.736328125, -17.16015625, -16.583984375, -16.0078125, -15.431640625, -14.85546875, -14.279296875, -13.703125, -13.126953125, -12.55078125, -11.974609375, -11.3984375, -10.822265625, -10.24609375, -9.669921875, -9.09375, -8.517578125, -7.94140625, -7.365234375, -6.7890625, -6.212890625, -5.63671875, -5.060546875, -4.484375, -3.908203125, -3.33203125, -2.755859375, -2.1796875, -1.603515625, -1.02734375, -0.451171875, 0.125, 0.701171875, 1.27734375, 1.853515625, 2.4296875, 3.005859375, 3.58203125, 4.158203125, 4.734375, 5.310546875, 5.88671875, 6.462890625, 7.0390625, 7.615234375, 8.19140625, 8.767578125, 9.34375, 9.919921875, 10.49609375, 11.072265625, 11.6484375, 12.224609375, 12.80078125, 13.376953125, 13.953125, 14.529296875, 15.10546875, 15.681640625, 16.2578125, 16.833984375, 17.41015625, 17.986328125, 18.5625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 11.0, 18.0, 44.0, 168.0, 374.0, 257.0, 94.0, 26.0, 10.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.83030700683594, -196.44622802734375, -190.0621337890625, -183.6780548095703, -177.29397583007812, -170.90988159179688, -164.5258026123047, -158.1417236328125, -151.75762939453125, -145.37355041503906, -138.9894561767578, -132.60537719726562, -126.2212905883789, -119.83720397949219, -113.453125, -107.06903839111328, -100.6849594116211, -94.30087280273438, -87.91679382324219, -81.53270721435547, -75.14862060546875, -68.76454162597656, -62.380455017089844, -55.996368408203125, -49.61228561401367, -43.22820281982422, -36.8441162109375, -30.460033416748047, -24.07594871520996, -17.691864013671875, -11.307781219482422, -4.923694610595703, 1.46038818359375, 7.844472408294678, 14.228556632995605, 20.612640380859375, 26.99672508239746, 33.38080978393555, 39.764892578125, 46.14897918701172, 52.53306198120117, 58.917144775390625, 65.30123138427734, 71.68531799316406, 78.06939697265625, 84.45348358154297, 90.83757019042969, 97.22164916992188, 103.6057357788086, 109.98982238769531, 116.3739013671875, 122.75798797607422, 129.14207458496094, 135.52615356445312, 141.91024780273438, 148.29432678222656, 154.67840576171875, 161.06248474121094, 167.4465789794922, 173.83065795898438, 180.21473693847656, 186.5988311767578, 192.98291015625, 199.36700439453125, 205.75108337402344]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 6.0, 6.0, 8.0, 14.0, 9.0, 12.0, 17.0, 14.0, 23.0, 25.0, 26.0, 26.0, 29.0, 33.0, 33.0, 46.0, 40.0, 34.0, 55.0, 37.0, 36.0, 43.0, 40.0, 46.0, 35.0, 40.0, 34.0, 28.0, 36.0, 18.0, 24.0, 25.0, 21.0, 11.0, 13.0, 10.0, 7.0, 5.0, 8.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-58.242889404296875, -56.551963806152344, -54.86104202270508, -53.17011642456055, -51.479190826416016, -49.78826904296875, -48.09734344482422, -46.40641784667969, -44.715492248535156, -43.024566650390625, -41.33364486694336, -39.64271926879883, -37.9517936706543, -36.26087188720703, -34.5699462890625, -32.87902069091797, -31.188098907470703, -29.497175216674805, -27.806249618530273, -26.115325927734375, -24.424400329589844, -22.733476638793945, -21.042552947998047, -19.351627349853516, -17.660703659057617, -15.969779014587402, -14.278854370117188, -12.587930679321289, -10.897006034851074, -9.20608139038086, -7.515157699584961, -5.824233055114746, -4.133308410644531, -2.4423840045928955, -0.7514595985412598, 0.9394645690917969, 2.6303892135620117, 4.321313858032227, 6.012237548828125, 7.70316219329834, 9.394086837768555, 11.08501148223877, 12.775936126708984, 14.466859817504883, 16.15778350830078, 17.848709106445312, 19.53963279724121, 21.23055648803711, 22.92148208618164, 24.61240577697754, 26.30333137512207, 27.99425506591797, 29.6851806640625, 31.3761043548584, 33.0670280456543, 34.75795364379883, 36.448875427246094, 38.139801025390625, 39.83072280883789, 41.52164840698242, 43.21257400512695, 44.90349578857422, 46.59442138671875, 48.28534698486328, 49.97627258300781]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 1.0, 4.0, 7.0, 6.0, 5.0, 4.0, 13.0, 11.0, 14.0, 15.0, 24.0, 30.0, 22.0, 26.0, 18.0, 20.0, 29.0, 43.0, 32.0, 37.0, 43.0, 36.0, 42.0, 32.0, 41.0, 38.0, 39.0, 35.0, 32.0, 37.0, 32.0, 31.0, 22.0, 18.0, 32.0, 23.0, 14.0, 14.0, 12.0, 16.0, 10.0, 7.0, 11.0, 5.0, 4.0, 8.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.0, -7.73876953125, -7.4775390625, -7.21630859375, -6.955078125, -6.69384765625, -6.4326171875, -6.17138671875, -5.91015625, -5.64892578125, -5.3876953125, -5.12646484375, -4.865234375, -4.60400390625, -4.3427734375, -4.08154296875, -3.8203125, -3.55908203125, -3.2978515625, -3.03662109375, -2.775390625, -2.51416015625, -2.2529296875, -1.99169921875, -1.73046875, -1.46923828125, -1.2080078125, -0.94677734375, -0.685546875, -0.42431640625, -0.1630859375, 0.09814453125, 0.359375, 0.62060546875, 0.8818359375, 1.14306640625, 1.404296875, 1.66552734375, 1.9267578125, 2.18798828125, 2.44921875, 2.71044921875, 2.9716796875, 3.23291015625, 3.494140625, 3.75537109375, 4.0166015625, 4.27783203125, 4.5390625, 4.80029296875, 5.0615234375, 5.32275390625, 5.583984375, 5.84521484375, 6.1064453125, 6.36767578125, 6.62890625, 6.89013671875, 7.1513671875, 7.41259765625, 7.673828125, 7.93505859375, 8.1962890625, 8.45751953125, 8.71875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 17.0, 35.0, 23.0, 37.0, 60.0, 88.0, 141.0, 222.0, 295.0, 461.0, 705.0, 1022.0, 1571.0, 2418.0, 3492.0, 5059.0, 7827.0, 12034.0, 18059.0, 27853.0, 43539.0, 68164.0, 107490.0, 163204.0, 188080.0, 141310.0, 91236.0, 57510.0, 36736.0, 23747.0, 15430.0, 10277.0, 6643.0, 4600.0, 2993.0, 2015.0, 1414.0, 905.0, 583.0, 404.0, 265.0, 197.0, 136.0, 76.0, 69.0, 42.0, 23.0, 12.0, 15.0, 7.0, 2.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.849609375, -0.822479248046875, -0.79534912109375, -0.768218994140625, -0.7410888671875, -0.713958740234375, -0.68682861328125, -0.659698486328125, -0.632568359375, -0.605438232421875, -0.57830810546875, -0.551177978515625, -0.5240478515625, -0.496917724609375, -0.46978759765625, -0.442657470703125, -0.41552734375, -0.388397216796875, -0.36126708984375, -0.334136962890625, -0.3070068359375, -0.279876708984375, -0.25274658203125, -0.225616455078125, -0.198486328125, -0.171356201171875, -0.14422607421875, -0.117095947265625, -0.0899658203125, -0.062835693359375, -0.03570556640625, -0.008575439453125, 0.0185546875, 0.045684814453125, 0.07281494140625, 0.099945068359375, 0.1270751953125, 0.154205322265625, 0.18133544921875, 0.208465576171875, 0.235595703125, 0.262725830078125, 0.28985595703125, 0.316986083984375, 0.3441162109375, 0.371246337890625, 0.39837646484375, 0.425506591796875, 0.45263671875, 0.479766845703125, 0.50689697265625, 0.534027099609375, 0.5611572265625, 0.588287353515625, 0.61541748046875, 0.642547607421875, 0.669677734375, 0.696807861328125, 0.72393798828125, 0.751068115234375, 0.7781982421875, 0.805328369140625, 0.83245849609375, 0.859588623046875, 0.88671875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 7.0, 6.0, 8.0, 15.0, 11.0, 13.0, 5.0, 26.0, 25.0, 19.0, 29.0, 25.0, 27.0, 41.0, 44.0, 50.0, 44.0, 50.0, 45.0, 1061.0, 42.0, 48.0, 51.0, 40.0, 36.0, 27.0, 33.0, 30.0, 27.0, 28.0, 22.0, 16.0, 20.0, 10.0, 10.0, 8.0, 8.0, 4.0, 12.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.53125, -6.34295654296875, -6.1546630859375, -5.96636962890625, -5.778076171875, -5.58978271484375, -5.4014892578125, -5.21319580078125, -5.02490234375, -4.83660888671875, -4.6483154296875, -4.46002197265625, -4.271728515625, -4.08343505859375, -3.8951416015625, -3.70684814453125, -3.5185546875, -3.33026123046875, -3.1419677734375, -2.95367431640625, -2.765380859375, -2.57708740234375, -2.3887939453125, -2.20050048828125, -2.01220703125, -1.82391357421875, -1.6356201171875, -1.44732666015625, -1.259033203125, -1.07073974609375, -0.8824462890625, -0.69415283203125, -0.505859375, -0.31756591796875, -0.1292724609375, 0.05902099609375, 0.247314453125, 0.43560791015625, 0.6239013671875, 0.81219482421875, 1.00048828125, 1.18878173828125, 1.3770751953125, 1.56536865234375, 1.753662109375, 1.94195556640625, 2.1302490234375, 2.31854248046875, 2.5068359375, 2.69512939453125, 2.8834228515625, 3.07171630859375, 3.260009765625, 3.44830322265625, 3.6365966796875, 3.82489013671875, 4.01318359375, 4.20147705078125, 4.3897705078125, 4.57806396484375, 4.766357421875, 4.95465087890625, 5.1429443359375, 5.33123779296875, 5.51953125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 7.0, 4.0, 9.0, 20.0, 23.0, 24.0, 39.0, 51.0, 97.0, 149.0, 204.0, 286.0, 398.0, 499.0, 768.0, 1144.0, 1574.0, 2222.0, 3226.0, 4671.0, 6692.0, 9835.0, 14111.0, 21842.0, 33019.0, 51477.0, 82716.0, 128446.0, 1092886.0, 293341.0, 123222.0, 78757.0, 48826.0, 31606.0, 20623.0, 13895.0, 9386.0, 6394.0, 4391.0, 3062.0, 2117.0, 1501.0, 1072.0, 784.0, 545.0, 371.0, 225.0, 194.0, 136.0, 81.0, 64.0, 40.0, 26.0, 14.0, 10.0, 13.0, 4.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.583984375, -0.565704345703125, -0.54742431640625, -0.529144287109375, -0.5108642578125, -0.492584228515625, -0.47430419921875, -0.456024169921875, -0.437744140625, -0.419464111328125, -0.40118408203125, -0.382904052734375, -0.3646240234375, -0.346343994140625, -0.32806396484375, -0.309783935546875, -0.29150390625, -0.273223876953125, -0.25494384765625, -0.236663818359375, -0.2183837890625, -0.200103759765625, -0.18182373046875, -0.163543701171875, -0.145263671875, -0.126983642578125, -0.10870361328125, -0.090423583984375, -0.0721435546875, -0.053863525390625, -0.03558349609375, -0.017303466796875, 0.0009765625, 0.019256591796875, 0.03753662109375, 0.055816650390625, 0.0740966796875, 0.092376708984375, 0.11065673828125, 0.128936767578125, 0.147216796875, 0.165496826171875, 0.18377685546875, 0.202056884765625, 0.2203369140625, 0.238616943359375, 0.25689697265625, 0.275177001953125, 0.29345703125, 0.311737060546875, 0.33001708984375, 0.348297119140625, 0.3665771484375, 0.384857177734375, 0.40313720703125, 0.421417236328125, 0.439697265625, 0.457977294921875, 0.47625732421875, 0.494537353515625, 0.5128173828125, 0.531097412109375, 0.54937744140625, 0.567657470703125, 0.5859375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 5.0, 6.0, 8.0, 17.0, 11.0, 21.0, 41.0, 45.0, 74.0, 145.0, 230.0, 136.0, 83.0, 43.0, 35.0, 13.0, 16.0, 11.0, 7.0, 8.0, 5.0, 5.0, 4.0, 2.0, 6.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.038970947265625, -0.0378718376159668, -0.036772727966308594, -0.03567361831665039, -0.03457450866699219, -0.033475399017333984, -0.03237628936767578, -0.03127717971801758, -0.030178070068359375, -0.029078960418701172, -0.02797985076904297, -0.026880741119384766, -0.025781631469726562, -0.02468252182006836, -0.023583412170410156, -0.022484302520751953, -0.02138519287109375, -0.020286083221435547, -0.019186973571777344, -0.01808786392211914, -0.016988754272460938, -0.015889644622802734, -0.014790534973144531, -0.013691425323486328, -0.012592315673828125, -0.011493206024169922, -0.010394096374511719, -0.009294986724853516, -0.008195877075195312, -0.007096767425537109, -0.005997657775878906, -0.004898548126220703, -0.0037994384765625, -0.002700328826904297, -0.0016012191772460938, -0.0005021095275878906, 0.0005970001220703125, 0.0016961097717285156, 0.0027952194213867188, 0.003894329071044922, 0.004993438720703125, 0.006092548370361328, 0.007191658020019531, 0.008290767669677734, 0.009389877319335938, 0.01048898696899414, 0.011588096618652344, 0.012687206268310547, 0.01378631591796875, 0.014885425567626953, 0.015984535217285156, 0.01708364486694336, 0.018182754516601562, 0.019281864166259766, 0.02038097381591797, 0.021480083465576172, 0.022579193115234375, 0.023678302764892578, 0.02477741241455078, 0.025876522064208984, 0.026975631713867188, 0.02807474136352539, 0.029173851013183594, 0.030272960662841797, 0.0313720703125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 6.0, 9.0, 8.0, 13.0, 10.0, 10.0, 23.0, 29.0, 56.0, 70.0, 115.0, 167.0, 587.0, 32995.0, 1010690.0, 3036.0, 286.0, 135.0, 98.0, 65.0, 31.0, 20.0, 20.0, 10.0, 13.0, 9.0, 5.0, 5.0, 0.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.625, -0.6028900146484375, -0.580780029296875, -0.5586700439453125, -0.53656005859375, -0.5144500732421875, -0.492340087890625, -0.4702301025390625, -0.4481201171875, -0.4260101318359375, -0.403900146484375, -0.3817901611328125, -0.35968017578125, -0.3375701904296875, -0.315460205078125, -0.2933502197265625, -0.271240234375, -0.2491302490234375, -0.227020263671875, -0.2049102783203125, -0.18280029296875, -0.1606903076171875, -0.138580322265625, -0.1164703369140625, -0.0943603515625, -0.0722503662109375, -0.050140380859375, -0.0280303955078125, -0.00592041015625, 0.0161895751953125, 0.038299560546875, 0.0604095458984375, 0.08251953125, 0.1046295166015625, 0.126739501953125, 0.1488494873046875, 0.17095947265625, 0.1930694580078125, 0.215179443359375, 0.2372894287109375, 0.2593994140625, 0.2815093994140625, 0.303619384765625, 0.3257293701171875, 0.34783935546875, 0.3699493408203125, 0.392059326171875, 0.4141693115234375, 0.436279296875, 0.4583892822265625, 0.480499267578125, 0.5026092529296875, 0.52471923828125, 0.5468292236328125, 0.568939208984375, 0.5910491943359375, 0.6131591796875, 0.6352691650390625, 0.657379150390625, 0.6794891357421875, 0.70159912109375, 0.7237091064453125, 0.745819091796875, 0.7679290771484375, 0.7900390625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 8.0, 31.0, 93.0, 583.0, 262.0, 33.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.272876501083374, -0.2660271227359772, -0.2591777443885803, -0.25232839584350586, -0.24547900259494781, -0.23862963914871216, -0.2317802608013153, -0.22493088245391846, -0.2180815041065216, -0.21123212575912476, -0.2043827623128891, -0.19753338396549225, -0.1906840056180954, -0.18383464217185974, -0.1769852638244629, -0.17013588547706604, -0.16328652203083038, -0.15643714368343353, -0.14958778023719788, -0.14273840188980103, -0.13588902354240417, -0.12903964519500732, -0.12219028174877167, -0.11534090340137482, -0.10849153250455856, -0.10164216160774231, -0.09479278326034546, -0.0879434123635292, -0.08109404146671295, -0.0742446631193161, -0.06739529222249985, -0.060545917600393295, -0.05369654297828674, -0.04684716835618019, -0.03999779373407364, -0.033148422837257385, -0.026299048215150833, -0.01944967359304428, -0.012600302696228027, -0.005750928074121475, 0.001098446547985077, 0.007947820238769054, 0.014797193929553032, 0.021646566689014435, 0.028495941311120987, 0.03534531593322754, 0.04219468683004379, 0.049044061452150345, 0.0558934360742569, 0.06274280697107315, 0.06959218531847, 0.07644155621528625, 0.0832909345626831, 0.09014030545949936, 0.09698967635631561, 0.10383905470371246, 0.11068842560052872, 0.11753779649734497, 0.12438717484474182, 0.13123655319213867, 0.13808591663837433, 0.14493529498577118, 0.15178465843200684, 0.1586340367794037, 0.16548341512680054]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 5.0, 5.0, 7.0, 7.0, 13.0, 19.0, 11.0, 15.0, 22.0, 24.0, 17.0, 20.0, 19.0, 39.0, 28.0, 28.0, 37.0, 44.0, 35.0, 44.0, 40.0, 46.0, 37.0, 41.0, 45.0, 34.0, 32.0, 34.0, 31.0, 42.0, 26.0, 25.0, 19.0, 22.0, 15.0, 16.0, 9.0, 14.0, 8.0, 7.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.022802889347076416, -0.022143829613924026, -0.021484771743416786, -0.020825713872909546, -0.020166654139757156, -0.019507594406604767, -0.018848536536097527, -0.018189478665590286, -0.017530418932437897, -0.016871359199285507, -0.016212301328778267, -0.015553242526948452, -0.014894183725118637, -0.014235124923288822, -0.013576066121459007, -0.012917007319629192, -0.012257948517799377, -0.011598889715969563, -0.010939830914139748, -0.010280772112309933, -0.009621713310480118, -0.008962654508650303, -0.008303595706820488, -0.007644536904990673, -0.006985478103160858, -0.006326419301331043, -0.005667360499501228, -0.005008301697671413, -0.0043492428958415985, -0.0036901840940117836, -0.0030311252921819687, -0.0023720664903521538, -0.0017130076885223389, -0.001053948886692524, -0.00039489008486270905, 0.00026416871696710587, 0.0009232275187969208, 0.0015822863206267357, 0.0022413451224565506, 0.0029004039242863655, 0.0035594627261161804, 0.004218521527945995, 0.00487758032977581, 0.005536639131605625, 0.00619569793343544, 0.006854756735265255, 0.00751381553709507, 0.008172874338924885, 0.0088319331407547, 0.009490991942584515, 0.01015005074441433, 0.010809109546244144, 0.01146816834807396, 0.012127227149903774, 0.01278628595173359, 0.013445344753563404, 0.014104403555393219, 0.014763462357223034, 0.015422521159052849, 0.01608157902956009, 0.01674063876271248, 0.017399698495864868, 0.01805875636637211, 0.01871781423687935, 0.01937687397003174]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 1.0, 4.0, 7.0, 6.0, 5.0, 4.0, 13.0, 11.0, 14.0, 15.0, 24.0, 30.0, 22.0, 26.0, 18.0, 20.0, 28.0, 45.0, 31.0, 38.0, 42.0, 37.0, 41.0, 32.0, 41.0, 38.0, 39.0, 35.0, 32.0, 37.0, 32.0, 31.0, 22.0, 18.0, 32.0, 23.0, 14.0, 14.0, 11.0, 17.0, 10.0, 7.0, 11.0, 5.0, 4.0, 8.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.0, -7.73876953125, -7.4775390625, -7.21630859375, -6.955078125, -6.69384765625, -6.4326171875, -6.17138671875, -5.91015625, -5.64892578125, -5.3876953125, -5.12646484375, -4.865234375, -4.60400390625, -4.3427734375, -4.08154296875, -3.8203125, -3.55908203125, -3.2978515625, -3.03662109375, -2.775390625, -2.51416015625, -2.2529296875, -1.99169921875, -1.73046875, -1.46923828125, -1.2080078125, -0.94677734375, -0.685546875, -0.42431640625, -0.1630859375, 0.09814453125, 0.359375, 0.62060546875, 0.8818359375, 1.14306640625, 1.404296875, 1.66552734375, 1.9267578125, 2.18798828125, 2.44921875, 2.71044921875, 2.9716796875, 3.23291015625, 3.494140625, 3.75537109375, 4.0166015625, 4.27783203125, 4.5390625, 4.80029296875, 5.0615234375, 5.32275390625, 5.583984375, 5.84521484375, 6.1064453125, 6.36767578125, 6.62890625, 6.89013671875, 7.1513671875, 7.41259765625, 7.673828125, 7.93505859375, 8.1962890625, 8.45751953125, 8.71875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 8.0, 16.0, 8.0, 20.0, 19.0, 33.0, 49.0, 61.0, 95.0, 112.0, 158.0, 236.0, 360.0, 546.0, 807.0, 1190.0, 1837.0, 2899.0, 4572.0, 8297.0, 15497.0, 31646.0, 73524.0, 242450.0, 433318.0, 132096.0, 48214.0, 22233.0, 11319.0, 6390.0, 3747.0, 2265.0, 1436.0, 976.0, 671.0, 436.0, 300.0, 189.0, 161.0, 113.0, 68.0, 42.0, 42.0, 30.0, 22.0, 9.0, 16.0, 6.0, 5.0, 9.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.7423095703125, -10.375244140625, -10.0081787109375, -9.64111328125, -9.2740478515625, -8.906982421875, -8.5399169921875, -8.1728515625, -7.8057861328125, -7.438720703125, -7.0716552734375, -6.70458984375, -6.3375244140625, -5.970458984375, -5.6033935546875, -5.236328125, -4.8692626953125, -4.502197265625, -4.1351318359375, -3.76806640625, -3.4010009765625, -3.033935546875, -2.6668701171875, -2.2998046875, -1.9327392578125, -1.565673828125, -1.1986083984375, -0.83154296875, -0.4644775390625, -0.097412109375, 0.2696533203125, 0.63671875, 1.0037841796875, 1.370849609375, 1.7379150390625, 2.10498046875, 2.4720458984375, 2.839111328125, 3.2061767578125, 3.5732421875, 3.9403076171875, 4.307373046875, 4.6744384765625, 5.04150390625, 5.4085693359375, 5.775634765625, 6.1427001953125, 6.509765625, 6.8768310546875, 7.243896484375, 7.6109619140625, 7.97802734375, 8.3450927734375, 8.712158203125, 9.0792236328125, 9.4462890625, 9.8133544921875, 10.180419921875, 10.5474853515625, 10.91455078125, 11.2816162109375, 11.648681640625, 12.0157470703125, 12.3828125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 0.0, 5.0, 3.0, 7.0, 10.0, 11.0, 14.0, 7.0, 10.0, 16.0, 17.0, 28.0, 19.0, 26.0, 24.0, 32.0, 26.0, 41.0, 45.0, 67.0, 80.0, 102.0, 216.0, 1388.0, 248.0, 120.0, 94.0, 54.0, 38.0, 47.0, 27.0, 24.0, 27.0, 18.0, 24.0, 20.0, 10.0, 20.0, 21.0, 9.0, 14.0, 10.0, 11.0, 7.0, 6.0, 2.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-21.78125, -21.15185546875, -20.5224609375, -19.89306640625, -19.263671875, -18.63427734375, -18.0048828125, -17.37548828125, -16.74609375, -16.11669921875, -15.4873046875, -14.85791015625, -14.228515625, -13.59912109375, -12.9697265625, -12.34033203125, -11.7109375, -11.08154296875, -10.4521484375, -9.82275390625, -9.193359375, -8.56396484375, -7.9345703125, -7.30517578125, -6.67578125, -6.04638671875, -5.4169921875, -4.78759765625, -4.158203125, -3.52880859375, -2.8994140625, -2.27001953125, -1.640625, -1.01123046875, -0.3818359375, 0.24755859375, 0.876953125, 1.50634765625, 2.1357421875, 2.76513671875, 3.39453125, 4.02392578125, 4.6533203125, 5.28271484375, 5.912109375, 6.54150390625, 7.1708984375, 7.80029296875, 8.4296875, 9.05908203125, 9.6884765625, 10.31787109375, 10.947265625, 11.57666015625, 12.2060546875, 12.83544921875, 13.46484375, 14.09423828125, 14.7236328125, 15.35302734375, 15.982421875, 16.61181640625, 17.2412109375, 17.87060546875, 18.5]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 4.0, 5.0, 5.0, 4.0, 11.0, 7.0, 11.0, 24.0, 20.0, 39.0, 60.0, 74.0, 118.0, 235.0, 501.0, 1783.0, 15571.0, 2630840.0, 485383.0, 8741.0, 1297.0, 405.0, 193.0, 122.0, 70.0, 48.0, 34.0, 20.0, 27.0, 10.0, 8.0, 12.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-61.0, -59.1455078125, -57.291015625, -55.4365234375, -53.58203125, -51.7275390625, -49.873046875, -48.0185546875, -46.1640625, -44.3095703125, -42.455078125, -40.6005859375, -38.74609375, -36.8916015625, -35.037109375, -33.1826171875, -31.328125, -29.4736328125, -27.619140625, -25.7646484375, -23.91015625, -22.0556640625, -20.201171875, -18.3466796875, -16.4921875, -14.6376953125, -12.783203125, -10.9287109375, -9.07421875, -7.2197265625, -5.365234375, -3.5107421875, -1.65625, 0.1982421875, 2.052734375, 3.9072265625, 5.76171875, 7.6162109375, 9.470703125, 11.3251953125, 13.1796875, 15.0341796875, 16.888671875, 18.7431640625, 20.59765625, 22.4521484375, 24.306640625, 26.1611328125, 28.015625, 29.8701171875, 31.724609375, 33.5791015625, 35.43359375, 37.2880859375, 39.142578125, 40.9970703125, 42.8515625, 44.7060546875, 46.560546875, 48.4150390625, 50.26953125, 52.1240234375, 53.978515625, 55.8330078125, 57.6875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 24.0, 522.0, 459.0, 12.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-464.90570068359375, -455.78759765625, -446.66949462890625, -437.5513610839844, -428.4332580566406, -419.3151550292969, -410.1970520019531, -401.0789489746094, -391.9608154296875, -382.84271240234375, -373.724609375, -364.6064758300781, -355.4883728027344, -346.3702697753906, -337.2521667480469, -328.1340637207031, -319.0159606933594, -309.8978576660156, -300.7797546386719, -291.66162109375, -282.54351806640625, -273.4254150390625, -264.30731201171875, -255.189208984375, -246.0710906982422, -236.95298767089844, -227.83486938476562, -218.71676635742188, -209.59866333007812, -200.4805450439453, -191.36244201660156, -182.24432373046875, -173.126220703125, -164.00811767578125, -154.88999938964844, -145.7718963623047, -136.65377807617188, -127.53567504882812, -118.41757202148438, -109.2994613647461, -100.18134307861328, -91.063232421875, -81.94512939453125, -72.82701873779297, -63.70890808105469, -54.590797424316406, -45.47269058227539, -36.354583740234375, -27.236473083496094, -18.118364334106445, -9.000255584716797, 0.11785316467285156, 9.2359619140625, 18.35407257080078, 27.472179412841797, 36.59028625488281, 45.708396911621094, 54.826507568359375, 63.94461441040039, 73.0627212524414, 82.18083190917969, 91.29894256591797, 100.41705322265625, 109.53515625, 118.65326690673828]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 9.0, 14.0, 8.0, 9.0, 15.0, 10.0, 24.0, 25.0, 17.0, 37.0, 26.0, 45.0, 31.0, 21.0, 37.0, 33.0, 47.0, 45.0, 47.0, 49.0, 50.0, 40.0, 48.0, 23.0, 37.0, 29.0, 30.0, 32.0, 24.0, 15.0, 18.0, 14.0, 20.0, 15.0, 12.0, 7.0, 8.0, 8.0, 3.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-50.259281158447266, -48.63461685180664, -47.009952545166016, -45.38528823852539, -43.760623931884766, -42.13595962524414, -40.51129150390625, -38.886627197265625, -37.261962890625, -35.637298583984375, -34.01263427734375, -32.387969970703125, -30.7633056640625, -29.138641357421875, -27.513975143432617, -25.889310836791992, -24.2646484375, -22.639984130859375, -21.01531982421875, -19.390655517578125, -17.7659912109375, -16.141326904296875, -14.516660690307617, -12.891996383666992, -11.267332077026367, -9.642667770385742, -8.018003463745117, -6.393338203430176, -4.768673896789551, -3.144009590148926, -1.5193443298339844, 0.10531997680664062, 1.7299880981445312, 3.3546526432037354, 4.9793171882629395, 6.603981971740723, 8.228646278381348, 9.853310585021973, 11.477975845336914, 13.102640151977539, 14.727304458618164, 16.35196876525879, 17.976633071899414, 19.601299285888672, 21.225963592529297, 22.850627899169922, 24.475292205810547, 26.099956512451172, 27.724620819091797, 29.349285125732422, 30.973949432373047, 32.59861373901367, 34.2232780456543, 35.84794235229492, 37.47261047363281, 39.09727478027344, 40.72193908691406, 42.34660339355469, 43.97126770019531, 45.59593200683594, 47.22059631347656, 48.84526062011719, 50.46992492675781, 52.09458923339844, 53.71925354003906]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 3.0, 8.0, 6.0, 7.0, 12.0, 8.0, 16.0, 21.0, 18.0, 16.0, 23.0, 22.0, 22.0, 24.0, 27.0, 40.0, 46.0, 39.0, 46.0, 34.0, 31.0, 45.0, 40.0, 36.0, 27.0, 36.0, 36.0, 28.0, 29.0, 39.0, 31.0, 22.0, 20.0, 13.0, 18.0, 18.0, 13.0, 11.0, 11.0, 13.0, 15.0, 5.0, 8.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-8.3203125, -8.0587158203125, -7.797119140625, -7.5355224609375, -7.27392578125, -7.0123291015625, -6.750732421875, -6.4891357421875, -6.2275390625, -5.9659423828125, -5.704345703125, -5.4427490234375, -5.18115234375, -4.9195556640625, -4.657958984375, -4.3963623046875, -4.134765625, -3.8731689453125, -3.611572265625, -3.3499755859375, -3.08837890625, -2.8267822265625, -2.565185546875, -2.3035888671875, -2.0419921875, -1.7803955078125, -1.518798828125, -1.2572021484375, -0.99560546875, -0.7340087890625, -0.472412109375, -0.2108154296875, 0.05078125, 0.3123779296875, 0.573974609375, 0.8355712890625, 1.09716796875, 1.3587646484375, 1.620361328125, 1.8819580078125, 2.1435546875, 2.4051513671875, 2.666748046875, 2.9283447265625, 3.18994140625, 3.4515380859375, 3.713134765625, 3.9747314453125, 4.236328125, 4.4979248046875, 4.759521484375, 5.0211181640625, 5.28271484375, 5.5443115234375, 5.805908203125, 6.0675048828125, 6.3291015625, 6.5906982421875, 6.852294921875, 7.1138916015625, 7.37548828125, 7.6370849609375, 7.898681640625, 8.1602783203125, 8.421875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 4.0, 10.0, 7.0, 10.0, 15.0, 15.0, 27.0, 30.0, 21.0, 31.0, 47.0, 48.0, 80.0, 105.0, 130.0, 211.0, 352.0, 661.0, 1601.0, 7606.0, 2301515.0, 1871348.0, 7077.0, 1513.0, 655.0, 348.0, 218.0, 147.0, 105.0, 61.0, 53.0, 52.0, 31.0, 22.0, 26.0, 17.0, 14.0, 16.0, 13.0, 8.0, 8.0, 1.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-78.875, -76.4091796875, -73.943359375, -71.4775390625, -69.01171875, -66.5458984375, -64.080078125, -61.6142578125, -59.1484375, -56.6826171875, -54.216796875, -51.7509765625, -49.28515625, -46.8193359375, -44.353515625, -41.8876953125, -39.421875, -36.9560546875, -34.490234375, -32.0244140625, -29.55859375, -27.0927734375, -24.626953125, -22.1611328125, -19.6953125, -17.2294921875, -14.763671875, -12.2978515625, -9.83203125, -7.3662109375, -4.900390625, -2.4345703125, 0.03125, 2.4970703125, 4.962890625, 7.4287109375, 9.89453125, 12.3603515625, 14.826171875, 17.2919921875, 19.7578125, 22.2236328125, 24.689453125, 27.1552734375, 29.62109375, 32.0869140625, 34.552734375, 37.0185546875, 39.484375, 41.9501953125, 44.416015625, 46.8818359375, 49.34765625, 51.8134765625, 54.279296875, 56.7451171875, 59.2109375, 61.6767578125, 64.142578125, 66.6083984375, 69.07421875, 71.5400390625, 74.005859375, 76.4716796875, 78.9375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 2.0, 7.0, 4.0, 4.0, 5.0, 4.0, 9.0, 11.0, 14.0, 17.0, 29.0, 32.0, 52.0, 69.0, 69.0, 114.0, 180.0, 315.0, 515.0, 720.0, 667.0, 432.0, 256.0, 168.0, 108.0, 57.0, 48.0, 38.0, 25.0, 27.0, 20.0, 11.0, 11.0, 9.0, 9.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9140625, -12.4500732421875, -11.986083984375, -11.5220947265625, -11.05810546875, -10.5941162109375, -10.130126953125, -9.6661376953125, -9.2021484375, -8.7381591796875, -8.274169921875, -7.8101806640625, -7.34619140625, -6.8822021484375, -6.418212890625, -5.9542236328125, -5.490234375, -5.0262451171875, -4.562255859375, -4.0982666015625, -3.63427734375, -3.1702880859375, -2.706298828125, -2.2423095703125, -1.7783203125, -1.3143310546875, -0.850341796875, -0.3863525390625, 0.07763671875, 0.5416259765625, 1.005615234375, 1.4696044921875, 1.93359375, 2.3975830078125, 2.861572265625, 3.3255615234375, 3.78955078125, 4.2535400390625, 4.717529296875, 5.1815185546875, 5.6455078125, 6.1094970703125, 6.573486328125, 7.0374755859375, 7.50146484375, 7.9654541015625, 8.429443359375, 8.8934326171875, 9.357421875, 9.8214111328125, 10.285400390625, 10.7493896484375, 11.21337890625, 11.6773681640625, 12.141357421875, 12.6053466796875, 13.0693359375, 13.5333251953125, 13.997314453125, 14.4613037109375, 14.92529296875, 15.3892822265625, 15.853271484375, 16.3172607421875, 16.78125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 7.0, 3.0, 7.0, 11.0, 7.0, 9.0, 12.0, 17.0, 29.0, 28.0, 39.0, 47.0, 97.0, 143.0, 281.0, 578.0, 1362.0, 3750.0, 12159.0, 70420.0, 2531681.0, 1502151.0, 55510.0, 10341.0, 3185.0, 1200.0, 497.0, 280.0, 132.0, 79.0, 54.0, 35.0, 20.0, 27.0, 26.0, 13.0, 13.0, 5.0, 6.0, 4.0, 3.0, 3.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.03125, -34.9033203125, -33.775390625, -32.6474609375, -31.51953125, -30.3916015625, -29.263671875, -28.1357421875, -27.0078125, -25.8798828125, -24.751953125, -23.6240234375, -22.49609375, -21.3681640625, -20.240234375, -19.1123046875, -17.984375, -16.8564453125, -15.728515625, -14.6005859375, -13.47265625, -12.3447265625, -11.216796875, -10.0888671875, -8.9609375, -7.8330078125, -6.705078125, -5.5771484375, -4.44921875, -3.3212890625, -2.193359375, -1.0654296875, 0.0625, 1.1904296875, 2.318359375, 3.4462890625, 4.57421875, 5.7021484375, 6.830078125, 7.9580078125, 9.0859375, 10.2138671875, 11.341796875, 12.4697265625, 13.59765625, 14.7255859375, 15.853515625, 16.9814453125, 18.109375, 19.2373046875, 20.365234375, 21.4931640625, 22.62109375, 23.7490234375, 24.876953125, 26.0048828125, 27.1328125, 28.2607421875, 29.388671875, 30.5166015625, 31.64453125, 32.7724609375, 33.900390625, 35.0283203125, 36.15625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 16.0, 23.0, 30.0, 59.0, 108.0, 151.0, 186.0, 161.0, 106.0, 71.0, 44.0, 30.0, 11.0, 7.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.5049991607666, -24.248519897460938, -21.99203872680664, -19.735557556152344, -17.47907829284668, -15.2225980758667, -12.966117858886719, -10.709637641906738, -8.453157424926758, -6.196677207946777, -3.940196990966797, -1.6837167739868164, 0.5727634429931641, 2.8292436599731445, 5.085723876953125, 7.3422040939331055, 9.598684310913086, 11.855164527893066, 14.111644744873047, 16.368125915527344, 18.624605178833008, 20.881084442138672, 23.13756561279297, 25.394046783447266, 27.65052604675293, 29.907005310058594, 32.16348648071289, 34.41996765136719, 36.67644500732422, 38.932926177978516, 41.18940734863281, 43.44588851928711, 45.702362060546875, 47.95884323120117, 50.21532440185547, 52.4718017578125, 54.7282829284668, 56.984764099121094, 59.241241455078125, 61.49772262573242, 63.75420379638672, 66.01068115234375, 68.26716613769531, 70.52364349365234, 72.78012084960938, 75.03660583496094, 77.29308319091797, 79.54956817626953, 81.80604553222656, 84.0625228881836, 86.31900787353516, 88.57548522949219, 90.83197021484375, 93.08844757080078, 95.34492492675781, 97.60140991210938, 99.8578872680664, 102.11436462402344, 104.370849609375, 106.62732696533203, 108.88380432128906, 111.14028930664062, 113.39676666259766, 115.65325164794922, 117.90972900390625]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 3.0, 1.0, 7.0, 4.0, 4.0, 10.0, 9.0, 15.0, 8.0, 14.0, 12.0, 24.0, 31.0, 21.0, 26.0, 29.0, 25.0, 33.0, 31.0, 32.0, 35.0, 35.0, 43.0, 40.0, 55.0, 39.0, 38.0, 30.0, 30.0, 30.0, 31.0, 29.0, 21.0, 28.0, 29.0, 19.0, 23.0, 16.0, 16.0, 13.0, 15.0, 11.0, 6.0, 9.0, 7.0, 2.0, 1.0, 6.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-41.1014404296875, -39.82278823852539, -38.54413604736328, -37.26548767089844, -35.98683547973633, -34.70818328857422, -33.429534912109375, -32.150882720947266, -30.872230529785156, -29.593578338623047, -28.31492805480957, -27.036277770996094, -25.757625579833984, -24.478973388671875, -23.2003231048584, -21.921672821044922, -20.643020629882812, -19.364368438720703, -18.085718154907227, -16.80706787109375, -15.52841567993164, -14.249764442443848, -12.971113204956055, -11.692461967468262, -10.413810729980469, -9.135159492492676, -7.856508255004883, -6.57785701751709, -5.299205780029297, -4.020554542541504, -2.741903305053711, -1.463252067565918, -0.184600830078125, 1.094050407409668, 2.372701644897461, 3.651352882385254, 4.930004119873047, 6.20865535736084, 7.487306594848633, 8.765957832336426, 10.044609069824219, 11.323260307312012, 12.601911544799805, 13.880562782287598, 15.15921401977539, 16.4378662109375, 17.716516494750977, 18.995166778564453, 20.273818969726562, 21.552471160888672, 22.83112144470215, 24.109771728515625, 25.388423919677734, 26.667076110839844, 27.94572639465332, 29.224376678466797, 30.503028869628906, 31.781681060791016, 33.060333251953125, 34.33898162841797, 35.61763381958008, 36.89628601074219, 38.17493438720703, 39.45358657836914, 40.73223876953125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 7.0, 8.0, 5.0, 7.0, 7.0, 8.0, 20.0, 11.0, 13.0, 12.0, 18.0, 22.0, 30.0, 28.0, 36.0, 37.0, 37.0, 48.0, 32.0, 49.0, 38.0, 42.0, 40.0, 42.0, 39.0, 30.0, 37.0, 27.0, 32.0, 22.0, 34.0, 28.0, 18.0, 10.0, 18.0, 17.0, 13.0, 10.0, 12.0, 13.0, 10.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.84375, -7.58544921875, -7.3271484375, -7.06884765625, -6.810546875, -6.55224609375, -6.2939453125, -6.03564453125, -5.77734375, -5.51904296875, -5.2607421875, -5.00244140625, -4.744140625, -4.48583984375, -4.2275390625, -3.96923828125, -3.7109375, -3.45263671875, -3.1943359375, -2.93603515625, -2.677734375, -2.41943359375, -2.1611328125, -1.90283203125, -1.64453125, -1.38623046875, -1.1279296875, -0.86962890625, -0.611328125, -0.35302734375, -0.0947265625, 0.16357421875, 0.421875, 0.68017578125, 0.9384765625, 1.19677734375, 1.455078125, 1.71337890625, 1.9716796875, 2.22998046875, 2.48828125, 2.74658203125, 3.0048828125, 3.26318359375, 3.521484375, 3.77978515625, 4.0380859375, 4.29638671875, 4.5546875, 4.81298828125, 5.0712890625, 5.32958984375, 5.587890625, 5.84619140625, 6.1044921875, 6.36279296875, 6.62109375, 6.87939453125, 7.1376953125, 7.39599609375, 7.654296875, 7.91259765625, 8.1708984375, 8.42919921875, 8.6875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 10.0, 22.0, 24.0, 47.0, 63.0, 103.0, 153.0, 225.0, 388.0, 607.0, 927.0, 1455.0, 2293.0, 3528.0, 5694.0, 9145.0, 14662.0, 23310.0, 37649.0, 61668.0, 101214.0, 161099.0, 208675.0, 158345.0, 98531.0, 60469.0, 37088.0, 22760.0, 14129.0, 8856.0, 5656.0, 3544.0, 2187.0, 1496.0, 927.0, 582.0, 361.0, 238.0, 162.0, 101.0, 57.0, 45.0, 17.0, 19.0, 12.0, 3.0, 9.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.029296875, -0.9976043701171875, -0.965911865234375, -0.9342193603515625, -0.90252685546875, -0.8708343505859375, -0.839141845703125, -0.8074493408203125, -0.7757568359375, -0.7440643310546875, -0.712371826171875, -0.6806793212890625, -0.64898681640625, -0.6172943115234375, -0.585601806640625, -0.5539093017578125, -0.522216796875, -0.4905242919921875, -0.458831787109375, -0.4271392822265625, -0.39544677734375, -0.3637542724609375, -0.332061767578125, -0.3003692626953125, -0.2686767578125, -0.2369842529296875, -0.205291748046875, -0.1735992431640625, -0.14190673828125, -0.1102142333984375, -0.078521728515625, -0.0468292236328125, -0.01513671875, 0.0165557861328125, 0.048248291015625, 0.0799407958984375, 0.11163330078125, 0.1433258056640625, 0.175018310546875, 0.2067108154296875, 0.2384033203125, 0.2700958251953125, 0.301788330078125, 0.3334808349609375, 0.36517333984375, 0.3968658447265625, 0.428558349609375, 0.4602508544921875, 0.491943359375, 0.5236358642578125, 0.555328369140625, 0.5870208740234375, 0.61871337890625, 0.6504058837890625, 0.682098388671875, 0.7137908935546875, 0.7454833984375, 0.7771759033203125, 0.808868408203125, 0.8405609130859375, 0.87225341796875, 0.9039459228515625, 0.935638427734375, 0.9673309326171875, 0.9990234375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 9.0, 3.0, 6.0, 13.0, 14.0, 21.0, 24.0, 17.0, 25.0, 33.0, 37.0, 28.0, 33.0, 34.0, 36.0, 36.0, 36.0, 56.0, 1063.0, 46.0, 35.0, 45.0, 38.0, 45.0, 43.0, 37.0, 28.0, 23.0, 21.0, 17.0, 17.0, 16.0, 21.0, 9.0, 4.0, 7.0, 2.0, 11.0, 7.0, 4.0, 2.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.484375, -5.30426025390625, -5.1241455078125, -4.94403076171875, -4.763916015625, -4.58380126953125, -4.4036865234375, -4.22357177734375, -4.04345703125, -3.86334228515625, -3.6832275390625, -3.50311279296875, -3.322998046875, -3.14288330078125, -2.9627685546875, -2.78265380859375, -2.6025390625, -2.42242431640625, -2.2423095703125, -2.06219482421875, -1.882080078125, -1.70196533203125, -1.5218505859375, -1.34173583984375, -1.16162109375, -0.98150634765625, -0.8013916015625, -0.62127685546875, -0.441162109375, -0.26104736328125, -0.0809326171875, 0.09918212890625, 0.279296875, 0.45941162109375, 0.6395263671875, 0.81964111328125, 0.999755859375, 1.17987060546875, 1.3599853515625, 1.54010009765625, 1.72021484375, 1.90032958984375, 2.0804443359375, 2.26055908203125, 2.440673828125, 2.62078857421875, 2.8009033203125, 2.98101806640625, 3.1611328125, 3.34124755859375, 3.5213623046875, 3.70147705078125, 3.881591796875, 4.06170654296875, 4.2418212890625, 4.42193603515625, 4.60205078125, 4.78216552734375, 4.9622802734375, 5.14239501953125, 5.322509765625, 5.50262451171875, 5.6827392578125, 5.86285400390625, 6.04296875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 5.0, 10.0, 20.0, 43.0, 44.0, 67.0, 110.0, 138.0, 198.0, 269.0, 403.0, 621.0, 828.0, 1303.0, 1753.0, 2774.0, 3862.0, 5704.0, 8489.0, 12535.0, 18882.0, 28446.0, 44173.0, 68705.0, 107683.0, 157598.0, 1214421.0, 142399.0, 96536.0, 61696.0, 39130.0, 25773.0, 16889.0, 11339.0, 7594.0, 5228.0, 3638.0, 2444.0, 1679.0, 1159.0, 796.0, 525.0, 378.0, 250.0, 194.0, 137.0, 78.0, 65.0, 55.0, 22.0, 21.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 4.0], "bins": [-0.61767578125, -0.5985946655273438, -0.5795135498046875, -0.5604324340820312, -0.541351318359375, -0.5222702026367188, -0.5031890869140625, -0.48410797119140625, -0.46502685546875, -0.44594573974609375, -0.4268646240234375, -0.40778350830078125, -0.388702392578125, -0.36962127685546875, -0.3505401611328125, -0.33145904541015625, -0.3123779296875, -0.29329681396484375, -0.2742156982421875, -0.25513458251953125, -0.236053466796875, -0.21697235107421875, -0.1978912353515625, -0.17881011962890625, -0.15972900390625, -0.14064788818359375, -0.1215667724609375, -0.10248565673828125, -0.083404541015625, -0.06432342529296875, -0.0452423095703125, -0.02616119384765625, -0.007080078125, 0.01200103759765625, 0.0310821533203125, 0.05016326904296875, 0.069244384765625, 0.08832550048828125, 0.1074066162109375, 0.12648773193359375, 0.14556884765625, 0.16464996337890625, 0.1837310791015625, 0.20281219482421875, 0.221893310546875, 0.24097442626953125, 0.2600555419921875, 0.27913665771484375, 0.2982177734375, 0.31729888916015625, 0.3363800048828125, 0.35546112060546875, 0.374542236328125, 0.39362335205078125, 0.4127044677734375, 0.43178558349609375, 0.45086669921875, 0.46994781494140625, 0.4890289306640625, 0.5081100463867188, 0.527191162109375, 0.5462722778320312, 0.5653533935546875, 0.5844345092773438, 0.603515625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 1.0, 11.0, 7.0, 12.0, 21.0, 23.0, 32.0, 39.0, 80.0, 157.0, 210.0, 124.0, 70.0, 54.0, 34.0, 26.0, 22.0, 11.0, 5.0, 8.0, 3.0, 6.0, 5.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.053466796875, -0.05195426940917969, -0.050441741943359375, -0.04892921447753906, -0.04741668701171875, -0.04590415954589844, -0.044391632080078125, -0.04287910461425781, -0.0413665771484375, -0.03985404968261719, -0.038341522216796875, -0.03682899475097656, -0.03531646728515625, -0.03380393981933594, -0.032291412353515625, -0.030778884887695312, -0.029266357421875, -0.027753829956054688, -0.026241302490234375, -0.024728775024414062, -0.02321624755859375, -0.021703720092773438, -0.020191192626953125, -0.018678665161132812, -0.0171661376953125, -0.015653610229492188, -0.014141082763671875, -0.012628555297851562, -0.01111602783203125, -0.009603500366210938, -0.008090972900390625, -0.0065784454345703125, -0.00506591796875, -0.0035533905029296875, -0.002040863037109375, -0.0005283355712890625, 0.00098419189453125, 0.0024967193603515625, 0.004009246826171875, 0.0055217742919921875, 0.0070343017578125, 0.008546829223632812, 0.010059356689453125, 0.011571884155273438, 0.01308441162109375, 0.014596939086914062, 0.016109466552734375, 0.017621994018554688, 0.019134521484375, 0.020647048950195312, 0.022159576416015625, 0.023672103881835938, 0.02518463134765625, 0.026697158813476562, 0.028209686279296875, 0.029722213745117188, 0.0312347412109375, 0.03274726867675781, 0.034259796142578125, 0.03577232360839844, 0.03728485107421875, 0.03879737854003906, 0.040309906005859375, 0.04182243347167969, 0.0433349609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 2.0, 6.0, 4.0, 3.0, 13.0, 13.0, 20.0, 19.0, 28.0, 47.0, 70.0, 113.0, 170.0, 576.0, 5841.0, 1023166.0, 17090.0, 747.0, 208.0, 103.0, 92.0, 42.0, 39.0, 26.0, 23.0, 12.0, 10.0, 11.0, 8.0, 8.0, 3.0, 3.0, 7.0, 2.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85595703125, -0.8260574340820312, -0.7961578369140625, -0.7662582397460938, -0.736358642578125, -0.7064590454101562, -0.6765594482421875, -0.6466598510742188, -0.61676025390625, -0.5868606567382812, -0.5569610595703125, -0.5270614624023438, -0.497161865234375, -0.46726226806640625, -0.4373626708984375, -0.40746307373046875, -0.3775634765625, -0.34766387939453125, -0.3177642822265625, -0.28786468505859375, -0.257965087890625, -0.22806549072265625, -0.1981658935546875, -0.16826629638671875, -0.13836669921875, -0.10846710205078125, -0.0785675048828125, -0.04866790771484375, -0.018768310546875, 0.01113128662109375, 0.0410308837890625, 0.07093048095703125, 0.100830078125, 0.13072967529296875, 0.1606292724609375, 0.19052886962890625, 0.220428466796875, 0.25032806396484375, 0.2802276611328125, 0.31012725830078125, 0.34002685546875, 0.36992645263671875, 0.3998260498046875, 0.42972564697265625, 0.459625244140625, 0.48952484130859375, 0.5194244384765625, 0.5493240356445312, 0.5792236328125, 0.6091232299804688, 0.6390228271484375, 0.6689224243164062, 0.698822021484375, 0.7287216186523438, 0.7586212158203125, 0.7885208129882812, 0.81842041015625, 0.8483200073242188, 0.8782196044921875, 0.9081192016601562, 0.938018798828125, 0.9679183959960938, 0.9978179931640625, 1.0277175903320312, 1.0576171875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 6.0, 9.0, 9.0, 15.0, 17.0, 20.0, 29.0, 51.0, 83.0, 100.0, 140.0, 176.0, 112.0, 75.0, 49.0, 26.0, 21.0, 13.0, 15.0, 5.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05558837205171585, -0.05386858060956001, -0.052148789167404175, -0.05042899772524834, -0.0487092062830925, -0.04698941484093666, -0.04526962339878082, -0.043549828231334686, -0.04183004051446915, -0.04011024907231331, -0.03839045763015747, -0.03667066618800163, -0.034950874745845795, -0.03323108330368996, -0.03151129186153412, -0.02979149855673313, -0.028071705251932144, -0.026351913809776306, -0.024632122367620468, -0.02291233092546463, -0.021192539483308792, -0.019472748041152954, -0.017752954736351967, -0.01603316329419613, -0.01431337185204029, -0.012593580409884453, -0.010873788967728615, -0.009153996594250202, -0.007434205152094364, -0.005714413709938526, -0.0039946213364601135, -0.0022748298943042755, -0.000555034726858139, 0.0011647569481283426, 0.0028845486231148243, 0.00460434053093195, 0.006324131973087788, 0.008043923415243626, 0.009763715788722038, 0.011483507230877876, 0.013203298673033714, 0.014923090115189552, 0.01664288155734539, 0.018362674862146378, 0.020082466304302216, 0.021802257746458054, 0.02352204918861389, 0.02524184063076973, 0.026961632072925568, 0.028681423515081406, 0.030401214957237244, 0.03212100639939308, 0.03384079784154892, 0.03556058928370476, 0.037280380725860596, 0.03900017589330673, 0.04071996361017227, 0.04243975505232811, 0.04415954649448395, 0.045879337936639786, 0.047599129378795624, 0.04931892082095146, 0.0510387122631073, 0.052758507430553436, 0.054478298872709274]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 9.0, 9.0, 7.0, 11.0, 15.0, 11.0, 13.0, 21.0, 17.0, 27.0, 24.0, 33.0, 23.0, 25.0, 37.0, 41.0, 37.0, 61.0, 36.0, 44.0, 43.0, 52.0, 48.0, 33.0, 51.0, 25.0, 40.0, 35.0, 28.0, 22.0, 19.0, 18.0, 16.0, 22.0, 13.0, 8.0, 8.0, 8.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.023683011531829834, -0.022920023649930954, -0.022157037630677223, -0.021394051611423492, -0.020631063729524612, -0.019868075847625732, -0.019105089828372, -0.01834210380911827, -0.01757911592721939, -0.01681612804532051, -0.01605314202606678, -0.015290155075490475, -0.01452716812491417, -0.013764181174337864, -0.013001194223761559, -0.012238207273185253, -0.011475220322608948, -0.010712233372032642, -0.009949246421456337, -0.009186259470880032, -0.008423272520303726, -0.007660285569727421, -0.006897298619151115, -0.00613431166857481, -0.005371324717998505, -0.004608337767422199, -0.003845350816845894, -0.0030823638662695885, -0.002319376915693283, -0.0015563899651169777, -0.0007934030145406723, -3.0416063964366913e-05, 0.0007325708866119385, 0.0014955578371882439, 0.0022585447877645493, 0.0030215317383408546, 0.00378451868891716, 0.004547505639493465, 0.005310492590069771, 0.006073479540646076, 0.006836466491222382, 0.007599453441798687, 0.008362440392374992, 0.009125427342951298, 0.009888414293527603, 0.010651401244103909, 0.011414388194680214, 0.01217737514525652, 0.012940362095832825, 0.01370334904640913, 0.014466335996985435, 0.015229322947561741, 0.015992309898138046, 0.016755297780036926, 0.017518283799290657, 0.018281269818544388, 0.019044257700443268, 0.019807245582342148, 0.02057023160159588, 0.02133321762084961, 0.02209620550274849, 0.02285919338464737, 0.0236221794039011, 0.02438516542315483, 0.02514815330505371]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 7.0, 7.0, 6.0, 7.0, 7.0, 8.0, 19.0, 12.0, 13.0, 12.0, 17.0, 23.0, 30.0, 28.0, 36.0, 37.0, 37.0, 49.0, 31.0, 49.0, 37.0, 43.0, 40.0, 43.0, 37.0, 31.0, 37.0, 28.0, 31.0, 22.0, 34.0, 28.0, 18.0, 10.0, 17.0, 18.0, 13.0, 10.0, 12.0, 13.0, 10.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.84375, -7.58544921875, -7.3271484375, -7.06884765625, -6.810546875, -6.55224609375, -6.2939453125, -6.03564453125, -5.77734375, -5.51904296875, -5.2607421875, -5.00244140625, -4.744140625, -4.48583984375, -4.2275390625, -3.96923828125, -3.7109375, -3.45263671875, -3.1943359375, -2.93603515625, -2.677734375, -2.41943359375, -2.1611328125, -1.90283203125, -1.64453125, -1.38623046875, -1.1279296875, -0.86962890625, -0.611328125, -0.35302734375, -0.0947265625, 0.16357421875, 0.421875, 0.68017578125, 0.9384765625, 1.19677734375, 1.455078125, 1.71337890625, 1.9716796875, 2.22998046875, 2.48828125, 2.74658203125, 3.0048828125, 3.26318359375, 3.521484375, 3.77978515625, 4.0380859375, 4.29638671875, 4.5546875, 4.81298828125, 5.0712890625, 5.32958984375, 5.587890625, 5.84619140625, 6.1044921875, 6.36279296875, 6.62109375, 6.87939453125, 7.1376953125, 7.39599609375, 7.654296875, 7.91259765625, 8.1708984375, 8.42919921875, 8.6875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 7.0, 3.0, 7.0, 9.0, 13.0, 19.0, 27.0, 27.0, 35.0, 37.0, 56.0, 72.0, 110.0, 145.0, 190.0, 252.0, 364.0, 483.0, 613.0, 866.0, 1162.0, 1851.0, 2975.0, 5495.0, 13590.0, 44036.0, 178886.0, 524879.0, 195624.0, 47099.0, 14398.0, 5887.0, 2970.0, 1773.0, 1202.0, 867.0, 634.0, 516.0, 320.0, 265.0, 190.0, 155.0, 110.0, 91.0, 65.0, 45.0, 47.0, 29.0, 18.0, 9.0, 12.0, 9.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-13.359375, -12.9217529296875, -12.484130859375, -12.0465087890625, -11.60888671875, -11.1712646484375, -10.733642578125, -10.2960205078125, -9.8583984375, -9.4207763671875, -8.983154296875, -8.5455322265625, -8.10791015625, -7.6702880859375, -7.232666015625, -6.7950439453125, -6.357421875, -5.9197998046875, -5.482177734375, -5.0445556640625, -4.60693359375, -4.1693115234375, -3.731689453125, -3.2940673828125, -2.8564453125, -2.4188232421875, -1.981201171875, -1.5435791015625, -1.10595703125, -0.6683349609375, -0.230712890625, 0.2069091796875, 0.64453125, 1.0821533203125, 1.519775390625, 1.9573974609375, 2.39501953125, 2.8326416015625, 3.270263671875, 3.7078857421875, 4.1455078125, 4.5831298828125, 5.020751953125, 5.4583740234375, 5.89599609375, 6.3336181640625, 6.771240234375, 7.2088623046875, 7.646484375, 8.0841064453125, 8.521728515625, 8.9593505859375, 9.39697265625, 9.8345947265625, 10.272216796875, 10.7098388671875, 11.1474609375, 11.5850830078125, 12.022705078125, 12.4603271484375, 12.89794921875, 13.3355712890625, 13.773193359375, 14.2108154296875, 14.6484375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 11.0, 7.0, 13.0, 15.0, 25.0, 23.0, 30.0, 43.0, 47.0, 42.0, 52.0, 39.0, 81.0, 204.0, 1532.0, 339.0, 126.0, 69.0, 52.0, 51.0, 49.0, 35.0, 29.0, 29.0, 14.0, 16.0, 20.0, 9.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.421875, -25.66162109375, -24.9013671875, -24.14111328125, -23.380859375, -22.62060546875, -21.8603515625, -21.10009765625, -20.33984375, -19.57958984375, -18.8193359375, -18.05908203125, -17.298828125, -16.53857421875, -15.7783203125, -15.01806640625, -14.2578125, -13.49755859375, -12.7373046875, -11.97705078125, -11.216796875, -10.45654296875, -9.6962890625, -8.93603515625, -8.17578125, -7.41552734375, -6.6552734375, -5.89501953125, -5.134765625, -4.37451171875, -3.6142578125, -2.85400390625, -2.09375, -1.33349609375, -0.5732421875, 0.18701171875, 0.947265625, 1.70751953125, 2.4677734375, 3.22802734375, 3.98828125, 4.74853515625, 5.5087890625, 6.26904296875, 7.029296875, 7.78955078125, 8.5498046875, 9.31005859375, 10.0703125, 10.83056640625, 11.5908203125, 12.35107421875, 13.111328125, 13.87158203125, 14.6318359375, 15.39208984375, 16.15234375, 16.91259765625, 17.6728515625, 18.43310546875, 19.193359375, 19.95361328125, 20.7138671875, 21.47412109375, 22.234375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 6.0, 4.0, 12.0, 11.0, 17.0, 24.0, 39.0, 50.0, 78.0, 143.0, 365.0, 1107.0, 32127.0, 3108021.0, 2555.0, 591.0, 207.0, 114.0, 69.0, 37.0, 36.0, 24.0, 20.0, 9.0, 13.0, 5.0, 8.0, 2.0, 2.0, 1.0, 7.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.875, -73.25390625, -69.6328125, -66.01171875, -62.390625, -58.76953125, -55.1484375, -51.52734375, -47.90625, -44.28515625, -40.6640625, -37.04296875, -33.421875, -29.80078125, -26.1796875, -22.55859375, -18.9375, -15.31640625, -11.6953125, -8.07421875, -4.453125, -0.83203125, 2.7890625, 6.41015625, 10.03125, 13.65234375, 17.2734375, 20.89453125, 24.515625, 28.13671875, 31.7578125, 35.37890625, 39.0, 42.62109375, 46.2421875, 49.86328125, 53.484375, 57.10546875, 60.7265625, 64.34765625, 67.96875, 71.58984375, 75.2109375, 78.83203125, 82.453125, 86.07421875, 89.6953125, 93.31640625, 96.9375, 100.55859375, 104.1796875, 107.80078125, 111.421875, 115.04296875, 118.6640625, 122.28515625, 125.90625, 129.52734375, 133.1484375, 136.76953125, 140.390625, 144.01171875, 147.6328125, 151.25390625, 154.875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 11.0, 53.0, 297.0, 463.0, 170.0, 21.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.4927215576172, -147.7690887451172, -143.04547119140625, -138.32183837890625, -133.59820556640625, -128.87457275390625, -124.15095520019531, -119.42732238769531, -114.70369720458984, -109.98007202148438, -105.25643920898438, -100.5328140258789, -95.80918884277344, -91.08555603027344, -86.36193084716797, -81.6383056640625, -76.9146728515625, -72.19104766845703, -67.46741485595703, -62.74378967285156, -58.02016067504883, -53.296531677246094, -48.572906494140625, -43.84927749633789, -39.125648498535156, -34.40201950073242, -29.67839241027832, -24.95476531982422, -20.231136322021484, -15.50750732421875, -10.783880233764648, -6.060253143310547, -1.336639404296875, 3.386988639831543, 8.110616683959961, 12.834244728088379, 17.557872772216797, 22.28150177001953, 27.005128860473633, 31.728755950927734, 36.45238494873047, 41.1760139465332, 45.89964294433594, 50.623268127441406, 55.34689712524414, 60.070526123046875, 64.79415130615234, 69.51777648925781, 74.24140930175781, 78.96503448486328, 83.68866729736328, 88.41229248046875, 93.13592529296875, 97.85955047607422, 102.58317565917969, 107.30680847167969, 112.03043365478516, 116.75405883789062, 121.47769165039062, 126.2013168334961, 130.92494201660156, 135.64857482910156, 140.37220764160156, 145.0958251953125, 149.8194580078125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 10.0, 5.0, 7.0, 14.0, 13.0, 23.0, 15.0, 21.0, 18.0, 35.0, 41.0, 37.0, 36.0, 42.0, 44.0, 33.0, 51.0, 48.0, 47.0, 47.0, 41.0, 40.0, 34.0, 35.0, 29.0, 31.0, 33.0, 32.0, 20.0, 23.0, 26.0, 12.0, 10.0, 15.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-63.8980712890625, -62.054901123046875, -60.211727142333984, -58.36855697631836, -56.52538299560547, -54.682212829589844, -52.83904266357422, -50.99586868286133, -49.15269470214844, -47.30952453613281, -45.46635055541992, -43.6231803894043, -41.780006408691406, -39.93683624267578, -38.093666076660156, -36.250492095947266, -34.40732192993164, -32.564151763916016, -30.720977783203125, -28.8778076171875, -27.03463363647461, -25.191463470458984, -23.348291397094727, -21.50511932373047, -19.66194725036621, -17.818775177001953, -15.975603103637695, -14.132431983947754, -12.289259910583496, -10.446087837219238, -8.602916717529297, -6.759744644165039, -4.916576385498047, -3.073404550552368, -1.2302327156066895, 0.6129388809204102, 2.456110954284668, 4.299283027648926, 6.142454147338867, 7.985626220703125, 9.828798294067383, 11.67197036743164, 13.515142440795898, 15.35831356048584, 17.20148468017578, 19.044658660888672, 20.887828826904297, 22.731000900268555, 24.574172973632812, 26.41734504699707, 28.260517120361328, 30.103687286376953, 31.946861267089844, 33.79003143310547, 35.633201599121094, 37.476375579833984, 39.319549560546875, 41.1627197265625, 43.00589370727539, 44.849063873291016, 46.692237854003906, 48.53540802001953, 50.378578186035156, 52.22175216674805, 54.06492233276367]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 6.0, 9.0, 9.0, 4.0, 5.0, 5.0, 5.0, 11.0, 14.0, 12.0, 26.0, 25.0, 21.0, 34.0, 35.0, 24.0, 48.0, 36.0, 41.0, 44.0, 36.0, 39.0, 52.0, 38.0, 42.0, 40.0, 32.0, 34.0, 35.0, 21.0, 31.0, 29.0, 30.0, 20.0, 17.0, 26.0, 10.0, 11.0, 6.0, 9.0, 6.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-9.59375, -9.32025146484375, -9.0467529296875, -8.77325439453125, -8.499755859375, -8.22625732421875, -7.9527587890625, -7.67926025390625, -7.40576171875, -7.13226318359375, -6.8587646484375, -6.58526611328125, -6.311767578125, -6.03826904296875, -5.7647705078125, -5.49127197265625, -5.2177734375, -4.94427490234375, -4.6707763671875, -4.39727783203125, -4.123779296875, -3.85028076171875, -3.5767822265625, -3.30328369140625, -3.02978515625, -2.75628662109375, -2.4827880859375, -2.20928955078125, -1.935791015625, -1.66229248046875, -1.3887939453125, -1.11529541015625, -0.841796875, -0.56829833984375, -0.2947998046875, -0.02130126953125, 0.252197265625, 0.52569580078125, 0.7991943359375, 1.07269287109375, 1.34619140625, 1.61968994140625, 1.8931884765625, 2.16668701171875, 2.440185546875, 2.71368408203125, 2.9871826171875, 3.26068115234375, 3.5341796875, 3.80767822265625, 4.0811767578125, 4.35467529296875, 4.628173828125, 4.90167236328125, 5.1751708984375, 5.44866943359375, 5.72216796875, 5.99566650390625, 6.2691650390625, 6.54266357421875, 6.816162109375, 7.08966064453125, 7.3631591796875, 7.63665771484375, 7.91015625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 7.0, 6.0, 4.0, 21.0, 23.0, 24.0, 28.0, 63.0, 47.0, 122.0, 149.0, 227.0, 311.0, 539.0, 885.0, 1641.0, 3434.0, 8617.0, 33162.0, 369875.0, 2881233.0, 812165.0, 60564.0, 11930.0, 4371.0, 2018.0, 1064.0, 613.0, 338.0, 270.0, 152.0, 118.0, 70.0, 57.0, 33.0, 33.0, 28.0, 10.0, 9.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.046875, -23.310302734375, -22.57373046875, -21.837158203125, -21.1005859375, -20.364013671875, -19.62744140625, -18.890869140625, -18.154296875, -17.417724609375, -16.68115234375, -15.944580078125, -15.2080078125, -14.471435546875, -13.73486328125, -12.998291015625, -12.26171875, -11.525146484375, -10.78857421875, -10.052001953125, -9.3154296875, -8.578857421875, -7.84228515625, -7.105712890625, -6.369140625, -5.632568359375, -4.89599609375, -4.159423828125, -3.4228515625, -2.686279296875, -1.94970703125, -1.213134765625, -0.4765625, 0.260009765625, 0.99658203125, 1.733154296875, 2.4697265625, 3.206298828125, 3.94287109375, 4.679443359375, 5.416015625, 6.152587890625, 6.88916015625, 7.625732421875, 8.3623046875, 9.098876953125, 9.83544921875, 10.572021484375, 11.30859375, 12.045166015625, 12.78173828125, 13.518310546875, 14.2548828125, 14.991455078125, 15.72802734375, 16.464599609375, 17.201171875, 17.937744140625, 18.67431640625, 19.410888671875, 20.1474609375, 20.884033203125, 21.62060546875, 22.357177734375, 23.09375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 8.0, 8.0, 2.0, 7.0, 18.0, 22.0, 32.0, 38.0, 65.0, 88.0, 136.0, 222.0, 398.0, 585.0, 784.0, 598.0, 372.0, 226.0, 144.0, 118.0, 64.0, 50.0, 33.0, 21.0, 12.0, 9.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.609375, -23.934814453125, -23.26025390625, -22.585693359375, -21.9111328125, -21.236572265625, -20.56201171875, -19.887451171875, -19.212890625, -18.538330078125, -17.86376953125, -17.189208984375, -16.5146484375, -15.840087890625, -15.16552734375, -14.490966796875, -13.81640625, -13.141845703125, -12.46728515625, -11.792724609375, -11.1181640625, -10.443603515625, -9.76904296875, -9.094482421875, -8.419921875, -7.745361328125, -7.07080078125, -6.396240234375, -5.7216796875, -5.047119140625, -4.37255859375, -3.697998046875, -3.0234375, -2.348876953125, -1.67431640625, -0.999755859375, -0.3251953125, 0.349365234375, 1.02392578125, 1.698486328125, 2.373046875, 3.047607421875, 3.72216796875, 4.396728515625, 5.0712890625, 5.745849609375, 6.42041015625, 7.094970703125, 7.76953125, 8.444091796875, 9.11865234375, 9.793212890625, 10.4677734375, 11.142333984375, 11.81689453125, 12.491455078125, 13.166015625, 13.840576171875, 14.51513671875, 15.189697265625, 15.8642578125, 16.538818359375, 17.21337890625, 17.887939453125, 18.5625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 5.0, 14.0, 23.0, 26.0, 44.0, 70.0, 128.0, 231.0, 409.0, 871.0, 2167.0, 5995.0, 23773.0, 212179.0, 3480890.0, 420453.0, 34416.0, 7911.0, 2554.0, 1010.0, 472.0, 233.0, 161.0, 91.0, 55.0, 28.0, 15.0, 16.0, 13.0, 8.0, 4.0, 0.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.609375, -28.536865234375, -27.46435546875, -26.391845703125, -25.3193359375, -24.246826171875, -23.17431640625, -22.101806640625, -21.029296875, -19.956787109375, -18.88427734375, -17.811767578125, -16.7392578125, -15.666748046875, -14.59423828125, -13.521728515625, -12.44921875, -11.376708984375, -10.30419921875, -9.231689453125, -8.1591796875, -7.086669921875, -6.01416015625, -4.941650390625, -3.869140625, -2.796630859375, -1.72412109375, -0.651611328125, 0.4208984375, 1.493408203125, 2.56591796875, 3.638427734375, 4.7109375, 5.783447265625, 6.85595703125, 7.928466796875, 9.0009765625, 10.073486328125, 11.14599609375, 12.218505859375, 13.291015625, 14.363525390625, 15.43603515625, 16.508544921875, 17.5810546875, 18.653564453125, 19.72607421875, 20.798583984375, 21.87109375, 22.943603515625, 24.01611328125, 25.088623046875, 26.1611328125, 27.233642578125, 28.30615234375, 29.378662109375, 30.451171875, 31.523681640625, 32.59619140625, 33.668701171875, 34.7412109375, 35.813720703125, 36.88623046875, 37.958740234375, 39.03125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 25.0, 46.0, 106.0, 224.0, 286.0, 205.0, 76.0, 22.0, 11.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.05123901367188, -134.13015747070312, -129.2090606689453, -124.28797149658203, -119.36688232421875, -114.44580078125, -109.52471160888672, -104.60362243652344, -99.68253326416016, -94.76144409179688, -89.8403549194336, -84.91926574707031, -79.99818420410156, -75.07708740234375, -70.156005859375, -65.23491668701172, -60.31382751464844, -55.392738342285156, -50.471649169921875, -45.55056381225586, -40.62947463989258, -35.7083854675293, -30.78729820251465, -25.8662109375, -20.94512176513672, -16.024032592773438, -11.102945327758789, -6.181857109069824, -1.2607688903808594, 3.660320281982422, 8.58140754699707, 13.502494812011719, 18.423599243164062, 23.344688415527344, 28.265775680541992, 33.18686294555664, 38.10795211791992, 43.0290412902832, 47.95012664794922, 52.8712158203125, 57.79230499267578, 62.71339416503906, 67.63448333740234, 72.55557250976562, 77.47665405273438, 82.39775085449219, 87.31883239746094, 92.23992156982422, 97.1610107421875, 102.08209991455078, 107.00318908691406, 111.92427825927734, 116.84536743164062, 121.76644897460938, 126.68753814697266, 131.60862731933594, 136.52972412109375, 141.4508056640625, 146.3719024658203, 151.29298400878906, 156.21408081054688, 161.13516235351562, 166.05625915527344, 170.9773406982422, 175.89842224121094]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 8.0, 7.0, 11.0, 14.0, 11.0, 20.0, 29.0, 20.0, 22.0, 29.0, 22.0, 38.0, 34.0, 38.0, 44.0, 46.0, 27.0, 47.0, 57.0, 42.0, 41.0, 43.0, 31.0, 35.0, 30.0, 30.0, 38.0, 32.0, 22.0, 30.0, 15.0, 14.0, 8.0, 8.0, 9.0, 4.0, 5.0, 11.0, 2.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-51.902488708496094, -50.216556549072266, -48.53062438964844, -46.844688415527344, -45.158756256103516, -43.47282409667969, -41.786888122558594, -40.100955963134766, -38.41502380371094, -36.72909164428711, -35.04315948486328, -33.35722351074219, -31.67129135131836, -29.98535919189453, -28.29942512512207, -26.61349105834961, -24.92755889892578, -23.241626739501953, -21.555692672729492, -19.86975860595703, -18.183826446533203, -16.497894287109375, -14.811960220336914, -13.12602710723877, -11.440093994140625, -9.75416088104248, -8.068227767944336, -6.382294654846191, -4.696361541748047, -3.0104284286499023, -1.3244953155517578, 0.3614377975463867, 2.0473709106445312, 3.733304023742676, 5.41923713684082, 7.105170249938965, 8.79110336303711, 10.477036476135254, 12.162969589233398, 13.848902702331543, 15.534835815429688, 17.220767974853516, 18.906702041625977, 20.592636108398438, 22.278568267822266, 23.964500427246094, 25.650434494018555, 27.336368560791016, 29.022300720214844, 30.708232879638672, 32.3941650390625, 34.080101013183594, 35.76603317260742, 37.45196533203125, 39.137901306152344, 40.82383346557617, 42.509765625, 44.19569778442383, 45.881629943847656, 47.56756591796875, 49.25349807739258, 50.939430236816406, 52.6253662109375, 54.31129837036133, 55.997230529785156]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 3.0, 3.0, 3.0, 8.0, 9.0, 9.0, 16.0, 6.0, 20.0, 14.0, 12.0, 20.0, 24.0, 34.0, 30.0, 36.0, 33.0, 36.0, 36.0, 36.0, 43.0, 50.0, 40.0, 48.0, 43.0, 31.0, 28.0, 44.0, 27.0, 29.0, 26.0, 31.0, 19.0, 19.0, 27.0, 19.0, 12.0, 15.0, 14.0, 7.0, 11.0, 4.0, 2.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.83203125, -7.6029052734375, -7.373779296875, -7.1446533203125, -6.91552734375, -6.6864013671875, -6.457275390625, -6.2281494140625, -5.9990234375, -5.7698974609375, -5.540771484375, -5.3116455078125, -5.08251953125, -4.8533935546875, -4.624267578125, -4.3951416015625, -4.166015625, -3.9368896484375, -3.707763671875, -3.4786376953125, -3.24951171875, -3.0203857421875, -2.791259765625, -2.5621337890625, -2.3330078125, -2.1038818359375, -1.874755859375, -1.6456298828125, -1.41650390625, -1.1873779296875, -0.958251953125, -0.7291259765625, -0.5, -0.2708740234375, -0.041748046875, 0.1873779296875, 0.41650390625, 0.6456298828125, 0.874755859375, 1.1038818359375, 1.3330078125, 1.5621337890625, 1.791259765625, 2.0203857421875, 2.24951171875, 2.4786376953125, 2.707763671875, 2.9368896484375, 3.166015625, 3.3951416015625, 3.624267578125, 3.8533935546875, 4.08251953125, 4.3116455078125, 4.540771484375, 4.7698974609375, 4.9990234375, 5.2281494140625, 5.457275390625, 5.6864013671875, 5.91552734375, 6.1446533203125, 6.373779296875, 6.6029052734375, 6.83203125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 8.0, 6.0, 8.0, 16.0, 19.0, 31.0, 48.0, 71.0, 127.0, 149.0, 223.0, 362.0, 501.0, 739.0, 1062.0, 1669.0, 2408.0, 3340.0, 4972.0, 7164.0, 10550.0, 15550.0, 23211.0, 35116.0, 53681.0, 83694.0, 133664.0, 185920.0, 168059.0, 110537.0, 69967.0, 44921.0, 29312.0, 19712.0, 13193.0, 9068.0, 6117.0, 4168.0, 2852.0, 2021.0, 1401.0, 913.0, 650.0, 433.0, 306.0, 184.0, 142.0, 96.0, 75.0, 43.0, 27.0, 20.0, 13.0, 10.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.7412109375, -0.7171401977539062, -0.6930694580078125, -0.6689987182617188, -0.644927978515625, -0.6208572387695312, -0.5967864990234375, -0.5727157592773438, -0.54864501953125, -0.5245742797851562, -0.5005035400390625, -0.47643280029296875, -0.452362060546875, -0.42829132080078125, -0.4042205810546875, -0.38014984130859375, -0.3560791015625, -0.33200836181640625, -0.3079376220703125, -0.28386688232421875, -0.259796142578125, -0.23572540283203125, -0.2116546630859375, -0.18758392333984375, -0.16351318359375, -0.13944244384765625, -0.1153717041015625, -0.09130096435546875, -0.067230224609375, -0.04315948486328125, -0.0190887451171875, 0.00498199462890625, 0.029052734375, 0.05312347412109375, 0.0771942138671875, 0.10126495361328125, 0.125335693359375, 0.14940643310546875, 0.1734771728515625, 0.19754791259765625, 0.22161865234375, 0.24568939208984375, 0.2697601318359375, 0.29383087158203125, 0.317901611328125, 0.34197235107421875, 0.3660430908203125, 0.39011383056640625, 0.4141845703125, 0.43825531005859375, 0.4623260498046875, 0.48639678955078125, 0.510467529296875, 0.5345382690429688, 0.5586090087890625, 0.5826797485351562, 0.60675048828125, 0.6308212280273438, 0.6548919677734375, 0.6789627075195312, 0.703033447265625, 0.7271041870117188, 0.7511749267578125, 0.7752456665039062, 0.79931640625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 5.0, 7.0, 5.0, 7.0, 7.0, 10.0, 8.0, 14.0, 19.0, 20.0, 19.0, 26.0, 39.0, 27.0, 31.0, 33.0, 33.0, 40.0, 30.0, 46.0, 40.0, 1061.0, 47.0, 41.0, 34.0, 31.0, 36.0, 32.0, 32.0, 36.0, 36.0, 26.0, 22.0, 19.0, 14.0, 20.0, 10.0, 10.0, 14.0, 10.0, 9.0, 2.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.00390625, -4.85333251953125, -4.7027587890625, -4.55218505859375, -4.401611328125, -4.25103759765625, -4.1004638671875, -3.94989013671875, -3.79931640625, -3.64874267578125, -3.4981689453125, -3.34759521484375, -3.197021484375, -3.04644775390625, -2.8958740234375, -2.74530029296875, -2.5947265625, -2.44415283203125, -2.2935791015625, -2.14300537109375, -1.992431640625, -1.84185791015625, -1.6912841796875, -1.54071044921875, -1.39013671875, -1.23956298828125, -1.0889892578125, -0.93841552734375, -0.787841796875, -0.63726806640625, -0.4866943359375, -0.33612060546875, -0.185546875, -0.03497314453125, 0.1156005859375, 0.26617431640625, 0.416748046875, 0.56732177734375, 0.7178955078125, 0.86846923828125, 1.01904296875, 1.16961669921875, 1.3201904296875, 1.47076416015625, 1.621337890625, 1.77191162109375, 1.9224853515625, 2.07305908203125, 2.2236328125, 2.37420654296875, 2.5247802734375, 2.67535400390625, 2.825927734375, 2.97650146484375, 3.1270751953125, 3.27764892578125, 3.42822265625, 3.57879638671875, 3.7293701171875, 3.87994384765625, 4.030517578125, 4.18109130859375, 4.3316650390625, 4.48223876953125, 4.6328125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 8.0, 9.0, 21.0, 28.0, 39.0, 66.0, 94.0, 149.0, 229.0, 342.0, 532.0, 780.0, 1129.0, 1533.0, 2227.0, 3190.0, 4656.0, 6548.0, 9252.0, 13262.0, 19194.0, 28491.0, 41829.0, 64505.0, 98093.0, 143036.0, 1211729.0, 144790.0, 99639.0, 65578.0, 43056.0, 28802.0, 19666.0, 13378.0, 9360.0, 6648.0, 4654.0, 3235.0, 2245.0, 1633.0, 1068.0, 721.0, 568.0, 376.0, 254.0, 165.0, 112.0, 67.0, 51.0, 32.0, 25.0, 14.0, 15.0, 8.0, 3.0], "bins": [-0.58056640625, -0.5642204284667969, -0.5478744506835938, -0.5315284729003906, -0.5151824951171875, -0.4988365173339844, -0.48249053955078125, -0.4661445617675781, -0.449798583984375, -0.4334526062011719, -0.41710662841796875, -0.4007606506347656, -0.3844146728515625, -0.3680686950683594, -0.35172271728515625, -0.3353767395019531, -0.31903076171875, -0.3026847839355469, -0.28633880615234375, -0.2699928283691406, -0.2536468505859375, -0.23730087280273438, -0.22095489501953125, -0.20460891723632812, -0.188262939453125, -0.17191696166992188, -0.15557098388671875, -0.13922500610351562, -0.1228790283203125, -0.10653305053710938, -0.09018707275390625, -0.07384109497070312, -0.0574951171875, -0.041149139404296875, -0.02480316162109375, -0.008457183837890625, 0.0078887939453125, 0.024234771728515625, 0.04058074951171875, 0.056926727294921875, 0.073272705078125, 0.08961868286132812, 0.10596466064453125, 0.12231063842773438, 0.1386566162109375, 0.15500259399414062, 0.17134857177734375, 0.18769454956054688, 0.20404052734375, 0.22038650512695312, 0.23673248291015625, 0.2530784606933594, 0.2694244384765625, 0.2857704162597656, 0.30211639404296875, 0.3184623718261719, 0.334808349609375, 0.3511543273925781, 0.36750030517578125, 0.3838462829589844, 0.4001922607421875, 0.4165382385253906, 0.43288421630859375, 0.4492301940917969, 0.465576171875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 5.0, 8.0, 6.0, 14.0, 15.0, 12.0, 26.0, 22.0, 26.0, 29.0, 35.0, 57.0, 78.0, 92.0, 111.0, 78.0, 77.0, 61.0, 52.0, 28.0, 18.0, 21.0, 13.0, 12.0, 14.0, 11.0, 12.0, 9.0, 14.0, 11.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0236053466796875, -0.022921323776245117, -0.022237300872802734, -0.02155327796936035, -0.02086925506591797, -0.020185232162475586, -0.019501209259033203, -0.01881718635559082, -0.018133163452148438, -0.017449140548706055, -0.016765117645263672, -0.01608109474182129, -0.015397071838378906, -0.014713048934936523, -0.01402902603149414, -0.013345003128051758, -0.012660980224609375, -0.011976957321166992, -0.01129293441772461, -0.010608911514282227, -0.009924888610839844, -0.009240865707397461, -0.008556842803955078, -0.007872819900512695, -0.0071887969970703125, -0.00650477409362793, -0.005820751190185547, -0.005136728286743164, -0.004452705383300781, -0.0037686824798583984, -0.0030846595764160156, -0.002400636672973633, -0.00171661376953125, -0.0010325908660888672, -0.0003485679626464844, 0.00033545494079589844, 0.0010194778442382812, 0.001703500747680664, 0.002387523651123047, 0.0030715465545654297, 0.0037555694580078125, 0.004439592361450195, 0.005123615264892578, 0.005807638168334961, 0.006491661071777344, 0.0071756839752197266, 0.00785970687866211, 0.008543729782104492, 0.009227752685546875, 0.009911775588989258, 0.01059579849243164, 0.011279821395874023, 0.011963844299316406, 0.012647867202758789, 0.013331890106201172, 0.014015913009643555, 0.014699935913085938, 0.01538395881652832, 0.016067981719970703, 0.016752004623413086, 0.01743602752685547, 0.01812005043029785, 0.018804073333740234, 0.019488096237182617, 0.020172119140625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 11.0, 8.0, 17.0, 21.0, 26.0, 28.0, 27.0, 31.0, 37.0, 48.0, 65.0, 103.0, 157.0, 242.0, 384.0, 1223.0, 30799.0, 990903.0, 22285.0, 1015.0, 366.0, 202.0, 137.0, 99.0, 58.0, 55.0, 37.0, 40.0, 34.0, 14.0, 14.0, 13.0, 7.0, 7.0, 7.0, 6.0, 3.0, 2.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.359619140625, -0.347412109375, -0.335205078125, -0.322998046875, -0.310791015625, -0.298583984375, -0.286376953125, -0.274169921875, -0.261962890625, -0.249755859375, -0.237548828125, -0.225341796875, -0.213134765625, -0.200927734375, -0.188720703125, -0.176513671875, -0.164306640625, -0.152099609375, -0.139892578125, -0.127685546875, -0.115478515625, -0.103271484375, -0.091064453125, -0.078857421875, -0.066650390625, -0.054443359375, -0.042236328125, -0.030029296875, -0.017822265625, -0.005615234375, 0.006591796875, 0.018798828125, 0.031005859375, 0.043212890625, 0.055419921875, 0.067626953125, 0.079833984375, 0.092041015625, 0.104248046875, 0.116455078125, 0.128662109375, 0.140869140625, 0.153076171875, 0.165283203125, 0.177490234375, 0.189697265625, 0.201904296875, 0.214111328125, 0.226318359375, 0.238525390625, 0.250732421875, 0.262939453125, 0.275146484375, 0.287353515625, 0.299560546875, 0.311767578125, 0.323974609375, 0.336181640625, 0.348388671875, 0.360595703125, 0.372802734375, 0.385009765625, 0.397216796875, 0.409423828125, 0.421630859375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 52.0, 406.0, 491.0, 49.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1614478975534439, -0.15295201539993286, -0.14445611834526062, -0.13596022129058838, -0.12746433913707733, -0.11896844953298569, -0.11047255992889404, -0.1019766703248024, -0.09348078072071075, -0.08498489111661911, -0.07648900151252747, -0.06799311190843582, -0.05949722230434418, -0.05100133270025253, -0.04250544309616089, -0.034009553492069244, -0.0255136638879776, -0.017017774283885956, -0.008521884679794312, -2.5995075702667236e-05, 0.008469894528388977, 0.01696578413248062, 0.025461673736572266, 0.03395756334066391, 0.042453452944755554, 0.0509493425488472, 0.05944523215293884, 0.06794112175703049, 0.07643701136112213, 0.08493290096521378, 0.09342879056930542, 0.10192468017339706, 0.1104205846786499, 0.11891647428274155, 0.1274123638868332, 0.13590824604034424, 0.14440414309501648, 0.15290004014968872, 0.16139592230319977, 0.16989180445671082, 0.17838770151138306, 0.1868835985660553, 0.19537948071956635, 0.2038753628730774, 0.21237125992774963, 0.22086715698242188, 0.22936303913593292, 0.23785892128944397, 0.2463548183441162, 0.25485071539878845, 0.2633466124534607, 0.27184247970581055, 0.2803383767604828, 0.28883427381515503, 0.2973301410675049, 0.3058260381221771, 0.31432193517684937, 0.3228178322315216, 0.33131372928619385, 0.3398095965385437, 0.34830549359321594, 0.3568013906478882, 0.36529725790023804, 0.3737931549549103, 0.3822890520095825]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 2.0, 10.0, 7.0, 15.0, 12.0, 25.0, 16.0, 31.0, 40.0, 34.0, 38.0, 38.0, 39.0, 39.0, 54.0, 39.0, 45.0, 46.0, 46.0, 37.0, 39.0, 41.0, 40.0, 38.0, 37.0, 25.0, 31.0, 29.0, 24.0, 13.0, 11.0, 14.0, 9.0, 8.0, 4.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033541202545166016, -0.032430168241262436, -0.031319133937358856, -0.030208095908164978, -0.0290970616042614, -0.02798602730035782, -0.02687499113380909, -0.02576395496726036, -0.02465292066335678, -0.0235418863594532, -0.022430850192904472, -0.021319814026355743, -0.020208779722452164, -0.019097745418548584, -0.017986709251999855, -0.016875673085451126, -0.015764638781547546, -0.014653603546321392, -0.013542568311095238, -0.012431533075869083, -0.011320497840642929, -0.010209462605416775, -0.00909842737019062, -0.007987392134964466, -0.006876356899738312, -0.0057653216645121574, -0.004654286429286003, -0.003543251194059849, -0.0024322159588336945, -0.0013211807236075401, -0.0002101454883813858, 0.0009008897468447685, 0.002011924982070923, 0.003122960217297077, 0.0042339954525232315, 0.005345030687749386, 0.00645606592297554, 0.0075671011582016945, 0.008678136393427849, 0.009789171628654003, 0.010900206863880157, 0.012011242099106312, 0.013122277334332466, 0.01423331256955862, 0.015344347804784775, 0.016455382108688354, 0.017566418275237083, 0.018677454441785812, 0.019788488745689392, 0.020899523049592972, 0.0220105592161417, 0.02312159538269043, 0.02423262968659401, 0.02534366399049759, 0.026454700157046318, 0.027565736323595047, 0.028676770627498627, 0.029787804931402206, 0.030898841097950935, 0.032009877264499664, 0.033120911568403244, 0.034231945872306824, 0.0353429839015007, 0.03645401820540428, 0.03756505250930786]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 2.0, 3.0, 3.0, 9.0, 8.0, 10.0, 15.0, 6.0, 20.0, 14.0, 12.0, 20.0, 25.0, 33.0, 30.0, 37.0, 31.0, 38.0, 34.0, 38.0, 42.0, 51.0, 39.0, 48.0, 43.0, 31.0, 28.0, 44.0, 27.0, 29.0, 26.0, 31.0, 19.0, 19.0, 27.0, 19.0, 12.0, 15.0, 14.0, 7.0, 11.0, 4.0, 2.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.82421875, -7.59527587890625, -7.3663330078125, -7.13739013671875, -6.908447265625, -6.67950439453125, -6.4505615234375, -6.22161865234375, -5.99267578125, -5.76373291015625, -5.5347900390625, -5.30584716796875, -5.076904296875, -4.84796142578125, -4.6190185546875, -4.39007568359375, -4.1611328125, -3.93218994140625, -3.7032470703125, -3.47430419921875, -3.245361328125, -3.01641845703125, -2.7874755859375, -2.55853271484375, -2.32958984375, -2.10064697265625, -1.8717041015625, -1.64276123046875, -1.413818359375, -1.18487548828125, -0.9559326171875, -0.72698974609375, -0.498046875, -0.26910400390625, -0.0401611328125, 0.18878173828125, 0.417724609375, 0.64666748046875, 0.8756103515625, 1.10455322265625, 1.33349609375, 1.56243896484375, 1.7913818359375, 2.02032470703125, 2.249267578125, 2.47821044921875, 2.7071533203125, 2.93609619140625, 3.1650390625, 3.39398193359375, 3.6229248046875, 3.85186767578125, 4.080810546875, 4.30975341796875, 4.5386962890625, 4.76763916015625, 4.99658203125, 5.22552490234375, 5.4544677734375, 5.68341064453125, 5.912353515625, 6.14129638671875, 6.3702392578125, 6.59918212890625, 6.828125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 6.0, 5.0, 4.0, 7.0, 14.0, 11.0, 20.0, 25.0, 32.0, 48.0, 78.0, 79.0, 140.0, 149.0, 244.0, 304.0, 531.0, 718.0, 1069.0, 1612.0, 2825.0, 5664.0, 17493.0, 118607.0, 739214.0, 127519.0, 18348.0, 5813.0, 2919.0, 1655.0, 1043.0, 679.0, 488.0, 335.0, 233.0, 160.0, 116.0, 91.0, 63.0, 45.0, 41.0, 34.0, 23.0, 10.0, 10.0, 8.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-19.015625, -18.371337890625, -17.72705078125, -17.082763671875, -16.4384765625, -15.794189453125, -15.14990234375, -14.505615234375, -13.861328125, -13.217041015625, -12.57275390625, -11.928466796875, -11.2841796875, -10.639892578125, -9.99560546875, -9.351318359375, -8.70703125, -8.062744140625, -7.41845703125, -6.774169921875, -6.1298828125, -5.485595703125, -4.84130859375, -4.197021484375, -3.552734375, -2.908447265625, -2.26416015625, -1.619873046875, -0.9755859375, -0.331298828125, 0.31298828125, 0.957275390625, 1.6015625, 2.245849609375, 2.89013671875, 3.534423828125, 4.1787109375, 4.822998046875, 5.46728515625, 6.111572265625, 6.755859375, 7.400146484375, 8.04443359375, 8.688720703125, 9.3330078125, 9.977294921875, 10.62158203125, 11.265869140625, 11.91015625, 12.554443359375, 13.19873046875, 13.843017578125, 14.4873046875, 15.131591796875, 15.77587890625, 16.420166015625, 17.064453125, 17.708740234375, 18.35302734375, 18.997314453125, 19.6416015625, 20.285888671875, 20.93017578125, 21.574462890625, 22.21875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 5.0, 4.0, 9.0, 1.0, 5.0, 6.0, 8.0, 11.0, 10.0, 15.0, 21.0, 20.0, 21.0, 23.0, 48.0, 48.0, 53.0, 64.0, 96.0, 156.0, 1488.0, 357.0, 145.0, 93.0, 54.0, 42.0, 39.0, 38.0, 31.0, 27.0, 22.0, 18.0, 22.0, 8.0, 10.0, 11.0, 7.0, 6.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-23.671875, -22.973388671875, -22.27490234375, -21.576416015625, -20.8779296875, -20.179443359375, -19.48095703125, -18.782470703125, -18.083984375, -17.385498046875, -16.68701171875, -15.988525390625, -15.2900390625, -14.591552734375, -13.89306640625, -13.194580078125, -12.49609375, -11.797607421875, -11.09912109375, -10.400634765625, -9.7021484375, -9.003662109375, -8.30517578125, -7.606689453125, -6.908203125, -6.209716796875, -5.51123046875, -4.812744140625, -4.1142578125, -3.415771484375, -2.71728515625, -2.018798828125, -1.3203125, -0.621826171875, 0.07666015625, 0.775146484375, 1.4736328125, 2.172119140625, 2.87060546875, 3.569091796875, 4.267578125, 4.966064453125, 5.66455078125, 6.363037109375, 7.0615234375, 7.760009765625, 8.45849609375, 9.156982421875, 9.85546875, 10.553955078125, 11.25244140625, 11.950927734375, 12.6494140625, 13.347900390625, 14.04638671875, 14.744873046875, 15.443359375, 16.141845703125, 16.84033203125, 17.538818359375, 18.2373046875, 18.935791015625, 19.63427734375, 20.332763671875, 21.03125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 12.0, 11.0, 16.0, 27.0, 26.0, 45.0, 61.0, 94.0, 149.0, 243.0, 525.0, 1277.0, 59353.0, 3079315.0, 2978.0, 667.0, 338.0, 185.0, 94.0, 80.0, 53.0, 32.0, 34.0, 22.0, 21.0, 13.0, 5.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.625, -82.0771484375, -79.529296875, -76.9814453125, -74.43359375, -71.8857421875, -69.337890625, -66.7900390625, -64.2421875, -61.6943359375, -59.146484375, -56.5986328125, -54.05078125, -51.5029296875, -48.955078125, -46.4072265625, -43.859375, -41.3115234375, -38.763671875, -36.2158203125, -33.66796875, -31.1201171875, -28.572265625, -26.0244140625, -23.4765625, -20.9287109375, -18.380859375, -15.8330078125, -13.28515625, -10.7373046875, -8.189453125, -5.6416015625, -3.09375, -0.5458984375, 2.001953125, 4.5498046875, 7.09765625, 9.6455078125, 12.193359375, 14.7412109375, 17.2890625, 19.8369140625, 22.384765625, 24.9326171875, 27.48046875, 30.0283203125, 32.576171875, 35.1240234375, 37.671875, 40.2197265625, 42.767578125, 45.3154296875, 47.86328125, 50.4111328125, 52.958984375, 55.5068359375, 58.0546875, 60.6025390625, 63.150390625, 65.6982421875, 68.24609375, 70.7939453125, 73.341796875, 75.8896484375, 78.4375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 15.0, 47.0, 139.0, 346.0, 300.0, 124.0, 33.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.02149200439453, -51.31443786621094, -46.60737991333008, -41.90032196044922, -37.193267822265625, -32.48621368408203, -27.779155731201172, -23.072097778320312, -18.36504364013672, -13.657987594604492, -8.950931549072266, -4.243875503540039, 0.4631805419921875, 5.170236587524414, 9.87729263305664, 14.5843505859375, 19.291404724121094, 23.99846076965332, 28.705516815185547, 33.412574768066406, 38.11962890625, 42.826683044433594, 47.53374099731445, 52.24079895019531, 56.947853088378906, 61.6549072265625, 66.36196899414062, 71.06902313232422, 75.77607727050781, 80.4831314086914, 85.190185546875, 89.89724731445312, 94.60430908203125, 99.31136322021484, 104.01841735839844, 108.72547912597656, 113.43253326416016, 118.13958740234375, 122.84664916992188, 127.55370330810547, 132.26075744628906, 136.9678192138672, 141.67486572265625, 146.38192749023438, 151.0889892578125, 155.79603576660156, 160.5030975341797, 165.21014404296875, 169.91720581054688, 174.624267578125, 179.33131408691406, 184.0383758544922, 188.74542236328125, 193.45248413085938, 198.1595458984375, 202.86660766601562, 207.5736541748047, 212.2807159423828, 216.98776245117188, 221.69482421875, 226.40188598632812, 231.1089324951172, 235.8159942626953, 240.52304077148438, 245.2301025390625]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 7.0, 8.0, 13.0, 12.0, 10.0, 26.0, 21.0, 17.0, 17.0, 21.0, 31.0, 36.0, 32.0, 34.0, 35.0, 39.0, 45.0, 46.0, 44.0, 41.0, 45.0, 53.0, 36.0, 39.0, 31.0, 26.0, 32.0, 28.0, 25.0, 19.0, 15.0, 11.0, 17.0, 10.0, 15.0, 15.0, 8.0, 10.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-57.607154846191406, -55.86639404296875, -54.12563705444336, -52.3848762512207, -50.64411926269531, -48.903358459472656, -47.16259765625, -45.421836853027344, -43.68107986450195, -41.9403190612793, -40.199562072753906, -38.45880126953125, -36.718040466308594, -34.9772834777832, -33.23652267456055, -31.495763778686523, -29.7550048828125, -28.014245986938477, -26.273487091064453, -24.532726287841797, -22.791967391967773, -21.05120849609375, -19.310447692871094, -17.56968879699707, -15.828929901123047, -14.088171005249023, -12.347411155700684, -10.606651306152344, -8.86589241027832, -7.125133514404297, -5.384373664855957, -3.643613815307617, -1.9028549194335938, -0.1620955467224121, 1.5786638259887695, 3.319423198699951, 5.060182571411133, 6.800941467285156, 8.541701316833496, 10.282461166381836, 12.02322006225586, 13.763978958129883, 15.504738807678223, 17.245498657226562, 18.986257553100586, 20.72701644897461, 22.467777252197266, 24.20853614807129, 25.949295043945312, 27.690053939819336, 29.43081283569336, 31.171573638916016, 32.912330627441406, 34.65309143066406, 36.39385223388672, 38.134613037109375, 39.875370025634766, 41.61613082885742, 43.35688781738281, 45.09764862060547, 46.838409423828125, 48.579166412353516, 50.31992721557617, 52.06068420410156, 53.80144500732422]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 7.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 7.0, 5.0, 6.0, 11.0, 9.0, 18.0, 19.0, 11.0, 17.0, 21.0, 24.0, 17.0, 31.0, 27.0, 37.0, 34.0, 37.0, 31.0, 29.0, 41.0, 45.0, 37.0, 44.0, 44.0, 32.0, 25.0, 38.0, 26.0, 26.0, 28.0, 21.0, 28.0, 22.0, 29.0, 17.0, 18.0, 12.0, 17.0, 14.0, 4.0, 9.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.2421875, -7.01568603515625, -6.7891845703125, -6.56268310546875, -6.336181640625, -6.10968017578125, -5.8831787109375, -5.65667724609375, -5.43017578125, -5.20367431640625, -4.9771728515625, -4.75067138671875, -4.524169921875, -4.29766845703125, -4.0711669921875, -3.84466552734375, -3.6181640625, -3.39166259765625, -3.1651611328125, -2.93865966796875, -2.712158203125, -2.48565673828125, -2.2591552734375, -2.03265380859375, -1.80615234375, -1.57965087890625, -1.3531494140625, -1.12664794921875, -0.900146484375, -0.67364501953125, -0.4471435546875, -0.22064208984375, 0.005859375, 0.23236083984375, 0.4588623046875, 0.68536376953125, 0.911865234375, 1.13836669921875, 1.3648681640625, 1.59136962890625, 1.81787109375, 2.04437255859375, 2.2708740234375, 2.49737548828125, 2.723876953125, 2.95037841796875, 3.1768798828125, 3.40338134765625, 3.6298828125, 3.85638427734375, 4.0828857421875, 4.30938720703125, 4.535888671875, 4.76239013671875, 4.9888916015625, 5.21539306640625, 5.44189453125, 5.66839599609375, 5.8948974609375, 6.12139892578125, 6.347900390625, 6.57440185546875, 6.8009033203125, 7.02740478515625, 7.25390625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 11.0, 12.0, 21.0, 32.0, 35.0, 46.0, 46.0, 61.0, 105.0, 115.0, 162.0, 186.0, 242.0, 309.0, 362.0, 467.0, 548.0, 906.0, 1613.0, 3145.0, 7535.0, 23057.0, 176975.0, 2478511.0, 1381085.0, 89566.0, 15997.0, 5729.0, 2587.0, 1455.0, 871.0, 525.0, 413.0, 347.0, 250.0, 212.0, 171.0, 132.0, 105.0, 78.0, 62.0, 41.0, 27.0, 29.0, 19.0, 18.0, 15.0, 11.0, 11.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.765625, -21.08251953125, -20.3994140625, -19.71630859375, -19.033203125, -18.35009765625, -17.6669921875, -16.98388671875, -16.30078125, -15.61767578125, -14.9345703125, -14.25146484375, -13.568359375, -12.88525390625, -12.2021484375, -11.51904296875, -10.8359375, -10.15283203125, -9.4697265625, -8.78662109375, -8.103515625, -7.42041015625, -6.7373046875, -6.05419921875, -5.37109375, -4.68798828125, -4.0048828125, -3.32177734375, -2.638671875, -1.95556640625, -1.2724609375, -0.58935546875, 0.09375, 0.77685546875, 1.4599609375, 2.14306640625, 2.826171875, 3.50927734375, 4.1923828125, 4.87548828125, 5.55859375, 6.24169921875, 6.9248046875, 7.60791015625, 8.291015625, 8.97412109375, 9.6572265625, 10.34033203125, 11.0234375, 11.70654296875, 12.3896484375, 13.07275390625, 13.755859375, 14.43896484375, 15.1220703125, 15.80517578125, 16.48828125, 17.17138671875, 17.8544921875, 18.53759765625, 19.220703125, 19.90380859375, 20.5869140625, 21.27001953125, 21.953125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 2.0, 7.0, 10.0, 9.0, 25.0, 25.0, 50.0, 63.0, 106.0, 157.0, 299.0, 460.0, 667.0, 770.0, 507.0, 325.0, 201.0, 110.0, 103.0, 53.0, 48.0, 26.0, 13.0, 11.0, 9.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2421875, -13.6754150390625, -13.108642578125, -12.5418701171875, -11.97509765625, -11.4083251953125, -10.841552734375, -10.2747802734375, -9.7080078125, -9.1412353515625, -8.574462890625, -8.0076904296875, -7.44091796875, -6.8741455078125, -6.307373046875, -5.7406005859375, -5.173828125, -4.6070556640625, -4.040283203125, -3.4735107421875, -2.90673828125, -2.3399658203125, -1.773193359375, -1.2064208984375, -0.6396484375, -0.0728759765625, 0.493896484375, 1.0606689453125, 1.62744140625, 2.1942138671875, 2.760986328125, 3.3277587890625, 3.89453125, 4.4613037109375, 5.028076171875, 5.5948486328125, 6.16162109375, 6.7283935546875, 7.295166015625, 7.8619384765625, 8.4287109375, 8.9954833984375, 9.562255859375, 10.1290283203125, 10.69580078125, 11.2625732421875, 11.829345703125, 12.3961181640625, 12.962890625, 13.5296630859375, 14.096435546875, 14.6632080078125, 15.22998046875, 15.7967529296875, 16.363525390625, 16.9302978515625, 17.4970703125, 18.0638427734375, 18.630615234375, 19.1973876953125, 19.76416015625, 20.3309326171875, 20.897705078125, 21.4644775390625, 22.03125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 5.0, 3.0, 6.0, 11.0, 12.0, 24.0, 23.0, 46.0, 83.0, 127.0, 240.0, 464.0, 1211.0, 3792.0, 23922.0, 1217139.0, 2904382.0, 35606.0, 4727.0, 1350.0, 522.0, 236.0, 125.0, 78.0, 49.0, 45.0, 17.0, 7.0, 10.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-47.125, -45.85400390625, -44.5830078125, -43.31201171875, -42.041015625, -40.77001953125, -39.4990234375, -38.22802734375, -36.95703125, -35.68603515625, -34.4150390625, -33.14404296875, -31.873046875, -30.60205078125, -29.3310546875, -28.06005859375, -26.7890625, -25.51806640625, -24.2470703125, -22.97607421875, -21.705078125, -20.43408203125, -19.1630859375, -17.89208984375, -16.62109375, -15.35009765625, -14.0791015625, -12.80810546875, -11.537109375, -10.26611328125, -8.9951171875, -7.72412109375, -6.453125, -5.18212890625, -3.9111328125, -2.64013671875, -1.369140625, -0.09814453125, 1.1728515625, 2.44384765625, 3.71484375, 4.98583984375, 6.2568359375, 7.52783203125, 8.798828125, 10.06982421875, 11.3408203125, 12.61181640625, 13.8828125, 15.15380859375, 16.4248046875, 17.69580078125, 18.966796875, 20.23779296875, 21.5087890625, 22.77978515625, 24.05078125, 25.32177734375, 26.5927734375, 27.86376953125, 29.134765625, 30.40576171875, 31.6767578125, 32.94775390625, 34.21875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 27.0, 39.0, 107.0, 225.0, 273.0, 194.0, 82.0, 33.0, 17.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-210.18653869628906, -205.9167022705078, -201.64686584472656, -197.3770294189453, -193.10720825195312, -188.83737182617188, -184.56753540039062, -180.29769897460938, -176.02786254882812, -171.75802612304688, -167.48818969726562, -163.21835327148438, -158.94851684570312, -154.67869567871094, -150.4088592529297, -146.13902282714844, -141.8691864013672, -137.59934997558594, -133.3295135498047, -129.05967712402344, -124.78984832763672, -120.52001190185547, -116.25018310546875, -111.9803466796875, -107.71051025390625, -103.440673828125, -99.17083740234375, -94.90100860595703, -90.63117218017578, -86.36133575439453, -82.09150695800781, -77.82167053222656, -73.55183410644531, -69.28199768066406, -65.01216125488281, -60.742332458496094, -56.472496032714844, -52.202659606933594, -47.93282699584961, -43.662994384765625, -39.393157958984375, -35.123321533203125, -30.85348892211914, -26.583654403686523, -22.313819885253906, -18.04398536682129, -13.774150848388672, -9.504316329956055, -5.2344818115234375, -0.9646472930908203, 3.305187225341797, 7.575021743774414, 11.844856262207031, 16.11469078063965, 20.384525299072266, 24.654359817504883, 28.9241943359375, 33.19403076171875, 37.463863372802734, 41.73369598388672, 46.00353240966797, 50.27336883544922, 54.5432014465332, 58.81303405761719, 63.08287048339844]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 9.0, 10.0, 6.0, 13.0, 12.0, 6.0, 16.0, 16.0, 20.0, 24.0, 20.0, 30.0, 36.0, 32.0, 29.0, 28.0, 55.0, 42.0, 39.0, 39.0, 46.0, 43.0, 30.0, 36.0, 32.0, 32.0, 36.0, 34.0, 29.0, 30.0, 27.0, 19.0, 30.0, 15.0, 10.0, 11.0, 10.0, 9.0, 7.0, 8.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.1527099609375, -43.715240478515625, -42.27777099609375, -40.840301513671875, -39.40283203125, -37.96535873413086, -36.527889251708984, -35.09041976928711, -33.652950286865234, -32.21548080444336, -30.778011322021484, -29.340539932250977, -27.9030704498291, -26.465600967407227, -25.02812957763672, -23.590660095214844, -22.15319061279297, -20.715721130371094, -19.27825164794922, -17.84078025817871, -16.403310775756836, -14.965841293334961, -13.52837085723877, -12.090900421142578, -10.653430938720703, -9.215961456298828, -7.778491020202637, -6.3410210609436035, -4.90355110168457, -3.466081142425537, -2.028611183166504, -0.5911407470703125, 0.8463287353515625, 2.2837986946105957, 3.721268653869629, 5.158738613128662, 6.596208572387695, 8.03367805480957, 9.471148490905762, 10.908618927001953, 12.346088409423828, 13.783557891845703, 15.221028327941895, 16.658498764038086, 18.09596824645996, 19.533437728881836, 20.970909118652344, 22.40837860107422, 23.845848083496094, 25.28331756591797, 26.720787048339844, 28.15825843811035, 29.595727920532227, 31.0331974029541, 32.47066879272461, 33.908138275146484, 35.34560775756836, 36.783077239990234, 38.22054672241211, 39.658016204833984, 41.095489501953125, 42.532958984375, 43.970428466796875, 45.40789794921875, 46.845367431640625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0, 8.0, 10.0, 15.0, 11.0, 16.0, 10.0, 15.0, 20.0, 15.0, 15.0, 41.0, 28.0, 29.0, 34.0, 35.0, 40.0, 38.0, 41.0, 38.0, 47.0, 47.0, 49.0, 42.0, 44.0, 31.0, 38.0, 31.0, 38.0, 28.0, 25.0, 17.0, 23.0, 16.0, 15.0, 6.0, 7.0, 6.0, 6.0, 7.0, 2.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.4453125, -7.22900390625, -7.0126953125, -6.79638671875, -6.580078125, -6.36376953125, -6.1474609375, -5.93115234375, -5.71484375, -5.49853515625, -5.2822265625, -5.06591796875, -4.849609375, -4.63330078125, -4.4169921875, -4.20068359375, -3.984375, -3.76806640625, -3.5517578125, -3.33544921875, -3.119140625, -2.90283203125, -2.6865234375, -2.47021484375, -2.25390625, -2.03759765625, -1.8212890625, -1.60498046875, -1.388671875, -1.17236328125, -0.9560546875, -0.73974609375, -0.5234375, -0.30712890625, -0.0908203125, 0.12548828125, 0.341796875, 0.55810546875, 0.7744140625, 0.99072265625, 1.20703125, 1.42333984375, 1.6396484375, 1.85595703125, 2.072265625, 2.28857421875, 2.5048828125, 2.72119140625, 2.9375, 3.15380859375, 3.3701171875, 3.58642578125, 3.802734375, 4.01904296875, 4.2353515625, 4.45166015625, 4.66796875, 4.88427734375, 5.1005859375, 5.31689453125, 5.533203125, 5.74951171875, 5.9658203125, 6.18212890625, 6.3984375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 1.0, 9.0, 12.0, 14.0, 20.0, 33.0, 50.0, 64.0, 109.0, 115.0, 179.0, 235.0, 369.0, 508.0, 746.0, 1119.0, 1546.0, 2176.0, 3108.0, 4607.0, 6846.0, 9944.0, 14764.0, 22608.0, 33736.0, 52134.0, 82466.0, 132018.0, 190833.0, 172878.0, 110993.0, 69813.0, 44718.0, 29054.0, 19228.0, 13159.0, 8824.0, 6073.0, 4081.0, 2874.0, 1948.0, 1422.0, 916.0, 670.0, 464.0, 316.0, 229.0, 168.0, 102.0, 92.0, 49.0, 39.0, 30.0, 20.0, 15.0, 9.0, 5.0, 5.0, 3.0, 2.0], "bins": [-0.63037109375, -0.6111679077148438, -0.5919647216796875, -0.5727615356445312, -0.553558349609375, -0.5343551635742188, -0.5151519775390625, -0.49594879150390625, -0.47674560546875, -0.45754241943359375, -0.4383392333984375, -0.41913604736328125, -0.399932861328125, -0.38072967529296875, -0.3615264892578125, -0.34232330322265625, -0.3231201171875, -0.30391693115234375, -0.2847137451171875, -0.26551055908203125, -0.246307373046875, -0.22710418701171875, -0.2079010009765625, -0.18869781494140625, -0.16949462890625, -0.15029144287109375, -0.1310882568359375, -0.11188507080078125, -0.092681884765625, -0.07347869873046875, -0.0542755126953125, -0.03507232666015625, -0.015869140625, 0.00333404541015625, 0.0225372314453125, 0.04174041748046875, 0.060943603515625, 0.08014678955078125, 0.0993499755859375, 0.11855316162109375, 0.13775634765625, 0.15695953369140625, 0.1761627197265625, 0.19536590576171875, 0.214569091796875, 0.23377227783203125, 0.2529754638671875, 0.27217864990234375, 0.2913818359375, 0.31058502197265625, 0.3297882080078125, 0.34899139404296875, 0.368194580078125, 0.38739776611328125, 0.4066009521484375, 0.42580413818359375, 0.44500732421875, 0.46421051025390625, 0.4834136962890625, 0.5026168823242188, 0.521820068359375, 0.5410232543945312, 0.5602264404296875, 0.5794296264648438, 0.5986328125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 8.0, 4.0, 10.0, 8.0, 12.0, 9.0, 9.0, 6.0, 14.0, 12.0, 22.0, 20.0, 26.0, 27.0, 45.0, 31.0, 22.0, 39.0, 39.0, 31.0, 34.0, 31.0, 35.0, 1072.0, 42.0, 31.0, 37.0, 28.0, 30.0, 31.0, 31.0, 32.0, 21.0, 25.0, 23.0, 20.0, 16.0, 21.0, 16.0, 8.0, 9.0, 4.0, 6.0, 7.0, 8.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.9140625, -3.78399658203125, -3.6539306640625, -3.52386474609375, -3.393798828125, -3.26373291015625, -3.1336669921875, -3.00360107421875, -2.87353515625, -2.74346923828125, -2.6134033203125, -2.48333740234375, -2.353271484375, -2.22320556640625, -2.0931396484375, -1.96307373046875, -1.8330078125, -1.70294189453125, -1.5728759765625, -1.44281005859375, -1.312744140625, -1.18267822265625, -1.0526123046875, -0.92254638671875, -0.79248046875, -0.66241455078125, -0.5323486328125, -0.40228271484375, -0.272216796875, -0.14215087890625, -0.0120849609375, 0.11798095703125, 0.248046875, 0.37811279296875, 0.5081787109375, 0.63824462890625, 0.768310546875, 0.89837646484375, 1.0284423828125, 1.15850830078125, 1.28857421875, 1.41864013671875, 1.5487060546875, 1.67877197265625, 1.808837890625, 1.93890380859375, 2.0689697265625, 2.19903564453125, 2.3291015625, 2.45916748046875, 2.5892333984375, 2.71929931640625, 2.849365234375, 2.97943115234375, 3.1094970703125, 3.23956298828125, 3.36962890625, 3.49969482421875, 3.6297607421875, 3.75982666015625, 3.889892578125, 4.01995849609375, 4.1500244140625, 4.28009033203125, 4.41015625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 8.0, 12.0, 13.0, 36.0, 37.0, 60.0, 87.0, 148.0, 262.0, 398.0, 510.0, 875.0, 1282.0, 1859.0, 2943.0, 4553.0, 6928.0, 10692.0, 16568.0, 26284.0, 43599.0, 75220.0, 132054.0, 1120677.0, 335958.0, 128597.0, 73351.0, 42528.0, 25685.0, 15933.0, 10538.0, 6660.0, 4506.0, 2861.0, 1826.0, 1223.0, 816.0, 511.0, 364.0, 274.0, 158.0, 83.0, 58.0, 34.0, 29.0, 19.0, 8.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53076171875, -0.5130538940429688, -0.4953460693359375, -0.47763824462890625, -0.459930419921875, -0.44222259521484375, -0.4245147705078125, -0.40680694580078125, -0.38909912109375, -0.37139129638671875, -0.3536834716796875, -0.33597564697265625, -0.318267822265625, -0.30055999755859375, -0.2828521728515625, -0.26514434814453125, -0.2474365234375, -0.22972869873046875, -0.2120208740234375, -0.19431304931640625, -0.176605224609375, -0.15889739990234375, -0.1411895751953125, -0.12348175048828125, -0.10577392578125, -0.08806610107421875, -0.0703582763671875, -0.05265045166015625, -0.034942626953125, -0.01723480224609375, 0.0004730224609375, 0.01818084716796875, 0.035888671875, 0.05359649658203125, 0.0713043212890625, 0.08901214599609375, 0.106719970703125, 0.12442779541015625, 0.1421356201171875, 0.15984344482421875, 0.17755126953125, 0.19525909423828125, 0.2129669189453125, 0.23067474365234375, 0.248382568359375, 0.26609039306640625, 0.2837982177734375, 0.30150604248046875, 0.3192138671875, 0.33692169189453125, 0.3546295166015625, 0.37233734130859375, 0.390045166015625, 0.40775299072265625, 0.4254608154296875, 0.44316864013671875, 0.46087646484375, 0.47858428955078125, 0.4962921142578125, 0.5139999389648438, 0.531707763671875, 0.5494155883789062, 0.5671234130859375, 0.5848312377929688, 0.6025390625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 0.0, 4.0, 4.0, 11.0, 11.0, 17.0, 25.0, 35.0, 47.0, 74.0, 87.0, 132.0, 122.0, 107.0, 77.0, 83.0, 52.0, 29.0, 24.0, 17.0, 6.0, 14.0, 4.0, 3.0, 1.0, 9.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0130157470703125, -0.012669086456298828, -0.012322425842285156, -0.011975765228271484, -0.011629104614257812, -0.01128244400024414, -0.010935783386230469, -0.010589122772216797, -0.010242462158203125, -0.009895801544189453, -0.009549140930175781, -0.00920248031616211, -0.008855819702148438, -0.008509159088134766, -0.008162498474121094, -0.007815837860107422, -0.00746917724609375, -0.007122516632080078, -0.006775856018066406, -0.006429195404052734, -0.0060825347900390625, -0.005735874176025391, -0.005389213562011719, -0.005042552947998047, -0.004695892333984375, -0.004349231719970703, -0.004002571105957031, -0.0036559104919433594, -0.0033092498779296875, -0.0029625892639160156, -0.0026159286499023438, -0.002269268035888672, -0.001922607421875, -0.0015759468078613281, -0.0012292861938476562, -0.0008826255798339844, -0.0005359649658203125, -0.00018930435180664062, 0.00015735626220703125, 0.0005040168762207031, 0.000850677490234375, 0.0011973381042480469, 0.0015439987182617188, 0.0018906593322753906, 0.0022373199462890625, 0.0025839805603027344, 0.0029306411743164062, 0.003277301788330078, 0.00362396240234375, 0.003970623016357422, 0.004317283630371094, 0.004663944244384766, 0.0050106048583984375, 0.005357265472412109, 0.005703926086425781, 0.006050586700439453, 0.006397247314453125, 0.006743907928466797, 0.007090568542480469, 0.007437229156494141, 0.0077838897705078125, 0.008130550384521484, 0.008477210998535156, 0.008823871612548828, 0.0091705322265625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 6.0, 7.0, 3.0, 9.0, 11.0, 26.0, 23.0, 26.0, 32.0, 58.0, 54.0, 111.0, 123.0, 214.0, 335.0, 508.0, 1674.0, 707806.0, 334451.0, 1527.0, 543.0, 315.0, 207.0, 130.0, 80.0, 66.0, 54.0, 31.0, 31.0, 27.0, 17.0, 8.0, 9.0, 5.0, 4.0, 1.0, 6.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1705322265625, -0.1650257110595703, -0.15951919555664062, -0.15401268005371094, -0.14850616455078125, -0.14299964904785156, -0.13749313354492188, -0.1319866180419922, -0.1264801025390625, -0.12097358703613281, -0.11546707153320312, -0.10996055603027344, -0.10445404052734375, -0.09894752502441406, -0.09344100952148438, -0.08793449401855469, -0.082427978515625, -0.07692146301269531, -0.07141494750976562, -0.06590843200683594, -0.06040191650390625, -0.05489540100097656, -0.049388885498046875, -0.04388236999511719, -0.0383758544921875, -0.03286933898925781, -0.027362823486328125, -0.021856307983398438, -0.01634979248046875, -0.010843276977539062, -0.005336761474609375, 0.0001697540283203125, 0.00567626953125, 0.011182785034179688, 0.016689300537109375, 0.022195816040039062, 0.02770233154296875, 0.03320884704589844, 0.038715362548828125, 0.04422187805175781, 0.0497283935546875, 0.05523490905761719, 0.060741424560546875, 0.06624794006347656, 0.07175445556640625, 0.07726097106933594, 0.08276748657226562, 0.08827400207519531, 0.093780517578125, 0.09928703308105469, 0.10479354858398438, 0.11030006408691406, 0.11580657958984375, 0.12131309509277344, 0.12681961059570312, 0.1323261260986328, 0.1378326416015625, 0.1433391571044922, 0.14884567260742188, 0.15435218811035156, 0.15985870361328125, 0.16536521911621094, 0.17087173461914062, 0.1763782501220703, 0.181884765625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 355.0, 648.0, 9.0], "bins": [-0.24799008667469025, -0.2439933568239212, -0.23999662697315216, -0.23599989712238312, -0.23200316727161407, -0.22800645232200623, -0.22400972247123718, -0.22001299262046814, -0.2160162627696991, -0.21201953291893005, -0.208022803068161, -0.20402607321739197, -0.20002934336662292, -0.19603261351585388, -0.19203588366508484, -0.188039168715477, -0.18404242396354675, -0.1800456941127777, -0.17604896426200867, -0.17205223441123962, -0.16805550456047058, -0.16405877470970154, -0.1600620448589325, -0.15606532990932465, -0.1520686000585556, -0.14807187020778656, -0.14407514035701752, -0.14007841050624847, -0.13608168065547943, -0.13208496570587158, -0.12808823585510254, -0.1240914985537529, -0.12009478360414505, -0.11609805375337601, -0.11210132390260696, -0.10810460150241852, -0.10410787165164948, -0.10011114180088043, -0.09611441195011139, -0.09211768209934235, -0.0881209596991539, -0.08412422984838486, -0.08012749999761581, -0.07613077759742737, -0.07213404774665833, -0.06813731789588928, -0.06414058804512024, -0.060143858194351196, -0.05614712834358215, -0.05215039849281311, -0.048153672367334366, -0.04415694251656532, -0.04016021639108658, -0.036163486540317535, -0.03216675668954849, -0.0281700287014246, -0.024173300713300705, -0.02017657272517681, -0.016179844737052917, -0.012183114886283875, -0.00818638689815998, -0.004189658910036087, -0.00019292905926704407, 0.0038037989288568497, 0.007800525985658169]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 5.0, 4.0, 6.0, 12.0, 22.0, 24.0, 19.0, 20.0, 41.0, 40.0, 29.0, 37.0, 47.0, 47.0, 42.0, 53.0, 50.0, 35.0, 54.0, 42.0, 55.0, 33.0, 40.0, 35.0, 47.0, 30.0, 29.0, 19.0, 16.0, 10.0, 13.0, 11.0, 9.0, 6.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.006684422492980957, -0.006505077704787254, -0.006325732916593552, -0.006146388128399849, -0.005967043340206146, -0.0057876985520124435, -0.005608353763818741, -0.005429008975625038, -0.0052496641874313354, -0.005070319399237633, -0.00489097461104393, -0.004711629822850227, -0.004532285034656525, -0.004352940246462822, -0.004173595458269119, -0.0039942506700754166, -0.003814905881881714, -0.003635561093688011, -0.0034562163054943085, -0.0032768715173006058, -0.003097526729106903, -0.0029181819409132004, -0.0027388371527194977, -0.002559492364525795, -0.0023801475763320923, -0.0022008027881383896, -0.002021457999944687, -0.0018421132117509842, -0.0016627684235572815, -0.0014834236353635788, -0.001304078847169876, -0.0011247340589761734, -0.0009453892707824707, -0.000766044482588768, -0.0005866996943950653, -0.0004073549062013626, -0.0002280101180076599, -4.8665329813957214e-05, 0.00013067945837974548, 0.0003100242465734482, 0.0004893690347671509, 0.0006687138229608536, 0.0008480586111545563, 0.001027403399348259, 0.0012067481875419617, 0.0013860929757356644, 0.001565437763929367, 0.0017447825521230698, 0.0019241273403167725, 0.002103472128510475, 0.002282816916704178, 0.0024621617048978806, 0.0026415064930915833, 0.002820851281285286, 0.0030001960694789886, 0.0031795408576726913, 0.003358885645866394, 0.0035382304340600967, 0.0037175752222537994, 0.003896920010447502, 0.004076264798641205, 0.0042556095868349075, 0.00443495437502861, 0.004614299163222313, 0.004793643951416016]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0, 8.0, 10.0, 15.0, 10.0, 17.0, 10.0, 15.0, 20.0, 15.0, 15.0, 41.0, 28.0, 29.0, 34.0, 35.0, 40.0, 38.0, 40.0, 39.0, 47.0, 46.0, 50.0, 42.0, 44.0, 31.0, 38.0, 30.0, 39.0, 28.0, 25.0, 17.0, 23.0, 16.0, 14.0, 7.0, 7.0, 6.0, 6.0, 7.0, 2.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.4453125, -7.22906494140625, -7.0128173828125, -6.79656982421875, -6.580322265625, -6.36407470703125, -6.1478271484375, -5.93157958984375, -5.71533203125, -5.49908447265625, -5.2828369140625, -5.06658935546875, -4.850341796875, -4.63409423828125, -4.4178466796875, -4.20159912109375, -3.9853515625, -3.76910400390625, -3.5528564453125, -3.33660888671875, -3.120361328125, -2.90411376953125, -2.6878662109375, -2.47161865234375, -2.25537109375, -2.03912353515625, -1.8228759765625, -1.60662841796875, -1.390380859375, -1.17413330078125, -0.9578857421875, -0.74163818359375, -0.525390625, -0.30914306640625, -0.0928955078125, 0.12335205078125, 0.339599609375, 0.55584716796875, 0.7720947265625, 0.98834228515625, 1.20458984375, 1.42083740234375, 1.6370849609375, 1.85333251953125, 2.069580078125, 2.28582763671875, 2.5020751953125, 2.71832275390625, 2.9345703125, 3.15081787109375, 3.3670654296875, 3.58331298828125, 3.799560546875, 4.01580810546875, 4.2320556640625, 4.44830322265625, 4.66455078125, 4.88079833984375, 5.0970458984375, 5.31329345703125, 5.529541015625, 5.74578857421875, 5.9620361328125, 6.17828369140625, 6.39453125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 3.0, 3.0, 10.0, 6.0, 9.0, 17.0, 29.0, 32.0, 42.0, 53.0, 77.0, 85.0, 136.0, 153.0, 197.0, 335.0, 434.0, 754.0, 1276.0, 2470.0, 5084.0, 13306.0, 43767.0, 211011.0, 570344.0, 145750.0, 33017.0, 10446.0, 4270.0, 2096.0, 1108.0, 699.0, 437.0, 311.0, 209.0, 135.0, 123.0, 92.0, 46.0, 39.0, 28.0, 29.0, 21.0, 18.0, 12.0, 13.0, 6.0, 4.0, 6.0, 2.0, 6.0, 0.0, 1.0, 0.0, 3.0], "bins": [-11.1484375, -10.8145751953125, -10.480712890625, -10.1468505859375, -9.81298828125, -9.4791259765625, -9.145263671875, -8.8114013671875, -8.4775390625, -8.1436767578125, -7.809814453125, -7.4759521484375, -7.14208984375, -6.8082275390625, -6.474365234375, -6.1405029296875, -5.806640625, -5.4727783203125, -5.138916015625, -4.8050537109375, -4.47119140625, -4.1373291015625, -3.803466796875, -3.4696044921875, -3.1357421875, -2.8018798828125, -2.468017578125, -2.1341552734375, -1.80029296875, -1.4664306640625, -1.132568359375, -0.7987060546875, -0.46484375, -0.1309814453125, 0.202880859375, 0.5367431640625, 0.87060546875, 1.2044677734375, 1.538330078125, 1.8721923828125, 2.2060546875, 2.5399169921875, 2.873779296875, 3.2076416015625, 3.54150390625, 3.8753662109375, 4.209228515625, 4.5430908203125, 4.876953125, 5.2108154296875, 5.544677734375, 5.8785400390625, 6.21240234375, 6.5462646484375, 6.880126953125, 7.2139892578125, 7.5478515625, 7.8817138671875, 8.215576171875, 8.5494384765625, 8.88330078125, 9.2171630859375, 9.551025390625, 9.8848876953125, 10.21875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 4.0, 5.0, 3.0, 5.0, 2.0, 8.0, 11.0, 9.0, 10.0, 17.0, 9.0, 18.0, 24.0, 29.0, 27.0, 28.0, 39.0, 43.0, 50.0, 72.0, 178.0, 1464.0, 390.0, 148.0, 85.0, 70.0, 42.0, 39.0, 46.0, 35.0, 15.0, 23.0, 19.0, 22.0, 12.0, 11.0, 10.0, 8.0, 5.0, 5.0, 3.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.34375, -16.74462890625, -16.1455078125, -15.54638671875, -14.947265625, -14.34814453125, -13.7490234375, -13.14990234375, -12.55078125, -11.95166015625, -11.3525390625, -10.75341796875, -10.154296875, -9.55517578125, -8.9560546875, -8.35693359375, -7.7578125, -7.15869140625, -6.5595703125, -5.96044921875, -5.361328125, -4.76220703125, -4.1630859375, -3.56396484375, -2.96484375, -2.36572265625, -1.7666015625, -1.16748046875, -0.568359375, 0.03076171875, 0.6298828125, 1.22900390625, 1.828125, 2.42724609375, 3.0263671875, 3.62548828125, 4.224609375, 4.82373046875, 5.4228515625, 6.02197265625, 6.62109375, 7.22021484375, 7.8193359375, 8.41845703125, 9.017578125, 9.61669921875, 10.2158203125, 10.81494140625, 11.4140625, 12.01318359375, 12.6123046875, 13.21142578125, 13.810546875, 14.40966796875, 15.0087890625, 15.60791015625, 16.20703125, 16.80615234375, 17.4052734375, 18.00439453125, 18.603515625, 19.20263671875, 19.8017578125, 20.40087890625, 21.0]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 4.0, 6.0, 8.0, 8.0, 6.0, 18.0, 17.0, 24.0, 30.0, 41.0, 61.0, 118.0, 189.0, 343.0, 507.0, 1316.0, 60195.0, 3077888.0, 3183.0, 707.0, 366.0, 226.0, 123.0, 88.0, 62.0, 48.0, 27.0, 27.0, 11.0, 8.0, 17.0, 4.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-57.59375, -56.00439453125, -54.4150390625, -52.82568359375, -51.236328125, -49.64697265625, -48.0576171875, -46.46826171875, -44.87890625, -43.28955078125, -41.7001953125, -40.11083984375, -38.521484375, -36.93212890625, -35.3427734375, -33.75341796875, -32.1640625, -30.57470703125, -28.9853515625, -27.39599609375, -25.806640625, -24.21728515625, -22.6279296875, -21.03857421875, -19.44921875, -17.85986328125, -16.2705078125, -14.68115234375, -13.091796875, -11.50244140625, -9.9130859375, -8.32373046875, -6.734375, -5.14501953125, -3.5556640625, -1.96630859375, -0.376953125, 1.21240234375, 2.8017578125, 4.39111328125, 5.98046875, 7.56982421875, 9.1591796875, 10.74853515625, 12.337890625, 13.92724609375, 15.5166015625, 17.10595703125, 18.6953125, 20.28466796875, 21.8740234375, 23.46337890625, 25.052734375, 26.64208984375, 28.2314453125, 29.82080078125, 31.41015625, 32.99951171875, 34.5888671875, 36.17822265625, 37.767578125, 39.35693359375, 40.9462890625, 42.53564453125, 44.125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [6.0, 602.0, 405.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.456827163696289, -7.366308212280273, 0.7242107391357422, 8.814729690551758, 16.905248641967773, 24.99576759338379, 33.08628845214844, 41.17680358886719, 49.26732635498047, 57.357845306396484, 65.4483642578125, 73.53887939453125, 81.62940216064453, 89.71992492675781, 97.81044006347656, 105.90095520019531, 113.9914779663086, 122.08200073242188, 130.17251586914062, 138.26303100585938, 146.35354614257812, 154.44407653808594, 162.5345916748047, 170.62510681152344, 178.7156219482422, 186.80613708496094, 194.89666748046875, 202.9871826171875, 211.07769775390625, 219.168212890625, 227.25872802734375, 235.34925842285156, 243.43975830078125, 251.5302734375, 259.62078857421875, 267.7113037109375, 275.80181884765625, 283.8923645019531, 291.9828796386719, 300.0733947753906, 308.1639099121094, 316.2544250488281, 324.3449401855469, 332.4354553222656, 340.5260009765625, 348.61651611328125, 356.70703125, 364.79754638671875, 372.8880615234375, 380.97857666015625, 389.069091796875, 397.15960693359375, 405.2501220703125, 413.3406677246094, 421.4311828613281, 429.5216979980469, 437.6122131347656, 445.7027282714844, 453.7932434082031, 461.8837585449219, 469.97430419921875, 478.0648193359375, 486.15533447265625, 494.245849609375, 502.33636474609375]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 8.0, 6.0, 8.0, 13.0, 15.0, 18.0, 18.0, 19.0, 25.0, 24.0, 20.0, 51.0, 45.0, 24.0, 45.0, 42.0, 41.0, 53.0, 47.0, 37.0, 48.0, 38.0, 41.0, 45.0, 36.0, 33.0, 31.0, 32.0, 25.0, 22.0, 16.0, 14.0, 9.0, 12.0, 13.0, 7.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.781192779541016, -40.37506866455078, -38.96894073486328, -37.56281280517578, -36.15668869018555, -34.75056457519531, -33.34443664550781, -31.938310623168945, -30.532184600830078, -29.12605857849121, -27.719932556152344, -26.313806533813477, -24.90768051147461, -23.501554489135742, -22.095428466796875, -20.689302444458008, -19.28317642211914, -17.877050399780273, -16.470924377441406, -15.064798355102539, -13.658672332763672, -12.252546310424805, -10.846420288085938, -9.44029426574707, -8.034168243408203, -6.628042221069336, -5.221916198730469, -3.8157901763916016, -2.4096641540527344, -1.0035381317138672, 0.402587890625, 1.8087139129638672, 3.2148361206054688, 4.620962142944336, 6.027088165283203, 7.43321418762207, 8.839340209960938, 10.245466232299805, 11.651592254638672, 13.057718276977539, 14.463844299316406, 15.869970321655273, 17.27609634399414, 18.682222366333008, 20.088348388671875, 21.494474411010742, 22.90060043334961, 24.306726455688477, 25.712852478027344, 27.11897850036621, 28.525104522705078, 29.931230545043945, 31.337356567382812, 32.74348449707031, 34.14960861206055, 35.55573272705078, 36.96186065673828, 38.36798858642578, 39.774112701416016, 41.18023681640625, 42.58636474609375, 43.99249267578125, 45.398616790771484, 46.80474090576172, 48.21086883544922]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 4.0, 11.0, 11.0, 12.0, 16.0, 10.0, 24.0, 34.0, 24.0, 25.0, 25.0, 37.0, 40.0, 40.0, 44.0, 51.0, 51.0, 45.0, 45.0, 45.0, 45.0, 41.0, 46.0, 38.0, 37.0, 39.0, 26.0, 24.0, 13.0, 22.0, 11.0, 9.0, 12.0, 8.0, 10.0, 7.0, 4.0, 8.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1015625, -7.837646484375, -7.57373046875, -7.309814453125, -7.0458984375, -6.781982421875, -6.51806640625, -6.254150390625, -5.990234375, -5.726318359375, -5.46240234375, -5.198486328125, -4.9345703125, -4.670654296875, -4.40673828125, -4.142822265625, -3.87890625, -3.614990234375, -3.35107421875, -3.087158203125, -2.8232421875, -2.559326171875, -2.29541015625, -2.031494140625, -1.767578125, -1.503662109375, -1.23974609375, -0.975830078125, -0.7119140625, -0.447998046875, -0.18408203125, 0.079833984375, 0.34375, 0.607666015625, 0.87158203125, 1.135498046875, 1.3994140625, 1.663330078125, 1.92724609375, 2.191162109375, 2.455078125, 2.718994140625, 2.98291015625, 3.246826171875, 3.5107421875, 3.774658203125, 4.03857421875, 4.302490234375, 4.56640625, 4.830322265625, 5.09423828125, 5.358154296875, 5.6220703125, 5.885986328125, 6.14990234375, 6.413818359375, 6.677734375, 6.941650390625, 7.20556640625, 7.469482421875, 7.7333984375, 7.997314453125, 8.26123046875, 8.525146484375, 8.7890625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 7.0, 7.0, 16.0, 20.0, 35.0, 42.0, 57.0, 77.0, 99.0, 123.0, 188.0, 281.0, 397.0, 637.0, 1168.0, 2761.0, 8557.0, 48924.0, 2799786.0, 1291074.0, 28682.0, 6300.0, 2251.0, 1003.0, 520.0, 376.0, 251.0, 167.0, 119.0, 92.0, 75.0, 51.0, 33.0, 23.0, 18.0, 12.0, 11.0, 9.0, 8.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.09375, -38.79541015625, -37.4970703125, -36.19873046875, -34.900390625, -33.60205078125, -32.3037109375, -31.00537109375, -29.70703125, -28.40869140625, -27.1103515625, -25.81201171875, -24.513671875, -23.21533203125, -21.9169921875, -20.61865234375, -19.3203125, -18.02197265625, -16.7236328125, -15.42529296875, -14.126953125, -12.82861328125, -11.5302734375, -10.23193359375, -8.93359375, -7.63525390625, -6.3369140625, -5.03857421875, -3.740234375, -2.44189453125, -1.1435546875, 0.15478515625, 1.453125, 2.75146484375, 4.0498046875, 5.34814453125, 6.646484375, 7.94482421875, 9.2431640625, 10.54150390625, 11.83984375, 13.13818359375, 14.4365234375, 15.73486328125, 17.033203125, 18.33154296875, 19.6298828125, 20.92822265625, 22.2265625, 23.52490234375, 24.8232421875, 26.12158203125, 27.419921875, 28.71826171875, 30.0166015625, 31.31494140625, 32.61328125, 33.91162109375, 35.2099609375, 36.50830078125, 37.806640625, 39.10498046875, 40.4033203125, 41.70166015625, 43.0]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 2.0, 7.0, 13.0, 5.0, 11.0, 13.0, 26.0, 29.0, 34.0, 58.0, 70.0, 103.0, 148.0, 226.0, 385.0, 542.0, 698.0, 594.0, 374.0, 256.0, 152.0, 92.0, 69.0, 49.0, 29.0, 20.0, 18.0, 8.0, 7.0, 3.0, 11.0, 8.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1953125, -12.6353759765625, -12.075439453125, -11.5155029296875, -10.95556640625, -10.3956298828125, -9.835693359375, -9.2757568359375, -8.7158203125, -8.1558837890625, -7.595947265625, -7.0360107421875, -6.47607421875, -5.9161376953125, -5.356201171875, -4.7962646484375, -4.236328125, -3.6763916015625, -3.116455078125, -2.5565185546875, -1.99658203125, -1.4366455078125, -0.876708984375, -0.3167724609375, 0.2431640625, 0.8031005859375, 1.363037109375, 1.9229736328125, 2.48291015625, 3.0428466796875, 3.602783203125, 4.1627197265625, 4.72265625, 5.2825927734375, 5.842529296875, 6.4024658203125, 6.96240234375, 7.5223388671875, 8.082275390625, 8.6422119140625, 9.2021484375, 9.7620849609375, 10.322021484375, 10.8819580078125, 11.44189453125, 12.0018310546875, 12.561767578125, 13.1217041015625, 13.681640625, 14.2415771484375, 14.801513671875, 15.3614501953125, 15.92138671875, 16.4813232421875, 17.041259765625, 17.6011962890625, 18.1611328125, 18.7210693359375, 19.281005859375, 19.8409423828125, 20.40087890625, 20.9608154296875, 21.520751953125, 22.0806884765625, 22.640625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 6.0, 14.0, 24.0, 34.0, 54.0, 125.0, 252.0, 613.0, 1309.0, 3214.0, 8192.0, 23694.0, 100226.0, 1120731.0, 2681881.0, 197572.0, 37249.0, 11461.0, 4300.0, 1776.0, 865.0, 369.0, 159.0, 81.0, 36.0, 20.0, 15.0, 3.0, 7.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.71875, -16.103515625, -15.48828125, -14.873046875, -14.2578125, -13.642578125, -13.02734375, -12.412109375, -11.796875, -11.181640625, -10.56640625, -9.951171875, -9.3359375, -8.720703125, -8.10546875, -7.490234375, -6.875, -6.259765625, -5.64453125, -5.029296875, -4.4140625, -3.798828125, -3.18359375, -2.568359375, -1.953125, -1.337890625, -0.72265625, -0.107421875, 0.5078125, 1.123046875, 1.73828125, 2.353515625, 2.96875, 3.583984375, 4.19921875, 4.814453125, 5.4296875, 6.044921875, 6.66015625, 7.275390625, 7.890625, 8.505859375, 9.12109375, 9.736328125, 10.3515625, 10.966796875, 11.58203125, 12.197265625, 12.8125, 13.427734375, 14.04296875, 14.658203125, 15.2734375, 15.888671875, 16.50390625, 17.119140625, 17.734375, 18.349609375, 18.96484375, 19.580078125, 20.1953125, 20.810546875, 21.42578125, 22.041015625, 22.65625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 10.0, 9.0, 12.0, 11.0, 17.0, 18.0, 24.0, 24.0, 36.0, 55.0, 54.0, 65.0, 85.0, 79.0, 81.0, 83.0, 67.0, 51.0, 43.0, 39.0, 29.0, 22.0, 15.0, 11.0, 13.0, 5.0, 6.0, 4.0, 5.0, 3.0, 0.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.84513092041016, -65.29803466796875, -62.75093078613281, -60.20383071899414, -57.65673065185547, -55.1096305847168, -52.562530517578125, -50.01543045043945, -47.46833038330078, -44.92123031616211, -42.37413024902344, -39.827030181884766, -37.279930114746094, -34.73283004760742, -32.18572998046875, -29.638629913330078, -27.091529846191406, -24.544429779052734, -21.997329711914062, -19.45022964477539, -16.90312957763672, -14.356029510498047, -11.808929443359375, -9.261829376220703, -6.714729309082031, -4.167629241943359, -1.6205291748046875, 0.9265708923339844, 3.4736709594726562, 6.020771026611328, 8.56787109375, 11.114971160888672, 13.662063598632812, 16.209163665771484, 18.756263732910156, 21.303363800048828, 23.8504638671875, 26.397563934326172, 28.944664001464844, 31.491764068603516, 34.03886413574219, 36.58596420288086, 39.13306427001953, 41.6801643371582, 44.227264404296875, 46.77436447143555, 49.32146453857422, 51.86856460571289, 54.41566467285156, 56.962764739990234, 59.509864807128906, 62.05696487426758, 64.60406494140625, 67.15116882324219, 69.6982650756836, 72.245361328125, 74.79246520996094, 77.33956909179688, 79.88666534423828, 82.43376159667969, 84.98086547851562, 87.52796936035156, 90.07506561279297, 92.62216186523438, 95.16926574707031]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 2.0, 6.0, 4.0, 11.0, 17.0, 11.0, 11.0, 19.0, 27.0, 29.0, 27.0, 32.0, 32.0, 35.0, 42.0, 39.0, 35.0, 30.0, 43.0, 36.0, 42.0, 58.0, 43.0, 28.0, 36.0, 29.0, 31.0, 32.0, 26.0, 18.0, 22.0, 24.0, 16.0, 15.0, 13.0, 13.0, 14.0, 10.0, 11.0, 4.0, 6.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-61.7271842956543, -59.909019470214844, -58.090850830078125, -56.27268600463867, -54.45451736450195, -52.6363525390625, -50.81818389892578, -49.00001907348633, -47.181854248046875, -45.36368942260742, -43.5455207824707, -41.72735595703125, -39.90918731689453, -38.09102249145508, -36.272857666015625, -34.454689025878906, -32.63652038574219, -30.8183536529541, -29.000186920166016, -27.182022094726562, -25.363855361938477, -23.54568862915039, -21.727521896362305, -19.90935516357422, -18.091190338134766, -16.27302360534668, -14.45485782623291, -12.636691093444824, -10.818525314331055, -9.000358581542969, -7.182191848754883, -5.364026069641113, -3.5458602905273438, -1.7276939153671265, 0.09047245979309082, 1.9086389541625977, 3.7268052101135254, 5.544971466064453, 7.363138198852539, 9.181303977966309, 10.999470710754395, 12.81763744354248, 14.63580322265625, 16.453969955444336, 18.272136688232422, 20.090301513671875, 21.908470153808594, 23.726634979248047, 25.544801712036133, 27.36296844482422, 29.181135177612305, 30.99930191040039, 32.817466735839844, 34.63563537597656, 36.453800201416016, 38.27196502685547, 40.09013366699219, 41.90829849243164, 43.72646713256836, 45.54463195800781, 47.36280059814453, 49.180965423583984, 50.99913024902344, 52.817298889160156, 54.63546371459961]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 2.0, 8.0, 3.0, 2.0, 14.0, 7.0, 15.0, 16.0, 22.0, 20.0, 34.0, 36.0, 24.0, 39.0, 26.0, 44.0, 49.0, 40.0, 35.0, 44.0, 55.0, 63.0, 37.0, 35.0, 39.0, 32.0, 34.0, 26.0, 28.0, 29.0, 13.0, 23.0, 18.0, 13.0, 8.0, 11.0, 20.0, 5.0, 5.0, 3.0, 8.0, 1.0, 9.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-113.5625, -110.328125, -107.09375, -103.859375, -100.625, -97.390625, -94.15625, -90.921875, -87.6875, -84.453125, -81.21875, -77.984375, -74.75, -71.515625, -68.28125, -65.046875, -61.8125, -58.578125, -55.34375, -52.109375, -48.875, -45.640625, -42.40625, -39.171875, -35.9375, -32.703125, -29.46875, -26.234375, -23.0, -19.765625, -16.53125, -13.296875, -10.0625, -6.828125, -3.59375, -0.359375, 2.875, 6.109375, 9.34375, 12.578125, 15.8125, 19.046875, 22.28125, 25.515625, 28.75, 31.984375, 35.21875, 38.453125, 41.6875, 44.921875, 48.15625, 51.390625, 54.625, 57.859375, 61.09375, 64.328125, 67.5625, 70.796875, 74.03125, 77.265625, 80.5, 83.734375, 86.96875, 90.203125, 93.4375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 14.0, 18.0, 14.0, 31.0, 44.0, 50.0, 92.0, 127.0, 185.0, 254.0, 357.0, 561.0, 828.0, 1094.0, 1590.0, 2291.0, 3427.0, 4870.0, 7568.0, 11777.0, 18989.0, 31306.0, 55693.0, 105002.0, 201601.0, 254912.0, 153540.0, 79290.0, 43140.0, 25238.0, 15376.0, 9704.0, 6216.0, 4198.0, 2845.0, 1877.0, 1365.0, 918.0, 628.0, 472.0, 323.0, 225.0, 164.0, 91.0, 87.0, 56.0, 46.0, 21.0, 12.0, 11.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 4.0], "bins": [-10.71875, -10.38671875, -10.0546875, -9.72265625, -9.390625, -9.05859375, -8.7265625, -8.39453125, -8.0625, -7.73046875, -7.3984375, -7.06640625, -6.734375, -6.40234375, -6.0703125, -5.73828125, -5.40625, -5.07421875, -4.7421875, -4.41015625, -4.078125, -3.74609375, -3.4140625, -3.08203125, -2.75, -2.41796875, -2.0859375, -1.75390625, -1.421875, -1.08984375, -0.7578125, -0.42578125, -0.09375, 0.23828125, 0.5703125, 0.90234375, 1.234375, 1.56640625, 1.8984375, 2.23046875, 2.5625, 2.89453125, 3.2265625, 3.55859375, 3.890625, 4.22265625, 4.5546875, 4.88671875, 5.21875, 5.55078125, 5.8828125, 6.21484375, 6.546875, 6.87890625, 7.2109375, 7.54296875, 7.875, 8.20703125, 8.5390625, 8.87109375, 9.203125, 9.53515625, 9.8671875, 10.19921875, 10.53125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 6.0, 3.0, 10.0, 7.0, 20.0, 18.0, 14.0, 18.0, 31.0, 30.0, 29.0, 34.0, 37.0, 42.0, 42.0, 53.0, 57.0, 54.0, 1074.0, 36.0, 52.0, 48.0, 37.0, 44.0, 31.0, 39.0, 25.0, 31.0, 14.0, 13.0, 21.0, 20.0, 16.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.875, -64.5712890625, -62.267578125, -59.9638671875, -57.66015625, -55.3564453125, -53.052734375, -50.7490234375, -48.4453125, -46.1416015625, -43.837890625, -41.5341796875, -39.23046875, -36.9267578125, -34.623046875, -32.3193359375, -30.015625, -27.7119140625, -25.408203125, -23.1044921875, -20.80078125, -18.4970703125, -16.193359375, -13.8896484375, -11.5859375, -9.2822265625, -6.978515625, -4.6748046875, -2.37109375, -0.0673828125, 2.236328125, 4.5400390625, 6.84375, 9.1474609375, 11.451171875, 13.7548828125, 16.05859375, 18.3623046875, 20.666015625, 22.9697265625, 25.2734375, 27.5771484375, 29.880859375, 32.1845703125, 34.48828125, 36.7919921875, 39.095703125, 41.3994140625, 43.703125, 46.0068359375, 48.310546875, 50.6142578125, 52.91796875, 55.2216796875, 57.525390625, 59.8291015625, 62.1328125, 64.4365234375, 66.740234375, 69.0439453125, 71.34765625, 73.6513671875, 75.955078125, 78.2587890625, 80.5625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 15.0, 29.0, 43.0, 64.0, 107.0, 119.0, 202.0, 347.0, 462.0, 709.0, 1016.0, 1478.0, 2273.0, 3171.0, 4771.0, 6929.0, 10396.0, 15638.0, 23745.0, 38285.0, 65530.0, 117168.0, 192131.0, 1260437.0, 142462.0, 80170.0, 46061.0, 28198.0, 18238.0, 11937.0, 8062.0, 5408.0, 3733.0, 2598.0, 1696.0, 1186.0, 736.0, 528.0, 349.0, 254.0, 159.0, 89.0, 61.0, 49.0, 32.0, 18.0, 14.0, 6.0, 5.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3125, -7.0701904296875, -6.827880859375, -6.5855712890625, -6.34326171875, -6.1009521484375, -5.858642578125, -5.6163330078125, -5.3740234375, -5.1317138671875, -4.889404296875, -4.6470947265625, -4.40478515625, -4.1624755859375, -3.920166015625, -3.6778564453125, -3.435546875, -3.1932373046875, -2.950927734375, -2.7086181640625, -2.46630859375, -2.2239990234375, -1.981689453125, -1.7393798828125, -1.4970703125, -1.2547607421875, -1.012451171875, -0.7701416015625, -0.52783203125, -0.2855224609375, -0.043212890625, 0.1990966796875, 0.44140625, 0.6837158203125, 0.926025390625, 1.1683349609375, 1.41064453125, 1.6529541015625, 1.895263671875, 2.1375732421875, 2.3798828125, 2.6221923828125, 2.864501953125, 3.1068115234375, 3.34912109375, 3.5914306640625, 3.833740234375, 4.0760498046875, 4.318359375, 4.5606689453125, 4.802978515625, 5.0452880859375, 5.28759765625, 5.5299072265625, 5.772216796875, 6.0145263671875, 6.2568359375, 6.4991455078125, 6.741455078125, 6.9837646484375, 7.22607421875, 7.4683837890625, 7.710693359375, 7.9530029296875, 8.1953125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 2.0, 7.0, 9.0, 9.0, 4.0, 9.0, 10.0, 17.0, 15.0, 16.0, 19.0, 28.0, 31.0, 32.0, 40.0, 42.0, 48.0, 47.0, 39.0, 44.0, 59.0, 39.0, 43.0, 44.0, 37.0, 35.0, 32.0, 32.0, 30.0, 32.0, 22.0, 22.0, 20.0, 19.0, 11.0, 13.0, 3.0, 7.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0238037109375, -0.023006916046142578, -0.022210121154785156, -0.021413326263427734, -0.020616531372070312, -0.01981973648071289, -0.01902294158935547, -0.018226146697998047, -0.017429351806640625, -0.016632556915283203, -0.01583576202392578, -0.01503896713256836, -0.014242172241210938, -0.013445377349853516, -0.012648582458496094, -0.011851787567138672, -0.01105499267578125, -0.010258197784423828, -0.009461402893066406, -0.008664608001708984, -0.007867813110351562, -0.007071018218994141, -0.006274223327636719, -0.005477428436279297, -0.004680633544921875, -0.003883838653564453, -0.0030870437622070312, -0.0022902488708496094, -0.0014934539794921875, -0.0006966590881347656, 0.00010013580322265625, 0.0008969306945800781, 0.0016937255859375, 0.002490520477294922, 0.0032873153686523438, 0.004084110260009766, 0.0048809051513671875, 0.005677700042724609, 0.006474494934082031, 0.007271289825439453, 0.008068084716796875, 0.008864879608154297, 0.009661674499511719, 0.01045846939086914, 0.011255264282226562, 0.012052059173583984, 0.012848854064941406, 0.013645648956298828, 0.01444244384765625, 0.015239238739013672, 0.016036033630371094, 0.016832828521728516, 0.017629623413085938, 0.01842641830444336, 0.01922321319580078, 0.020020008087158203, 0.020816802978515625, 0.021613597869873047, 0.02241039276123047, 0.02320718765258789, 0.024003982543945312, 0.024800777435302734, 0.025597572326660156, 0.026394367218017578, 0.027191162109375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 7.0, 5.0, 4.0, 5.0, 8.0, 7.0, 11.0, 19.0, 15.0, 36.0, 32.0, 42.0, 63.0, 99.0, 146.0, 251.0, 456.0, 1079.0, 3382.0, 14128.0, 103725.0, 639985.0, 247963.0, 28440.0, 5510.0, 1557.0, 661.0, 325.0, 200.0, 109.0, 88.0, 36.0, 27.0, 27.0, 25.0, 22.0, 13.0, 8.0, 7.0, 5.0, 7.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.316162109375, -0.3067779541015625, -0.297393798828125, -0.2880096435546875, -0.27862548828125, -0.2692413330078125, -0.259857177734375, -0.2504730224609375, -0.2410888671875, -0.2317047119140625, -0.222320556640625, -0.2129364013671875, -0.20355224609375, -0.1941680908203125, -0.184783935546875, -0.1753997802734375, -0.166015625, -0.1566314697265625, -0.147247314453125, -0.1378631591796875, -0.12847900390625, -0.1190948486328125, -0.109710693359375, -0.1003265380859375, -0.0909423828125, -0.0815582275390625, -0.072174072265625, -0.0627899169921875, -0.05340576171875, -0.0440216064453125, -0.034637451171875, -0.0252532958984375, -0.015869140625, -0.0064849853515625, 0.002899169921875, 0.0122833251953125, 0.02166748046875, 0.0310516357421875, 0.040435791015625, 0.0498199462890625, 0.0592041015625, 0.0685882568359375, 0.077972412109375, 0.0873565673828125, 0.09674072265625, 0.1061248779296875, 0.115509033203125, 0.1248931884765625, 0.13427734375, 0.1436614990234375, 0.153045654296875, 0.1624298095703125, 0.17181396484375, 0.1811981201171875, 0.190582275390625, 0.1999664306640625, 0.2093505859375, 0.2187347412109375, 0.228118896484375, 0.2375030517578125, 0.24688720703125, 0.2562713623046875, 0.265655517578125, 0.2750396728515625, 0.284423828125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 35.0, 61.0, 214.0, 448.0, 195.0, 35.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10440338402986526, -0.09808691591024399, -0.09177044034004211, -0.08545397222042084, -0.07913750410079956, -0.07282103598117828, -0.06650456041097641, -0.06018809229135513, -0.05387162044644356, -0.04755514860153198, -0.041238680481910706, -0.03492220863699913, -0.028605738654732704, -0.022289268672466278, -0.015972796827554703, -0.009656328707933426, -0.0033398568630218506, 0.002976613584905863, 0.009293084032833576, 0.015609554946422577, 0.021926024928689003, 0.02824249491095543, 0.034558966755867004, 0.04087543487548828, 0.04719190672039986, 0.05350837856531143, 0.05982484668493271, 0.06614132225513458, 0.07245779037475586, 0.07877425849437714, 0.08509072661399841, 0.09140719473361969, 0.09772367775440216, 0.10404014587402344, 0.11035662144422531, 0.11667308956384659, 0.12298955768346786, 0.12930603325366974, 0.13562250137329102, 0.1419389694929123, 0.14825543761253357, 0.15457190573215485, 0.16088837385177612, 0.1672048568725586, 0.17352132499217987, 0.17983779311180115, 0.18615426123142242, 0.1924707293510437, 0.19878721237182617, 0.20510368049144745, 0.21142014861106873, 0.2177366316318512, 0.22405309975147247, 0.23036956787109375, 0.23668603599071503, 0.2430025041103363, 0.24931897222995758, 0.25563544034957886, 0.26195192337036133, 0.2682683765888214, 0.2745848596096039, 0.28090131282806396, 0.28721779584884644, 0.2935342788696289, 0.299850732088089]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 8.0, 3.0, 6.0, 10.0, 15.0, 15.0, 16.0, 23.0, 15.0, 24.0, 19.0, 29.0, 17.0, 33.0, 30.0, 30.0, 26.0, 59.0, 33.0, 41.0, 36.0, 44.0, 28.0, 42.0, 41.0, 40.0, 33.0, 30.0, 29.0, 29.0, 27.0, 13.0, 20.0, 23.0, 24.0, 18.0, 14.0, 12.0, 16.0, 7.0, 4.0, 9.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02394580841064453, -0.023098502308130264, -0.022251196205615997, -0.02140389010310173, -0.020556584000587463, -0.019709277898073196, -0.01886197179555893, -0.018014665693044662, -0.017167359590530396, -0.01632005348801613, -0.015472747385501862, -0.014625441282987595, -0.013778135180473328, -0.01293082907795906, -0.012083522975444794, -0.011236216872930527, -0.01038891077041626, -0.009541604667901993, -0.008694298565387726, -0.007846992462873459, -0.006999686360359192, -0.006152380257844925, -0.005305074155330658, -0.004457768052816391, -0.003610461950302124, -0.002763155847787857, -0.00191584974527359, -0.0010685436427593231, -0.00022123754024505615, 0.0006260685622692108, 0.0014733746647834778, 0.0023206807672977448, 0.0031679868698120117, 0.004015292972326279, 0.004862599074840546, 0.005709905177354813, 0.00655721127986908, 0.0074045173823833466, 0.008251823484897614, 0.00909912958741188, 0.009946435689926147, 0.010793741792440414, 0.011641047894954681, 0.012488353997468948, 0.013335660099983215, 0.014182966202497482, 0.01503027230501175, 0.015877578407526016, 0.016724884510040283, 0.01757219061255455, 0.018419496715068817, 0.019266802817583084, 0.02011410892009735, 0.020961415022611618, 0.021808721125125885, 0.022656027227640152, 0.02350333333015442, 0.024350639432668686, 0.025197945535182953, 0.02604525163769722, 0.026892557740211487, 0.027739863842725754, 0.02858716994524002, 0.029434476047754288, 0.030281782150268555]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 8.0, 3.0, 2.0, 14.0, 7.0, 15.0, 16.0, 22.0, 20.0, 33.0, 36.0, 25.0, 38.0, 27.0, 43.0, 49.0, 40.0, 36.0, 43.0, 55.0, 62.0, 39.0, 35.0, 37.0, 34.0, 33.0, 25.0, 29.0, 30.0, 13.0, 22.0, 19.0, 11.0, 10.0, 10.0, 20.0, 6.0, 5.0, 3.0, 8.0, 1.0, 9.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-113.5625, -110.330078125, -107.09765625, -103.865234375, -100.6328125, -97.400390625, -94.16796875, -90.935546875, -87.703125, -84.470703125, -81.23828125, -78.005859375, -74.7734375, -71.541015625, -68.30859375, -65.076171875, -61.84375, -58.611328125, -55.37890625, -52.146484375, -48.9140625, -45.681640625, -42.44921875, -39.216796875, -35.984375, -32.751953125, -29.51953125, -26.287109375, -23.0546875, -19.822265625, -16.58984375, -13.357421875, -10.125, -6.892578125, -3.66015625, -0.427734375, 2.8046875, 6.037109375, 9.26953125, 12.501953125, 15.734375, 18.966796875, 22.19921875, 25.431640625, 28.6640625, 31.896484375, 35.12890625, 38.361328125, 41.59375, 44.826171875, 48.05859375, 51.291015625, 54.5234375, 57.755859375, 60.98828125, 64.220703125, 67.453125, 70.685546875, 73.91796875, 77.150390625, 80.3828125, 83.615234375, 86.84765625, 90.080078125, 93.3125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 9.0, 9.0, 11.0, 16.0, 16.0, 19.0, 25.0, 29.0, 50.0, 53.0, 75.0, 128.0, 173.0, 282.0, 421.0, 712.0, 1321.0, 3020.0, 8485.0, 26752.0, 109766.0, 454466.0, 336853.0, 74866.0, 19453.0, 6203.0, 2439.0, 1108.0, 588.0, 387.0, 233.0, 141.0, 109.0, 77.0, 54.0, 60.0, 37.0, 26.0, 18.0, 16.0, 17.0, 15.0, 11.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.328125, -16.784423828125, -16.24072265625, -15.697021484375, -15.1533203125, -14.609619140625, -14.06591796875, -13.522216796875, -12.978515625, -12.434814453125, -11.89111328125, -11.347412109375, -10.8037109375, -10.260009765625, -9.71630859375, -9.172607421875, -8.62890625, -8.085205078125, -7.54150390625, -6.997802734375, -6.4541015625, -5.910400390625, -5.36669921875, -4.822998046875, -4.279296875, -3.735595703125, -3.19189453125, -2.648193359375, -2.1044921875, -1.560791015625, -1.01708984375, -0.473388671875, 0.0703125, 0.614013671875, 1.15771484375, 1.701416015625, 2.2451171875, 2.788818359375, 3.33251953125, 3.876220703125, 4.419921875, 4.963623046875, 5.50732421875, 6.051025390625, 6.5947265625, 7.138427734375, 7.68212890625, 8.225830078125, 8.76953125, 9.313232421875, 9.85693359375, 10.400634765625, 10.9443359375, 11.488037109375, 12.03173828125, 12.575439453125, 13.119140625, 13.662841796875, 14.20654296875, 14.750244140625, 15.2939453125, 15.837646484375, 16.38134765625, 16.925048828125, 17.46875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 6.0, 6.0, 16.0, 24.0, 22.0, 28.0, 32.0, 56.0, 45.0, 51.0, 79.0, 60.0, 2118.0, 106.0, 69.0, 65.0, 61.0, 46.0, 29.0, 34.0, 29.0, 19.0, 13.0, 10.0, 10.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.375, -201.568359375, -194.76171875, -187.955078125, -181.1484375, -174.341796875, -167.53515625, -160.728515625, -153.921875, -147.115234375, -140.30859375, -133.501953125, -126.6953125, -119.888671875, -113.08203125, -106.275390625, -99.46875, -92.662109375, -85.85546875, -79.048828125, -72.2421875, -65.435546875, -58.62890625, -51.822265625, -45.015625, -38.208984375, -31.40234375, -24.595703125, -17.7890625, -10.982421875, -4.17578125, 2.630859375, 9.4375, 16.244140625, 23.05078125, 29.857421875, 36.6640625, 43.470703125, 50.27734375, 57.083984375, 63.890625, 70.697265625, 77.50390625, 84.310546875, 91.1171875, 97.923828125, 104.73046875, 111.537109375, 118.34375, 125.150390625, 131.95703125, 138.763671875, 145.5703125, 152.376953125, 159.18359375, 165.990234375, 172.796875, 179.603515625, 186.41015625, 193.216796875, 200.0234375, 206.830078125, 213.63671875, 220.443359375, 227.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 9.0, 6.0, 16.0, 35.0, 37.0, 58.0, 113.0, 185.0, 370.0, 763.0, 1899.0, 10646.0, 598353.0, 2517830.0, 11785.0, 1935.0, 819.0, 387.0, 200.0, 100.0, 66.0, 47.0, 25.0, 7.0, 11.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.53125, -48.03125, -46.53125, -45.03125, -43.53125, -42.03125, -40.53125, -39.03125, -37.53125, -36.03125, -34.53125, -33.03125, -31.53125, -30.03125, -28.53125, -27.03125, -25.53125, -24.03125, -22.53125, -21.03125, -19.53125, -18.03125, -16.53125, -15.03125, -13.53125, -12.03125, -10.53125, -9.03125, -7.53125, -6.03125, -4.53125, -3.03125, -1.53125, -0.03125, 1.46875, 2.96875, 4.46875, 5.96875, 7.46875, 8.96875, 10.46875, 11.96875, 13.46875, 14.96875, 16.46875, 17.96875, 19.46875, 20.96875, 22.46875, 23.96875, 25.46875, 26.96875, 28.46875, 29.96875, 31.46875, 32.96875, 34.46875, 35.96875, 37.46875, 38.96875, 40.46875, 41.96875, 43.46875, 44.96875, 46.46875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 8.0, 24.0, 119.0, 275.0, 345.0, 145.0, 49.0, 21.0, 9.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.8161163330078, -191.63790893554688, -174.45970153808594, -157.281494140625, -140.10330200195312, -122.92508697509766, -105.74688720703125, -88.56867980957031, -71.39047241210938, -54.21226501464844, -37.034061431884766, -19.855857849121094, -2.6776504516601562, 14.500556945800781, 31.678756713867188, 48.856964111328125, 66.03517150878906, 83.21337890625, 100.39158630371094, 117.56978607177734, 134.74798583984375, 151.92620849609375, 169.10440063476562, 186.28260803222656, 203.4608154296875, 220.63902282714844, 237.81723022460938, 254.99542236328125, 272.17364501953125, 289.3518371582031, 306.530029296875, 323.708251953125, 340.88641357421875, 358.0646057128906, 375.2428283691406, 392.4210205078125, 409.5992431640625, 426.7774353027344, 443.95562744140625, 461.13385009765625, 478.31207275390625, 495.4902648925781, 512.66845703125, 529.8466796875, 547.02490234375, 564.203125, 581.3812866210938, 598.5595092773438, 615.7376708984375, 632.9158935546875, 650.0940551757812, 667.2722778320312, 684.4505004882812, 701.6287231445312, 718.806884765625, 735.985107421875, 753.163330078125, 770.341552734375, 787.5197143554688, 804.6979370117188, 821.8761596679688, 839.0543823242188, 856.2325439453125, 873.4107666015625, 890.5889892578125]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 5.0, 7.0, 7.0, 8.0, 7.0, 13.0, 13.0, 16.0, 21.0, 32.0, 38.0, 30.0, 38.0, 48.0, 34.0, 44.0, 54.0, 45.0, 49.0, 45.0, 42.0, 36.0, 36.0, 63.0, 40.0, 39.0, 34.0, 27.0, 15.0, 20.0, 18.0, 15.0, 18.0, 9.0, 5.0, 9.0, 13.0, 8.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.4662628173828, -202.9014892578125, -196.3367156982422, -189.77194213867188, -183.20716857910156, -176.64239501953125, -170.07763671875, -163.51284790039062, -156.94808959960938, -150.38331604003906, -143.81854248046875, -137.25376892089844, -130.68899536132812, -124.12422180175781, -117.55945587158203, -110.99468231201172, -104.42990112304688, -97.86512756347656, -91.30035400390625, -84.73558044433594, -78.17080688476562, -71.60603332519531, -65.04126739501953, -58.47649383544922, -51.911720275878906, -45.346946716308594, -38.78217315673828, -32.217403411865234, -25.652629852294922, -19.08785629272461, -12.523086547851562, -5.95831298828125, 0.6064453125, 7.171217918395996, 13.735990524291992, 20.300762176513672, 26.865535736083984, 33.4303092956543, 39.995079040527344, 46.559852600097656, 53.12462615966797, 59.68939971923828, 66.2541732788086, 72.81893920898438, 79.38371276855469, 85.948486328125, 92.51325988769531, 99.07803344726562, 105.64280700683594, 112.20758056640625, 118.77235412597656, 125.33712768554688, 131.9019012451172, 138.4666748046875, 145.03143310546875, 151.59622192382812, 158.16098022460938, 164.7257537841797, 171.29052734375, 177.8553009033203, 184.42007446289062, 190.98484802246094, 197.54962158203125, 204.1143798828125, 210.67916870117188]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 8.0, 8.0, 14.0, 16.0, 20.0, 31.0, 37.0, 40.0, 50.0, 71.0, 110.0, 141.0, 183.0, 257.0, 334.0, 523.0, 789.0, 1294.0, 1040768.0, 1265.0, 721.0, 524.0, 349.0, 250.0, 177.0, 135.0, 119.0, 64.0, 53.0, 33.0, 34.0, 36.0, 23.0, 7.0, 8.0, 15.0, 9.0, 8.0, 1.0, 2.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-68.3751449584961, -66.1307144165039, -63.88628387451172, -61.64185333251953, -59.397422790527344, -57.152992248535156, -54.9085578918457, -52.664127349853516, -50.41969680786133, -48.17526626586914, -45.93083572387695, -43.686405181884766, -41.44197082519531, -39.197540283203125, -36.95310974121094, -34.70867919921875, -32.46424865722656, -30.219818115234375, -27.975387573242188, -25.730955123901367, -23.48652458190918, -21.242094039916992, -18.997661590576172, -16.753231048583984, -14.508800506591797, -12.26436996459961, -10.019938468933105, -7.77550745010376, -5.531076431274414, -3.2866458892822266, -1.0422143936157227, 1.2022171020507812, 3.4466552734375, 5.691086292266846, 7.935517311096191, 10.179948806762695, 12.424379348754883, 14.66880989074707, 16.91324234008789, 19.157672882080078, 21.402103424072266, 23.646533966064453, 25.89096450805664, 28.13539695739746, 30.37982749938965, 32.62425994873047, 34.868690490722656, 37.113121032714844, 39.35755157470703, 41.60198211669922, 43.846412658691406, 46.090843200683594, 48.33527374267578, 50.57970428466797, 52.82413864135742, 55.06856918334961, 57.3129997253418, 59.557430267333984, 61.80186080932617, 64.04629516601562, 66.29072570800781, 68.53515625, 70.77958679199219, 73.02401733398438, 75.26844787597656]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 0.0, 4.0, 5.0, 18.0, 15.0, 15.0, 23.0, 64.0, 125.0, 51436560.0, 26224.0, 72.0, 48.0, 17.0, 11.0, 9.0, 5.0, 2.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2635.649169921875, -2541.3642578125, -2447.0791015625, -2352.7939453125, -2258.509033203125, -2164.22412109375, -2069.93896484375, -1975.6539306640625, -1881.368896484375, -1787.0838623046875, -1692.798828125, -1598.5137939453125, -1504.228759765625, -1409.9437255859375, -1315.65869140625, -1221.3736572265625, -1127.088623046875, -1032.8035888671875, -938.5185546875, -844.2335205078125, -749.948486328125, -655.6634521484375, -561.37841796875, -467.0933837890625, -372.808349609375, -278.5233154296875, -184.23828125, -89.9532470703125, 4.331787109375, 98.6168212890625, 192.90185546875, 287.1868896484375, 381.471923828125, 475.7569580078125, 570.0419921875, 664.3270263671875, 758.612060546875, 852.8970947265625, 947.18212890625, 1041.4671630859375, 1135.752197265625, 1230.0372314453125, 1324.322265625, 1418.6072998046875, 1512.892333984375, 1607.1773681640625, 1701.46240234375, 1795.7474365234375, 1890.032470703125, 1984.3175048828125, 2078.6025390625, 2172.8876953125, 2267.172607421875, 2361.45751953125, 2455.74267578125, 2550.02783203125, 2644.312744140625, 2738.59765625, 2832.8828125, 2927.16796875, 3021.452880859375, 3115.73779296875, 3210.02294921875, 3304.30810546875, 3398.593017578125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 6.0, 11.0, 3.0, 13.0, 18.0, 25.0, 46.0, 60.0, 78.0, 122.0, 204.0, 260.0, 352.0, 484.0, 714.0, 1110.0, 1584.0, 2194.0, 3108.0, 4722.0, 7062.0, 10433.0, 15966.0, 24337.0, 37573.0, 60190.0, 97009.0, 161106.0, 266758.0, 412008.0, 3164188.0, 1013206.0, 378992.0, 239682.0, 144758.0, 87484.0, 54618.0, 34385.0, 22245.0, 14476.0, 9521.0, 6540.0, 4341.0, 2924.0, 2013.0, 1344.0, 962.0, 686.0, 446.0, 303.0, 232.0, 170.0, 132.0, 89.0, 59.0, 16.0, 17.0, 22.0, 17.0, 16.0, 7.0, 5.0, 3.0], "bins": [-2.04296875, -1.978912353515625, -1.91485595703125, -1.850799560546875, -1.7867431640625, -1.722686767578125, -1.65863037109375, -1.594573974609375, -1.530517578125, -1.466461181640625, -1.40240478515625, -1.338348388671875, -1.2742919921875, -1.210235595703125, -1.14617919921875, -1.082122802734375, -1.01806640625, -0.954010009765625, -0.88995361328125, -0.825897216796875, -0.7618408203125, -0.697784423828125, -0.63372802734375, -0.569671630859375, -0.505615234375, -0.441558837890625, -0.37750244140625, -0.313446044921875, -0.2493896484375, -0.185333251953125, -0.12127685546875, -0.057220458984375, 0.0068359375, 0.070892333984375, 0.13494873046875, 0.199005126953125, 0.2630615234375, 0.327117919921875, 0.39117431640625, 0.455230712890625, 0.519287109375, 0.583343505859375, 0.64739990234375, 0.711456298828125, 0.7755126953125, 0.839569091796875, 0.90362548828125, 0.967681884765625, 1.03173828125, 1.095794677734375, 1.15985107421875, 1.223907470703125, 1.2879638671875, 1.352020263671875, 1.41607666015625, 1.480133056640625, 1.544189453125, 1.608245849609375, 1.67230224609375, 1.736358642578125, 1.8004150390625, 1.864471435546875, 1.92852783203125, 1.992584228515625, 2.056640625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 6.0, 4.0, 7.0, 6.0, 9.0, 2.0, 12.0, 10.0, 11.0, 12.0, 14.0, 19.0, 18.0, 18.0, 17.0, 22.0, 20.0, 32.0, 36.0, 42.0, 34.0, 34.0, 36.0, 34.0, 130.0, 846.0, 145.0, 38.0, 25.0, 34.0, 36.0, 38.0, 20.0, 28.0, 30.0, 20.0, 19.0, 23.0, 25.0, 17.0, 17.0, 17.0, 8.0, 9.0, 11.0, 8.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 5.0, 1.0, 3.0], "bins": [-17.84375, -17.2763671875, -16.708984375, -16.1416015625, -15.57421875, -15.0068359375, -14.439453125, -13.8720703125, -13.3046875, -12.7373046875, -12.169921875, -11.6025390625, -11.03515625, -10.4677734375, -9.900390625, -9.3330078125, -8.765625, -8.1982421875, -7.630859375, -7.0634765625, -6.49609375, -5.9287109375, -5.361328125, -4.7939453125, -4.2265625, -3.6591796875, -3.091796875, -2.5244140625, -1.95703125, -1.3896484375, -0.822265625, -0.2548828125, 0.3125, 0.8798828125, 1.447265625, 2.0146484375, 2.58203125, 3.1494140625, 3.716796875, 4.2841796875, 4.8515625, 5.4189453125, 5.986328125, 6.5537109375, 7.12109375, 7.6884765625, 8.255859375, 8.8232421875, 9.390625, 9.9580078125, 10.525390625, 11.0927734375, 11.66015625, 12.2275390625, 12.794921875, 13.3623046875, 13.9296875, 14.4970703125, 15.064453125, 15.6318359375, 16.19921875, 16.7666015625, 17.333984375, 17.9013671875, 18.46875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 11.0, 15.0, 20.0, 32.0, 47.0, 84.0, 119.0, 188.0, 246.0, 397.0, 675.0, 978.0, 1539.0, 2548.0, 4100.0, 6430.0, 10448.0, 16949.0, 27420.0, 44406.0, 72342.0, 118071.0, 192147.0, 296640.0, 418137.0, 3475598.0, 612463.0, 356863.0, 240890.0, 150864.0, 92523.0, 56730.0, 35196.0, 21383.0, 13190.0, 8177.0, 5030.0, 3110.0, 1951.0, 1234.0, 738.0, 520.0, 353.0, 202.0, 146.0, 96.0, 52.0, 46.0, 28.0, 19.0, 16.0, 7.0, 7.0, 8.0, 3.0, 2.0], "bins": [-1.7060546875, -1.6555023193359375, -1.604949951171875, -1.5543975830078125, -1.50384521484375, -1.4532928466796875, -1.402740478515625, -1.3521881103515625, -1.3016357421875, -1.2510833740234375, -1.200531005859375, -1.1499786376953125, -1.09942626953125, -1.0488739013671875, -0.998321533203125, -0.9477691650390625, -0.897216796875, -0.8466644287109375, -0.796112060546875, -0.7455596923828125, -0.69500732421875, -0.6444549560546875, -0.593902587890625, -0.5433502197265625, -0.4927978515625, -0.4422454833984375, -0.391693115234375, -0.3411407470703125, -0.29058837890625, -0.2400360107421875, -0.189483642578125, -0.1389312744140625, -0.08837890625, -0.0378265380859375, 0.012725830078125, 0.0632781982421875, 0.11383056640625, 0.1643829345703125, 0.214935302734375, 0.2654876708984375, 0.3160400390625, 0.3665924072265625, 0.417144775390625, 0.4676971435546875, 0.51824951171875, 0.5688018798828125, 0.619354248046875, 0.6699066162109375, 0.720458984375, 0.7710113525390625, 0.821563720703125, 0.8721160888671875, 0.92266845703125, 0.9732208251953125, 1.023773193359375, 1.0743255615234375, 1.1248779296875, 1.1754302978515625, 1.225982666015625, 1.2765350341796875, 1.32708740234375, 1.3776397705078125, 1.428192138671875, 1.4787445068359375, 1.529296875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 2.0, 4.0, 7.0, 2.0, 6.0, 12.0, 14.0, 8.0, 20.0, 19.0, 17.0, 24.0, 27.0, 29.0, 28.0, 27.0, 34.0, 41.0, 41.0, 41.0, 41.0, 79.0, 972.0, 98.0, 35.0, 35.0, 39.0, 40.0, 34.0, 35.0, 29.0, 25.0, 23.0, 27.0, 27.0, 12.0, 12.0, 16.0, 14.0, 5.0, 6.0, 6.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9140625, -14.3897705078125, -13.865478515625, -13.3411865234375, -12.81689453125, -12.2926025390625, -11.768310546875, -11.2440185546875, -10.7197265625, -10.1954345703125, -9.671142578125, -9.1468505859375, -8.62255859375, -8.0982666015625, -7.573974609375, -7.0496826171875, -6.525390625, -6.0010986328125, -5.476806640625, -4.9525146484375, -4.42822265625, -3.9039306640625, -3.379638671875, -2.8553466796875, -2.3310546875, -1.8067626953125, -1.282470703125, -0.7581787109375, -0.23388671875, 0.2904052734375, 0.814697265625, 1.3389892578125, 1.86328125, 2.3875732421875, 2.911865234375, 3.4361572265625, 3.96044921875, 4.4847412109375, 5.009033203125, 5.5333251953125, 6.0576171875, 6.5819091796875, 7.106201171875, 7.6304931640625, 8.15478515625, 8.6790771484375, 9.203369140625, 9.7276611328125, 10.251953125, 10.7762451171875, 11.300537109375, 11.8248291015625, 12.34912109375, 12.8734130859375, 13.397705078125, 13.9219970703125, 14.4462890625, 14.9705810546875, 15.494873046875, 16.0191650390625, 16.54345703125, 17.0677490234375, 17.592041015625, 18.1163330078125, 18.640625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 11.0, 18.0, 10.0, 23.0, 44.0, 43.0, 75.0, 93.0, 162.0, 199.0, 300.0, 412.0, 650.0, 882.0, 1325.0, 1988.0, 3033.0, 4553.0, 7174.0, 11100.0, 17320.0, 27974.0, 44461.0, 71650.0, 123970.0, 5609537.0, 149308.0, 80058.0, 49346.0, 31318.0, 19730.0, 12180.0, 7589.0, 5005.0, 3283.0, 2162.0, 1421.0, 941.0, 618.0, 408.0, 300.0, 196.0, 167.0, 129.0, 75.0, 67.0, 32.0, 25.0, 23.0, 13.0, 4.0, 5.0, 9.0, 8.0, 2.0, 3.0], "bins": [-3.751953125, -3.64031982421875, -3.5286865234375, -3.41705322265625, -3.305419921875, -3.19378662109375, -3.0821533203125, -2.97052001953125, -2.85888671875, -2.74725341796875, -2.6356201171875, -2.52398681640625, -2.412353515625, -2.30072021484375, -2.1890869140625, -2.07745361328125, -1.9658203125, -1.85418701171875, -1.7425537109375, -1.63092041015625, -1.519287109375, -1.40765380859375, -1.2960205078125, -1.18438720703125, -1.07275390625, -0.96112060546875, -0.8494873046875, -0.73785400390625, -0.626220703125, -0.51458740234375, -0.4029541015625, -0.29132080078125, -0.1796875, -0.06805419921875, 0.0435791015625, 0.15521240234375, 0.266845703125, 0.37847900390625, 0.4901123046875, 0.60174560546875, 0.71337890625, 0.82501220703125, 0.9366455078125, 1.04827880859375, 1.159912109375, 1.27154541015625, 1.3831787109375, 1.49481201171875, 1.6064453125, 1.71807861328125, 1.8297119140625, 1.94134521484375, 2.052978515625, 2.16461181640625, 2.2762451171875, 2.38787841796875, 2.49951171875, 2.61114501953125, 2.7227783203125, 2.83441162109375, 2.946044921875, 3.05767822265625, 3.1693115234375, 3.28094482421875, 3.392578125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 1.0, 10.0, 5.0, 5.0, 16.0, 11.0, 11.0, 16.0, 17.0, 18.0, 26.0, 27.0, 24.0, 27.0, 34.0, 28.0, 31.0, 37.0, 51.0, 39.0, 45.0, 802.0, 290.0, 44.0, 37.0, 37.0, 45.0, 38.0, 36.0, 31.0, 26.0, 24.0, 23.0, 21.0, 17.0, 10.0, 8.0, 21.0, 10.0, 5.0, 8.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.03125, -12.608154296875, -12.18505859375, -11.761962890625, -11.3388671875, -10.915771484375, -10.49267578125, -10.069580078125, -9.646484375, -9.223388671875, -8.80029296875, -8.377197265625, -7.9541015625, -7.531005859375, -7.10791015625, -6.684814453125, -6.26171875, -5.838623046875, -5.41552734375, -4.992431640625, -4.5693359375, -4.146240234375, -3.72314453125, -3.300048828125, -2.876953125, -2.453857421875, -2.03076171875, -1.607666015625, -1.1845703125, -0.761474609375, -0.33837890625, 0.084716796875, 0.5078125, 0.930908203125, 1.35400390625, 1.777099609375, 2.2001953125, 2.623291015625, 3.04638671875, 3.469482421875, 3.892578125, 4.315673828125, 4.73876953125, 5.161865234375, 5.5849609375, 6.008056640625, 6.43115234375, 6.854248046875, 7.27734375, 7.700439453125, 8.12353515625, 8.546630859375, 8.9697265625, 9.392822265625, 9.81591796875, 10.239013671875, 10.662109375, 11.085205078125, 11.50830078125, 11.931396484375, 12.3544921875, 12.777587890625, 13.20068359375, 13.623779296875, 14.046875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 5.0, 21.0, 63.0, 144.0, 316.0, 279.0, 101.0, 34.0, 23.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.8656234741211, -85.40959167480469, -82.95355224609375, -80.49751281738281, -78.0414810180664, -75.58544921875, -73.12940979003906, -70.67337036132812, -68.21733856201172, -65.76130676269531, -63.305267333984375, -60.8492317199707, -58.39319610595703, -55.93716049194336, -53.48112487792969, -51.025089263916016, -48.569053649902344, -46.11301803588867, -43.656982421875, -41.20094680786133, -38.744911193847656, -36.288875579833984, -33.83283996582031, -31.37680435180664, -28.92076873779297, -26.464733123779297, -24.008697509765625, -21.552661895751953, -19.09662628173828, -16.64059066772461, -14.184555053710938, -11.728519439697266, -9.272476196289062, -6.816440582275391, -4.360404968261719, -1.9043693542480469, 0.551666259765625, 3.007701873779297, 5.463737487792969, 7.919773101806641, 10.375808715820312, 12.831844329833984, 15.287879943847656, 17.743915557861328, 20.199951171875, 22.655986785888672, 25.112022399902344, 27.568058013916016, 30.024093627929688, 32.48012924194336, 34.93616485595703, 37.3922004699707, 39.848236083984375, 42.30427169799805, 44.76030731201172, 47.21634292602539, 49.67237854003906, 52.128414154052734, 54.584449768066406, 57.04048538208008, 59.49652099609375, 61.95255661010742, 64.4085922241211, 66.8646240234375, 69.32066345214844]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 1.0, 5.0, 6.0, 9.0, 9.0, 13.0, 13.0, 26.0, 22.0, 31.0, 34.0, 32.0, 48.0, 43.0, 49.0, 42.0, 59.0, 49.0, 52.0, 38.0, 43.0, 42.0, 47.0, 34.0, 42.0, 41.0, 24.0, 33.0, 26.0, 17.0, 21.0, 5.0, 16.0, 10.0, 4.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.56077575683594, -41.389495849609375, -40.21821975708008, -39.046939849853516, -37.87565994262695, -36.704383850097656, -35.533103942871094, -34.36182403564453, -33.19054412841797, -32.019264221191406, -30.847986221313477, -29.676708221435547, -28.505428314208984, -27.334150314331055, -26.162872314453125, -24.991592407226562, -23.820316314697266, -22.649038314819336, -21.477758407592773, -20.306480407714844, -19.13520050048828, -17.96392250061035, -16.792644500732422, -15.621365547180176, -14.45008659362793, -13.278807640075684, -12.107528686523438, -10.936250686645508, -9.764971733093262, -8.593692779541016, -7.422414302825928, -6.25113582611084, -5.079856872558594, -3.9085781574249268, -2.7372994422912598, -1.5660207271575928, -0.3947420120239258, 0.7765369415283203, 1.9478154182434082, 3.119093894958496, 4.290372848510742, 5.461651802062988, 6.632930278778076, 7.804208755493164, 8.97548770904541, 10.146766662597656, 11.318044662475586, 12.489323616027832, 13.660602569580078, 14.831881523132324, 16.00316047668457, 17.1744384765625, 18.345718383789062, 19.516996383666992, 20.688274383544922, 21.859554290771484, 23.030832290649414, 24.202110290527344, 25.373390197753906, 26.544668197631836, 27.715946197509766, 28.887226104736328, 30.058504104614258, 31.229782104492188, 32.40106201171875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 1.0, 8.0, 5.0, 9.0, 7.0, 10.0, 20.0, 29.0, 37.0, 66.0, 60.0, 148.0, 172.0, 363.0, 664.0, 1347.0, 2929.0, 8087.0, 39112.0, 4018355.0, 102597.0, 13263.0, 3880.0, 1591.0, 710.0, 333.0, 193.0, 112.0, 60.0, 36.0, 26.0, 12.0, 11.0, 4.0, 8.0, 3.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44384765625, -0.428375244140625, -0.41290283203125, -0.397430419921875, -0.3819580078125, -0.366485595703125, -0.35101318359375, -0.335540771484375, -0.320068359375, -0.304595947265625, -0.28912353515625, -0.273651123046875, -0.2581787109375, -0.242706298828125, -0.22723388671875, -0.211761474609375, -0.1962890625, -0.180816650390625, -0.16534423828125, -0.149871826171875, -0.1343994140625, -0.118927001953125, -0.10345458984375, -0.087982177734375, -0.072509765625, -0.057037353515625, -0.04156494140625, -0.026092529296875, -0.0106201171875, 0.004852294921875, 0.02032470703125, 0.035797119140625, 0.05126953125, 0.066741943359375, 0.08221435546875, 0.097686767578125, 0.1131591796875, 0.128631591796875, 0.14410400390625, 0.159576416015625, 0.175048828125, 0.190521240234375, 0.20599365234375, 0.221466064453125, 0.2369384765625, 0.252410888671875, 0.26788330078125, 0.283355712890625, 0.298828125, 0.314300537109375, 0.32977294921875, 0.345245361328125, 0.3607177734375, 0.376190185546875, 0.39166259765625, 0.407135009765625, 0.422607421875, 0.438079833984375, 0.45355224609375, 0.469024658203125, 0.4844970703125, 0.499969482421875, 0.51544189453125, 0.530914306640625, 0.54638671875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 6.0, 4.0, 7.0, 9.0, 14.0, 11.0, 13.0, 11.0, 23.0, 751.0, 37.0, 19.0, 11.0, 6.0, 12.0, 11.0, 7.0, 6.0, 7.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.17529296875, -0.17037391662597656, -0.16545486450195312, -0.1605358123779297, -0.15561676025390625, -0.1506977081298828, -0.14577865600585938, -0.14085960388183594, -0.1359405517578125, -0.13102149963378906, -0.12610244750976562, -0.12118339538574219, -0.11626434326171875, -0.11134529113769531, -0.10642623901367188, -0.10150718688964844, -0.096588134765625, -0.09166908264160156, -0.08675003051757812, -0.08183097839355469, -0.07691192626953125, -0.07199287414550781, -0.06707382202148438, -0.06215476989746094, -0.0572357177734375, -0.05231666564941406, -0.047397613525390625, -0.04247856140136719, -0.03755950927734375, -0.03264045715332031, -0.027721405029296875, -0.022802352905273438, -0.01788330078125, -0.012964248657226562, -0.008045196533203125, -0.0031261444091796875, 0.00179290771484375, 0.0067119598388671875, 0.011631011962890625, 0.016550064086914062, 0.0214691162109375, 0.026388168334960938, 0.031307220458984375, 0.03622627258300781, 0.04114532470703125, 0.04606437683105469, 0.050983428955078125, 0.05590248107910156, 0.060821533203125, 0.06574058532714844, 0.07065963745117188, 0.07557868957519531, 0.08049774169921875, 0.08541679382324219, 0.09033584594726562, 0.09525489807128906, 0.1001739501953125, 0.10509300231933594, 0.11001205444335938, 0.11493110656738281, 0.11985015869140625, 0.12476921081542969, 0.12968826293945312, 0.13460731506347656, 0.1395263671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 3.0, 5.0, 16.0, 18.0, 26.0, 38.0, 70.0, 120.0, 212.0, 370.0, 609.0, 1162.0, 2348.0, 4996.0, 11625.0, 33125.0, 155212.0, 3092514.0, 779167.0, 77507.0, 20900.0, 7443.0, 3272.0, 1503.0, 811.0, 445.0, 279.0, 174.0, 111.0, 50.0, 42.0, 31.0, 19.0, 15.0, 11.0, 12.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.350341796875, -0.3408203125, -0.331298828125, -0.32177734375, -0.312255859375, -0.302734375, -0.293212890625, -0.28369140625, -0.274169921875, -0.2646484375, -0.255126953125, -0.24560546875, -0.236083984375, -0.2265625, -0.217041015625, -0.20751953125, -0.197998046875, -0.1884765625, -0.178955078125, -0.16943359375, -0.159912109375, -0.150390625, -0.140869140625, -0.13134765625, -0.121826171875, -0.1123046875, -0.102783203125, -0.09326171875, -0.083740234375, -0.07421875, -0.064697265625, -0.05517578125, -0.045654296875, -0.0361328125, -0.026611328125, -0.01708984375, -0.007568359375, 0.001953125, 0.011474609375, 0.02099609375, 0.030517578125, 0.0400390625, 0.049560546875, 0.05908203125, 0.068603515625, 0.078125, 0.087646484375, 0.09716796875, 0.106689453125, 0.1162109375, 0.125732421875, 0.13525390625, 0.144775390625, 0.154296875, 0.163818359375, 0.17333984375, 0.182861328125, 0.1923828125, 0.201904296875, 0.21142578125, 0.220947265625, 0.23046875, 0.239990234375, 0.24951171875, 0.259033203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 10.0, 7.0, 3.0, 6.0, 11.0, 12.0, 15.0, 20.0, 40.0, 45.0, 75.0, 169.0, 299.0, 841.0, 1364.0, 557.0, 223.0, 114.0, 75.0, 66.0, 31.0, 25.0, 13.0, 15.0, 10.0, 5.0, 2.0, 3.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.145263671875, -0.1399364471435547, -0.13460922241210938, -0.12928199768066406, -0.12395477294921875, -0.11862754821777344, -0.11330032348632812, -0.10797309875488281, -0.1026458740234375, -0.09731864929199219, -0.09199142456054688, -0.08666419982910156, -0.08133697509765625, -0.07600975036621094, -0.07068252563476562, -0.06535530090332031, -0.060028076171875, -0.05470085144042969, -0.049373626708984375, -0.04404640197753906, -0.03871917724609375, -0.03339195251464844, -0.028064727783203125, -0.022737503051757812, -0.0174102783203125, -0.012083053588867188, -0.006755828857421875, -0.0014286041259765625, 0.00389862060546875, 0.009225845336914062, 0.014553070068359375, 0.019880294799804688, 0.02520751953125, 0.030534744262695312, 0.035861968994140625, 0.04118919372558594, 0.04651641845703125, 0.05184364318847656, 0.057170867919921875, 0.06249809265136719, 0.0678253173828125, 0.07315254211425781, 0.07847976684570312, 0.08380699157714844, 0.08913421630859375, 0.09446144104003906, 0.09978866577148438, 0.10511589050292969, 0.110443115234375, 0.11577033996582031, 0.12109756469726562, 0.12642478942871094, 0.13175201416015625, 0.13707923889160156, 0.14240646362304688, 0.1477336883544922, 0.1530609130859375, 0.1583881378173828, 0.16371536254882812, 0.16904258728027344, 0.17436981201171875, 0.17969703674316406, 0.18502426147460938, 0.1903514862060547, 0.1956787109375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 18.0, 108.0, 481.0, 327.0, 53.0, 12.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.786720037460327, -3.716315269470215, -3.6459105014801025, -3.5755057334899902, -3.505100965499878, -3.4346961975097656, -3.3642914295196533, -3.293886661529541, -3.223482131958008, -3.1530773639678955, -3.082672595977783, -3.012267827987671, -2.9418630599975586, -2.8714582920074463, -2.801053524017334, -2.730648994445801, -2.6602439880371094, -2.589839220046997, -2.5194344520568848, -2.4490296840667725, -2.37862491607666, -2.308220148086548, -2.2378153800964355, -2.1674108505249023, -2.097005844116211, -2.0266010761260986, -1.9561963081359863, -1.885791540145874, -1.8153867721557617, -1.7449820041656494, -1.6745773553848267, -1.6041725873947144, -1.5337679386138916, -1.4633631706237793, -1.392958402633667, -1.3225536346435547, -1.2521488666534424, -1.18174409866333, -1.1113394498825073, -1.040934681892395, -0.9705298542976379, -0.9001250863075256, -0.8297203779220581, -0.7593156099319458, -0.6889108419418335, -0.6185060739517212, -0.5481013059616089, -0.47769659757614136, -0.40729182958602905, -0.33688706159591675, -0.26648232340812683, -0.19607757031917572, -0.1256728172302246, -0.055268049240112305, 0.015136688947677612, 0.08554142713546753, 0.15594619512557983, 0.22635094821453094, 0.29675570130348206, 0.367160439491272, 0.4375652074813843, 0.5079699754714966, 0.5783747434616089, 0.6487794518470764, 0.7191842198371887]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 10.0, 2.0, 9.0, 11.0, 14.0, 20.0, 30.0, 36.0, 40.0, 66.0, 63.0, 63.0, 67.0, 75.0, 79.0, 70.0, 78.0, 54.0, 46.0, 44.0, 37.0, 20.0, 16.0, 20.0, 14.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6763163208961487, -0.6550523042678833, -0.6337883472442627, -0.6125243306159973, -0.5912603139877319, -0.5699962973594666, -0.5487322807312012, -0.5274683237075806, -0.5062043070793152, -0.4849402904510498, -0.4636763036251068, -0.4424123167991638, -0.42114830017089844, -0.39988428354263306, -0.37862029671669006, -0.35735630989074707, -0.3360922932624817, -0.3148282766342163, -0.2935642898082733, -0.2723003029823303, -0.25103628635406494, -0.22977228462696075, -0.20850828289985657, -0.18724428117275238, -0.1659802794456482, -0.144716277718544, -0.12345227599143982, -0.10218827426433563, -0.08092427253723145, -0.05966027081012726, -0.03839626908302307, -0.017132267355918884, 0.004131793975830078, 0.025395795702934265, 0.04665979743003845, 0.06792379915714264, 0.08918780088424683, 0.11045180261135101, 0.1317158043384552, 0.1529798060655594, 0.17424380779266357, 0.19550780951976776, 0.21677181124687195, 0.23803581297397614, 0.2592998147010803, 0.2805638313293457, 0.3018278181552887, 0.3230918049812317, 0.34435582160949707, 0.36561983823776245, 0.38688382506370544, 0.40814781188964844, 0.4294118285179138, 0.4506758451461792, 0.4719398319721222, 0.4932038187980652, 0.5144678354263306, 0.535731852054596, 0.5569958686828613, 0.5782598257064819, 0.5995238423347473, 0.6207878589630127, 0.6420518159866333, 0.6633158326148987, 0.6845798492431641]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 5.0, 6.0, 11.0, 15.0, 21.0, 40.0, 41.0, 65.0, 68.0, 130.0, 169.0, 274.0, 449.0, 672.0, 1157.0, 2015.0, 3678.0, 6718.0, 14294.0, 33401.0, 845278.0, 90388.0, 25353.0, 11327.0, 5641.0, 2948.0, 1681.0, 1000.0, 534.0, 385.0, 245.0, 165.0, 105.0, 68.0, 51.0, 38.0, 18.0, 25.0, 21.0, 12.0, 17.0, 12.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.82080078125, -0.7923507690429688, -0.7639007568359375, -0.7354507446289062, -0.707000732421875, -0.6785507202148438, -0.6501007080078125, -0.6216506958007812, -0.59320068359375, -0.5647506713867188, -0.5363006591796875, -0.5078506469726562, -0.479400634765625, -0.45095062255859375, -0.4225006103515625, -0.39405059814453125, -0.3656005859375, -0.33715057373046875, -0.3087005615234375, -0.28025054931640625, -0.251800537109375, -0.22335052490234375, -0.1949005126953125, -0.16645050048828125, -0.13800048828125, -0.10955047607421875, -0.0811004638671875, -0.05265045166015625, -0.024200439453125, 0.00424957275390625, 0.0326995849609375, 0.06114959716796875, 0.089599609375, 0.11804962158203125, 0.1464996337890625, 0.17494964599609375, 0.203399658203125, 0.23184967041015625, 0.2602996826171875, 0.28874969482421875, 0.31719970703125, 0.34564971923828125, 0.3740997314453125, 0.40254974365234375, 0.430999755859375, 0.45944976806640625, 0.4878997802734375, 0.5163497924804688, 0.5447998046875, 0.5732498168945312, 0.6016998291015625, 0.6301498413085938, 0.658599853515625, 0.6870498657226562, 0.7154998779296875, 0.7439498901367188, 0.77239990234375, 0.8008499145507812, 0.8292999267578125, 0.8577499389648438, 0.886199951171875, 0.9146499633789062, 0.9430999755859375, 0.9715499877929688, 1.0]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 6.0, 9.0, 11.0, 9.0, 12.0, 18.0, 15.0, 269.0, 516.0, 22.0, 12.0, 14.0, 5.0, 10.0, 13.0, 5.0, 4.0, 8.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.164306640625, -0.15961074829101562, -0.15491485595703125, -0.15021896362304688, -0.1455230712890625, -0.14082717895507812, -0.13613128662109375, -0.13143539428710938, -0.126739501953125, -0.12204360961914062, -0.11734771728515625, -0.11265182495117188, -0.1079559326171875, -0.10326004028320312, -0.09856414794921875, -0.09386825561523438, -0.08917236328125, -0.08447647094726562, -0.07978057861328125, -0.07508468627929688, -0.0703887939453125, -0.06569290161132812, -0.06099700927734375, -0.056301116943359375, -0.051605224609375, -0.046909332275390625, -0.04221343994140625, -0.037517547607421875, -0.0328216552734375, -0.028125762939453125, -0.02342987060546875, -0.018733978271484375, -0.0140380859375, -0.009342193603515625, -0.00464630126953125, 4.9591064453125e-05, 0.0047454833984375, 0.009441375732421875, 0.01413726806640625, 0.018833160400390625, 0.023529052734375, 0.028224945068359375, 0.03292083740234375, 0.037616729736328125, 0.0423126220703125, 0.047008514404296875, 0.05170440673828125, 0.056400299072265625, 0.06109619140625, 0.06579208374023438, 0.07048797607421875, 0.07518386840820312, 0.0798797607421875, 0.08457565307617188, 0.08927154541015625, 0.09396743774414062, 0.098663330078125, 0.10335922241210938, 0.10805511474609375, 0.11275100708007812, 0.1174468994140625, 0.12214279174804688, 0.12683868408203125, 0.13153457641601562, 0.13623046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 9.0, 3.0, 8.0, 20.0, 16.0, 22.0, 37.0, 45.0, 55.0, 90.0, 126.0, 177.0, 260.0, 441.0, 646.0, 1163.0, 2092.0, 3888.0, 7631.0, 16006.0, 35130.0, 82991.0, 199821.0, 343872.0, 202017.0, 83255.0, 35296.0, 16255.0, 7788.0, 4066.0, 2157.0, 1151.0, 708.0, 412.0, 276.0, 176.0, 115.0, 87.0, 59.0, 44.0, 42.0, 26.0, 30.0, 11.0, 8.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.36376953125, -0.3522224426269531, -0.34067535400390625, -0.3291282653808594, -0.3175811767578125, -0.3060340881347656, -0.29448699951171875, -0.2829399108886719, -0.271392822265625, -0.2598457336425781, -0.24829864501953125, -0.23675155639648438, -0.2252044677734375, -0.21365737915039062, -0.20211029052734375, -0.19056320190429688, -0.17901611328125, -0.16746902465820312, -0.15592193603515625, -0.14437484741210938, -0.1328277587890625, -0.12128067016601562, -0.10973358154296875, -0.09818649291992188, -0.086639404296875, -0.07509231567382812, -0.06354522705078125, -0.051998138427734375, -0.0404510498046875, -0.028903961181640625, -0.01735687255859375, -0.005809783935546875, 0.0057373046875, 0.017284393310546875, 0.02883148193359375, 0.040378570556640625, 0.0519256591796875, 0.06347274780273438, 0.07501983642578125, 0.08656692504882812, 0.098114013671875, 0.10966110229492188, 0.12120819091796875, 0.13275527954101562, 0.1443023681640625, 0.15584945678710938, 0.16739654541015625, 0.17894363403320312, 0.19049072265625, 0.20203781127929688, 0.21358489990234375, 0.22513198852539062, 0.2366790771484375, 0.24822616577148438, 0.25977325439453125, 0.2713203430175781, 0.282867431640625, 0.2944145202636719, 0.30596160888671875, 0.3175086975097656, 0.3290557861328125, 0.3406028747558594, 0.35214996337890625, 0.3636970520019531, 0.375244140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 9.0, 7.0, 15.0, 13.0, 9.0, 18.0, 16.0, 18.0, 21.0, 24.0, 29.0, 32.0, 31.0, 31.0, 37.0, 45.0, 45.0, 48.0, 39.0, 35.0, 43.0, 40.0, 55.0, 43.0, 38.0, 35.0, 27.0, 33.0, 15.0, 26.0, 22.0, 17.0, 20.0, 11.0, 13.0, 10.0, 6.0, 9.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.537109375, -0.5199966430664062, -0.5028839111328125, -0.48577117919921875, -0.468658447265625, -0.45154571533203125, -0.4344329833984375, -0.41732025146484375, -0.40020751953125, -0.38309478759765625, -0.3659820556640625, -0.34886932373046875, -0.331756591796875, -0.31464385986328125, -0.2975311279296875, -0.28041839599609375, -0.2633056640625, -0.24619293212890625, -0.2290802001953125, -0.21196746826171875, -0.194854736328125, -0.17774200439453125, -0.1606292724609375, -0.14351654052734375, -0.12640380859375, -0.10929107666015625, -0.0921783447265625, -0.07506561279296875, -0.057952880859375, -0.04084014892578125, -0.0237274169921875, -0.00661468505859375, 0.010498046875, 0.02761077880859375, 0.0447235107421875, 0.06183624267578125, 0.078948974609375, 0.09606170654296875, 0.1131744384765625, 0.13028717041015625, 0.14739990234375, 0.16451263427734375, 0.1816253662109375, 0.19873809814453125, 0.215850830078125, 0.23296356201171875, 0.2500762939453125, 0.26718902587890625, 0.2843017578125, 0.30141448974609375, 0.3185272216796875, 0.33563995361328125, 0.352752685546875, 0.36986541748046875, 0.3869781494140625, 0.40409088134765625, 0.42120361328125, 0.43831634521484375, 0.4554290771484375, 0.47254180908203125, 0.489654541015625, 0.5067672729492188, 0.5238800048828125, 0.5409927368164062, 0.55810546875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 13.0, 17.0, 18.0, 38.0, 57.0, 102.0, 147.0, 259.0, 501.0, 1124.0, 2898.0, 10898.0, 114289.0, 871400.0, 36633.0, 6399.0, 2028.0, 779.0, 392.0, 215.0, 105.0, 65.0, 55.0, 33.0, 20.0, 15.0, 12.0, 12.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.658203125, -0.6357498168945312, -0.6132965087890625, -0.5908432006835938, -0.568389892578125, -0.5459365844726562, -0.5234832763671875, -0.5010299682617188, -0.47857666015625, -0.45612335205078125, -0.4336700439453125, -0.41121673583984375, -0.388763427734375, -0.36631011962890625, -0.3438568115234375, -0.32140350341796875, -0.2989501953125, -0.27649688720703125, -0.2540435791015625, -0.23159027099609375, -0.209136962890625, -0.18668365478515625, -0.1642303466796875, -0.14177703857421875, -0.11932373046875, -0.09687042236328125, -0.0744171142578125, -0.05196380615234375, -0.029510498046875, -0.00705718994140625, 0.0153961181640625, 0.03784942626953125, 0.060302734375, 0.08275604248046875, 0.1052093505859375, 0.12766265869140625, 0.150115966796875, 0.17256927490234375, 0.1950225830078125, 0.21747589111328125, 0.23992919921875, 0.26238250732421875, 0.2848358154296875, 0.30728912353515625, 0.329742431640625, 0.35219573974609375, 0.3746490478515625, 0.39710235595703125, 0.4195556640625, 0.44200897216796875, 0.4644622802734375, 0.48691558837890625, 0.509368896484375, 0.5318222045898438, 0.5542755126953125, 0.5767288208007812, 0.59918212890625, 0.6216354370117188, 0.6440887451171875, 0.6665420532226562, 0.688995361328125, 0.7114486694335938, 0.7339019775390625, 0.7563552856445312, 0.77880859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 10.0, 14.0, 19.0, 23.0, 61.0, 70.0, 97.0, 161.0, 154.0, 135.0, 83.0, 56.0, 49.0, 23.0, 14.0, 12.0, 11.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.072355270385742e-05, -4.915241152048111e-05, -4.75812703371048e-05, -4.6010129153728485e-05, -4.443898797035217e-05, -4.286784678697586e-05, -4.129670560359955e-05, -3.9725564420223236e-05, -3.8154423236846924e-05, -3.658328205347061e-05, -3.50121408700943e-05, -3.344099968671799e-05, -3.1869858503341675e-05, -3.0298717319965363e-05, -2.872757613658905e-05, -2.7156434953212738e-05, -2.5585293769836426e-05, -2.4014152586460114e-05, -2.24430114030838e-05, -2.087187021970749e-05, -1.9300729036331177e-05, -1.7729587852954865e-05, -1.6158446669578552e-05, -1.458730548620224e-05, -1.3016164302825928e-05, -1.1445023119449615e-05, -9.873881936073303e-06, -8.302740752696991e-06, -6.731599569320679e-06, -5.1604583859443665e-06, -3.589317202568054e-06, -2.018176019191742e-06, -4.470348358154297e-07, 1.1241063475608826e-06, 2.695247530937195e-06, 4.266388714313507e-06, 5.837529897689819e-06, 7.408671081066132e-06, 8.979812264442444e-06, 1.0550953447818756e-05, 1.2122094631195068e-05, 1.369323581457138e-05, 1.5264376997947693e-05, 1.6835518181324005e-05, 1.8406659364700317e-05, 1.997780054807663e-05, 2.1548941731452942e-05, 2.3120082914829254e-05, 2.4691224098205566e-05, 2.626236528158188e-05, 2.783350646495819e-05, 2.9404647648334503e-05, 3.0975788831710815e-05, 3.254693001508713e-05, 3.411807119846344e-05, 3.568921238183975e-05, 3.7260353565216064e-05, 3.883149474859238e-05, 4.040263593196869e-05, 4.1973777115345e-05, 4.3544918298721313e-05, 4.5116059482097626e-05, 4.668720066547394e-05, 4.825834184885025e-05, 4.982948303222656e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 9.0, 12.0, 22.0, 16.0, 18.0, 34.0, 48.0, 65.0, 98.0, 136.0, 157.0, 311.0, 500.0, 712.0, 1239.0, 2217.0, 4069.0, 8727.0, 21787.0, 70175.0, 324699.0, 460006.0, 103002.0, 28707.0, 10685.0, 4791.0, 2522.0, 1385.0, 857.0, 515.0, 325.0, 207.0, 128.0, 100.0, 73.0, 41.0, 44.0, 24.0, 26.0, 17.0, 9.0, 10.0, 5.0, 4.0, 2.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.371337890625, -0.36013031005859375, -0.3489227294921875, -0.33771514892578125, -0.326507568359375, -0.31529998779296875, -0.3040924072265625, -0.29288482666015625, -0.28167724609375, -0.27046966552734375, -0.2592620849609375, -0.24805450439453125, -0.236846923828125, -0.22563934326171875, -0.2144317626953125, -0.20322418212890625, -0.1920166015625, -0.18080902099609375, -0.1696014404296875, -0.15839385986328125, -0.147186279296875, -0.13597869873046875, -0.1247711181640625, -0.11356353759765625, -0.10235595703125, -0.09114837646484375, -0.0799407958984375, -0.06873321533203125, -0.057525634765625, -0.04631805419921875, -0.0351104736328125, -0.02390289306640625, -0.0126953125, -0.00148773193359375, 0.0097198486328125, 0.02092742919921875, 0.032135009765625, 0.04334259033203125, 0.0545501708984375, 0.06575775146484375, 0.07696533203125, 0.08817291259765625, 0.0993804931640625, 0.11058807373046875, 0.121795654296875, 0.13300323486328125, 0.1442108154296875, 0.15541839599609375, 0.1666259765625, 0.17783355712890625, 0.1890411376953125, 0.20024871826171875, 0.211456298828125, 0.22266387939453125, 0.2338714599609375, 0.24507904052734375, 0.25628662109375, 0.26749420166015625, 0.2787017822265625, 0.28990936279296875, 0.301116943359375, 0.31232452392578125, 0.3235321044921875, 0.33473968505859375, 0.345947265625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 11.0, 15.0, 17.0, 20.0, 31.0, 24.0, 27.0, 43.0, 32.0, 53.0, 67.0, 86.0, 77.0, 55.0, 76.0, 57.0, 60.0, 50.0, 35.0, 34.0, 19.0, 18.0, 21.0, 11.0, 11.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.50634765625, -0.4898834228515625, -0.473419189453125, -0.4569549560546875, -0.44049072265625, -0.4240264892578125, -0.407562255859375, -0.3910980224609375, -0.3746337890625, -0.3581695556640625, -0.341705322265625, -0.3252410888671875, -0.30877685546875, -0.2923126220703125, -0.275848388671875, -0.2593841552734375, -0.242919921875, -0.2264556884765625, -0.209991455078125, -0.1935272216796875, -0.17706298828125, -0.1605987548828125, -0.144134521484375, -0.1276702880859375, -0.1112060546875, -0.0947418212890625, -0.078277587890625, -0.0618133544921875, -0.04534912109375, -0.0288848876953125, -0.012420654296875, 0.0040435791015625, 0.0205078125, 0.0369720458984375, 0.053436279296875, 0.0699005126953125, 0.08636474609375, 0.1028289794921875, 0.119293212890625, 0.1357574462890625, 0.1522216796875, 0.1686859130859375, 0.185150146484375, 0.2016143798828125, 0.21807861328125, 0.2345428466796875, 0.251007080078125, 0.2674713134765625, 0.283935546875, 0.3003997802734375, 0.316864013671875, 0.3333282470703125, 0.34979248046875, 0.3662567138671875, 0.382720947265625, 0.3991851806640625, 0.4156494140625, 0.4321136474609375, 0.448577880859375, 0.4650421142578125, 0.48150634765625, 0.4979705810546875, 0.514434814453125, 0.5308990478515625, 0.54736328125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 10.0, 28.0, 52.0, 153.0, 386.0, 232.0, 90.0, 20.0, 13.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.209859848022461, -13.842630386352539, -13.4753999710083, -13.108170509338379, -12.740941047668457, -12.373710632324219, -12.006481170654297, -11.639251708984375, -11.272022247314453, -10.904792785644531, -10.537562370300293, -10.170332908630371, -9.80310344696045, -9.435873031616211, -9.068643569946289, -8.701414108276367, -8.334183692932129, -7.966953754425049, -7.599724292755127, -7.232494354248047, -6.865264892578125, -6.498034954071045, -6.130805015563965, -5.763575553894043, -5.396345615386963, -5.029115676879883, -4.661886215209961, -4.294656276702881, -3.92742657661438, -3.560196876525879, -3.192966938018799, -2.825737237930298, -2.4585084915161133, -2.0912787914276123, -1.7240489721298218, -1.3568191528320312, -0.9895894527435303, -0.6223597526550293, -0.2551298141479492, 0.11209988594055176, 0.47932958602905273, 0.8465593457221985, 1.2137891054153442, 1.5810189247131348, 1.9482486248016357, 2.3154783248901367, 2.682708263397217, 3.0499379634857178, 3.4171676635742188, 3.7843973636627197, 4.151627063751221, 4.518857002258301, 4.886086463928223, 5.253316402435303, 5.620546340942383, 5.987775802612305, 6.355005741119385, 6.722235679626465, 7.089465141296387, 7.456695079803467, 7.823925018310547, 8.191154479980469, 8.55838394165039, 8.925614356994629, 9.29284381866455]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 3.0, 7.0, 17.0, 12.0, 17.0, 41.0, 37.0, 86.0, 111.0, 139.0, 134.0, 113.0, 76.0, 58.0, 46.0, 26.0, 14.0, 7.0, 7.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.37216567993164, -10.048008918762207, -9.723852157592773, -9.39969539642334, -9.075538635253906, -8.751382827758789, -8.427226066589355, -8.103069305419922, -7.778912544250488, -7.454755783081055, -7.130599021911621, -6.806442737579346, -6.482285976409912, -6.1581292152404785, -5.833972930908203, -5.5098161697387695, -5.185659408569336, -4.861502647399902, -4.537345886230469, -4.213189601898193, -3.8890328407287598, -3.564876079559326, -3.2407195568084717, -2.916563034057617, -2.5924062728881836, -2.26824951171875, -1.9440929889678955, -1.6199363470077515, -1.2957797050476074, -0.9716230630874634, -0.6474664211273193, -0.32330989837646484, 0.00084686279296875, 0.3250035047531128, 0.6491601467132568, 0.9733167886734009, 1.297473430633545, 1.621630072593689, 1.945786714553833, 2.2699432373046875, 2.594099998474121, 2.9182567596435547, 3.242413282394409, 3.5665698051452637, 3.8907265663146973, 4.214883327484131, 4.539039611816406, 4.86319637298584, 5.187353134155273, 5.511509895324707, 5.835666656494141, 6.159822940826416, 6.48397970199585, 6.808136463165283, 7.132292747497559, 7.456449508666992, 7.780606269836426, 8.10476303100586, 8.428919792175293, 8.753076553344727, 9.077232360839844, 9.401389122009277, 9.725545883178711, 10.049702644348145, 10.373859405517578]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 12.0, 17.0, 26.0, 49.0, 74.0, 152.0, 240.0, 477.0, 1016.0, 2413.0, 6504.0, 22931.0, 237135.0, 3864807.0, 44261.0, 9098.0, 2926.0, 1155.0, 451.0, 208.0, 132.0, 69.0, 44.0, 30.0, 10.0, 8.0, 11.0, 4.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.384765625, -1.33892822265625, -1.2930908203125, -1.24725341796875, -1.201416015625, -1.15557861328125, -1.1097412109375, -1.06390380859375, -1.01806640625, -0.97222900390625, -0.9263916015625, -0.88055419921875, -0.834716796875, -0.78887939453125, -0.7430419921875, -0.69720458984375, -0.6513671875, -0.60552978515625, -0.5596923828125, -0.51385498046875, -0.468017578125, -0.42218017578125, -0.3763427734375, -0.33050537109375, -0.28466796875, -0.23883056640625, -0.1929931640625, -0.14715576171875, -0.101318359375, -0.05548095703125, -0.0096435546875, 0.03619384765625, 0.08203125, 0.12786865234375, 0.1737060546875, 0.21954345703125, 0.265380859375, 0.31121826171875, 0.3570556640625, 0.40289306640625, 0.44873046875, 0.49456787109375, 0.5404052734375, 0.58624267578125, 0.632080078125, 0.67791748046875, 0.7237548828125, 0.76959228515625, 0.8154296875, 0.86126708984375, 0.9071044921875, 0.95294189453125, 0.998779296875, 1.04461669921875, 1.0904541015625, 1.13629150390625, 1.18212890625, 1.22796630859375, 1.2738037109375, 1.31964111328125, 1.365478515625, 1.41131591796875, 1.4571533203125, 1.50299072265625, 1.548828125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 8.0, 7.0, 6.0, 10.0, 9.0, 11.0, 21.0, 29.0, 88.0, 254.0, 252.0, 136.0, 53.0, 24.0, 13.0, 12.0, 13.0, 6.0, 6.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10723876953125, -0.10378456115722656, -0.10033035278320312, -0.09687614440917969, -0.09342193603515625, -0.08996772766113281, -0.08651351928710938, -0.08305931091308594, -0.0796051025390625, -0.07615089416503906, -0.07269668579101562, -0.06924247741699219, -0.06578826904296875, -0.06233406066894531, -0.058879852294921875, -0.05542564392089844, -0.051971435546875, -0.04851722717285156, -0.045063018798828125, -0.04160881042480469, -0.03815460205078125, -0.03470039367675781, -0.031246185302734375, -0.027791976928710938, -0.0243377685546875, -0.020883560180664062, -0.017429351806640625, -0.013975143432617188, -0.01052093505859375, -0.0070667266845703125, -0.003612518310546875, -0.0001583099365234375, 0.0032958984375, 0.0067501068115234375, 0.010204315185546875, 0.013658523559570312, 0.01711273193359375, 0.020566940307617188, 0.024021148681640625, 0.027475357055664062, 0.0309295654296875, 0.03438377380371094, 0.037837982177734375, 0.04129219055175781, 0.04474639892578125, 0.04820060729980469, 0.051654815673828125, 0.05510902404785156, 0.058563232421875, 0.06201744079589844, 0.06547164916992188, 0.06892585754394531, 0.07238006591796875, 0.07583427429199219, 0.07928848266601562, 0.08274269104003906, 0.0861968994140625, 0.08965110778808594, 0.09310531616210938, 0.09655952453613281, 0.10001373291015625, 0.10346794128417969, 0.10692214965820312, 0.11037635803222656, 0.11383056640625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 10.0, 19.0, 28.0, 29.0, 48.0, 61.0, 84.0, 132.0, 202.0, 323.0, 600.0, 1029.0, 1852.0, 3746.0, 8169.0, 19684.0, 60572.0, 348907.0, 3339545.0, 317426.0, 57386.0, 18811.0, 7752.0, 3609.0, 1779.0, 976.0, 529.0, 329.0, 201.0, 131.0, 83.0, 63.0, 41.0, 41.0, 23.0, 13.0, 16.0, 9.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.517578125, -0.5000228881835938, -0.4824676513671875, -0.46491241455078125, -0.447357177734375, -0.42980194091796875, -0.4122467041015625, -0.39469146728515625, -0.37713623046875, -0.35958099365234375, -0.3420257568359375, -0.32447052001953125, -0.306915283203125, -0.28936004638671875, -0.2718048095703125, -0.25424957275390625, -0.2366943359375, -0.21913909912109375, -0.2015838623046875, -0.18402862548828125, -0.166473388671875, -0.14891815185546875, -0.1313629150390625, -0.11380767822265625, -0.09625244140625, -0.07869720458984375, -0.0611419677734375, -0.04358673095703125, -0.026031494140625, -0.00847625732421875, 0.0090789794921875, 0.02663421630859375, 0.044189453125, 0.06174468994140625, 0.0792999267578125, 0.09685516357421875, 0.114410400390625, 0.13196563720703125, 0.1495208740234375, 0.16707611083984375, 0.18463134765625, 0.20218658447265625, 0.2197418212890625, 0.23729705810546875, 0.254852294921875, 0.27240753173828125, 0.2899627685546875, 0.30751800537109375, 0.3250732421875, 0.34262847900390625, 0.3601837158203125, 0.37773895263671875, 0.395294189453125, 0.41284942626953125, 0.4304046630859375, 0.44795989990234375, 0.46551513671875, 0.48307037353515625, 0.5006256103515625, 0.5181808471679688, 0.535736083984375, 0.5532913208007812, 0.5708465576171875, 0.5884017944335938, 0.60595703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 7.0, 3.0, 2.0, 6.0, 8.0, 16.0, 9.0, 21.0, 28.0, 27.0, 35.0, 65.0, 89.0, 178.0, 323.0, 661.0, 1384.0, 571.0, 226.0, 132.0, 68.0, 44.0, 40.0, 28.0, 18.0, 12.0, 13.0, 8.0, 5.0, 11.0, 5.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09295654296875, -0.0891561508178711, -0.08535575866699219, -0.08155536651611328, -0.07775497436523438, -0.07395458221435547, -0.07015419006347656, -0.06635379791259766, -0.06255340576171875, -0.058753013610839844, -0.05495262145996094, -0.05115222930908203, -0.047351837158203125, -0.04355144500732422, -0.03975105285644531, -0.035950660705566406, -0.0321502685546875, -0.028349876403808594, -0.024549484252929688, -0.02074909210205078, -0.016948699951171875, -0.013148307800292969, -0.009347915649414062, -0.005547523498535156, -0.00174713134765625, 0.0020532608032226562, 0.0058536529541015625, 0.009654045104980469, 0.013454437255859375, 0.01725482940673828, 0.021055221557617188, 0.024855613708496094, 0.028656005859375, 0.032456398010253906, 0.03625679016113281, 0.04005718231201172, 0.043857574462890625, 0.04765796661376953, 0.05145835876464844, 0.055258750915527344, 0.05905914306640625, 0.06285953521728516, 0.06665992736816406, 0.07046031951904297, 0.07426071166992188, 0.07806110382080078, 0.08186149597167969, 0.0856618881225586, 0.0894622802734375, 0.0932626724243164, 0.09706306457519531, 0.10086345672607422, 0.10466384887695312, 0.10846424102783203, 0.11226463317871094, 0.11606502532958984, 0.11986541748046875, 0.12366580963134766, 0.12746620178222656, 0.13126659393310547, 0.13506698608398438, 0.13886737823486328, 0.1426677703857422, 0.1464681625366211, 0.1502685546875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 8.0, 7.0, 17.0, 103.0, 657.0, 189.0, 14.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3823251724243164, -2.2728469371795654, -2.1633689403533936, -2.0538907051086426, -1.9444127082824707, -1.8349344730377197, -1.7254564762115479, -1.6159782409667969, -1.506500244140625, -1.3970221281051636, -1.2875440120697021, -1.1780658960342407, -1.0685877799987793, -0.9591096043586731, -0.8496314883232117, -0.7401533722877502, -0.630675196647644, -0.5211970806121826, -0.4117189645767212, -0.3022408187389374, -0.19276270270347595, -0.08328455686569214, 0.026193559169769287, 0.1356716752052307, 0.24514979124069214, 0.35462790727615356, 0.464106023311615, 0.5735841989517212, 0.6830623149871826, 0.792540431022644, 0.9020185470581055, 1.011496663093567, 1.1209747791290283, 1.2304528951644897, 1.3399310111999512, 1.4494091272354126, 1.558887243270874, 1.668365478515625, 1.7778434753417969, 1.8873217105865479, 1.9967997074127197, 2.1062779426574707, 2.2157559394836426, 2.3252341747283936, 2.4347121715545654, 2.5441904067993164, 2.6536684036254883, 2.7631466388702393, 2.8726248741149902, 2.982103109359741, 3.091581106185913, 3.201059341430664, 3.310537338256836, 3.420015573501587, 3.529493570327759, 3.6389718055725098, 3.7484498023986816, 3.8579280376434326, 3.9674060344696045, 4.0768842697143555, 4.186362266540527, 4.295840263366699, 4.405318737030029, 4.514796733856201, 4.624274730682373]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 8.0, 2.0, 4.0, 4.0, 6.0, 9.0, 16.0, 12.0, 27.0, 30.0, 31.0, 55.0, 58.0, 56.0, 85.0, 71.0, 86.0, 73.0, 81.0, 80.0, 44.0, 34.0, 35.0, 17.0, 20.0, 18.0, 7.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7327967286109924, -0.7100450396537781, -0.6872933506965637, -0.6645417213439941, -0.6417900323867798, -0.6190383434295654, -0.5962866544723511, -0.5735349655151367, -0.5507832765579224, -0.528031587600708, -0.5052798986434937, -0.4825282394886017, -0.45977655053138733, -0.43702489137649536, -0.414273202419281, -0.39152151346206665, -0.3687698543071747, -0.3460181653499603, -0.32326650619506836, -0.300514817237854, -0.27776312828063965, -0.2550114393234253, -0.23225978016853333, -0.20950809121131897, -0.1867564171552658, -0.16400474309921265, -0.1412530541419983, -0.11850138008594513, -0.09574969857931137, -0.07299801707267761, -0.05024634301662445, -0.027494654059410095, -0.004742980003356934, 0.018008699640631676, 0.040760379284620285, 0.06351205706596375, 0.0862637385725975, 0.10901542007923126, 0.13176709413528442, 0.15451878309249878, 0.17727045714855194, 0.2000221312046051, 0.22277382016181946, 0.24552549421787262, 0.2682771682739258, 0.29102885723114014, 0.3137805461883545, 0.33653223514556885, 0.3592838943004608, 0.38203558325767517, 0.40478724241256714, 0.4275389313697815, 0.45029062032699585, 0.4730423092842102, 0.4957939684391022, 0.5185456275939941, 0.5412973165512085, 0.5640490055084229, 0.5868006944656372, 0.6095523834228516, 0.6323040127754211, 0.6550557017326355, 0.6778073906898499, 0.7005590796470642, 0.7233107686042786]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 13.0, 13.0, 18.0, 24.0, 29.0, 46.0, 49.0, 80.0, 128.0, 189.0, 293.0, 459.0, 721.0, 1155.0, 1926.0, 3389.0, 6515.0, 13029.0, 29355.0, 135659.0, 724044.0, 82336.0, 24356.0, 11247.0, 5765.0, 3071.0, 1751.0, 989.0, 636.0, 386.0, 269.0, 197.0, 133.0, 95.0, 61.0, 40.0, 28.0, 23.0, 8.0, 9.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.724609375, -0.702239990234375, -0.67987060546875, -0.657501220703125, -0.6351318359375, -0.612762451171875, -0.59039306640625, -0.568023681640625, -0.545654296875, -0.523284912109375, -0.50091552734375, -0.478546142578125, -0.4561767578125, -0.433807373046875, -0.41143798828125, -0.389068603515625, -0.36669921875, -0.344329833984375, -0.32196044921875, -0.299591064453125, -0.2772216796875, -0.254852294921875, -0.23248291015625, -0.210113525390625, -0.187744140625, -0.165374755859375, -0.14300537109375, -0.120635986328125, -0.0982666015625, -0.075897216796875, -0.05352783203125, -0.031158447265625, -0.0087890625, 0.013580322265625, 0.03594970703125, 0.058319091796875, 0.0806884765625, 0.103057861328125, 0.12542724609375, 0.147796630859375, 0.170166015625, 0.192535400390625, 0.21490478515625, 0.237274169921875, 0.2596435546875, 0.282012939453125, 0.30438232421875, 0.326751708984375, 0.34912109375, 0.371490478515625, 0.39385986328125, 0.416229248046875, 0.4385986328125, 0.460968017578125, 0.48333740234375, 0.505706787109375, 0.528076171875, 0.550445556640625, 0.57281494140625, 0.595184326171875, 0.6175537109375, 0.639923095703125, 0.66229248046875, 0.684661865234375, 0.70703125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 8.0, 9.0, 6.0, 11.0, 14.0, 12.0, 22.0, 36.0, 123.0, 212.0, 238.0, 141.0, 53.0, 37.0, 13.0, 13.0, 11.0, 8.0, 6.0, 1.0, 7.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10198974609375, -0.09858417510986328, -0.09517860412597656, -0.09177303314208984, -0.08836746215820312, -0.0849618911743164, -0.08155632019042969, -0.07815074920654297, -0.07474517822265625, -0.07133960723876953, -0.06793403625488281, -0.0645284652709961, -0.061122894287109375, -0.057717323303222656, -0.05431175231933594, -0.05090618133544922, -0.0475006103515625, -0.04409503936767578, -0.04068946838378906, -0.037283897399902344, -0.033878326416015625, -0.030472755432128906, -0.027067184448242188, -0.02366161346435547, -0.02025604248046875, -0.01685047149658203, -0.013444900512695312, -0.010039329528808594, -0.006633758544921875, -0.0032281875610351562, 0.0001773834228515625, 0.0035829544067382812, 0.006988525390625, 0.010394096374511719, 0.013799667358398438, 0.017205238342285156, 0.020610809326171875, 0.024016380310058594, 0.027421951293945312, 0.03082752227783203, 0.03423309326171875, 0.03763866424560547, 0.04104423522949219, 0.044449806213378906, 0.047855377197265625, 0.051260948181152344, 0.05466651916503906, 0.05807209014892578, 0.0614776611328125, 0.06488323211669922, 0.06828880310058594, 0.07169437408447266, 0.07509994506835938, 0.0785055160522461, 0.08191108703613281, 0.08531665802001953, 0.08872222900390625, 0.09212779998779297, 0.09553337097167969, 0.0989389419555664, 0.10234451293945312, 0.10575008392333984, 0.10915565490722656, 0.11256122589111328, 0.115966796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 12.0, 42.0, 155.0, 627.0, 2914.0, 25821.0, 500616.0, 489666.0, 24984.0, 2842.0, 649.0, 151.0, 30.0, 11.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.3525390625, -1.3169403076171875, -1.281341552734375, -1.2457427978515625, -1.21014404296875, -1.1745452880859375, -1.138946533203125, -1.1033477783203125, -1.0677490234375, -1.0321502685546875, -0.996551513671875, -0.9609527587890625, -0.92535400390625, -0.8897552490234375, -0.854156494140625, -0.8185577392578125, -0.782958984375, -0.7473602294921875, -0.711761474609375, -0.6761627197265625, -0.64056396484375, -0.6049652099609375, -0.569366455078125, -0.5337677001953125, -0.4981689453125, -0.4625701904296875, -0.426971435546875, -0.3913726806640625, -0.35577392578125, -0.3201751708984375, -0.284576416015625, -0.2489776611328125, -0.21337890625, -0.1777801513671875, -0.142181396484375, -0.1065826416015625, -0.07098388671875, -0.0353851318359375, 0.000213623046875, 0.0358123779296875, 0.0714111328125, 0.1070098876953125, 0.142608642578125, 0.1782073974609375, 0.21380615234375, 0.2494049072265625, 0.285003662109375, 0.3206024169921875, 0.356201171875, 0.3917999267578125, 0.427398681640625, 0.4629974365234375, 0.49859619140625, 0.5341949462890625, 0.569793701171875, 0.6053924560546875, 0.6409912109375, 0.6765899658203125, 0.712188720703125, 0.7477874755859375, 0.78338623046875, 0.8189849853515625, 0.854583740234375, 0.8901824951171875, 0.92578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 9.0, 7.0, 11.0, 9.0, 16.0, 13.0, 18.0, 24.0, 23.0, 20.0, 35.0, 28.0, 41.0, 40.0, 45.0, 59.0, 46.0, 55.0, 46.0, 55.0, 53.0, 49.0, 42.0, 49.0, 24.0, 28.0, 35.0, 19.0, 23.0, 15.0, 14.0, 18.0, 13.0, 7.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.404541015625, -0.39459228515625, -0.3846435546875, -0.37469482421875, -0.36474609375, -0.35479736328125, -0.3448486328125, -0.33489990234375, -0.324951171875, -0.31500244140625, -0.3050537109375, -0.29510498046875, -0.28515625, -0.27520751953125, -0.2652587890625, -0.25531005859375, -0.245361328125, -0.23541259765625, -0.2254638671875, -0.21551513671875, -0.20556640625, -0.19561767578125, -0.1856689453125, -0.17572021484375, -0.165771484375, -0.15582275390625, -0.1458740234375, -0.13592529296875, -0.1259765625, -0.11602783203125, -0.1060791015625, -0.09613037109375, -0.086181640625, -0.07623291015625, -0.0662841796875, -0.05633544921875, -0.04638671875, -0.03643798828125, -0.0264892578125, -0.01654052734375, -0.006591796875, 0.00335693359375, 0.0133056640625, 0.02325439453125, 0.033203125, 0.04315185546875, 0.0531005859375, 0.06304931640625, 0.072998046875, 0.08294677734375, 0.0928955078125, 0.10284423828125, 0.11279296875, 0.12274169921875, 0.1326904296875, 0.14263916015625, 0.152587890625, 0.16253662109375, 0.1724853515625, 0.18243408203125, 0.1923828125, 0.20233154296875, 0.2122802734375, 0.22222900390625, 0.232177734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 8.0, 12.0, 4.0, 9.0, 28.0, 41.0, 40.0, 85.0, 154.0, 327.0, 976.0, 4774.0, 129978.0, 896073.0, 13231.0, 1800.0, 487.0, 234.0, 119.0, 55.0, 28.0, 30.0, 12.0, 10.0, 7.0, 6.0, 9.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.662109375, -1.6149139404296875, -1.567718505859375, -1.5205230712890625, -1.47332763671875, -1.4261322021484375, -1.378936767578125, -1.3317413330078125, -1.2845458984375, -1.2373504638671875, -1.190155029296875, -1.1429595947265625, -1.09576416015625, -1.0485687255859375, -1.001373291015625, -0.9541778564453125, -0.906982421875, -0.8597869873046875, -0.812591552734375, -0.7653961181640625, -0.71820068359375, -0.6710052490234375, -0.623809814453125, -0.5766143798828125, -0.5294189453125, -0.4822235107421875, -0.435028076171875, -0.3878326416015625, -0.34063720703125, -0.2934417724609375, -0.246246337890625, -0.1990509033203125, -0.15185546875, -0.1046600341796875, -0.057464599609375, -0.0102691650390625, 0.03692626953125, 0.0841217041015625, 0.131317138671875, 0.1785125732421875, 0.2257080078125, 0.2729034423828125, 0.320098876953125, 0.3672943115234375, 0.41448974609375, 0.4616851806640625, 0.508880615234375, 0.5560760498046875, 0.603271484375, 0.6504669189453125, 0.697662353515625, 0.7448577880859375, 0.79205322265625, 0.8392486572265625, 0.886444091796875, 0.9336395263671875, 0.9808349609375, 1.0280303955078125, 1.075225830078125, 1.1224212646484375, 1.16961669921875, 1.2168121337890625, 1.264007568359375, 1.3112030029296875, 1.3583984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 3.0, 10.0, 11.0, 13.0, 18.0, 48.0, 53.0, 80.0, 113.0, 100.0, 164.0, 103.0, 75.0, 49.0, 44.0, 34.0, 13.0, 23.0, 11.0, 7.0, 4.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8160552978515625e-05, -4.656333476305008e-05, -4.4966116547584534e-05, -4.336889833211899e-05, -4.177168011665344e-05, -4.01744619011879e-05, -3.857724368572235e-05, -3.6980025470256805e-05, -3.538280725479126e-05, -3.3785589039325714e-05, -3.218837082386017e-05, -3.059115260839462e-05, -2.8993934392929077e-05, -2.739671617746353e-05, -2.5799497961997986e-05, -2.420227974653244e-05, -2.2605061531066895e-05, -2.100784331560135e-05, -1.9410625100135803e-05, -1.7813406884670258e-05, -1.6216188669204712e-05, -1.4618970453739166e-05, -1.302175223827362e-05, -1.1424534022808075e-05, -9.82731580734253e-06, -8.230097591876984e-06, -6.632879376411438e-06, -5.035661160945892e-06, -3.4384429454803467e-06, -1.841224730014801e-06, -2.4400651454925537e-07, 1.3532117009162903e-06, 2.950429916381836e-06, 4.547648131847382e-06, 6.144866347312927e-06, 7.742084562778473e-06, 9.339302778244019e-06, 1.0936520993709564e-05, 1.253373920917511e-05, 1.4130957424640656e-05, 1.57281756401062e-05, 1.7325393855571747e-05, 1.8922612071037292e-05, 2.0519830286502838e-05, 2.2117048501968384e-05, 2.371426671743393e-05, 2.5311484932899475e-05, 2.690870314836502e-05, 2.8505921363830566e-05, 3.0103139579296112e-05, 3.170035779476166e-05, 3.32975760102272e-05, 3.489479422569275e-05, 3.6492012441158295e-05, 3.808923065662384e-05, 3.9686448872089386e-05, 4.128366708755493e-05, 4.288088530302048e-05, 4.447810351848602e-05, 4.607532173395157e-05, 4.7672539949417114e-05, 4.926975816488266e-05, 5.0866976380348206e-05, 5.246419459581375e-05, 5.40614128112793e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 8.0, 10.0, 14.0, 12.0, 32.0, 43.0, 68.0, 84.0, 163.0, 306.0, 507.0, 1072.0, 2495.0, 7182.0, 29450.0, 226701.0, 651595.0, 103442.0, 17182.0, 4607.0, 1752.0, 805.0, 383.0, 249.0, 132.0, 92.0, 49.0, 37.0, 18.0, 21.0, 12.0, 6.0, 4.0, 2.0, 5.0, 4.0, 4.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55712890625, -0.5393447875976562, -0.5215606689453125, -0.5037765502929688, -0.485992431640625, -0.46820831298828125, -0.4504241943359375, -0.43264007568359375, -0.41485595703125, -0.39707183837890625, -0.3792877197265625, -0.36150360107421875, -0.343719482421875, -0.32593536376953125, -0.3081512451171875, -0.29036712646484375, -0.2725830078125, -0.25479888916015625, -0.2370147705078125, -0.21923065185546875, -0.201446533203125, -0.18366241455078125, -0.1658782958984375, -0.14809417724609375, -0.13031005859375, -0.11252593994140625, -0.0947418212890625, -0.07695770263671875, -0.059173583984375, -0.04138946533203125, -0.0236053466796875, -0.00582122802734375, 0.011962890625, 0.02974700927734375, 0.0475311279296875, 0.06531524658203125, 0.083099365234375, 0.10088348388671875, 0.1186676025390625, 0.13645172119140625, 0.15423583984375, 0.17201995849609375, 0.1898040771484375, 0.20758819580078125, 0.225372314453125, 0.24315643310546875, 0.2609405517578125, 0.27872467041015625, 0.2965087890625, 0.31429290771484375, 0.3320770263671875, 0.34986114501953125, 0.367645263671875, 0.38542938232421875, 0.4032135009765625, 0.42099761962890625, 0.43878173828125, 0.45656585693359375, 0.4743499755859375, 0.49213409423828125, 0.509918212890625, 0.5277023315429688, 0.5454864501953125, 0.5632705688476562, 0.5810546875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 10.0, 5.0, 10.0, 16.0, 21.0, 29.0, 52.0, 70.0, 88.0, 100.0, 132.0, 93.0, 101.0, 88.0, 57.0, 44.0, 25.0, 22.0, 16.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.433349609375, -0.4177589416503906, -0.40216827392578125, -0.3865776062011719, -0.3709869384765625, -0.3553962707519531, -0.33980560302734375, -0.3242149353027344, -0.308624267578125, -0.2930335998535156, -0.27744293212890625, -0.2618522644042969, -0.2462615966796875, -0.23067092895507812, -0.21508026123046875, -0.19948959350585938, -0.18389892578125, -0.16830825805664062, -0.15271759033203125, -0.13712692260742188, -0.1215362548828125, -0.10594558715820312, -0.09035491943359375, -0.07476425170898438, -0.059173583984375, -0.043582916259765625, -0.02799224853515625, -0.012401580810546875, 0.0031890869140625, 0.018779754638671875, 0.03437042236328125, 0.049961090087890625, 0.0655517578125, 0.08114242553710938, 0.09673309326171875, 0.11232376098632812, 0.1279144287109375, 0.14350509643554688, 0.15909576416015625, 0.17468643188476562, 0.190277099609375, 0.20586776733398438, 0.22145843505859375, 0.23704910278320312, 0.2526397705078125, 0.2682304382324219, 0.28382110595703125, 0.2994117736816406, 0.31500244140625, 0.3305931091308594, 0.34618377685546875, 0.3617744445800781, 0.3773651123046875, 0.3929557800292969, 0.40854644775390625, 0.4241371154785156, 0.439727783203125, 0.4553184509277344, 0.47090911865234375, 0.4864997863769531, 0.5020904541015625, 0.5176811218261719, 0.5332717895507812, 0.5488624572753906, 0.564453125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 16.0, 96.0, 649.0, 216.0, 14.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4247407913208, -11.9757661819458, -11.5267915725708, -11.0778169631958, -10.6288423538208, -10.1798677444458, -9.730894088745117, -9.281919479370117, -8.832944869995117, -8.383970260620117, -7.934995651245117, -7.486021041870117, -7.037046432495117, -6.588071823120117, -6.139097690582275, -5.690123081207275, -5.241147994995117, -4.792173385620117, -4.343198776245117, -3.8942244052886963, -3.4452497959136963, -2.9962751865386963, -2.5473008155822754, -2.0983262062072754, -1.6493515968322754, -1.2003769874572754, -0.7514024972915649, -0.3024280071258545, 0.1465466022491455, 0.5955212116241455, 1.0444955825805664, 1.4934701919555664, 1.9424457550048828, 2.391420364379883, 2.840394973754883, 3.2893693447113037, 3.7383439540863037, 4.187318801879883, 4.636292934417725, 5.085267543792725, 5.534242153167725, 5.983216762542725, 6.432191371917725, 6.881165504455566, 7.330140113830566, 7.779114723205566, 8.228089332580566, 8.677063941955566, 9.126038551330566, 9.575013160705566, 10.023987770080566, 10.472962379455566, 10.921936988830566, 11.370911598205566, 11.81988525390625, 12.26885986328125, 12.71783447265625, 13.16680908203125, 13.61578369140625, 14.06475830078125, 14.51373291015625, 14.96270751953125, 15.41168212890625, 15.86065673828125, 16.30963134765625]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 6.0, 4.0, 8.0, 10.0, 12.0, 12.0, 25.0, 34.0, 46.0, 65.0, 78.0, 98.0, 109.0, 101.0, 93.0, 61.0, 70.0, 52.0, 37.0, 22.0, 18.0, 13.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.923542499542236, -4.799688816070557, -4.675835609436035, -4.5519819259643555, -4.428128242492676, -4.304275035858154, -4.180421352386475, -4.056567668914795, -3.9327144622802734, -3.808861017227173, -3.685007333755493, -3.5611538887023926, -3.437300443649292, -3.3134469985961914, -3.1895933151245117, -3.065739870071411, -2.9418861865997314, -2.818032741546631, -2.694179058074951, -2.5703256130218506, -2.44647216796875, -2.3226184844970703, -2.1987650394439697, -2.074911594390869, -1.951058030128479, -1.8272044658660889, -1.7033510208129883, -1.5794974565505981, -1.455643892288208, -1.3317904472351074, -1.2079368829727173, -1.0840833187103271, -0.9602298736572266, -0.8363763689994812, -0.7125228643417358, -0.5886693000793457, -0.46481579542160034, -0.340962290763855, -0.21710872650146484, -0.09325522184371948, 0.03059828281402588, 0.15445180237293243, 0.278305321931839, 0.40215885639190674, 0.5260123610496521, 0.6498658657073975, 0.7737194299697876, 0.897572934627533, 1.0214264392852783, 1.1452800035476685, 1.269133448600769, 1.3929870128631592, 1.5168404579162598, 1.64069402217865, 1.76454758644104, 1.8884010314941406, 2.0122547149658203, 2.136108160018921, 2.2599618434906006, 2.383815288543701, 2.5076687335968018, 2.6315221786499023, 2.755375862121582, 2.8792293071746826, 3.003082752227783]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 1.0, 6.0, 6.0, 4.0, 2.0, 12.0, 8.0, 16.0, 11.0, 20.0, 29.0, 37.0, 45.0, 56.0, 98.0, 116.0, 196.0, 313.0, 562.0, 1043.0, 2126.0, 5984.0, 40127.0, 4090465.0, 42854.0, 6186.0, 2020.0, 858.0, 425.0, 246.0, 120.0, 86.0, 65.0, 25.0, 31.0, 23.0, 16.0, 12.0, 7.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.775390625, -2.69256591796875, -2.6097412109375, -2.52691650390625, -2.444091796875, -2.36126708984375, -2.2784423828125, -2.19561767578125, -2.11279296875, -2.02996826171875, -1.9471435546875, -1.86431884765625, -1.781494140625, -1.69866943359375, -1.6158447265625, -1.53302001953125, -1.4501953125, -1.36737060546875, -1.2845458984375, -1.20172119140625, -1.118896484375, -1.03607177734375, -0.9532470703125, -0.87042236328125, -0.78759765625, -0.70477294921875, -0.6219482421875, -0.53912353515625, -0.456298828125, -0.37347412109375, -0.2906494140625, -0.20782470703125, -0.125, -0.04217529296875, 0.0406494140625, 0.12347412109375, 0.206298828125, 0.28912353515625, 0.3719482421875, 0.45477294921875, 0.53759765625, 0.62042236328125, 0.7032470703125, 0.78607177734375, 0.868896484375, 0.95172119140625, 1.0345458984375, 1.11737060546875, 1.2001953125, 1.28302001953125, 1.3658447265625, 1.44866943359375, 1.531494140625, 1.61431884765625, 1.6971435546875, 1.77996826171875, 1.86279296875, 1.94561767578125, 2.0284423828125, 2.11126708984375, 2.194091796875, 2.27691650390625, 2.3597412109375, 2.44256591796875, 2.525390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 7.0, 13.0, 11.0, 11.0, 22.0, 50.0, 109.0, 210.0, 232.0, 159.0, 58.0, 40.0, 27.0, 17.0, 11.0, 4.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12939453125, -0.12560462951660156, -0.12181472778320312, -0.11802482604980469, -0.11423492431640625, -0.11044502258300781, -0.10665512084960938, -0.10286521911621094, -0.0990753173828125, -0.09528541564941406, -0.09149551391601562, -0.08770561218261719, -0.08391571044921875, -0.08012580871582031, -0.07633590698242188, -0.07254600524902344, -0.068756103515625, -0.06496620178222656, -0.061176300048828125, -0.05738639831542969, -0.05359649658203125, -0.04980659484863281, -0.046016693115234375, -0.04222679138183594, -0.0384368896484375, -0.03464698791503906, -0.030857086181640625, -0.027067184448242188, -0.02327728271484375, -0.019487380981445312, -0.015697479248046875, -0.011907577514648438, -0.00811767578125, -0.0043277740478515625, -0.000537872314453125, 0.0032520294189453125, 0.00704193115234375, 0.010831832885742188, 0.014621734619140625, 0.018411636352539062, 0.0222015380859375, 0.025991439819335938, 0.029781341552734375, 0.03357124328613281, 0.03736114501953125, 0.04115104675292969, 0.044940948486328125, 0.04873085021972656, 0.052520751953125, 0.05631065368652344, 0.060100555419921875, 0.06389045715332031, 0.06768035888671875, 0.07147026062011719, 0.07526016235351562, 0.07905006408691406, 0.0828399658203125, 0.08662986755371094, 0.09041976928710938, 0.09420967102050781, 0.09799957275390625, 0.10178947448730469, 0.10557937622070312, 0.10936927795410156, 0.1131591796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 5.0, 7.0, 8.0, 7.0, 3.0, 17.0, 17.0, 47.0, 45.0, 139.0, 267.0, 849.0, 8828.0, 4024276.0, 155764.0, 3003.0, 525.0, 213.0, 90.0, 41.0, 28.0, 20.0, 11.0, 11.0, 10.0, 15.0, 4.0, 7.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.29296875, -3.182525634765625, -3.07208251953125, -2.961639404296875, -2.8511962890625, -2.740753173828125, -2.63031005859375, -2.519866943359375, -2.409423828125, -2.298980712890625, -2.18853759765625, -2.078094482421875, -1.9676513671875, -1.857208251953125, -1.74676513671875, -1.636322021484375, -1.52587890625, -1.415435791015625, -1.30499267578125, -1.194549560546875, -1.0841064453125, -0.973663330078125, -0.86322021484375, -0.752777099609375, -0.642333984375, -0.531890869140625, -0.42144775390625, -0.311004638671875, -0.2005615234375, -0.090118408203125, 0.02032470703125, 0.130767822265625, 0.2412109375, 0.351654052734375, 0.46209716796875, 0.572540283203125, 0.6829833984375, 0.793426513671875, 0.90386962890625, 1.014312744140625, 1.124755859375, 1.235198974609375, 1.34564208984375, 1.456085205078125, 1.5665283203125, 1.676971435546875, 1.78741455078125, 1.897857666015625, 2.00830078125, 2.118743896484375, 2.22918701171875, 2.339630126953125, 2.4500732421875, 2.560516357421875, 2.67095947265625, 2.781402587890625, 2.891845703125, 3.002288818359375, 3.11273193359375, 3.223175048828125, 3.3336181640625, 3.444061279296875, 3.55450439453125, 3.664947509765625, 3.775390625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 8.0, 9.0, 5.0, 10.0, 18.0, 24.0, 30.0, 51.0, 76.0, 136.0, 380.0, 1337.0, 1249.0, 377.0, 154.0, 79.0, 49.0, 22.0, 9.0, 10.0, 11.0, 3.0, 8.0, 4.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.205810546875, -0.200531005859375, -0.19525146484375, -0.189971923828125, -0.1846923828125, -0.179412841796875, -0.17413330078125, -0.168853759765625, -0.16357421875, -0.158294677734375, -0.15301513671875, -0.147735595703125, -0.1424560546875, -0.137176513671875, -0.13189697265625, -0.126617431640625, -0.121337890625, -0.116058349609375, -0.11077880859375, -0.105499267578125, -0.1002197265625, -0.094940185546875, -0.08966064453125, -0.084381103515625, -0.0791015625, -0.073822021484375, -0.06854248046875, -0.063262939453125, -0.0579833984375, -0.052703857421875, -0.04742431640625, -0.042144775390625, -0.036865234375, -0.031585693359375, -0.02630615234375, -0.021026611328125, -0.0157470703125, -0.010467529296875, -0.00518798828125, 9.1552734375e-05, 0.00537109375, 0.010650634765625, 0.01593017578125, 0.021209716796875, 0.0264892578125, 0.031768798828125, 0.03704833984375, 0.042327880859375, 0.047607421875, 0.052886962890625, 0.05816650390625, 0.063446044921875, 0.0687255859375, 0.074005126953125, 0.07928466796875, 0.084564208984375, 0.08984375, 0.095123291015625, 0.10040283203125, 0.105682373046875, 0.1109619140625, 0.116241455078125, 0.12152099609375, 0.126800537109375, 0.132080078125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 10.0, 97.0, 587.0, 248.0, 36.0, 15.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7675652503967285, -7.60786247253418, -7.448160171508789, -7.28845739364624, -7.128754615783691, -6.969052314758301, -6.809349536895752, -6.649646759033203, -6.4899444580078125, -6.330241680145264, -6.170539379119873, -6.010836601257324, -5.851134300231934, -5.691431522369385, -5.531728744506836, -5.372026443481445, -5.2123236656188965, -5.052620887756348, -4.892918586730957, -4.733215808868408, -4.573513031005859, -4.413810729980469, -4.25410795211792, -4.094405174255371, -3.9347028732299805, -3.7750003337860107, -3.615297794342041, -3.455595016479492, -3.2958924770355225, -3.1361899375915527, -2.976487159729004, -2.816784620285034, -2.6570825576782227, -2.497380018234253, -2.337677478790283, -2.1779747009277344, -2.0182721614837646, -1.858569622039795, -1.6988669633865356, -1.5391643047332764, -1.3794617652893066, -1.219759225845337, -1.0600565671920776, -0.9003539681434631, -0.7406513690948486, -0.5809487700462341, -0.42124617099761963, -0.26154351234436035, -0.10184097290039062, 0.05786162614822388, 0.21756422519683838, 0.3772668242454529, 0.5369694232940674, 0.6966720223426819, 0.8563746213912964, 1.0160772800445557, 1.1757798194885254, 1.3354823589324951, 1.4951850175857544, 1.6548876762390137, 1.8145902156829834, 1.9742927551269531, 2.133995532989502, 2.2936980724334717, 2.4534006118774414]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 15.0, 32.0, 51.0, 92.0, 149.0, 198.0, 177.0, 144.0, 79.0, 36.0, 23.0, 11.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.243463516235352, -4.161136150360107, -4.078808784484863, -3.9964816570281982, -3.914154291152954, -3.83182692527771, -3.749499559402466, -3.6671721935272217, -3.5848450660705566, -3.5025177001953125, -3.4201903343200684, -3.3378632068634033, -3.255535840988159, -3.173208475112915, -3.090881109237671, -3.0085537433624268, -2.9262263774871826, -2.8438990116119385, -2.7615716457366943, -2.6792445182800293, -2.596917152404785, -2.514589786529541, -2.432262420654297, -2.3499350547790527, -2.2676076889038086, -2.1852803230285645, -2.1029529571533203, -2.0206258296966553, -1.9382984638214111, -1.855971097946167, -1.7736437320709229, -1.6913163661956787, -1.6089894771575928, -1.5266621112823486, -1.444334864616394, -1.36200749874115, -1.2796802520751953, -1.1973528861999512, -1.115025520324707, -1.032698154449463, -0.9503709077835083, -0.8680436015129089, -0.7857162952423096, -0.7033889293670654, -0.6210616230964661, -0.5387343168258667, -0.45640698075294495, -0.3740796446800232, -0.29175233840942383, -0.20942501723766327, -0.1270976960659027, -0.04477037489414215, 0.03755694627761841, 0.11988425254821777, 0.20221158862113953, 0.2845389246940613, 0.36686623096466064, 0.44919353723526, 0.5315208435058594, 0.6138482093811035, 0.6961755156517029, 0.7785028219223022, 0.8608301877975464, 0.9431574940681458, 1.0254848003387451]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 2.0, 6.0, 5.0, 7.0, 15.0, 12.0, 18.0, 29.0, 37.0, 42.0, 55.0, 52.0, 160.0, 10835.0, 1036351.0, 538.0, 83.0, 64.0, 51.0, 38.0, 32.0, 28.0, 19.0, 14.0, 13.0, 8.0, 2.0, 8.0, 9.0, 1.0, 3.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.921875, -10.5350341796875, -10.148193359375, -9.7613525390625, -9.37451171875, -8.9876708984375, -8.600830078125, -8.2139892578125, -7.8271484375, -7.4403076171875, -7.053466796875, -6.6666259765625, -6.27978515625, -5.8929443359375, -5.506103515625, -5.1192626953125, -4.732421875, -4.3455810546875, -3.958740234375, -3.5718994140625, -3.18505859375, -2.7982177734375, -2.411376953125, -2.0245361328125, -1.6376953125, -1.2508544921875, -0.864013671875, -0.4771728515625, -0.09033203125, 0.2965087890625, 0.683349609375, 1.0701904296875, 1.45703125, 1.8438720703125, 2.230712890625, 2.6175537109375, 3.00439453125, 3.3912353515625, 3.778076171875, 4.1649169921875, 4.5517578125, 4.9385986328125, 5.325439453125, 5.7122802734375, 6.09912109375, 6.4859619140625, 6.872802734375, 7.2596435546875, 7.646484375, 8.0333251953125, 8.420166015625, 8.8070068359375, 9.19384765625, 9.5806884765625, 9.967529296875, 10.3543701171875, 10.7412109375, 11.1280517578125, 11.514892578125, 11.9017333984375, 12.28857421875, 12.6754150390625, 13.062255859375, 13.4490966796875, 13.8359375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 21.0, 98.0, 583.0, 270.0, 33.0, 7.0, 2.0, 1.0, 1.0], "bins": [-0.97705078125, -0.9601030349731445, -0.9431552886962891, -0.9262075424194336, -0.9092597961425781, -0.8923120498657227, -0.8753643035888672, -0.8584165573120117, -0.8414688110351562, -0.8245210647583008, -0.8075733184814453, -0.7906255722045898, -0.7736778259277344, -0.7567300796508789, -0.7397823333740234, -0.722834587097168, -0.7058868408203125, -0.688939094543457, -0.6719913482666016, -0.6550436019897461, -0.6380958557128906, -0.6211481094360352, -0.6042003631591797, -0.5872526168823242, -0.5703048706054688, -0.5533571243286133, -0.5364093780517578, -0.5194616317749023, -0.5025138854980469, -0.4855661392211914, -0.46861839294433594, -0.45167064666748047, -0.434722900390625, -0.41777515411376953, -0.40082740783691406, -0.3838796615600586, -0.3669319152832031, -0.34998416900634766, -0.3330364227294922, -0.3160886764526367, -0.29914093017578125, -0.2821931838989258, -0.2652454376220703, -0.24829769134521484, -0.23134994506835938, -0.2144021987915039, -0.19745445251464844, -0.18050670623779297, -0.1635589599609375, -0.14661121368408203, -0.12966346740722656, -0.1127157211303711, -0.09576797485351562, -0.07882022857666016, -0.06187248229980469, -0.04492473602294922, -0.02797698974609375, -0.011029243469238281, 0.0059185028076171875, 0.022866249084472656, 0.039813995361328125, 0.056761741638183594, 0.07370948791503906, 0.09065723419189453, 0.10760498046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 4.0, 8.0, 13.0, 7.0, 19.0, 33.0, 40.0, 58.0, 98.0, 136.0, 239.0, 428.0, 913.0, 2368.0, 7774.0, 37346.0, 306776.0, 593258.0, 79468.0, 13321.0, 3610.0, 1289.0, 547.0, 294.0, 158.0, 107.0, 63.0, 50.0, 36.0, 24.0, 18.0, 13.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.01953125, -1.9586944580078125, -1.897857666015625, -1.8370208740234375, -1.77618408203125, -1.7153472900390625, -1.654510498046875, -1.5936737060546875, -1.5328369140625, -1.4720001220703125, -1.411163330078125, -1.3503265380859375, -1.28948974609375, -1.2286529541015625, -1.167816162109375, -1.1069793701171875, -1.046142578125, -0.9853057861328125, -0.924468994140625, -0.8636322021484375, -0.80279541015625, -0.7419586181640625, -0.681121826171875, -0.6202850341796875, -0.5594482421875, -0.4986114501953125, -0.437774658203125, -0.3769378662109375, -0.31610107421875, -0.2552642822265625, -0.194427490234375, -0.1335906982421875, -0.07275390625, -0.0119171142578125, 0.048919677734375, 0.1097564697265625, 0.17059326171875, 0.2314300537109375, 0.292266845703125, 0.3531036376953125, 0.4139404296875, 0.4747772216796875, 0.535614013671875, 0.5964508056640625, 0.65728759765625, 0.7181243896484375, 0.778961181640625, 0.8397979736328125, 0.900634765625, 0.9614715576171875, 1.022308349609375, 1.0831451416015625, 1.14398193359375, 1.2048187255859375, 1.265655517578125, 1.3264923095703125, 1.3873291015625, 1.4481658935546875, 1.509002685546875, 1.5698394775390625, 1.63067626953125, 1.6915130615234375, 1.752349853515625, 1.8131866455078125, 1.8740234375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 1.0, 2.0, 9.0, 9.0, 9.0, 12.0, 17.0, 16.0, 22.0, 23.0, 44.0, 32.0, 50.0, 60.0, 49.0, 55.0, 58.0, 77.0, 66.0, 64.0, 53.0, 52.0, 53.0, 43.0, 27.0, 25.0, 17.0, 14.0, 14.0, 6.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.7248458862304688, -0.6982269287109375, -0.6716079711914062, -0.644989013671875, -0.6183700561523438, -0.5917510986328125, -0.5651321411132812, -0.53851318359375, -0.5118942260742188, -0.4852752685546875, -0.45865631103515625, -0.432037353515625, -0.40541839599609375, -0.3787994384765625, -0.35218048095703125, -0.3255615234375, -0.29894256591796875, -0.2723236083984375, -0.24570465087890625, -0.219085693359375, -0.19246673583984375, -0.1658477783203125, -0.13922882080078125, -0.11260986328125, -0.08599090576171875, -0.0593719482421875, -0.03275299072265625, -0.006134033203125, 0.02048492431640625, 0.0471038818359375, 0.07372283935546875, 0.100341796875, 0.12696075439453125, 0.1535797119140625, 0.18019866943359375, 0.206817626953125, 0.23343658447265625, 0.2600555419921875, 0.28667449951171875, 0.31329345703125, 0.33991241455078125, 0.3665313720703125, 0.39315032958984375, 0.419769287109375, 0.44638824462890625, 0.4730072021484375, 0.49962615966796875, 0.5262451171875, 0.5528640747070312, 0.5794830322265625, 0.6061019897460938, 0.632720947265625, 0.6593399047851562, 0.6859588623046875, 0.7125778198242188, 0.73919677734375, 0.7658157348632812, 0.7924346923828125, 0.8190536499023438, 0.845672607421875, 0.8722915649414062, 0.8989105224609375, 0.9255294799804688, 0.9521484375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 14.0, 21.0, 21.0, 34.0, 62.0, 126.0, 288.0, 637.0, 2071.0, 11878.0, 377765.0, 636795.0, 15105.0, 2415.0, 736.0, 267.0, 138.0, 53.0, 36.0, 30.0, 20.0, 6.0, 8.0, 5.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.564453125, -1.490142822265625, -1.41583251953125, -1.341522216796875, -1.2672119140625, -1.192901611328125, -1.11859130859375, -1.044281005859375, -0.969970703125, -0.895660400390625, -0.82135009765625, -0.747039794921875, -0.6727294921875, -0.598419189453125, -0.52410888671875, -0.449798583984375, -0.37548828125, -0.301177978515625, -0.22686767578125, -0.152557373046875, -0.0782470703125, -0.003936767578125, 0.07037353515625, 0.144683837890625, 0.218994140625, 0.293304443359375, 0.36761474609375, 0.441925048828125, 0.5162353515625, 0.590545654296875, 0.66485595703125, 0.739166259765625, 0.8134765625, 0.887786865234375, 0.96209716796875, 1.036407470703125, 1.1107177734375, 1.185028076171875, 1.25933837890625, 1.333648681640625, 1.407958984375, 1.482269287109375, 1.55657958984375, 1.630889892578125, 1.7052001953125, 1.779510498046875, 1.85382080078125, 1.928131103515625, 2.00244140625, 2.076751708984375, 2.15106201171875, 2.225372314453125, 2.2996826171875, 2.373992919921875, 2.44830322265625, 2.522613525390625, 2.596923828125, 2.671234130859375, 2.74554443359375, 2.819854736328125, 2.8941650390625, 2.968475341796875, 3.04278564453125, 3.117095947265625, 3.19140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 12.0, 18.0, 24.0, 43.0, 67.0, 154.0, 247.0, 175.0, 91.0, 64.0, 34.0, 21.0, 13.0, 12.0, 3.0, 8.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001614093780517578, -0.00015537068247795105, -0.0001493319869041443, -0.00014329329133033752, -0.00013725459575653076, -0.000131215900182724, -0.00012517720460891724, -0.00011913850903511047, -0.00011309981346130371, -0.00010706111788749695, -0.00010102242231369019, -9.498372673988342e-05, -8.894503116607666e-05, -8.29063355922699e-05, -7.686764001846313e-05, -7.082894444465637e-05, -6.479024887084961e-05, -5.875155329704285e-05, -5.2712857723236084e-05, -4.667416214942932e-05, -4.063546657562256e-05, -3.4596771001815796e-05, -2.8558075428009033e-05, -2.251937985420227e-05, -1.6480684280395508e-05, -1.0441988706588745e-05, -4.403293132781982e-06, 1.6354024410247803e-06, 7.674098014831543e-06, 1.3712793588638306e-05, 1.975148916244507e-05, 2.579018473625183e-05, 3.1828880310058594e-05, 3.7867575883865356e-05, 4.390627145767212e-05, 4.994496703147888e-05, 5.5983662605285645e-05, 6.202235817909241e-05, 6.806105375289917e-05, 7.409974932670593e-05, 8.01384449005127e-05, 8.617714047431946e-05, 9.221583604812622e-05, 9.825453162193298e-05, 0.00010429322719573975, 0.00011033192276954651, 0.00011637061834335327, 0.00012240931391716003, 0.0001284480094909668, 0.00013448670506477356, 0.00014052540063858032, 0.00014656409621238708, 0.00015260279178619385, 0.0001586414873600006, 0.00016468018293380737, 0.00017071887850761414, 0.0001767575740814209, 0.00018279626965522766, 0.00018883496522903442, 0.0001948736608028412, 0.00020091235637664795, 0.0002069510519504547, 0.00021298974752426147, 0.00021902844309806824, 0.000225067138671875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 5.0, 6.0, 9.0, 9.0, 22.0, 25.0, 34.0, 59.0, 106.0, 205.0, 401.0, 1084.0, 2930.0, 10556.0, 97898.0, 863240.0, 59297.0, 8386.0, 2522.0, 924.0, 395.0, 158.0, 96.0, 48.0, 43.0, 26.0, 19.0, 9.0, 12.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.76171875, -1.7089996337890625, -1.656280517578125, -1.6035614013671875, -1.55084228515625, -1.4981231689453125, -1.445404052734375, -1.3926849365234375, -1.3399658203125, -1.2872467041015625, -1.234527587890625, -1.1818084716796875, -1.12908935546875, -1.0763702392578125, -1.023651123046875, -0.9709320068359375, -0.918212890625, -0.8654937744140625, -0.812774658203125, -0.7600555419921875, -0.70733642578125, -0.6546173095703125, -0.601898193359375, -0.5491790771484375, -0.4964599609375, -0.4437408447265625, -0.391021728515625, -0.3383026123046875, -0.28558349609375, -0.2328643798828125, -0.180145263671875, -0.1274261474609375, -0.07470703125, -0.0219879150390625, 0.030731201171875, 0.0834503173828125, 0.13616943359375, 0.1888885498046875, 0.241607666015625, 0.2943267822265625, 0.3470458984375, 0.3997650146484375, 0.452484130859375, 0.5052032470703125, 0.55792236328125, 0.6106414794921875, 0.663360595703125, 0.7160797119140625, 0.768798828125, 0.8215179443359375, 0.874237060546875, 0.9269561767578125, 0.97967529296875, 1.0323944091796875, 1.085113525390625, 1.1378326416015625, 1.1905517578125, 1.2432708740234375, 1.295989990234375, 1.3487091064453125, 1.40142822265625, 1.4541473388671875, 1.506866455078125, 1.5595855712890625, 1.6123046875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 12.0, 14.0, 25.0, 37.0, 63.0, 84.0, 106.0, 130.0, 135.0, 116.0, 79.0, 58.0, 33.0, 25.0, 25.0, 13.0, 9.0, 4.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53759765625, -0.5192184448242188, -0.5008392333984375, -0.48246002197265625, -0.464080810546875, -0.44570159912109375, -0.4273223876953125, -0.40894317626953125, -0.39056396484375, -0.37218475341796875, -0.3538055419921875, -0.33542633056640625, -0.317047119140625, -0.29866790771484375, -0.2802886962890625, -0.26190948486328125, -0.2435302734375, -0.22515106201171875, -0.2067718505859375, -0.18839263916015625, -0.170013427734375, -0.15163421630859375, -0.1332550048828125, -0.11487579345703125, -0.09649658203125, -0.07811737060546875, -0.0597381591796875, -0.04135894775390625, -0.022979736328125, -0.00460052490234375, 0.0137786865234375, 0.03215789794921875, 0.050537109375, 0.06891632080078125, 0.0872955322265625, 0.10567474365234375, 0.124053955078125, 0.14243316650390625, 0.1608123779296875, 0.17919158935546875, 0.19757080078125, 0.21595001220703125, 0.2343292236328125, 0.25270843505859375, 0.271087646484375, 0.28946685791015625, 0.3078460693359375, 0.32622528076171875, 0.3446044921875, 0.36298370361328125, 0.3813629150390625, 0.39974212646484375, 0.418121337890625, 0.43650054931640625, 0.4548797607421875, 0.47325897216796875, 0.49163818359375, 0.5100173950195312, 0.5283966064453125, 0.5467758178710938, 0.565155029296875, 0.5835342407226562, 0.6019134521484375, 0.6202926635742188, 0.638671875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 28.0, 121.0, 338.0, 319.0, 126.0, 39.0, 13.0, 7.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.267534255981445, -20.719139099121094, -20.17074203491211, -19.622344970703125, -19.073949813842773, -18.525554656982422, -17.977157592773438, -17.428760528564453, -16.8803653717041, -16.33197021484375, -15.783573150634766, -15.235177040100098, -14.68678092956543, -14.138384819030762, -13.589988708496094, -13.041592597961426, -12.493196487426758, -11.94480037689209, -11.396404266357422, -10.848008155822754, -10.299612045288086, -9.751215934753418, -9.20281982421875, -8.654423713684082, -8.106027603149414, -7.557631492614746, -7.009235382080078, -6.46083927154541, -5.912443161010742, -5.364047050476074, -4.815650939941406, -4.267254829406738, -3.7188568115234375, -3.1704607009887695, -2.6220645904541016, -2.0736684799194336, -1.5252723693847656, -0.9768762588500977, -0.4284801483154297, 0.11991596221923828, 0.6683120727539062, 1.2167081832885742, 1.7651042938232422, 2.31350040435791, 2.861896514892578, 3.410292625427246, 3.958688735961914, 4.507084846496582, 5.05548095703125, 5.603877067565918, 6.152273178100586, 6.700669288635254, 7.249065399169922, 7.79746150970459, 8.345857620239258, 8.894253730773926, 9.442649841308594, 9.991045951843262, 10.53944206237793, 11.087838172912598, 11.636234283447266, 12.184630393981934, 12.733026504516602, 13.28142261505127, 13.829818725585938]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 2.0, 8.0, 6.0, 5.0, 17.0, 13.0, 16.0, 19.0, 23.0, 30.0, 32.0, 36.0, 31.0, 46.0, 54.0, 36.0, 43.0, 56.0, 65.0, 52.0, 59.0, 43.0, 36.0, 51.0, 35.0, 31.0, 25.0, 25.0, 13.0, 23.0, 14.0, 9.0, 7.0, 13.0, 6.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.192131042480469, -5.040441989898682, -4.8887529373168945, -4.737063884735107, -4.58537483215332, -4.433686256408691, -4.281997203826904, -4.130308151245117, -3.97861909866333, -3.826930046081543, -3.675240993499756, -3.523552179336548, -3.3718631267547607, -3.2201740741729736, -3.0684852600097656, -2.9167962074279785, -2.7651071548461914, -2.6134181022644043, -2.461729049682617, -2.310040235519409, -2.158351182937622, -2.006662130355835, -1.8549731969833374, -1.7032842636108398, -1.5515952110290527, -1.3999061584472656, -1.248217225074768, -1.0965282917022705, -0.9448392391204834, -0.7931502461433411, -0.6414612531661987, -0.48977231979370117, -0.33808279037475586, -0.18639379739761353, -0.03470480442047119, 0.11698418855667114, 0.2686731815338135, 0.4203621745109558, 0.5720511674880981, 0.7237401008605957, 0.8754291534423828, 1.02711820602417, 1.1788071393966675, 1.330496072769165, 1.4821851253509521, 1.6338741779327393, 1.7855631113052368, 1.9372520446777344, 2.0889410972595215, 2.2406301498413086, 2.3923192024230957, 2.5440080165863037, 2.695697069168091, 2.847386121749878, 2.999074935913086, 3.150763988494873, 3.30245304107666, 3.4541420936584473, 3.6058311462402344, 3.7575199604034424, 3.9092090129852295, 4.0608978271484375, 4.212586879730225, 4.364275932312012, 4.515964984893799]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 7.0, 4.0, 3.0, 9.0, 17.0, 13.0, 23.0, 23.0, 23.0, 34.0, 53.0, 54.0, 68.0, 145.0, 531.0, 3943929.0, 248943.0, 331.0, 49.0, 19.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-37.0, -36.3143310546875, -35.628662109375, -34.9429931640625, -34.25732421875, -33.5716552734375, -32.885986328125, -32.2003173828125, -31.5146484375, -30.8289794921875, -30.143310546875, -29.4576416015625, -28.77197265625, -28.0863037109375, -27.400634765625, -26.7149658203125, -26.029296875, -25.3436279296875, -24.657958984375, -23.9722900390625, -23.28662109375, -22.6009521484375, -21.915283203125, -21.2296142578125, -20.5439453125, -19.8582763671875, -19.172607421875, -18.4869384765625, -17.80126953125, -17.1156005859375, -16.429931640625, -15.7442626953125, -15.05859375, -14.3729248046875, -13.687255859375, -13.0015869140625, -12.31591796875, -11.6302490234375, -10.944580078125, -10.2589111328125, -9.5732421875, -8.8875732421875, -8.201904296875, -7.5162353515625, -6.83056640625, -6.1448974609375, -5.459228515625, -4.7735595703125, -4.087890625, -3.4022216796875, -2.716552734375, -2.0308837890625, -1.34521484375, -0.6595458984375, 0.026123046875, 0.7117919921875, 1.3974609375, 2.0831298828125, 2.768798828125, 3.4544677734375, 4.14013671875, 4.8258056640625, 5.511474609375, 6.1971435546875, 6.8828125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 2.0, 16.0, 63.0, 177.0, 318.0, 267.0, 120.0, 30.0, 9.0, 5.0, 3.0, 0.0, 1.0], "bins": [-0.99853515625, -0.9806003570556641, -0.9626655578613281, -0.9447307586669922, -0.9267959594726562, -0.9088611602783203, -0.8909263610839844, -0.8729915618896484, -0.8550567626953125, -0.8371219635009766, -0.8191871643066406, -0.8012523651123047, -0.7833175659179688, -0.7653827667236328, -0.7474479675292969, -0.7295131683349609, -0.711578369140625, -0.6936435699462891, -0.6757087707519531, -0.6577739715576172, -0.6398391723632812, -0.6219043731689453, -0.6039695739746094, -0.5860347747802734, -0.5680999755859375, -0.5501651763916016, -0.5322303771972656, -0.5142955780029297, -0.49636077880859375, -0.4784259796142578, -0.4604911804199219, -0.44255638122558594, -0.42462158203125, -0.40668678283691406, -0.3887519836425781, -0.3708171844482422, -0.35288238525390625, -0.3349475860595703, -0.3170127868652344, -0.29907798767089844, -0.2811431884765625, -0.26320838928222656, -0.24527359008789062, -0.2273387908935547, -0.20940399169921875, -0.1914691925048828, -0.17353439331054688, -0.15559959411621094, -0.137664794921875, -0.11972999572753906, -0.10179519653320312, -0.08386039733886719, -0.06592559814453125, -0.04799079895019531, -0.030055999755859375, -0.012121200561523438, 0.0058135986328125, 0.023748397827148438, 0.041683197021484375, 0.05961799621582031, 0.07755279541015625, 0.09548759460449219, 0.11342239379882812, 0.13135719299316406, 0.1492919921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 3.0, 4.0, 11.0, 7.0, 11.0, 30.0, 30.0, 33.0, 45.0, 54.0, 80.0, 100.0, 134.0, 151.0, 174.0, 906.0, 4122480.0, 68775.0, 588.0, 178.0, 119.0, 119.0, 65.0, 47.0, 50.0, 29.0, 23.0, 10.0, 13.0, 11.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-26.203125, -25.191162109375, -24.17919921875, -23.167236328125, -22.1552734375, -21.143310546875, -20.13134765625, -19.119384765625, -18.107421875, -17.095458984375, -16.08349609375, -15.071533203125, -14.0595703125, -13.047607421875, -12.03564453125, -11.023681640625, -10.01171875, -8.999755859375, -7.98779296875, -6.975830078125, -5.9638671875, -4.951904296875, -3.93994140625, -2.927978515625, -1.916015625, -0.904052734375, 0.10791015625, 1.119873046875, 2.1318359375, 3.143798828125, 4.15576171875, 5.167724609375, 6.1796875, 7.191650390625, 8.20361328125, 9.215576171875, 10.2275390625, 11.239501953125, 12.25146484375, 13.263427734375, 14.275390625, 15.287353515625, 16.29931640625, 17.311279296875, 18.3232421875, 19.335205078125, 20.34716796875, 21.359130859375, 22.37109375, 23.383056640625, 24.39501953125, 25.406982421875, 26.4189453125, 27.430908203125, 28.44287109375, 29.454833984375, 30.466796875, 31.478759765625, 32.49072265625, 33.502685546875, 34.5146484375, 35.526611328125, 36.53857421875, 37.550537109375, 38.5625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 31.0, 695.0, 3216.0, 95.0, 28.0, 7.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3046875, -5.2008514404296875, -5.097015380859375, -4.9931793212890625, -4.88934326171875, -4.7855072021484375, -4.681671142578125, -4.5778350830078125, -4.4739990234375, -4.3701629638671875, -4.266326904296875, -4.1624908447265625, -4.05865478515625, -3.9548187255859375, -3.850982666015625, -3.7471466064453125, -3.643310546875, -3.5394744873046875, -3.435638427734375, -3.3318023681640625, -3.22796630859375, -3.1241302490234375, -3.020294189453125, -2.9164581298828125, -2.8126220703125, -2.7087860107421875, -2.604949951171875, -2.5011138916015625, -2.39727783203125, -2.2934417724609375, -2.189605712890625, -2.0857696533203125, -1.98193359375, -1.8780975341796875, -1.774261474609375, -1.6704254150390625, -1.56658935546875, -1.4627532958984375, -1.358917236328125, -1.2550811767578125, -1.1512451171875, -1.0474090576171875, -0.943572998046875, -0.8397369384765625, -0.73590087890625, -0.6320648193359375, -0.528228759765625, -0.4243927001953125, -0.320556640625, -0.2167205810546875, -0.112884521484375, -0.0090484619140625, 0.09478759765625, 0.1986236572265625, 0.302459716796875, 0.4062957763671875, 0.5101318359375, 0.6139678955078125, 0.717803955078125, 0.8216400146484375, 0.92547607421875, 1.0293121337890625, 1.133148193359375, 1.2369842529296875, 1.3408203125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 11.0, 59.0, 191.0, 528.0, 132.0, 42.0, 13.0, 8.0, 10.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.91761016845703, -33.957275390625, -32.9969367980957, -32.03660202026367, -31.076265335083008, -30.115928649902344, -29.155593872070312, -28.19525718688965, -27.234920501708984, -26.27458381652832, -25.31424903869629, -24.353912353515625, -23.39357566833496, -22.433238983154297, -21.472904205322266, -20.5125675201416, -19.55223274230957, -18.591896057128906, -17.631561279296875, -16.67122459411621, -15.710887908935547, -14.7505521774292, -13.790216445922852, -12.829879760742188, -11.86954402923584, -10.909208297729492, -9.948871612548828, -8.98853588104248, -8.028200149536133, -7.067863464355469, -6.107527732849121, -5.147191524505615, -4.186855316162109, -3.2265191078186035, -2.2661831378936768, -1.30584716796875, -0.34551095962524414, 0.6148252487182617, 1.5751609802246094, 2.5354971885681152, 3.495833396911621, 4.456169605255127, 5.416505813598633, 6.3768415451049805, 7.337177753448486, 8.297513961791992, 9.25784969329834, 10.218185424804688, 11.178522109985352, 12.1388578414917, 13.099194526672363, 14.059530258178711, 15.019866943359375, 15.980202674865723, 16.94053840637207, 17.900875091552734, 18.861209869384766, 19.82154655456543, 20.78188133239746, 21.742218017578125, 22.70255470275879, 23.662891387939453, 24.623226165771484, 25.58356285095215, 26.543899536132812]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 18.0, 23.0, 42.0, 83.0, 137.0, 147.0, 143.0, 152.0, 104.0, 69.0, 42.0, 18.0, 10.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.900402069091797, -17.323759078979492, -16.747116088867188, -16.170475006103516, -15.593832015991211, -15.017189025878906, -14.440546989440918, -13.86390495300293, -13.287261962890625, -12.71061897277832, -12.133976936340332, -11.557334899902344, -10.980691909790039, -10.404048919677734, -9.827406883239746, -9.250764846801758, -8.674121856689453, -8.097478866577148, -7.52083683013916, -6.944194316864014, -6.367551803588867, -5.790909290313721, -5.214266777038574, -4.637624263763428, -4.060981750488281, -3.4843392372131348, -2.9076967239379883, -2.331054210662842, -1.7544116973876953, -1.1777691841125488, -0.6011266708374023, -0.02448415756225586, 0.5521602630615234, 1.12880277633667, 1.7054452896118164, 2.282087802886963, 2.8587303161621094, 3.435372829437256, 4.012015342712402, 4.588657855987549, 5.165300369262695, 5.741942882537842, 6.318585395812988, 6.895227909088135, 7.471870422363281, 8.048513412475586, 8.625155448913574, 9.201797485351562, 9.778440475463867, 10.355083465576172, 10.93172550201416, 11.508367538452148, 12.085010528564453, 12.661653518676758, 13.238295555114746, 13.814937591552734, 14.391580581665039, 14.968223571777344, 15.544865608215332, 16.12150764465332, 16.698150634765625, 17.27479362487793, 17.851436614990234, 18.428077697753906, 19.00472068786621]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 8.0, 12.0, 8.0, 10.0, 19.0, 25.0, 42.0, 56.0, 82.0, 137.0, 223.0, 472.0, 1221.0, 4247.0, 36116.0, 846199.0, 146645.0, 9496.0, 2023.0, 728.0, 316.0, 156.0, 97.0, 61.0, 31.0, 34.0, 24.0, 18.0, 13.0, 9.0, 3.0, 10.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-12.296875, -11.9873046875, -11.677734375, -11.3681640625, -11.05859375, -10.7490234375, -10.439453125, -10.1298828125, -9.8203125, -9.5107421875, -9.201171875, -8.8916015625, -8.58203125, -8.2724609375, -7.962890625, -7.6533203125, -7.34375, -7.0341796875, -6.724609375, -6.4150390625, -6.10546875, -5.7958984375, -5.486328125, -5.1767578125, -4.8671875, -4.5576171875, -4.248046875, -3.9384765625, -3.62890625, -3.3193359375, -3.009765625, -2.7001953125, -2.390625, -2.0810546875, -1.771484375, -1.4619140625, -1.15234375, -0.8427734375, -0.533203125, -0.2236328125, 0.0859375, 0.3955078125, 0.705078125, 1.0146484375, 1.32421875, 1.6337890625, 1.943359375, 2.2529296875, 2.5625, 2.8720703125, 3.181640625, 3.4912109375, 3.80078125, 4.1103515625, 4.419921875, 4.7294921875, 5.0390625, 5.3486328125, 5.658203125, 5.9677734375, 6.27734375, 6.5869140625, 6.896484375, 7.2060546875, 7.515625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 10.0, 33.0, 45.0, 82.0, 113.0, 175.0, 175.0, 148.0, 97.0, 70.0, 26.0, 16.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.416015625, -1.3846282958984375, -1.353240966796875, -1.3218536376953125, -1.29046630859375, -1.2590789794921875, -1.227691650390625, -1.1963043212890625, -1.1649169921875, -1.1335296630859375, -1.102142333984375, -1.0707550048828125, -1.03936767578125, -1.0079803466796875, -0.976593017578125, -0.9452056884765625, -0.913818359375, -0.8824310302734375, -0.851043701171875, -0.8196563720703125, -0.78826904296875, -0.7568817138671875, -0.725494384765625, -0.6941070556640625, -0.6627197265625, -0.6313323974609375, -0.599945068359375, -0.5685577392578125, -0.53717041015625, -0.5057830810546875, -0.474395751953125, -0.4430084228515625, -0.41162109375, -0.3802337646484375, -0.348846435546875, -0.3174591064453125, -0.28607177734375, -0.2546844482421875, -0.223297119140625, -0.1919097900390625, -0.1605224609375, -0.1291351318359375, -0.097747802734375, -0.0663604736328125, -0.03497314453125, -0.0035858154296875, 0.027801513671875, 0.0591888427734375, 0.090576171875, 0.1219635009765625, 0.153350830078125, 0.1847381591796875, 0.21612548828125, 0.2475128173828125, 0.278900146484375, 0.3102874755859375, 0.3416748046875, 0.3730621337890625, 0.404449462890625, 0.4358367919921875, 0.46722412109375, 0.4986114501953125, 0.529998779296875, 0.5613861083984375, 0.5927734375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 7.0, 15.0, 17.0, 30.0, 24.0, 41.0, 48.0, 85.0, 118.0, 205.0, 309.0, 522.0, 978.0, 2166.0, 5188.0, 14144.0, 50524.0, 264538.0, 562995.0, 106394.0, 25639.0, 8138.0, 3120.0, 1372.0, 696.0, 424.0, 245.0, 170.0, 105.0, 75.0, 56.0, 33.0, 27.0, 26.0, 19.0, 18.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9296875, -2.838836669921875, -2.74798583984375, -2.657135009765625, -2.5662841796875, -2.475433349609375, -2.38458251953125, -2.293731689453125, -2.202880859375, -2.112030029296875, -2.02117919921875, -1.930328369140625, -1.8394775390625, -1.748626708984375, -1.65777587890625, -1.566925048828125, -1.47607421875, -1.385223388671875, -1.29437255859375, -1.203521728515625, -1.1126708984375, -1.021820068359375, -0.93096923828125, -0.840118408203125, -0.749267578125, -0.658416748046875, -0.56756591796875, -0.476715087890625, -0.3858642578125, -0.295013427734375, -0.20416259765625, -0.113311767578125, -0.0224609375, 0.068389892578125, 0.15924072265625, 0.250091552734375, 0.3409423828125, 0.431793212890625, 0.52264404296875, 0.613494873046875, 0.704345703125, 0.795196533203125, 0.88604736328125, 0.976898193359375, 1.0677490234375, 1.158599853515625, 1.24945068359375, 1.340301513671875, 1.43115234375, 1.522003173828125, 1.61285400390625, 1.703704833984375, 1.7945556640625, 1.885406494140625, 1.97625732421875, 2.067108154296875, 2.157958984375, 2.248809814453125, 2.33966064453125, 2.430511474609375, 2.5213623046875, 2.612213134765625, 2.70306396484375, 2.793914794921875, 2.884765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 3.0, 4.0, 8.0, 6.0, 12.0, 12.0, 15.0, 26.0, 39.0, 44.0, 52.0, 57.0, 63.0, 64.0, 56.0, 55.0, 67.0, 57.0, 52.0, 52.0, 44.0, 47.0, 23.0, 26.0, 32.0, 16.0, 14.0, 8.0, 14.0, 7.0, 1.0, 8.0, 3.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8857421875, -1.8245391845703125, -1.763336181640625, -1.7021331787109375, -1.64093017578125, -1.5797271728515625, -1.518524169921875, -1.4573211669921875, -1.3961181640625, -1.3349151611328125, -1.273712158203125, -1.2125091552734375, -1.15130615234375, -1.0901031494140625, -1.028900146484375, -0.9676971435546875, -0.906494140625, -0.8452911376953125, -0.784088134765625, -0.7228851318359375, -0.66168212890625, -0.6004791259765625, -0.539276123046875, -0.4780731201171875, -0.4168701171875, -0.3556671142578125, -0.294464111328125, -0.2332611083984375, -0.17205810546875, -0.1108551025390625, -0.049652099609375, 0.0115509033203125, 0.07275390625, 0.1339569091796875, 0.195159912109375, 0.2563629150390625, 0.31756591796875, 0.3787689208984375, 0.439971923828125, 0.5011749267578125, 0.5623779296875, 0.6235809326171875, 0.684783935546875, 0.7459869384765625, 0.80718994140625, 0.8683929443359375, 0.929595947265625, 0.9907989501953125, 1.052001953125, 1.1132049560546875, 1.174407958984375, 1.2356109619140625, 1.29681396484375, 1.3580169677734375, 1.419219970703125, 1.4804229736328125, 1.5416259765625, 1.6028289794921875, 1.664031982421875, 1.7252349853515625, 1.78643798828125, 1.8476409912109375, 1.908843994140625, 1.9700469970703125, 2.03125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 8.0, 7.0, 12.0, 13.0, 20.0, 31.0, 67.0, 136.0, 321.0, 901.0, 3570.0, 30665.0, 967866.0, 39163.0, 4117.0, 1025.0, 339.0, 126.0, 73.0, 40.0, 24.0, 7.0, 6.0, 11.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.625, -8.4222412109375, -8.219482421875, -8.0167236328125, -7.81396484375, -7.6112060546875, -7.408447265625, -7.2056884765625, -7.0029296875, -6.8001708984375, -6.597412109375, -6.3946533203125, -6.19189453125, -5.9891357421875, -5.786376953125, -5.5836181640625, -5.380859375, -5.1781005859375, -4.975341796875, -4.7725830078125, -4.56982421875, -4.3670654296875, -4.164306640625, -3.9615478515625, -3.7587890625, -3.5560302734375, -3.353271484375, -3.1505126953125, -2.94775390625, -2.7449951171875, -2.542236328125, -2.3394775390625, -2.13671875, -1.9339599609375, -1.731201171875, -1.5284423828125, -1.32568359375, -1.1229248046875, -0.920166015625, -0.7174072265625, -0.5146484375, -0.3118896484375, -0.109130859375, 0.0936279296875, 0.29638671875, 0.4991455078125, 0.701904296875, 0.9046630859375, 1.107421875, 1.3101806640625, 1.512939453125, 1.7156982421875, 1.91845703125, 2.1212158203125, 2.323974609375, 2.5267333984375, 2.7294921875, 2.9322509765625, 3.135009765625, 3.3377685546875, 3.54052734375, 3.7432861328125, 3.946044921875, 4.1488037109375, 4.3515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 4.0, 6.0, 14.0, 18.0, 18.0, 37.0, 54.0, 104.0, 163.0, 242.0, 130.0, 72.0, 54.0, 29.0, 18.0, 14.0, 10.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004093647003173828, -0.0003977753221988678, -0.0003861859440803528, -0.00037459656596183777, -0.00036300718784332275, -0.00035141780972480774, -0.0003398284316062927, -0.0003282390534877777, -0.0003166496753692627, -0.0003050602972507477, -0.00029347091913223267, -0.00028188154101371765, -0.00027029216289520264, -0.0002587027847766876, -0.0002471134066581726, -0.0002355240285396576, -0.00022393465042114258, -0.00021234527230262756, -0.00020075589418411255, -0.00018916651606559753, -0.00017757713794708252, -0.0001659877598285675, -0.0001543983817100525, -0.00014280900359153748, -0.00013121962547302246, -0.00011963024735450745, -0.00010804086923599243, -9.645149111747742e-05, -8.48621129989624e-05, -7.327273488044739e-05, -6.168335676193237e-05, -5.009397864341736e-05, -3.8504600524902344e-05, -2.691522240638733e-05, -1.5325844287872314e-05, -3.7364661693573e-06, 7.852911949157715e-06, 1.944229006767273e-05, 3.1031668186187744e-05, 4.262104630470276e-05, 5.4210424423217773e-05, 6.579980254173279e-05, 7.73891806602478e-05, 8.897855877876282e-05, 0.00010056793689727783, 0.00011215731501579285, 0.00012374669313430786, 0.00013533607125282288, 0.0001469254493713379, 0.0001585148274898529, 0.00017010420560836792, 0.00018169358372688293, 0.00019328296184539795, 0.00020487233996391296, 0.00021646171808242798, 0.000228051096200943, 0.000239640474319458, 0.000251229852437973, 0.00026281923055648804, 0.00027440860867500305, 0.00028599798679351807, 0.0002975873649120331, 0.0003091767430305481, 0.0003207661211490631, 0.0003323554992675781]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 5.0, 13.0, 15.0, 21.0, 30.0, 41.0, 84.0, 152.0, 260.0, 622.0, 1559.0, 5368.0, 27997.0, 854306.0, 141064.0, 12005.0, 2997.0, 1016.0, 428.0, 235.0, 124.0, 75.0, 52.0, 24.0, 23.0, 8.0, 10.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53125, -4.39300537109375, -4.2547607421875, -4.11651611328125, -3.978271484375, -3.84002685546875, -3.7017822265625, -3.56353759765625, -3.42529296875, -3.28704833984375, -3.1488037109375, -3.01055908203125, -2.872314453125, -2.73406982421875, -2.5958251953125, -2.45758056640625, -2.3193359375, -2.18109130859375, -2.0428466796875, -1.90460205078125, -1.766357421875, -1.62811279296875, -1.4898681640625, -1.35162353515625, -1.21337890625, -1.07513427734375, -0.9368896484375, -0.79864501953125, -0.660400390625, -0.52215576171875, -0.3839111328125, -0.24566650390625, -0.107421875, 0.03082275390625, 0.1690673828125, 0.30731201171875, 0.445556640625, 0.58380126953125, 0.7220458984375, 0.86029052734375, 0.99853515625, 1.13677978515625, 1.2750244140625, 1.41326904296875, 1.551513671875, 1.68975830078125, 1.8280029296875, 1.96624755859375, 2.1044921875, 2.24273681640625, 2.3809814453125, 2.51922607421875, 2.657470703125, 2.79571533203125, 2.9339599609375, 3.07220458984375, 3.21044921875, 3.34869384765625, 3.4869384765625, 3.62518310546875, 3.763427734375, 3.90167236328125, 4.0399169921875, 4.17816162109375, 4.31640625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 12.0, 8.0, 8.0, 18.0, 10.0, 32.0, 66.0, 116.0, 172.0, 194.0, 153.0, 75.0, 50.0, 31.0, 12.0, 11.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.787109375, -1.72991943359375, -1.6727294921875, -1.61553955078125, -1.558349609375, -1.50115966796875, -1.4439697265625, -1.38677978515625, -1.32958984375, -1.27239990234375, -1.2152099609375, -1.15802001953125, -1.100830078125, -1.04364013671875, -0.9864501953125, -0.92926025390625, -0.8720703125, -0.81488037109375, -0.7576904296875, -0.70050048828125, -0.643310546875, -0.58612060546875, -0.5289306640625, -0.47174072265625, -0.41455078125, -0.35736083984375, -0.3001708984375, -0.24298095703125, -0.185791015625, -0.12860107421875, -0.0714111328125, -0.01422119140625, 0.04296875, 0.10015869140625, 0.1573486328125, 0.21453857421875, 0.271728515625, 0.32891845703125, 0.3861083984375, 0.44329833984375, 0.50048828125, 0.55767822265625, 0.6148681640625, 0.67205810546875, 0.729248046875, 0.78643798828125, 0.8436279296875, 0.90081787109375, 0.9580078125, 1.01519775390625, 1.0723876953125, 1.12957763671875, 1.186767578125, 1.24395751953125, 1.3011474609375, 1.35833740234375, 1.41552734375, 1.47271728515625, 1.5299072265625, 1.58709716796875, 1.644287109375, 1.70147705078125, 1.7586669921875, 1.81585693359375, 1.873046875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 24.0, 385.0, 554.0, 40.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.13058471679688, -147.133056640625, -144.1355438232422, -141.13803100585938, -138.1405029296875, -135.14297485351562, -132.1454620361328, -129.14794921875, -126.15042114257812, -123.15290069580078, -120.15538024902344, -117.1578598022461, -114.16033935546875, -111.1628189086914, -108.16529846191406, -105.16777801513672, -102.17025756835938, -99.17273712158203, -96.17521667480469, -93.17769622802734, -90.18017578125, -87.18265533447266, -84.18513488769531, -81.18761444091797, -78.19009399414062, -75.19257354736328, -72.19505310058594, -69.1975326538086, -66.20001220703125, -63.202491760253906, -60.20497131347656, -57.20745086669922, -54.209930419921875, -51.21240997314453, -48.21488952636719, -45.217369079589844, -42.2198486328125, -39.222328186035156, -36.22480773925781, -33.22728729248047, -30.229766845703125, -27.23224639892578, -24.234725952148438, -21.237205505371094, -18.23968505859375, -15.242164611816406, -12.244644165039062, -9.247123718261719, -6.249603271484375, -3.2520828247070312, -0.2545623779296875, 2.7429580688476562, 5.740478515625, 8.737998962402344, 11.735519409179688, 14.733039855957031, 17.730560302734375, 20.72808074951172, 23.725601196289062, 26.723121643066406, 29.72064208984375, 32.718162536621094, 35.71568298339844, 38.71320343017578, 41.710723876953125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 12.0, 11.0, 20.0, 20.0, 26.0, 40.0, 40.0, 45.0, 36.0, 54.0, 54.0, 45.0, 69.0, 54.0, 46.0, 55.0, 60.0, 54.0, 54.0, 37.0, 27.0, 22.0, 20.0, 22.0, 13.0, 18.0, 9.0, 6.0, 5.0, 6.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.633420944213867, -10.228638648986816, -9.823857307434082, -9.419075012207031, -9.01429271697998, -8.609511375427246, -8.204729080200195, -7.799947261810303, -7.39516544342041, -6.990383625030518, -6.585601329803467, -6.180819511413574, -5.776037693023682, -5.371255874633789, -4.966473579406738, -4.561691761016846, -4.156909465789795, -3.7521274089813232, -3.3473455905914307, -2.942563533782959, -2.5377817153930664, -2.1329996585845947, -1.728217601776123, -1.3234357833862305, -0.9186537265777588, -0.5138717889785767, -0.10908979177474976, 0.29569220542907715, 0.7004741430282593, 1.1052560806274414, 1.510038137435913, 1.9148199558258057, 2.3196020126342773, 2.724384069442749, 3.1291658878326416, 3.5339479446411133, 3.938729763031006, 4.343511581420898, 4.748293876647949, 5.153075695037842, 5.557857513427734, 5.962639331817627, 6.367421627044678, 6.77220344543457, 7.176985263824463, 7.5817670822143555, 7.986549377441406, 8.39133071899414, 8.796113967895508, 9.200896263122559, 9.605677604675293, 10.010459899902344, 10.415242195129395, 10.820023536682129, 11.22480583190918, 11.629587173461914, 12.034369468688965, 12.439151763916016, 12.84393310546875, 13.2487154006958, 13.653497695922852, 14.058279037475586, 14.463061332702637, 14.867843627929688, 15.272624969482422]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 1.0, 3.0, 1.0, 5.0, 7.0, 8.0, 7.0, 7.0, 5.0, 12.0, 8.0, 19.0, 21.0, 25.0, 31.0, 52.0, 67.0, 102.0, 148.0, 252.0, 467.0, 1197.0, 4314.0, 26137.0, 4049533.0, 98200.0, 10349.0, 2191.0, 645.0, 249.0, 98.0, 61.0, 33.0, 15.0, 13.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.375, -18.96044921875, -18.5458984375, -18.13134765625, -17.716796875, -17.30224609375, -16.8876953125, -16.47314453125, -16.05859375, -15.64404296875, -15.2294921875, -14.81494140625, -14.400390625, -13.98583984375, -13.5712890625, -13.15673828125, -12.7421875, -12.32763671875, -11.9130859375, -11.49853515625, -11.083984375, -10.66943359375, -10.2548828125, -9.84033203125, -9.42578125, -9.01123046875, -8.5966796875, -8.18212890625, -7.767578125, -7.35302734375, -6.9384765625, -6.52392578125, -6.109375, -5.69482421875, -5.2802734375, -4.86572265625, -4.451171875, -4.03662109375, -3.6220703125, -3.20751953125, -2.79296875, -2.37841796875, -1.9638671875, -1.54931640625, -1.134765625, -0.72021484375, -0.3056640625, 0.10888671875, 0.5234375, 0.93798828125, 1.3525390625, 1.76708984375, 2.181640625, 2.59619140625, 3.0107421875, 3.42529296875, 3.83984375, 4.25439453125, 4.6689453125, 5.08349609375, 5.498046875, 5.91259765625, 6.3271484375, 6.74169921875, 7.15625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 8.0, 5.0, 13.0, 32.0, 52.0, 85.0, 106.0, 122.0, 141.0, 134.0, 116.0, 73.0, 46.0, 39.0, 18.0, 2.0, 2.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.287109375, -1.2593917846679688, -1.2316741943359375, -1.2039566040039062, -1.176239013671875, -1.1485214233398438, -1.1208038330078125, -1.0930862426757812, -1.06536865234375, -1.0376510620117188, -1.0099334716796875, -0.9822158813476562, -0.954498291015625, -0.9267807006835938, -0.8990631103515625, -0.8713455200195312, -0.8436279296875, -0.8159103393554688, -0.7881927490234375, -0.7604751586914062, -0.732757568359375, -0.7050399780273438, -0.6773223876953125, -0.6496047973632812, -0.62188720703125, -0.5941696166992188, -0.5664520263671875, -0.5387344360351562, -0.511016845703125, -0.48329925537109375, -0.4555816650390625, -0.42786407470703125, -0.400146484375, -0.37242889404296875, -0.3447113037109375, -0.31699371337890625, -0.289276123046875, -0.26155853271484375, -0.2338409423828125, -0.20612335205078125, -0.17840576171875, -0.15068817138671875, -0.1229705810546875, -0.09525299072265625, -0.067535400390625, -0.03981781005859375, -0.0121002197265625, 0.01561737060546875, 0.0433349609375, 0.07105255126953125, 0.0987701416015625, 0.12648773193359375, 0.154205322265625, 0.18192291259765625, 0.2096405029296875, 0.23735809326171875, 0.26507568359375, 0.29279327392578125, 0.3205108642578125, 0.34822845458984375, 0.375946044921875, 0.40366363525390625, 0.4313812255859375, 0.45909881591796875, 0.48681640625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 8.0, 8.0, 18.0, 20.0, 32.0, 46.0, 73.0, 108.0, 233.0, 381.0, 1162.0, 49429.0, 4138417.0, 3408.0, 479.0, 222.0, 95.0, 56.0, 37.0, 19.0, 15.0, 9.0, 4.0, 1.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-36.375, -35.37060546875, -34.3662109375, -33.36181640625, -32.357421875, -31.35302734375, -30.3486328125, -29.34423828125, -28.33984375, -27.33544921875, -26.3310546875, -25.32666015625, -24.322265625, -23.31787109375, -22.3134765625, -21.30908203125, -20.3046875, -19.30029296875, -18.2958984375, -17.29150390625, -16.287109375, -15.28271484375, -14.2783203125, -13.27392578125, -12.26953125, -11.26513671875, -10.2607421875, -9.25634765625, -8.251953125, -7.24755859375, -6.2431640625, -5.23876953125, -4.234375, -3.22998046875, -2.2255859375, -1.22119140625, -0.216796875, 0.78759765625, 1.7919921875, 2.79638671875, 3.80078125, 4.80517578125, 5.8095703125, 6.81396484375, 7.818359375, 8.82275390625, 9.8271484375, 10.83154296875, 11.8359375, 12.84033203125, 13.8447265625, 14.84912109375, 15.853515625, 16.85791015625, 17.8623046875, 18.86669921875, 19.87109375, 20.87548828125, 21.8798828125, 22.88427734375, 23.888671875, 24.89306640625, 25.8974609375, 26.90185546875, 27.90625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 20.0, 41.0, 89.0, 2745.0, 997.0, 90.0, 44.0, 24.0, 18.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.69140625, -5.583892822265625, -5.47637939453125, -5.368865966796875, -5.2613525390625, -5.153839111328125, -5.04632568359375, -4.938812255859375, -4.831298828125, -4.723785400390625, -4.61627197265625, -4.508758544921875, -4.4012451171875, -4.293731689453125, -4.18621826171875, -4.078704833984375, -3.97119140625, -3.863677978515625, -3.75616455078125, -3.648651123046875, -3.5411376953125, -3.433624267578125, -3.32611083984375, -3.218597412109375, -3.111083984375, -3.003570556640625, -2.89605712890625, -2.788543701171875, -2.6810302734375, -2.573516845703125, -2.46600341796875, -2.358489990234375, -2.2509765625, -2.143463134765625, -2.03594970703125, -1.928436279296875, -1.8209228515625, -1.713409423828125, -1.60589599609375, -1.498382568359375, -1.390869140625, -1.283355712890625, -1.17584228515625, -1.068328857421875, -0.9608154296875, -0.853302001953125, -0.74578857421875, -0.638275146484375, -0.53076171875, -0.423248291015625, -0.31573486328125, -0.208221435546875, -0.1007080078125, 0.006805419921875, 0.11431884765625, 0.221832275390625, 0.329345703125, 0.436859130859375, 0.54437255859375, 0.651885986328125, 0.7593994140625, 0.866912841796875, 0.97442626953125, 1.081939697265625, 1.189453125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 15.0, 62.0, 485.0, 366.0, 48.0, 10.0, 9.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.46833038330078, -21.216089248657227, -19.963848114013672, -18.711606979370117, -17.459365844726562, -16.207122802734375, -14.95488166809082, -13.702640533447266, -12.450399398803711, -11.198158264160156, -9.945917129516602, -8.69367504119873, -7.441433906555176, -6.189192771911621, -4.936951160430908, -3.6847095489501953, -2.4324684143066406, -1.1802270412445068, 0.07201433181762695, 1.3242557048797607, 2.5764970779418945, 3.828738212585449, 5.080979824066162, 6.333221435546875, 7.58546257019043, 8.837703704833984, 10.089944839477539, 11.34218692779541, 12.594428062438965, 13.84666919708252, 15.09891128540039, 16.351152420043945, 17.603397369384766, 18.85563850402832, 20.107879638671875, 21.36012077331543, 22.612361907958984, 23.864604949951172, 25.116846084594727, 26.36908721923828, 27.621328353881836, 28.87356948852539, 30.125810623168945, 31.3780517578125, 32.63029479980469, 33.88253402709961, 35.1347770690918, 36.38701629638672, 37.639259338378906, 38.891502380371094, 40.143741607666016, 41.3959846496582, 42.648223876953125, 43.90046691894531, 45.152706146240234, 46.40494918823242, 47.657188415527344, 48.90943145751953, 50.16167068481445, 51.41391372680664, 52.66615295410156, 53.91839599609375, 55.17063522338867, 56.42287826538086, 57.67512130737305]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 24.0, 37.0, 50.0, 67.0, 90.0, 97.0, 99.0, 91.0, 105.0, 74.0, 65.0, 60.0, 46.0, 31.0, 13.0, 9.0, 13.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.894081115722656, -8.588213920593262, -8.28234577178955, -7.976478099822998, -7.670610427856445, -7.364743232727051, -7.058875560760498, -6.753007888793945, -6.447140216827393, -6.14127254486084, -5.835404872894287, -5.529537200927734, -5.22367000579834, -4.917801856994629, -4.611934661865234, -4.306066989898682, -4.000199317932129, -3.694331645965576, -3.3884639739990234, -3.08259654045105, -2.776728868484497, -2.4708611965179443, -2.1649937629699707, -1.859126091003418, -1.5532584190368652, -1.2473907470703125, -0.9415231943130493, -0.6356555819511414, -0.3297879695892334, -0.023920297622680664, 0.2819472551345825, 0.5878148078918457, 0.8936834335327148, 1.1995511054992676, 1.5054186582565308, 1.811286211013794, 2.1171538829803467, 2.4230215549468994, 2.728888988494873, 3.034756660461426, 3.3406243324279785, 3.6464920043945312, 3.952359676361084, 4.258227348327637, 4.564094543457031, 4.869962692260742, 5.175829887390137, 5.4816975593566895, 5.787565231323242, 6.093432903289795, 6.399300575256348, 6.7051682472229, 7.011035919189453, 7.316903114318848, 7.6227707862854, 7.928638458251953, 8.234506607055664, 8.540373802185059, 8.84624195098877, 9.152109146118164, 9.457977294921875, 9.76384449005127, 10.06971263885498, 10.375579833984375, 10.68144702911377]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 8.0, 14.0, 15.0, 15.0, 30.0, 51.0, 62.0, 93.0, 121.0, 204.0, 297.0, 522.0, 1014.0, 2372.0, 7421.0, 32821.0, 291166.0, 636005.0, 58661.0, 11321.0, 3315.0, 1325.0, 635.0, 354.0, 217.0, 131.0, 83.0, 73.0, 51.0, 37.0, 19.0, 16.0, 18.0, 16.0, 12.0, 2.0, 11.0, 6.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-6.29296875, -6.0972900390625, -5.901611328125, -5.7059326171875, -5.51025390625, -5.3145751953125, -5.118896484375, -4.9232177734375, -4.7275390625, -4.5318603515625, -4.336181640625, -4.1405029296875, -3.94482421875, -3.7491455078125, -3.553466796875, -3.3577880859375, -3.162109375, -2.9664306640625, -2.770751953125, -2.5750732421875, -2.37939453125, -2.1837158203125, -1.988037109375, -1.7923583984375, -1.5966796875, -1.4010009765625, -1.205322265625, -1.0096435546875, -0.81396484375, -0.6182861328125, -0.422607421875, -0.2269287109375, -0.03125, 0.1644287109375, 0.360107421875, 0.5557861328125, 0.75146484375, 0.9471435546875, 1.142822265625, 1.3385009765625, 1.5341796875, 1.7298583984375, 1.925537109375, 2.1212158203125, 2.31689453125, 2.5125732421875, 2.708251953125, 2.9039306640625, 3.099609375, 3.2952880859375, 3.490966796875, 3.6866455078125, 3.88232421875, 4.0780029296875, 4.273681640625, 4.4693603515625, 4.6650390625, 4.8607177734375, 5.056396484375, 5.2520751953125, 5.44775390625, 5.6434326171875, 5.839111328125, 6.0347900390625, 6.23046875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 11.0, 5.0, 13.0, 21.0, 27.0, 67.0, 73.0, 91.0, 104.0, 122.0, 114.0, 124.0, 82.0, 49.0, 36.0, 28.0, 21.0, 8.0, 4.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.330078125, -1.2981491088867188, -1.2662200927734375, -1.2342910766601562, -1.202362060546875, -1.1704330444335938, -1.1385040283203125, -1.1065750122070312, -1.07464599609375, -1.0427169799804688, -1.0107879638671875, -0.9788589477539062, -0.946929931640625, -0.9150009155273438, -0.8830718994140625, -0.8511428833007812, -0.8192138671875, -0.7872848510742188, -0.7553558349609375, -0.7234268188476562, -0.691497802734375, -0.6595687866210938, -0.6276397705078125, -0.5957107543945312, -0.56378173828125, -0.5318527221679688, -0.4999237060546875, -0.46799468994140625, -0.436065673828125, -0.40413665771484375, -0.3722076416015625, -0.34027862548828125, -0.308349609375, -0.27642059326171875, -0.2444915771484375, -0.21256256103515625, -0.180633544921875, -0.14870452880859375, -0.1167755126953125, -0.08484649658203125, -0.05291748046875, -0.02098846435546875, 0.0109405517578125, 0.04286956787109375, 0.074798583984375, 0.10672760009765625, 0.1386566162109375, 0.17058563232421875, 0.2025146484375, 0.23444366455078125, 0.2663726806640625, 0.29830169677734375, 0.330230712890625, 0.36215972900390625, 0.3940887451171875, 0.42601776123046875, 0.45794677734375, 0.48987579345703125, 0.5218048095703125, 0.5537338256835938, 0.585662841796875, 0.6175918579101562, 0.6495208740234375, 0.6814498901367188, 0.71337890625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 8.0, 10.0, 12.0, 12.0, 21.0, 26.0, 45.0, 62.0, 63.0, 112.0, 190.0, 263.0, 399.0, 656.0, 1131.0, 2052.0, 3952.0, 8366.0, 19560.0, 52918.0, 179884.0, 498880.0, 187312.0, 54275.0, 20514.0, 8718.0, 4052.0, 2041.0, 1118.0, 673.0, 395.0, 263.0, 164.0, 120.0, 76.0, 63.0, 36.0, 24.0, 22.0, 20.0, 16.0, 10.0, 8.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.650390625, -2.568878173828125, -2.48736572265625, -2.405853271484375, -2.3243408203125, -2.242828369140625, -2.16131591796875, -2.079803466796875, -1.998291015625, -1.916778564453125, -1.83526611328125, -1.753753662109375, -1.6722412109375, -1.590728759765625, -1.50921630859375, -1.427703857421875, -1.34619140625, -1.264678955078125, -1.18316650390625, -1.101654052734375, -1.0201416015625, -0.938629150390625, -0.85711669921875, -0.775604248046875, -0.694091796875, -0.612579345703125, -0.53106689453125, -0.449554443359375, -0.3680419921875, -0.286529541015625, -0.20501708984375, -0.123504638671875, -0.0419921875, 0.039520263671875, 0.12103271484375, 0.202545166015625, 0.2840576171875, 0.365570068359375, 0.44708251953125, 0.528594970703125, 0.610107421875, 0.691619873046875, 0.77313232421875, 0.854644775390625, 0.9361572265625, 1.017669677734375, 1.09918212890625, 1.180694580078125, 1.26220703125, 1.343719482421875, 1.42523193359375, 1.506744384765625, 1.5882568359375, 1.669769287109375, 1.75128173828125, 1.832794189453125, 1.914306640625, 1.995819091796875, 2.07733154296875, 2.158843994140625, 2.2403564453125, 2.321868896484375, 2.40338134765625, 2.484893798828125, 2.56640625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 9.0, 7.0, 8.0, 16.0, 9.0, 11.0, 20.0, 22.0, 26.0, 22.0, 22.0, 34.0, 38.0, 47.0, 55.0, 46.0, 29.0, 53.0, 49.0, 47.0, 51.0, 49.0, 48.0, 46.0, 34.0, 34.0, 31.0, 30.0, 24.0, 19.0, 13.0, 16.0, 8.0, 8.0, 6.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.421875, -2.350616455078125, -2.27935791015625, -2.208099365234375, -2.1368408203125, -2.065582275390625, -1.99432373046875, -1.923065185546875, -1.851806640625, -1.780548095703125, -1.70928955078125, -1.638031005859375, -1.5667724609375, -1.495513916015625, -1.42425537109375, -1.352996826171875, -1.28173828125, -1.210479736328125, -1.13922119140625, -1.067962646484375, -0.9967041015625, -0.925445556640625, -0.85418701171875, -0.782928466796875, -0.711669921875, -0.640411376953125, -0.56915283203125, -0.497894287109375, -0.4266357421875, -0.355377197265625, -0.28411865234375, -0.212860107421875, -0.1416015625, -0.070343017578125, 0.00091552734375, 0.072174072265625, 0.1434326171875, 0.214691162109375, 0.28594970703125, 0.357208251953125, 0.428466796875, 0.499725341796875, 0.57098388671875, 0.642242431640625, 0.7135009765625, 0.784759521484375, 0.85601806640625, 0.927276611328125, 0.99853515625, 1.069793701171875, 1.14105224609375, 1.212310791015625, 1.2835693359375, 1.354827880859375, 1.42608642578125, 1.497344970703125, 1.568603515625, 1.639862060546875, 1.71112060546875, 1.782379150390625, 1.8536376953125, 1.924896240234375, 1.99615478515625, 2.067413330078125, 2.138671875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 14.0, 4.0, 16.0, 21.0, 29.0, 45.0, 79.0, 128.0, 228.0, 402.0, 922.0, 2523.0, 9003.0, 66907.0, 886867.0, 68004.0, 8983.0, 2517.0, 853.0, 413.0, 237.0, 121.0, 73.0, 59.0, 31.0, 25.0, 15.0, 8.0, 5.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.5625, -4.444000244140625, -4.32550048828125, -4.207000732421875, -4.0885009765625, -3.970001220703125, -3.85150146484375, -3.733001708984375, -3.614501953125, -3.496002197265625, -3.37750244140625, -3.259002685546875, -3.1405029296875, -3.022003173828125, -2.90350341796875, -2.785003662109375, -2.66650390625, -2.548004150390625, -2.42950439453125, -2.311004638671875, -2.1925048828125, -2.074005126953125, -1.95550537109375, -1.837005615234375, -1.718505859375, -1.600006103515625, -1.48150634765625, -1.363006591796875, -1.2445068359375, -1.126007080078125, -1.00750732421875, -0.889007568359375, -0.7705078125, -0.652008056640625, -0.53350830078125, -0.415008544921875, -0.2965087890625, -0.178009033203125, -0.05950927734375, 0.058990478515625, 0.177490234375, 0.295989990234375, 0.41448974609375, 0.532989501953125, 0.6514892578125, 0.769989013671875, 0.88848876953125, 1.006988525390625, 1.12548828125, 1.243988037109375, 1.36248779296875, 1.480987548828125, 1.5994873046875, 1.717987060546875, 1.83648681640625, 1.954986572265625, 2.073486328125, 2.191986083984375, 2.31048583984375, 2.428985595703125, 2.5474853515625, 2.665985107421875, 2.78448486328125, 2.902984619140625, 3.021484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 7.0, 8.0, 18.0, 22.0, 29.0, 47.0, 70.0, 173.0, 236.0, 164.0, 70.0, 45.0, 26.0, 20.0, 18.0, 15.0, 7.0, 8.0, 3.0, 7.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0], "bins": [-0.0006036758422851562, -0.0005904026329517365, -0.0005771294236183167, -0.0005638562142848969, -0.000550583004951477, -0.0005373097956180573, -0.0005240365862846375, -0.0005107633769512177, -0.0004974901676177979, -0.00048421695828437805, -0.00047094374895095825, -0.00045767053961753845, -0.00044439733028411865, -0.00043112412095069885, -0.00041785091161727905, -0.00040457770228385925, -0.00039130449295043945, -0.00037803128361701965, -0.00036475807428359985, -0.00035148486495018005, -0.00033821165561676025, -0.00032493844628334045, -0.00031166523694992065, -0.00029839202761650085, -0.00028511881828308105, -0.00027184560894966125, -0.00025857239961624146, -0.00024529919028282166, -0.00023202598094940186, -0.00021875277161598206, -0.00020547956228256226, -0.00019220635294914246, -0.00017893314361572266, -0.00016565993428230286, -0.00015238672494888306, -0.00013911351561546326, -0.00012584030628204346, -0.00011256709694862366, -9.929388761520386e-05, -8.602067828178406e-05, -7.274746894836426e-05, -5.947425961494446e-05, -4.620105028152466e-05, -3.292784094810486e-05, -1.965463161468506e-05, -6.381422281265259e-06, 6.891787052154541e-06, 2.016499638557434e-05, 3.343820571899414e-05, 4.671141505241394e-05, 5.998462438583374e-05, 7.325783371925354e-05, 8.653104305267334e-05, 9.980425238609314e-05, 0.00011307746171951294, 0.00012635067105293274, 0.00013962388038635254, 0.00015289708971977234, 0.00016617029905319214, 0.00017944350838661194, 0.00019271671772003174, 0.00020598992705345154, 0.00021926313638687134, 0.00023253634572029114, 0.00024580955505371094]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 8.0, 14.0, 9.0, 13.0, 13.0, 24.0, 22.0, 38.0, 72.0, 75.0, 111.0, 207.0, 265.0, 490.0, 793.0, 1411.0, 2649.0, 5336.0, 12444.0, 36278.0, 183814.0, 670083.0, 92419.0, 23748.0, 8889.0, 4184.0, 2111.0, 1191.0, 660.0, 431.0, 263.0, 161.0, 105.0, 74.0, 39.0, 28.0, 23.0, 13.0, 14.0, 5.0, 4.0, 6.0, 5.0, 3.0, 5.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.7705078125, -1.715728759765625, -1.66094970703125, -1.606170654296875, -1.5513916015625, -1.496612548828125, -1.44183349609375, -1.387054443359375, -1.332275390625, -1.277496337890625, -1.22271728515625, -1.167938232421875, -1.1131591796875, -1.058380126953125, -1.00360107421875, -0.948822021484375, -0.89404296875, -0.839263916015625, -0.78448486328125, -0.729705810546875, -0.6749267578125, -0.620147705078125, -0.56536865234375, -0.510589599609375, -0.455810546875, -0.401031494140625, -0.34625244140625, -0.291473388671875, -0.2366943359375, -0.181915283203125, -0.12713623046875, -0.072357177734375, -0.017578125, 0.037200927734375, 0.09197998046875, 0.146759033203125, 0.2015380859375, 0.256317138671875, 0.31109619140625, 0.365875244140625, 0.420654296875, 0.475433349609375, 0.53021240234375, 0.584991455078125, 0.6397705078125, 0.694549560546875, 0.74932861328125, 0.804107666015625, 0.85888671875, 0.913665771484375, 0.96844482421875, 1.023223876953125, 1.0780029296875, 1.132781982421875, 1.18756103515625, 1.242340087890625, 1.297119140625, 1.351898193359375, 1.40667724609375, 1.461456298828125, 1.5162353515625, 1.571014404296875, 1.62579345703125, 1.680572509765625, 1.7353515625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 10.0, 12.0, 13.0, 6.0, 16.0, 27.0, 35.0, 38.0, 54.0, 52.0, 84.0, 85.0, 104.0, 97.0, 61.0, 65.0, 48.0, 29.0, 29.0, 26.0, 22.0, 16.0, 10.0, 10.0, 6.0, 7.0, 7.0, 3.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -1.0212249755859375, -0.987762451171875, -0.9542999267578125, -0.92083740234375, -0.8873748779296875, -0.853912353515625, -0.8204498291015625, -0.7869873046875, -0.7535247802734375, -0.720062255859375, -0.6865997314453125, -0.65313720703125, -0.6196746826171875, -0.586212158203125, -0.5527496337890625, -0.519287109375, -0.4858245849609375, -0.452362060546875, -0.4188995361328125, -0.38543701171875, -0.3519744873046875, -0.318511962890625, -0.2850494384765625, -0.2515869140625, -0.2181243896484375, -0.184661865234375, -0.1511993408203125, -0.11773681640625, -0.0842742919921875, -0.050811767578125, -0.0173492431640625, 0.01611328125, 0.0495758056640625, 0.083038330078125, 0.1165008544921875, 0.14996337890625, 0.1834259033203125, 0.216888427734375, 0.2503509521484375, 0.2838134765625, 0.3172760009765625, 0.350738525390625, 0.3842010498046875, 0.41766357421875, 0.4511260986328125, 0.484588623046875, 0.5180511474609375, 0.551513671875, 0.5849761962890625, 0.618438720703125, 0.6519012451171875, 0.68536376953125, 0.7188262939453125, 0.752288818359375, 0.7857513427734375, 0.8192138671875, 0.8526763916015625, 0.886138916015625, 0.9196014404296875, 0.95306396484375, 0.9865264892578125, 1.019989013671875, 1.0534515380859375, 1.0869140625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 33.0, 69.0, 156.0, 255.0, 224.0, 125.0, 62.0, 36.0, 11.0, 9.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.6658992767334, -27.667036056518555, -26.668170928955078, -25.669307708740234, -24.67044448852539, -23.671581268310547, -22.67271614074707, -21.673852920532227, -20.67498779296875, -19.676124572753906, -18.67725944519043, -17.678396224975586, -16.679533004760742, -15.680668830871582, -14.681804656982422, -13.682941436767578, -12.684078216552734, -11.685214042663574, -10.68635082244873, -9.68748664855957, -8.688623428344727, -7.689759254455566, -6.690895080566406, -5.692031383514404, -4.693167686462402, -3.6943039894104004, -2.6954400539398193, -1.6965761184692383, -0.6977124214172363, 0.3011512756347656, 1.3000154495239258, 2.2988791465759277, 3.2977447509765625, 4.2966084480285645, 5.295472145080566, 6.294336318969727, 7.2932000160217285, 8.29206371307373, 9.29092788696289, 10.289791107177734, 11.288655281066895, 12.287519454956055, 13.286382675170898, 14.285246849060059, 15.284111022949219, 16.282974243164062, 17.281837463378906, 18.280702590942383, 19.279565811157227, 20.27842903137207, 21.277294158935547, 22.27615737915039, 23.275020599365234, 24.273883819580078, 25.272748947143555, 26.2716121673584, 27.270477294921875, 28.26934051513672, 29.268205642700195, 30.26706886291504, 31.265932083129883, 32.26479721069336, 33.2636604309082, 34.26252365112305, 35.26138687133789]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 5.0, 9.0, 12.0, 19.0, 23.0, 22.0, 35.0, 35.0, 41.0, 60.0, 72.0, 73.0, 69.0, 77.0, 77.0, 57.0, 55.0, 63.0, 35.0, 36.0, 32.0, 28.0, 23.0, 15.0, 12.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.603023529052734, -10.003554344177246, -9.404086112976074, -8.804616928100586, -8.205147743225098, -7.605679035186768, -7.0062103271484375, -6.406741142272949, -5.807272434234619, -5.207803726196289, -4.608334541320801, -4.008865833282471, -3.4093968868255615, -2.8099279403686523, -2.2104592323303223, -1.610990047454834, -1.011521339416504, -0.4120524525642395, 0.1874164342880249, 0.7868852615356445, 1.3863542079925537, 1.985823154449463, 2.585291862487793, 3.1847610473632812, 3.7842297554016113, 4.383698463439941, 4.98316764831543, 5.58263635635376, 6.18210506439209, 6.781574249267578, 7.381042957305908, 7.9805121421813965, 8.579980850219727, 9.179450035095215, 9.778918266296387, 10.378387451171875, 10.977856636047363, 11.577325820922852, 12.176794052124023, 12.776263236999512, 13.375732421875, 13.975201606750488, 14.57466983795166, 15.174139022827148, 15.773608207702637, 16.373077392578125, 16.972545623779297, 17.57201385498047, 18.17148208618164, 18.770950317382812, 19.370420455932617, 19.96988868713379, 20.56935691833496, 21.168827056884766, 21.768295288085938, 22.36776351928711, 22.967233657836914, 23.566701889038086, 24.16617202758789, 24.765640258789062, 25.365108489990234, 25.96457862854004, 26.56404685974121, 27.163516998291016, 27.762985229492188]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 5.0, 5.0, 7.0, 6.0, 12.0, 10.0, 16.0, 19.0, 17.0, 24.0, 27.0, 27.0, 41.0, 56.0, 82.0, 101.0, 137.0, 206.0, 409.0, 851.0, 1976.0, 5782.0, 21060.0, 3967749.0, 172456.0, 15320.0, 4585.0, 1646.0, 715.0, 395.0, 202.0, 113.0, 62.0, 54.0, 31.0, 21.0, 13.0, 10.0, 6.0, 7.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0], "bins": [-14.390625, -14.03857421875, -13.6865234375, -13.33447265625, -12.982421875, -12.63037109375, -12.2783203125, -11.92626953125, -11.57421875, -11.22216796875, -10.8701171875, -10.51806640625, -10.166015625, -9.81396484375, -9.4619140625, -9.10986328125, -8.7578125, -8.40576171875, -8.0537109375, -7.70166015625, -7.349609375, -6.99755859375, -6.6455078125, -6.29345703125, -5.94140625, -5.58935546875, -5.2373046875, -4.88525390625, -4.533203125, -4.18115234375, -3.8291015625, -3.47705078125, -3.125, -2.77294921875, -2.4208984375, -2.06884765625, -1.716796875, -1.36474609375, -1.0126953125, -0.66064453125, -0.30859375, 0.04345703125, 0.3955078125, 0.74755859375, 1.099609375, 1.45166015625, 1.8037109375, 2.15576171875, 2.5078125, 2.85986328125, 3.2119140625, 3.56396484375, 3.916015625, 4.26806640625, 4.6201171875, 4.97216796875, 5.32421875, 5.67626953125, 6.0283203125, 6.38037109375, 6.732421875, 7.08447265625, 7.4365234375, 7.78857421875, 8.140625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 29.0, 42.0, 52.0, 79.0, 98.0, 115.0, 125.0, 138.0, 92.0, 77.0, 55.0, 34.0, 27.0, 10.0, 10.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.3050918579101562, -1.2693634033203125, -1.2336349487304688, -1.197906494140625, -1.1621780395507812, -1.1264495849609375, -1.0907211303710938, -1.05499267578125, -1.0192642211914062, -0.9835357666015625, -0.9478073120117188, -0.912078857421875, -0.8763504028320312, -0.8406219482421875, -0.8048934936523438, -0.7691650390625, -0.7334365844726562, -0.6977081298828125, -0.6619796752929688, -0.626251220703125, -0.5905227661132812, -0.5547943115234375, -0.5190658569335938, -0.48333740234375, -0.44760894775390625, -0.4118804931640625, -0.37615203857421875, -0.340423583984375, -0.30469512939453125, -0.2689666748046875, -0.23323822021484375, -0.197509765625, -0.16178131103515625, -0.1260528564453125, -0.09032440185546875, -0.054595947265625, -0.01886749267578125, 0.0168609619140625, 0.05258941650390625, 0.08831787109375, 0.12404632568359375, 0.1597747802734375, 0.19550323486328125, 0.231231689453125, 0.26696014404296875, 0.3026885986328125, 0.33841705322265625, 0.3741455078125, 0.40987396240234375, 0.4456024169921875, 0.48133087158203125, 0.517059326171875, 0.5527877807617188, 0.5885162353515625, 0.6242446899414062, 0.65997314453125, 0.6957015991210938, 0.7314300537109375, 0.7671585083007812, 0.802886962890625, 0.8386154174804688, 0.8743438720703125, 0.9100723266601562, 0.94580078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 5.0, 16.0, 29.0, 35.0, 50.0, 79.0, 129.0, 223.0, 313.0, 491.0, 742.0, 1546.0, 3437.0, 9400.0, 40112.0, 3780604.0, 319205.0, 25076.0, 6956.0, 2566.0, 1274.0, 775.0, 433.0, 242.0, 155.0, 120.0, 77.0, 61.0, 37.0, 29.0, 17.0, 13.0, 10.0, 6.0, 4.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68359375, -7.4566650390625, -7.229736328125, -7.0028076171875, -6.77587890625, -6.5489501953125, -6.322021484375, -6.0950927734375, -5.8681640625, -5.6412353515625, -5.414306640625, -5.1873779296875, -4.96044921875, -4.7335205078125, -4.506591796875, -4.2796630859375, -4.052734375, -3.8258056640625, -3.598876953125, -3.3719482421875, -3.14501953125, -2.9180908203125, -2.691162109375, -2.4642333984375, -2.2373046875, -2.0103759765625, -1.783447265625, -1.5565185546875, -1.32958984375, -1.1026611328125, -0.875732421875, -0.6488037109375, -0.421875, -0.1949462890625, 0.031982421875, 0.2589111328125, 0.48583984375, 0.7127685546875, 0.939697265625, 1.1666259765625, 1.3935546875, 1.6204833984375, 1.847412109375, 2.0743408203125, 2.30126953125, 2.5281982421875, 2.755126953125, 2.9820556640625, 3.208984375, 3.4359130859375, 3.662841796875, 3.8897705078125, 4.11669921875, 4.3436279296875, 4.570556640625, 4.7974853515625, 5.0244140625, 5.2513427734375, 5.478271484375, 5.7052001953125, 5.93212890625, 6.1590576171875, 6.385986328125, 6.6129150390625, 6.83984375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 8.0, 12.0, 11.0, 15.0, 17.0, 41.0, 65.0, 142.0, 866.0, 2524.0, 167.0, 70.0, 45.0, 35.0, 13.0, 16.0, 9.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6279296875, -1.5720367431640625, -1.516143798828125, -1.4602508544921875, -1.40435791015625, -1.3484649658203125, -1.292572021484375, -1.2366790771484375, -1.1807861328125, -1.1248931884765625, -1.069000244140625, -1.0131072998046875, -0.95721435546875, -0.9013214111328125, -0.845428466796875, -0.7895355224609375, -0.733642578125, -0.6777496337890625, -0.621856689453125, -0.5659637451171875, -0.51007080078125, -0.4541778564453125, -0.398284912109375, -0.3423919677734375, -0.2864990234375, -0.2306060791015625, -0.174713134765625, -0.1188201904296875, -0.06292724609375, -0.0070343017578125, 0.048858642578125, 0.1047515869140625, 0.16064453125, 0.2165374755859375, 0.272430419921875, 0.3283233642578125, 0.38421630859375, 0.4401092529296875, 0.496002197265625, 0.5518951416015625, 0.6077880859375, 0.6636810302734375, 0.719573974609375, 0.7754669189453125, 0.83135986328125, 0.8872528076171875, 0.943145751953125, 0.9990386962890625, 1.054931640625, 1.1108245849609375, 1.166717529296875, 1.2226104736328125, 1.27850341796875, 1.3343963623046875, 1.390289306640625, 1.4461822509765625, 1.5020751953125, 1.5579681396484375, 1.613861083984375, 1.6697540283203125, 1.72564697265625, 1.7815399169921875, 1.837432861328125, 1.8933258056640625, 1.94921875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 17.0, 26.0, 89.0, 210.0, 375.0, 153.0, 65.0, 30.0, 8.0, 9.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.586057662963867, -18.125606536865234, -17.66515350341797, -17.204702377319336, -16.744251251220703, -16.28380012512207, -15.823347091674805, -15.362895965576172, -14.902444839477539, -14.44199275970459, -13.981541633605957, -13.521089553833008, -13.060638427734375, -12.600186347961426, -12.139734268188477, -11.679283142089844, -11.218831062316895, -10.758378982543945, -10.297927856445312, -9.837475776672363, -9.37702465057373, -8.916572570800781, -8.456121444702148, -7.995669364929199, -7.535217761993408, -7.074766159057617, -6.614314556121826, -6.153862953186035, -5.693410873413086, -5.232959747314453, -4.772507667541504, -4.312056064605713, -3.8516054153442383, -3.3911538124084473, -2.9307022094726562, -2.470250368118286, -2.009798765182495, -1.549347162246704, -1.088895320892334, -0.628443717956543, -0.16799211502075195, 0.29245954751968384, 0.7529112100601196, 1.2133629322052002, 1.6738145351409912, 2.1342661380767822, 2.5947179794311523, 3.0551695823669434, 3.5156211853027344, 3.9760727882385254, 4.436524391174316, 4.896976470947266, 5.357427597045898, 5.817879676818848, 6.278331279754639, 6.73878288269043, 7.199234485626221, 7.659686088562012, 8.120138168334961, 8.580589294433594, 9.041041374206543, 9.501492500305176, 9.961944580078125, 10.422395706176758, 10.882847785949707]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 5.0, 13.0, 18.0, 19.0, 23.0, 19.0, 23.0, 38.0, 34.0, 43.0, 60.0, 53.0, 63.0, 67.0, 69.0, 52.0, 64.0, 52.0, 49.0, 38.0, 26.0, 27.0, 32.0, 27.0, 20.0, 6.0, 12.0, 13.0, 6.0, 9.0, 4.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.373544216156006, -5.224605560302734, -5.075666427612305, -4.926727771759033, -4.7777886390686035, -4.628849983215332, -4.479910850524902, -4.330972194671631, -4.182033538818359, -4.033094882965088, -3.884155750274658, -3.7352168560028076, -3.586277961730957, -3.4373393058776855, -3.288400411605835, -3.1394615173339844, -2.9905223846435547, -2.841583490371704, -2.6926445960998535, -2.543705701828003, -2.3947668075561523, -2.245828151702881, -2.0968892574310303, -1.9479503631591797, -1.799011468887329, -1.6500725746154785, -1.501133680343628, -1.352194905281067, -1.2032560110092163, -1.0543171167373657, -0.9053782820701599, -0.7564394474029541, -0.6075010299682617, -0.4585621654987335, -0.3096233010292053, -0.16068443655967712, -0.011745572090148926, 0.13719332218170166, 0.28613215684890747, 0.4350709915161133, 0.5840098857879639, 0.7329487800598145, 0.8818876147270203, 1.030826449394226, 1.1797653436660767, 1.3287042379379272, 1.4776430130004883, 1.6265819072723389, 1.7755208015441895, 1.92445969581604, 2.0733985900878906, 2.222337484359741, 2.371276378631592, 2.5202150344848633, 2.669153928756714, 2.8180928230285645, 2.967031717300415, 3.1159706115722656, 3.264909505844116, 3.413848400115967, 3.5627870559692383, 3.711726188659668, 3.8606648445129395, 4.009603500366211, 4.158542633056641]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 8.0, 8.0, 20.0, 24.0, 25.0, 54.0, 59.0, 127.0, 241.0, 469.0, 1122.0, 3346.0, 19682.0, 471591.0, 524810.0, 21185.0, 3490.0, 1117.0, 508.0, 273.0, 151.0, 69.0, 50.0, 44.0, 20.0, 18.0, 8.0, 10.0, 4.0, 2.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.09375, -13.75830078125, -13.4228515625, -13.08740234375, -12.751953125, -12.41650390625, -12.0810546875, -11.74560546875, -11.41015625, -11.07470703125, -10.7392578125, -10.40380859375, -10.068359375, -9.73291015625, -9.3974609375, -9.06201171875, -8.7265625, -8.39111328125, -8.0556640625, -7.72021484375, -7.384765625, -7.04931640625, -6.7138671875, -6.37841796875, -6.04296875, -5.70751953125, -5.3720703125, -5.03662109375, -4.701171875, -4.36572265625, -4.0302734375, -3.69482421875, -3.359375, -3.02392578125, -2.6884765625, -2.35302734375, -2.017578125, -1.68212890625, -1.3466796875, -1.01123046875, -0.67578125, -0.34033203125, -0.0048828125, 0.33056640625, 0.666015625, 1.00146484375, 1.3369140625, 1.67236328125, 2.0078125, 2.34326171875, 2.6787109375, 3.01416015625, 3.349609375, 3.68505859375, 4.0205078125, 4.35595703125, 4.69140625, 5.02685546875, 5.3623046875, 5.69775390625, 6.033203125, 6.36865234375, 6.7041015625, 7.03955078125, 7.375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 11.0, 25.0, 49.0, 47.0, 81.0, 91.0, 113.0, 110.0, 134.0, 105.0, 85.0, 52.0, 32.0, 28.0, 9.0, 13.0, 1.0, 3.0, 0.0, 0.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5966796875, -1.5582046508789062, -1.5197296142578125, -1.4812545776367188, -1.442779541015625, -1.4043045043945312, -1.3658294677734375, -1.3273544311523438, -1.28887939453125, -1.2504043579101562, -1.2119293212890625, -1.1734542846679688, -1.134979248046875, -1.0965042114257812, -1.0580291748046875, -1.0195541381835938, -0.9810791015625, -0.9426040649414062, -0.9041290283203125, -0.8656539916992188, -0.827178955078125, -0.7887039184570312, -0.7502288818359375, -0.7117538452148438, -0.67327880859375, -0.6348037719726562, -0.5963287353515625, -0.5578536987304688, -0.519378662109375, -0.48090362548828125, -0.4424285888671875, -0.40395355224609375, -0.365478515625, -0.32700347900390625, -0.2885284423828125, -0.25005340576171875, -0.211578369140625, -0.17310333251953125, -0.1346282958984375, -0.09615325927734375, -0.05767822265625, -0.01920318603515625, 0.0192718505859375, 0.05774688720703125, 0.096221923828125, 0.13469696044921875, 0.1731719970703125, 0.21164703369140625, 0.2501220703125, 0.28859710693359375, 0.3270721435546875, 0.36554718017578125, 0.404022216796875, 0.44249725341796875, 0.4809722900390625, 0.5194473266601562, 0.55792236328125, 0.5963973999023438, 0.6348724365234375, 0.6733474731445312, 0.711822509765625, 0.7502975463867188, 0.7887725830078125, 0.8272476196289062, 0.86572265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 11.0, 13.0, 13.0, 30.0, 29.0, 47.0, 83.0, 106.0, 221.0, 417.0, 830.0, 1914.0, 5098.0, 17049.0, 92411.0, 674073.0, 213399.0, 30167.0, 7619.0, 2625.0, 1123.0, 549.0, 292.0, 165.0, 79.0, 67.0, 31.0, 27.0, 20.0, 8.0, 8.0, 5.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7578125, -4.57952880859375, -4.4012451171875, -4.22296142578125, -4.044677734375, -3.86639404296875, -3.6881103515625, -3.50982666015625, -3.33154296875, -3.15325927734375, -2.9749755859375, -2.79669189453125, -2.618408203125, -2.44012451171875, -2.2618408203125, -2.08355712890625, -1.9052734375, -1.72698974609375, -1.5487060546875, -1.37042236328125, -1.192138671875, -1.01385498046875, -0.8355712890625, -0.65728759765625, -0.47900390625, -0.30072021484375, -0.1224365234375, 0.05584716796875, 0.234130859375, 0.41241455078125, 0.5906982421875, 0.76898193359375, 0.947265625, 1.12554931640625, 1.3038330078125, 1.48211669921875, 1.660400390625, 1.83868408203125, 2.0169677734375, 2.19525146484375, 2.37353515625, 2.55181884765625, 2.7301025390625, 2.90838623046875, 3.086669921875, 3.26495361328125, 3.4432373046875, 3.62152099609375, 3.7998046875, 3.97808837890625, 4.1563720703125, 4.33465576171875, 4.512939453125, 4.69122314453125, 4.8695068359375, 5.04779052734375, 5.22607421875, 5.40435791015625, 5.5826416015625, 5.76092529296875, 5.939208984375, 6.11749267578125, 6.2957763671875, 6.47406005859375, 6.65234375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 6.0, 7.0, 10.0, 15.0, 23.0, 21.0, 28.0, 28.0, 30.0, 54.0, 65.0, 77.0, 73.0, 77.0, 64.0, 82.0, 62.0, 53.0, 44.0, 47.0, 41.0, 27.0, 18.0, 12.0, 7.0, 14.0, 4.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.25390625, -5.13104248046875, -5.0081787109375, -4.88531494140625, -4.762451171875, -4.63958740234375, -4.5167236328125, -4.39385986328125, -4.27099609375, -4.14813232421875, -4.0252685546875, -3.90240478515625, -3.779541015625, -3.65667724609375, -3.5338134765625, -3.41094970703125, -3.2880859375, -3.16522216796875, -3.0423583984375, -2.91949462890625, -2.796630859375, -2.67376708984375, -2.5509033203125, -2.42803955078125, -2.30517578125, -2.18231201171875, -2.0594482421875, -1.93658447265625, -1.813720703125, -1.69085693359375, -1.5679931640625, -1.44512939453125, -1.322265625, -1.19940185546875, -1.0765380859375, -0.95367431640625, -0.830810546875, -0.70794677734375, -0.5850830078125, -0.46221923828125, -0.33935546875, -0.21649169921875, -0.0936279296875, 0.02923583984375, 0.152099609375, 0.27496337890625, 0.3978271484375, 0.52069091796875, 0.6435546875, 0.76641845703125, 0.8892822265625, 1.01214599609375, 1.135009765625, 1.25787353515625, 1.3807373046875, 1.50360107421875, 1.62646484375, 1.74932861328125, 1.8721923828125, 1.99505615234375, 2.117919921875, 2.24078369140625, 2.3636474609375, 2.48651123046875, 2.609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 9.0, 10.0, 11.0, 14.0, 14.0, 18.0, 32.0, 42.0, 81.0, 97.0, 182.0, 269.0, 549.0, 1037.0, 2174.0, 5177.0, 14085.0, 47862.0, 275760.0, 573292.0, 91188.0, 22845.0, 7671.0, 3069.0, 1345.0, 697.0, 374.0, 225.0, 149.0, 62.0, 72.0, 32.0, 28.0, 31.0, 15.0, 13.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3427734375, -1.293426513671875, -1.24407958984375, -1.194732666015625, -1.1453857421875, -1.096038818359375, -1.04669189453125, -0.997344970703125, -0.947998046875, -0.898651123046875, -0.84930419921875, -0.799957275390625, -0.7506103515625, -0.701263427734375, -0.65191650390625, -0.602569580078125, -0.55322265625, -0.503875732421875, -0.45452880859375, -0.405181884765625, -0.3558349609375, -0.306488037109375, -0.25714111328125, -0.207794189453125, -0.158447265625, -0.109100341796875, -0.05975341796875, -0.010406494140625, 0.0389404296875, 0.088287353515625, 0.13763427734375, 0.186981201171875, 0.236328125, 0.285675048828125, 0.33502197265625, 0.384368896484375, 0.4337158203125, 0.483062744140625, 0.53240966796875, 0.581756591796875, 0.631103515625, 0.680450439453125, 0.72979736328125, 0.779144287109375, 0.8284912109375, 0.877838134765625, 0.92718505859375, 0.976531982421875, 1.02587890625, 1.075225830078125, 1.12457275390625, 1.173919677734375, 1.2232666015625, 1.272613525390625, 1.32196044921875, 1.371307373046875, 1.420654296875, 1.470001220703125, 1.51934814453125, 1.568695068359375, 1.6180419921875, 1.667388916015625, 1.71673583984375, 1.766082763671875, 1.8154296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 7.0, 9.0, 10.0, 7.0, 14.0, 45.0, 74.0, 168.0, 273.0, 197.0, 72.0, 37.0, 31.0, 15.0, 10.0, 5.0, 4.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005288124084472656, -0.0005089044570922852, -0.0004889965057373047, -0.0004690885543823242, -0.00044918060302734375, -0.0004292726516723633, -0.0004093647003173828, -0.00038945674896240234, -0.0003695487976074219, -0.0003496408462524414, -0.00032973289489746094, -0.00030982494354248047, -0.0002899169921875, -0.00027000904083251953, -0.00025010108947753906, -0.0002301931381225586, -0.00021028518676757812, -0.00019037723541259766, -0.0001704692840576172, -0.00015056133270263672, -0.00013065338134765625, -0.00011074542999267578, -9.083747863769531e-05, -7.092952728271484e-05, -5.1021575927734375e-05, -3.1113624572753906e-05, -1.1205673217773438e-05, 8.702278137207031e-06, 2.86102294921875e-05, 4.851818084716797e-05, 6.842613220214844e-05, 8.83340835571289e-05, 0.00010824203491210938, 0.00012814998626708984, 0.0001480579376220703, 0.00016796588897705078, 0.00018787384033203125, 0.00020778179168701172, 0.0002276897430419922, 0.00024759769439697266, 0.0002675056457519531, 0.0002874135971069336, 0.00030732154846191406, 0.00032722949981689453, 0.000347137451171875, 0.00036704540252685547, 0.00038695335388183594, 0.0004068613052368164, 0.0004267692565917969, 0.00044667720794677734, 0.0004665851593017578, 0.0004864931106567383, 0.0005064010620117188, 0.0005263090133666992, 0.0005462169647216797, 0.0005661249160766602, 0.0005860328674316406, 0.0006059408187866211, 0.0006258487701416016, 0.000645756721496582, 0.0006656646728515625, 0.000685572624206543, 0.0007054805755615234, 0.0007253885269165039, 0.0007452964782714844]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 3.0, 10.0, 11.0, 19.0, 25.0, 34.0, 63.0, 77.0, 134.0, 215.0, 407.0, 761.0, 1657.0, 4027.0, 12506.0, 49634.0, 370933.0, 518415.0, 65541.0, 15136.0, 5055.0, 1980.0, 880.0, 399.0, 253.0, 128.0, 89.0, 46.0, 32.0, 23.0, 16.0, 10.0, 10.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.29296875, -1.241424560546875, -1.18988037109375, -1.138336181640625, -1.0867919921875, -1.035247802734375, -0.98370361328125, -0.932159423828125, -0.880615234375, -0.829071044921875, -0.77752685546875, -0.725982666015625, -0.6744384765625, -0.622894287109375, -0.57135009765625, -0.519805908203125, -0.46826171875, -0.416717529296875, -0.36517333984375, -0.313629150390625, -0.2620849609375, -0.210540771484375, -0.15899658203125, -0.107452392578125, -0.055908203125, -0.004364013671875, 0.04718017578125, 0.098724365234375, 0.1502685546875, 0.201812744140625, 0.25335693359375, 0.304901123046875, 0.3564453125, 0.407989501953125, 0.45953369140625, 0.511077880859375, 0.5626220703125, 0.614166259765625, 0.66571044921875, 0.717254638671875, 0.768798828125, 0.820343017578125, 0.87188720703125, 0.923431396484375, 0.9749755859375, 1.026519775390625, 1.07806396484375, 1.129608154296875, 1.18115234375, 1.232696533203125, 1.28424072265625, 1.335784912109375, 1.3873291015625, 1.438873291015625, 1.49041748046875, 1.541961669921875, 1.593505859375, 1.645050048828125, 1.69659423828125, 1.748138427734375, 1.7996826171875, 1.851226806640625, 1.90277099609375, 1.954315185546875, 2.005859375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 8.0, 6.0, 10.0, 10.0, 8.0, 28.0, 23.0, 41.0, 52.0, 78.0, 89.0, 89.0, 102.0, 92.0, 91.0, 61.0, 57.0, 41.0, 35.0, 17.0, 17.0, 15.0, 8.0, 6.0, 1.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.390625, -1.3564834594726562, -1.3223419189453125, -1.2882003784179688, -1.254058837890625, -1.2199172973632812, -1.1857757568359375, -1.1516342163085938, -1.11749267578125, -1.0833511352539062, -1.0492095947265625, -1.0150680541992188, -0.980926513671875, -0.9467849731445312, -0.9126434326171875, -0.8785018920898438, -0.8443603515625, -0.8102188110351562, -0.7760772705078125, -0.7419357299804688, -0.707794189453125, -0.6736526489257812, -0.6395111083984375, -0.6053695678710938, -0.57122802734375, -0.5370864868164062, -0.5029449462890625, -0.46880340576171875, -0.434661865234375, -0.40052032470703125, -0.3663787841796875, -0.33223724365234375, -0.298095703125, -0.26395416259765625, -0.2298126220703125, -0.19567108154296875, -0.161529541015625, -0.12738800048828125, -0.0932464599609375, -0.05910491943359375, -0.02496337890625, 0.00917816162109375, 0.0433197021484375, 0.07746124267578125, 0.111602783203125, 0.14574432373046875, 0.1798858642578125, 0.21402740478515625, 0.2481689453125, 0.28231048583984375, 0.3164520263671875, 0.35059356689453125, 0.384735107421875, 0.41887664794921875, 0.4530181884765625, 0.48715972900390625, 0.52130126953125, 0.5554428100585938, 0.5895843505859375, 0.6237258911132812, 0.657867431640625, 0.6920089721679688, 0.7261505126953125, 0.7602920532226562, 0.79443359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 11.0, 56.0, 227.0, 464.0, 178.0, 45.0, 13.0, 10.0, 4.0, 5.0], "bins": [-138.11410522460938, -135.7060546875, -133.29798889160156, -130.8899383544922, -128.4818878173828, -126.0738296508789, -123.66577911376953, -121.25772094726562, -118.84967041015625, -116.44161224365234, -114.03356170654297, -111.62550354003906, -109.21745300292969, -106.80939483642578, -104.4013442993164, -101.9932861328125, -99.58523559570312, -97.17717742919922, -94.76912689208984, -92.36106872558594, -89.95301818847656, -87.54496002197266, -85.13690948486328, -82.72885131835938, -80.32079315185547, -77.91273498535156, -75.50468444824219, -73.09662628173828, -70.6885757446289, -68.280517578125, -65.87246704101562, -63.46440887451172, -61.05635070800781, -58.64829635620117, -56.24024200439453, -53.83218765258789, -51.42413330078125, -49.01607894897461, -46.60802459716797, -44.19996643066406, -41.79191589355469, -39.38386154174805, -36.975807189941406, -34.567752838134766, -32.159698486328125, -29.751644134521484, -27.34358787536621, -24.93553352355957, -22.52747917175293, -20.11942481994629, -17.71137046813965, -15.303315162658691, -12.89526081085205, -10.48720645904541, -8.079151153564453, -5.6710968017578125, -3.263042449951172, -0.8549878597259521, 1.5530667304992676, 3.9611215591430664, 6.369175910949707, 8.777230262756348, 11.185285568237305, 13.593339920043945, 16.001394271850586]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 19.0, 8.0, 17.0, 20.0, 26.0, 42.0, 53.0, 53.0, 49.0, 70.0, 70.0, 70.0, 81.0, 72.0, 73.0, 60.0, 46.0, 40.0, 28.0, 34.0, 12.0, 13.0, 10.0, 8.0, 7.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.717491149902344, -26.97990608215332, -26.242321014404297, -25.504735946655273, -24.76715087890625, -24.029565811157227, -23.291980743408203, -22.554393768310547, -21.816810607910156, -21.079225540161133, -20.34164047241211, -19.604055404663086, -18.866470336914062, -18.12888526916504, -17.391300201416016, -16.65371322631836, -15.916128158569336, -15.178543090820312, -14.440958023071289, -13.703372955322266, -12.965787887573242, -12.228202819824219, -11.490616798400879, -10.753031730651855, -10.015446662902832, -9.277861595153809, -8.540276527404785, -7.8026909828186035, -7.06510591506958, -6.327520847320557, -5.589935302734375, -4.852350234985352, -4.114765167236328, -3.3771800994873047, -2.639594793319702, -1.9020094871520996, -1.1644244194030762, -0.42683935165405273, 0.3107461929321289, 1.0483312606811523, 1.7859163284301758, 2.523501396179199, 3.2610867023468018, 3.9986720085144043, 4.736257076263428, 5.473842144012451, 6.211427688598633, 6.949012756347656, 7.68659782409668, 8.424182891845703, 9.161767959594727, 9.89935302734375, 10.636938095092773, 11.374523162841797, 12.112109184265137, 12.84969425201416, 13.587279319763184, 14.324864387512207, 15.06244945526123, 15.80003547668457, 16.537620544433594, 17.275205612182617, 18.01279067993164, 18.750375747680664, 19.487960815429688]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 2.0, 12.0, 4.0, 8.0, 6.0, 7.0, 5.0, 9.0, 16.0, 20.0, 31.0, 20.0, 37.0, 43.0, 48.0, 59.0, 49.0, 94.0, 120.0, 178.0, 270.0, 440.0, 884.0, 2121.0, 5556.0, 17471.0, 89500.0, 3990216.0, 64448.0, 14664.0, 4721.0, 1667.0, 709.0, 323.0, 162.0, 113.0, 74.0, 67.0, 44.0, 24.0, 9.0, 8.0, 6.0, 6.0, 1.0, 2.0], "bins": [-14.3046875, -13.98968505859375, -13.6746826171875, -13.35968017578125, -13.044677734375, -12.72967529296875, -12.4146728515625, -12.09967041015625, -11.78466796875, -11.46966552734375, -11.1546630859375, -10.83966064453125, -10.524658203125, -10.20965576171875, -9.8946533203125, -9.57965087890625, -9.2646484375, -8.94964599609375, -8.6346435546875, -8.31964111328125, -8.004638671875, -7.68963623046875, -7.3746337890625, -7.05963134765625, -6.74462890625, -6.42962646484375, -6.1146240234375, -5.79962158203125, -5.484619140625, -5.16961669921875, -4.8546142578125, -4.53961181640625, -4.224609375, -3.90960693359375, -3.5946044921875, -3.27960205078125, -2.964599609375, -2.64959716796875, -2.3345947265625, -2.01959228515625, -1.70458984375, -1.38958740234375, -1.0745849609375, -0.75958251953125, -0.444580078125, -0.12957763671875, 0.1854248046875, 0.50042724609375, 0.8154296875, 1.13043212890625, 1.4454345703125, 1.76043701171875, 2.075439453125, 2.39044189453125, 2.7054443359375, 3.02044677734375, 3.33544921875, 3.65045166015625, 3.9654541015625, 4.28045654296875, 4.595458984375, 4.91046142578125, 5.2254638671875, 5.54046630859375, 5.85546875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 9.0, 15.0, 26.0, 35.0, 59.0, 67.0, 75.0, 117.0, 102.0, 118.0, 106.0, 80.0, 56.0, 57.0, 27.0, 22.0, 15.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.638671875, -1.6002883911132812, -1.5619049072265625, -1.5235214233398438, -1.485137939453125, -1.4467544555664062, -1.4083709716796875, -1.3699874877929688, -1.33160400390625, -1.2932205200195312, -1.2548370361328125, -1.2164535522460938, -1.178070068359375, -1.1396865844726562, -1.1013031005859375, -1.0629196166992188, -1.0245361328125, -0.9861526489257812, -0.9477691650390625, -0.9093856811523438, -0.871002197265625, -0.8326187133789062, -0.7942352294921875, -0.7558517456054688, -0.71746826171875, -0.6790847778320312, -0.6407012939453125, -0.6023178100585938, -0.563934326171875, -0.5255508422851562, -0.4871673583984375, -0.44878387451171875, -0.410400390625, -0.37201690673828125, -0.3336334228515625, -0.29524993896484375, -0.256866455078125, -0.21848297119140625, -0.1800994873046875, -0.14171600341796875, -0.10333251953125, -0.06494903564453125, -0.0265655517578125, 0.01181793212890625, 0.050201416015625, 0.08858489990234375, 0.1269683837890625, 0.16535186767578125, 0.2037353515625, 0.24211883544921875, 0.2805023193359375, 0.31888580322265625, 0.357269287109375, 0.39565277099609375, 0.4340362548828125, 0.47241973876953125, 0.51080322265625, 0.5491867065429688, 0.5875701904296875, 0.6259536743164062, 0.664337158203125, 0.7027206420898438, 0.7411041259765625, 0.7794876098632812, 0.81787109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 10.0, 10.0, 18.0, 21.0, 29.0, 46.0, 61.0, 126.0, 229.0, 491.0, 1173.0, 3850.0, 22350.0, 4026566.0, 127855.0, 8135.0, 1967.0, 687.0, 286.0, 128.0, 93.0, 50.0, 30.0, 22.0, 13.0, 11.0, 7.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.953125, -13.3662109375, -12.779296875, -12.1923828125, -11.60546875, -11.0185546875, -10.431640625, -9.8447265625, -9.2578125, -8.6708984375, -8.083984375, -7.4970703125, -6.91015625, -6.3232421875, -5.736328125, -5.1494140625, -4.5625, -3.9755859375, -3.388671875, -2.8017578125, -2.21484375, -1.6279296875, -1.041015625, -0.4541015625, 0.1328125, 0.7197265625, 1.306640625, 1.8935546875, 2.48046875, 3.0673828125, 3.654296875, 4.2412109375, 4.828125, 5.4150390625, 6.001953125, 6.5888671875, 7.17578125, 7.7626953125, 8.349609375, 8.9365234375, 9.5234375, 10.1103515625, 10.697265625, 11.2841796875, 11.87109375, 12.4580078125, 13.044921875, 13.6318359375, 14.21875, 14.8056640625, 15.392578125, 15.9794921875, 16.56640625, 17.1533203125, 17.740234375, 18.3271484375, 18.9140625, 19.5009765625, 20.087890625, 20.6748046875, 21.26171875, 21.8486328125, 22.435546875, 23.0224609375, 23.609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 11.0, 4.0, 22.0, 18.0, 35.0, 47.0, 116.0, 570.0, 2838.0, 228.0, 85.0, 39.0, 22.0, 16.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-6.54296875, -6.4100799560546875, -6.277191162109375, -6.1443023681640625, -6.01141357421875, -5.8785247802734375, -5.745635986328125, -5.6127471923828125, -5.4798583984375, -5.3469696044921875, -5.214080810546875, -5.0811920166015625, -4.94830322265625, -4.8154144287109375, -4.682525634765625, -4.5496368408203125, -4.416748046875, -4.2838592529296875, -4.150970458984375, -4.0180816650390625, -3.88519287109375, -3.7523040771484375, -3.619415283203125, -3.4865264892578125, -3.3536376953125, -3.2207489013671875, -3.087860107421875, -2.9549713134765625, -2.82208251953125, -2.6891937255859375, -2.556304931640625, -2.4234161376953125, -2.29052734375, -2.1576385498046875, -2.024749755859375, -1.8918609619140625, -1.75897216796875, -1.6260833740234375, -1.493194580078125, -1.3603057861328125, -1.2274169921875, -1.0945281982421875, -0.961639404296875, -0.8287506103515625, -0.69586181640625, -0.5629730224609375, -0.430084228515625, -0.2971954345703125, -0.164306640625, -0.0314178466796875, 0.101470947265625, 0.2343597412109375, 0.36724853515625, 0.5001373291015625, 0.633026123046875, 0.7659149169921875, 0.8988037109375, 1.0316925048828125, 1.164581298828125, 1.2974700927734375, 1.43035888671875, 1.5632476806640625, 1.696136474609375, 1.8290252685546875, 1.9619140625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 7.0, 11.0, 32.0, 78.0, 254.0, 381.0, 163.0, 47.0, 13.0, 11.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.16647720336914, -41.94157409667969, -40.71666717529297, -39.491764068603516, -38.26686096191406, -37.04195785522461, -35.817054748535156, -34.59214782714844, -33.367244720458984, -32.14234161376953, -30.917436599731445, -29.69253158569336, -28.467628479003906, -27.242725372314453, -26.017820358276367, -24.79291534423828, -23.568012237548828, -22.343109130859375, -21.11820411682129, -19.893299102783203, -18.66839599609375, -17.443492889404297, -16.21858787536621, -14.993683815002441, -13.768779754638672, -12.543875694274902, -11.318971633911133, -10.094067573547363, -8.869163513183594, -7.644259452819824, -6.419355392456055, -5.194451332092285, -3.96954345703125, -2.7446393966674805, -1.519735336303711, -0.2948312759399414, 0.9300727844238281, 2.1549768447875977, 3.379880905151367, 4.604784965515137, 5.829689025878906, 7.054593086242676, 8.279497146606445, 9.504401206970215, 10.729305267333984, 11.954209327697754, 13.179113388061523, 14.404017448425293, 15.628921508789062, 16.853824615478516, 18.0787296295166, 19.303634643554688, 20.52853775024414, 21.753440856933594, 22.97834587097168, 24.203250885009766, 25.42815399169922, 26.653057098388672, 27.877962112426758, 29.102867126464844, 30.327770233154297, 31.55267333984375, 32.77758026123047, 34.00248336791992, 35.227386474609375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 7.0, 16.0, 17.0, 29.0, 51.0, 48.0, 82.0, 97.0, 101.0, 115.0, 110.0, 85.0, 73.0, 53.0, 45.0, 32.0, 14.0, 14.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.67136001586914, -19.122207641601562, -18.573057174682617, -18.02390480041504, -17.47475242614746, -16.925601959228516, -16.376449584960938, -15.82729721069336, -15.278145790100098, -14.728994369506836, -14.179841995239258, -13.630690574645996, -13.081539154052734, -12.532386779785156, -11.983235359191895, -11.434083938598633, -10.884931564331055, -10.335780143737793, -9.786627769470215, -9.237476348876953, -8.688323974609375, -8.139172554016113, -7.590021133422852, -7.040869235992432, -6.491717338562012, -5.942565441131592, -5.393413543701172, -4.84426212310791, -4.29511022567749, -3.7459583282470703, -3.1968066692352295, -2.6476550102233887, -2.098504066467285, -1.5493522882461548, -1.0002005100250244, -0.45104873180389404, 0.09810304641723633, 0.6472549438476562, 1.196406602859497, 1.745558261871338, 2.294710159301758, 2.8438620567321777, 3.3930137157440186, 3.9421653747558594, 4.491317272186279, 5.040469169616699, 5.589620590209961, 6.138772487640381, 6.687924385070801, 7.237076282501221, 7.786228179931641, 8.335379600524902, 8.884531021118164, 9.433683395385742, 9.982834815979004, 10.531986236572266, 11.081138610839844, 11.630290031433105, 12.179442405700684, 12.728593826293945, 13.277746200561523, 13.826897621154785, 14.376049041748047, 14.925201416015625, 15.474352836608887]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 2.0, 4.0, 15.0, 11.0, 12.0, 23.0, 23.0, 29.0, 51.0, 72.0, 78.0, 142.0, 188.0, 314.0, 542.0, 1041.0, 2697.0, 11568.0, 90878.0, 786134.0, 133566.0, 15077.0, 3267.0, 1205.0, 581.0, 324.0, 223.0, 141.0, 91.0, 70.0, 45.0, 34.0, 27.0, 18.0, 14.0, 23.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.7890625, -8.52728271484375, -8.2655029296875, -8.00372314453125, -7.741943359375, -7.48016357421875, -7.2183837890625, -6.95660400390625, -6.69482421875, -6.43304443359375, -6.1712646484375, -5.90948486328125, -5.647705078125, -5.38592529296875, -5.1241455078125, -4.86236572265625, -4.6005859375, -4.33880615234375, -4.0770263671875, -3.81524658203125, -3.553466796875, -3.29168701171875, -3.0299072265625, -2.76812744140625, -2.50634765625, -2.24456787109375, -1.9827880859375, -1.72100830078125, -1.459228515625, -1.19744873046875, -0.9356689453125, -0.67388916015625, -0.412109375, -0.15032958984375, 0.1114501953125, 0.37322998046875, 0.635009765625, 0.89678955078125, 1.1585693359375, 1.42034912109375, 1.68212890625, 1.94390869140625, 2.2056884765625, 2.46746826171875, 2.729248046875, 2.99102783203125, 3.2528076171875, 3.51458740234375, 3.7763671875, 4.03814697265625, 4.2999267578125, 4.56170654296875, 4.823486328125, 5.08526611328125, 5.3470458984375, 5.60882568359375, 5.87060546875, 6.13238525390625, 6.3941650390625, 6.65594482421875, 6.917724609375, 7.17950439453125, 7.4412841796875, 7.70306396484375, 7.96484375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 17.0, 24.0, 45.0, 51.0, 107.0, 100.0, 135.0, 154.0, 95.0, 89.0, 74.0, 42.0, 30.0, 17.0, 9.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8642578125, -1.817596435546875, -1.77093505859375, -1.724273681640625, -1.6776123046875, -1.630950927734375, -1.58428955078125, -1.537628173828125, -1.490966796875, -1.444305419921875, -1.39764404296875, -1.350982666015625, -1.3043212890625, -1.257659912109375, -1.21099853515625, -1.164337158203125, -1.11767578125, -1.071014404296875, -1.02435302734375, -0.977691650390625, -0.9310302734375, -0.884368896484375, -0.83770751953125, -0.791046142578125, -0.744384765625, -0.697723388671875, -0.65106201171875, -0.604400634765625, -0.5577392578125, -0.511077880859375, -0.46441650390625, -0.417755126953125, -0.37109375, -0.324432373046875, -0.27777099609375, -0.231109619140625, -0.1844482421875, -0.137786865234375, -0.09112548828125, -0.044464111328125, 0.002197265625, 0.048858642578125, 0.09552001953125, 0.142181396484375, 0.1888427734375, 0.235504150390625, 0.28216552734375, 0.328826904296875, 0.37548828125, 0.422149658203125, 0.46881103515625, 0.515472412109375, 0.5621337890625, 0.608795166015625, 0.65545654296875, 0.702117919921875, 0.748779296875, 0.795440673828125, 0.84210205078125, 0.888763427734375, 0.9354248046875, 0.982086181640625, 1.02874755859375, 1.075408935546875, 1.1220703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 11.0, 15.0, 9.0, 19.0, 29.0, 34.0, 57.0, 96.0, 154.0, 261.0, 546.0, 1083.0, 2426.0, 5693.0, 15341.0, 46706.0, 186560.0, 538740.0, 180414.0, 45372.0, 14829.0, 5434.0, 2358.0, 1069.0, 556.0, 303.0, 170.0, 102.0, 59.0, 37.0, 24.0, 16.0, 8.0, 11.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.921875, -3.8172607421875, -3.712646484375, -3.6080322265625, -3.50341796875, -3.3988037109375, -3.294189453125, -3.1895751953125, -3.0849609375, -2.9803466796875, -2.875732421875, -2.7711181640625, -2.66650390625, -2.5618896484375, -2.457275390625, -2.3526611328125, -2.248046875, -2.1434326171875, -2.038818359375, -1.9342041015625, -1.82958984375, -1.7249755859375, -1.620361328125, -1.5157470703125, -1.4111328125, -1.3065185546875, -1.201904296875, -1.0972900390625, -0.99267578125, -0.8880615234375, -0.783447265625, -0.6788330078125, -0.57421875, -0.4696044921875, -0.364990234375, -0.2603759765625, -0.15576171875, -0.0511474609375, 0.053466796875, 0.1580810546875, 0.2626953125, 0.3673095703125, 0.471923828125, 0.5765380859375, 0.68115234375, 0.7857666015625, 0.890380859375, 0.9949951171875, 1.099609375, 1.2042236328125, 1.308837890625, 1.4134521484375, 1.51806640625, 1.6226806640625, 1.727294921875, 1.8319091796875, 1.9365234375, 2.0411376953125, 2.145751953125, 2.2503662109375, 2.35498046875, 2.4595947265625, 2.564208984375, 2.6688232421875, 2.7734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 4.0, 7.0, 7.0, 7.0, 6.0, 13.0, 10.0, 24.0, 18.0, 18.0, 25.0, 32.0, 23.0, 40.0, 38.0, 28.0, 39.0, 57.0, 38.0, 39.0, 41.0, 40.0, 50.0, 38.0, 35.0, 37.0, 44.0, 29.0, 34.0, 21.0, 30.0, 21.0, 17.0, 13.0, 13.0, 16.0, 7.0, 8.0, 10.0, 8.0, 6.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.533203125, -2.457855224609375, -2.38250732421875, -2.307159423828125, -2.2318115234375, -2.156463623046875, -2.08111572265625, -2.005767822265625, -1.930419921875, -1.855072021484375, -1.77972412109375, -1.704376220703125, -1.6290283203125, -1.553680419921875, -1.47833251953125, -1.402984619140625, -1.32763671875, -1.252288818359375, -1.17694091796875, -1.101593017578125, -1.0262451171875, -0.950897216796875, -0.87554931640625, -0.800201416015625, -0.724853515625, -0.649505615234375, -0.57415771484375, -0.498809814453125, -0.4234619140625, -0.348114013671875, -0.27276611328125, -0.197418212890625, -0.1220703125, -0.046722412109375, 0.02862548828125, 0.103973388671875, 0.1793212890625, 0.254669189453125, 0.33001708984375, 0.405364990234375, 0.480712890625, 0.556060791015625, 0.63140869140625, 0.706756591796875, 0.7821044921875, 0.857452392578125, 0.93280029296875, 1.008148193359375, 1.08349609375, 1.158843994140625, 1.23419189453125, 1.309539794921875, 1.3848876953125, 1.460235595703125, 1.53558349609375, 1.610931396484375, 1.686279296875, 1.761627197265625, 1.83697509765625, 1.912322998046875, 1.9876708984375, 2.063018798828125, 2.13836669921875, 2.213714599609375, 2.2890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 12.0, 6.0, 4.0, 10.0, 11.0, 25.0, 44.0, 38.0, 52.0, 90.0, 162.0, 258.0, 540.0, 1113.0, 2742.0, 8099.0, 31990.0, 203831.0, 666326.0, 103744.0, 19912.0, 5653.0, 1993.0, 837.0, 431.0, 214.0, 144.0, 91.0, 45.0, 28.0, 34.0, 19.0, 11.0, 12.0, 5.0, 5.0, 5.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.06011962890625, -1.9874267578125, -1.91473388671875, -1.842041015625, -1.76934814453125, -1.6966552734375, -1.62396240234375, -1.55126953125, -1.47857666015625, -1.4058837890625, -1.33319091796875, -1.260498046875, -1.18780517578125, -1.1151123046875, -1.04241943359375, -0.9697265625, -0.89703369140625, -0.8243408203125, -0.75164794921875, -0.678955078125, -0.60626220703125, -0.5335693359375, -0.46087646484375, -0.38818359375, -0.31549072265625, -0.2427978515625, -0.17010498046875, -0.097412109375, -0.02471923828125, 0.0479736328125, 0.12066650390625, 0.193359375, 0.26605224609375, 0.3387451171875, 0.41143798828125, 0.484130859375, 0.55682373046875, 0.6295166015625, 0.70220947265625, 0.77490234375, 0.84759521484375, 0.9202880859375, 0.99298095703125, 1.065673828125, 1.13836669921875, 1.2110595703125, 1.28375244140625, 1.3564453125, 1.42913818359375, 1.5018310546875, 1.57452392578125, 1.647216796875, 1.71990966796875, 1.7926025390625, 1.86529541015625, 1.93798828125, 2.01068115234375, 2.0833740234375, 2.15606689453125, 2.228759765625, 2.30145263671875, 2.3741455078125, 2.44683837890625, 2.51953125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 6.0, 9.0, 6.0, 12.0, 20.0, 17.0, 40.0, 44.0, 60.0, 62.0, 106.0, 130.0, 120.0, 105.0, 63.0, 52.0, 34.0, 39.0, 13.0, 12.0, 15.0, 6.0, 4.0, 7.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032639503479003906, -0.00031581148505210876, -0.00030522793531417847, -0.00029464438557624817, -0.00028406083583831787, -0.0002734772861003876, -0.0002628937363624573, -0.000252310186624527, -0.00024172663688659668, -0.00023114308714866638, -0.00022055953741073608, -0.00020997598767280579, -0.0001993924379348755, -0.0001888088881969452, -0.0001782253384590149, -0.0001676417887210846, -0.0001570582389831543, -0.000146474689245224, -0.0001358911395072937, -0.0001253075897693634, -0.0001147240400314331, -0.00010414049029350281, -9.355694055557251e-05, -8.297339081764221e-05, -7.238984107971191e-05, -6.180629134178162e-05, -5.122274160385132e-05, -4.063919186592102e-05, -3.0055642127990723e-05, -1.9472092390060425e-05, -8.888542652130127e-06, 1.695007085800171e-06, 1.2278556823730469e-05, 2.2862106561660767e-05, 3.3445656299591064e-05, 4.402920603752136e-05, 5.461275577545166e-05, 6.519630551338196e-05, 7.577985525131226e-05, 8.636340498924255e-05, 9.694695472717285e-05, 0.00010753050446510315, 0.00011811405420303345, 0.00012869760394096375, 0.00013928115367889404, 0.00014986470341682434, 0.00016044825315475464, 0.00017103180289268494, 0.00018161535263061523, 0.00019219890236854553, 0.00020278245210647583, 0.00021336600184440613, 0.00022394955158233643, 0.00023453310132026672, 0.000245116651058197, 0.0002557002007961273, 0.0002662837505340576, 0.0002768673002719879, 0.0002874508500099182, 0.0002980343997478485, 0.0003086179494857788, 0.0003192014992237091, 0.0003297850489616394, 0.0003403685986995697, 0.0003509521484375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 8.0, 7.0, 7.0, 13.0, 21.0, 39.0, 54.0, 100.0, 141.0, 221.0, 351.0, 630.0, 1200.0, 2626.0, 6335.0, 17884.0, 71663.0, 528840.0, 344210.0, 50695.0, 13788.0, 5075.0, 2114.0, 1102.0, 575.0, 328.0, 188.0, 112.0, 81.0, 50.0, 30.0, 23.0, 22.0, 7.0, 5.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.181640625, -2.119110107421875, -2.05657958984375, -1.994049072265625, -1.9315185546875, -1.868988037109375, -1.80645751953125, -1.743927001953125, -1.681396484375, -1.618865966796875, -1.55633544921875, -1.493804931640625, -1.4312744140625, -1.368743896484375, -1.30621337890625, -1.243682861328125, -1.18115234375, -1.118621826171875, -1.05609130859375, -0.993560791015625, -0.9310302734375, -0.868499755859375, -0.80596923828125, -0.743438720703125, -0.680908203125, -0.618377685546875, -0.55584716796875, -0.493316650390625, -0.4307861328125, -0.368255615234375, -0.30572509765625, -0.243194580078125, -0.1806640625, -0.118133544921875, -0.05560302734375, 0.006927490234375, 0.0694580078125, 0.131988525390625, 0.19451904296875, 0.257049560546875, 0.319580078125, 0.382110595703125, 0.44464111328125, 0.507171630859375, 0.5697021484375, 0.632232666015625, 0.69476318359375, 0.757293701171875, 0.81982421875, 0.882354736328125, 0.94488525390625, 1.007415771484375, 1.0699462890625, 1.132476806640625, 1.19500732421875, 1.257537841796875, 1.320068359375, 1.382598876953125, 1.44512939453125, 1.507659912109375, 1.5701904296875, 1.632720947265625, 1.69525146484375, 1.757781982421875, 1.8203125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 5.0, 4.0, 10.0, 17.0, 14.0, 21.0, 26.0, 52.0, 77.0, 71.0, 104.0, 106.0, 103.0, 106.0, 76.0, 44.0, 46.0, 27.0, 20.0, 13.0, 13.0, 12.0, 12.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.736328125, -1.6866607666015625, -1.636993408203125, -1.5873260498046875, -1.53765869140625, -1.4879913330078125, -1.438323974609375, -1.3886566162109375, -1.3389892578125, -1.2893218994140625, -1.239654541015625, -1.1899871826171875, -1.14031982421875, -1.0906524658203125, -1.040985107421875, -0.9913177490234375, -0.941650390625, -0.8919830322265625, -0.842315673828125, -0.7926483154296875, -0.74298095703125, -0.6933135986328125, -0.643646240234375, -0.5939788818359375, -0.5443115234375, -0.4946441650390625, -0.444976806640625, -0.3953094482421875, -0.34564208984375, -0.2959747314453125, -0.246307373046875, -0.1966400146484375, -0.14697265625, -0.0973052978515625, -0.047637939453125, 0.0020294189453125, 0.05169677734375, 0.1013641357421875, 0.151031494140625, 0.2006988525390625, 0.2503662109375, 0.3000335693359375, 0.349700927734375, 0.3993682861328125, 0.44903564453125, 0.4987030029296875, 0.548370361328125, 0.5980377197265625, 0.647705078125, 0.6973724365234375, 0.747039794921875, 0.7967071533203125, 0.84637451171875, 0.8960418701171875, 0.945709228515625, 0.9953765869140625, 1.0450439453125, 1.0947113037109375, 1.144378662109375, 1.1940460205078125, 1.24371337890625, 1.2933807373046875, 1.343048095703125, 1.3927154541015625, 1.4423828125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 19.0, 51.0, 187.0, 355.0, 221.0, 96.0, 39.0, 20.0, 8.0, 2.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.96515655517578, -68.32442474365234, -66.68370056152344, -65.04296875, -63.40224075317383, -61.761512756347656, -60.12078094482422, -58.48005294799805, -56.839324951171875, -55.1985969543457, -53.557865142822266, -51.917137145996094, -50.27640914916992, -48.63568115234375, -46.99494934082031, -45.35422134399414, -43.71349334716797, -42.0727653503418, -40.43203353881836, -38.79130554199219, -37.150577545166016, -35.509849548339844, -33.869117736816406, -32.228389739990234, -30.587657928466797, -28.946928024291992, -27.30620002746582, -25.665470123291016, -24.024742126464844, -22.38401222229004, -20.743282318115234, -19.102554321289062, -17.46182632446289, -15.821097373962402, -14.180368423461914, -12.53963851928711, -10.898910522460938, -9.258180618286133, -7.6174516677856445, -5.976722717285156, -4.335993766784668, -2.6952648162841797, -1.0545356273651123, 0.5861935615539551, 2.2269225120544434, 3.86765193939209, 5.508380889892578, 7.149109840393066, 8.789838790893555, 10.430567741394043, 12.071296691894531, 13.712026596069336, 15.352754592895508, 16.993484497070312, 18.634212493896484, 20.27494239807129, 21.915672302246094, 23.5564022064209, 25.19713020324707, 26.837860107421875, 28.478588104248047, 30.11931800842285, 31.760047912597656, 33.40077590942383, 35.04150390625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 10.0, 11.0, 16.0, 19.0, 27.0, 23.0, 19.0, 24.0, 33.0, 36.0, 43.0, 44.0, 52.0, 48.0, 45.0, 48.0, 36.0, 54.0, 43.0, 48.0, 57.0, 40.0, 27.0, 27.0, 28.0, 29.0, 22.0, 29.0, 9.0, 9.0, 8.0, 10.0, 8.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-17.02634048461914, -16.503665924072266, -15.980989456176758, -15.458313941955566, -14.935638427734375, -14.412962913513184, -13.890287399291992, -13.367612838745117, -12.84493637084961, -12.322260856628418, -11.799585342407227, -11.276909828186035, -10.754234313964844, -10.231558799743652, -9.708883285522461, -9.186208724975586, -8.663533210754395, -8.140857696533203, -7.618182182312012, -7.09550666809082, -6.572831153869629, -6.0501556396484375, -5.527480602264404, -5.004805088043213, -4.4821295738220215, -3.95945405960083, -3.4367785453796387, -2.9141032695770264, -2.391427755355835, -1.8687522411346436, -1.3460769653320312, -0.8234014511108398, -0.30072593688964844, 0.2219495177268982, 0.7446249723434448, 1.2673003673553467, 1.789975881576538, 2.3126513957977295, 2.835326671600342, 3.358002185821533, 3.8806777000427246, 4.403353214263916, 4.926028728485107, 5.448703765869141, 5.971379280090332, 6.494054794311523, 7.016730308532715, 7.539405822753906, 8.062081336975098, 8.584756851196289, 9.10743236541748, 9.630107879638672, 10.152783393859863, 10.675458908081055, 11.19813346862793, 11.720809936523438, 12.243484497070312, 12.766160011291504, 13.288835525512695, 13.811511039733887, 14.334186553955078, 14.85686206817627, 15.379537582397461, 15.902212142944336, 16.424888610839844]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 6.0, 9.0, 7.0, 11.0, 19.0, 19.0, 19.0, 25.0, 30.0, 39.0, 53.0, 69.0, 108.0, 167.0, 239.0, 593.0, 1606.0, 5917.0, 40207.0, 4105124.0, 31995.0, 5433.0, 1454.0, 524.0, 229.0, 134.0, 74.0, 53.0, 31.0, 24.0, 11.0, 12.0, 8.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.890625, -18.423583984375, -17.95654296875, -17.489501953125, -17.0224609375, -16.555419921875, -16.08837890625, -15.621337890625, -15.154296875, -14.687255859375, -14.22021484375, -13.753173828125, -13.2861328125, -12.819091796875, -12.35205078125, -11.885009765625, -11.41796875, -10.950927734375, -10.48388671875, -10.016845703125, -9.5498046875, -9.082763671875, -8.61572265625, -8.148681640625, -7.681640625, -7.214599609375, -6.74755859375, -6.280517578125, -5.8134765625, -5.346435546875, -4.87939453125, -4.412353515625, -3.9453125, -3.478271484375, -3.01123046875, -2.544189453125, -2.0771484375, -1.610107421875, -1.14306640625, -0.676025390625, -0.208984375, 0.258056640625, 0.72509765625, 1.192138671875, 1.6591796875, 2.126220703125, 2.59326171875, 3.060302734375, 3.52734375, 3.994384765625, 4.46142578125, 4.928466796875, 5.3955078125, 5.862548828125, 6.32958984375, 6.796630859375, 7.263671875, 7.730712890625, 8.19775390625, 8.664794921875, 9.1318359375, 9.598876953125, 10.06591796875, 10.532958984375, 11.0]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 10.0, 13.0, 25.0, 26.0, 48.0, 84.0, 94.0, 99.0, 128.0, 112.0, 94.0, 76.0, 81.0, 43.0, 26.0, 17.0, 13.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.796875, -1.75164794921875, -1.7064208984375, -1.66119384765625, -1.615966796875, -1.57073974609375, -1.5255126953125, -1.48028564453125, -1.43505859375, -1.38983154296875, -1.3446044921875, -1.29937744140625, -1.254150390625, -1.20892333984375, -1.1636962890625, -1.11846923828125, -1.0732421875, -1.02801513671875, -0.9827880859375, -0.93756103515625, -0.892333984375, -0.84710693359375, -0.8018798828125, -0.75665283203125, -0.71142578125, -0.66619873046875, -0.6209716796875, -0.57574462890625, -0.530517578125, -0.48529052734375, -0.4400634765625, -0.39483642578125, -0.349609375, -0.30438232421875, -0.2591552734375, -0.21392822265625, -0.168701171875, -0.12347412109375, -0.0782470703125, -0.03302001953125, 0.01220703125, 0.05743408203125, 0.1026611328125, 0.14788818359375, 0.193115234375, 0.23834228515625, 0.2835693359375, 0.32879638671875, 0.3740234375, 0.41925048828125, 0.4644775390625, 0.50970458984375, 0.554931640625, 0.60015869140625, 0.6453857421875, 0.69061279296875, 0.73583984375, 0.78106689453125, 0.8262939453125, 0.87152099609375, 0.916748046875, 0.96197509765625, 1.0072021484375, 1.05242919921875, 1.09765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 4.0, 5.0, 4.0, 9.0, 17.0, 18.0, 21.0, 41.0, 61.0, 97.0, 125.0, 188.0, 364.0, 656.0, 1258.0, 2546.0, 5485.0, 13196.0, 43051.0, 1040174.0, 3013660.0, 47778.0, 13814.0, 5784.0, 2648.0, 1408.0, 774.0, 409.0, 241.0, 142.0, 85.0, 56.0, 55.0, 33.0, 16.0, 15.0, 11.0, 13.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0], "bins": [-7.15625, -6.97747802734375, -6.7987060546875, -6.61993408203125, -6.441162109375, -6.26239013671875, -6.0836181640625, -5.90484619140625, -5.72607421875, -5.54730224609375, -5.3685302734375, -5.18975830078125, -5.010986328125, -4.83221435546875, -4.6534423828125, -4.47467041015625, -4.2958984375, -4.11712646484375, -3.9383544921875, -3.75958251953125, -3.580810546875, -3.40203857421875, -3.2232666015625, -3.04449462890625, -2.86572265625, -2.68695068359375, -2.5081787109375, -2.32940673828125, -2.150634765625, -1.97186279296875, -1.7930908203125, -1.61431884765625, -1.435546875, -1.25677490234375, -1.0780029296875, -0.89923095703125, -0.720458984375, -0.54168701171875, -0.3629150390625, -0.18414306640625, -0.00537109375, 0.17340087890625, 0.3521728515625, 0.53094482421875, 0.709716796875, 0.88848876953125, 1.0672607421875, 1.24603271484375, 1.4248046875, 1.60357666015625, 1.7823486328125, 1.96112060546875, 2.139892578125, 2.31866455078125, 2.4974365234375, 2.67620849609375, 2.85498046875, 3.03375244140625, 3.2125244140625, 3.39129638671875, 3.570068359375, 3.74884033203125, 3.9276123046875, 4.10638427734375, 4.28515625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 8.0, 9.0, 12.0, 10.0, 21.0, 21.0, 46.0, 61.0, 141.0, 590.0, 2597.0, 245.0, 120.0, 56.0, 36.0, 26.0, 16.0, 11.0, 5.0, 5.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3974609375, -1.3373870849609375, -1.277313232421875, -1.2172393798828125, -1.15716552734375, -1.0970916748046875, -1.037017822265625, -0.9769439697265625, -0.9168701171875, -0.8567962646484375, -0.796722412109375, -0.7366485595703125, -0.67657470703125, -0.6165008544921875, -0.556427001953125, -0.4963531494140625, -0.436279296875, -0.3762054443359375, -0.316131591796875, -0.2560577392578125, -0.19598388671875, -0.1359100341796875, -0.075836181640625, -0.0157623291015625, 0.0443115234375, 0.1043853759765625, 0.164459228515625, 0.2245330810546875, 0.28460693359375, 0.3446807861328125, 0.404754638671875, 0.4648284912109375, 0.52490234375, 0.5849761962890625, 0.645050048828125, 0.7051239013671875, 0.76519775390625, 0.8252716064453125, 0.885345458984375, 0.9454193115234375, 1.0054931640625, 1.0655670166015625, 1.125640869140625, 1.1857147216796875, 1.24578857421875, 1.3058624267578125, 1.365936279296875, 1.4260101318359375, 1.486083984375, 1.5461578369140625, 1.606231689453125, 1.6663055419921875, 1.72637939453125, 1.7864532470703125, 1.846527099609375, 1.9066009521484375, 1.9666748046875, 2.0267486572265625, 2.086822509765625, 2.1468963623046875, 2.20697021484375, 2.2670440673828125, 2.327117919921875, 2.3871917724609375, 2.447265625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 14.0, 37.0, 53.0, 143.0, 366.0, 240.0, 98.0, 39.0, 14.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.569042205810547, -8.864547729492188, -8.160053253173828, -7.4555583000183105, -6.751063346862793, -6.046568870544434, -5.342074394226074, -4.637579441070557, -3.9330849647521973, -3.228590250015259, -2.5240955352783203, -1.819601058959961, -1.1151063442230225, -0.410611629486084, 0.2938828468322754, 0.998377799987793, 1.7028722763061523, 2.407366991043091, 3.1118617057800293, 3.8163561820983887, 4.520851135253906, 5.225345611572266, 5.929840087890625, 6.634335041046143, 7.338829517364502, 8.04332447052002, 8.747818946838379, 9.452313423156738, 10.156807899475098, 10.861303329467773, 11.565797805786133, 12.270292282104492, 12.974786758422852, 13.679281234741211, 14.38377571105957, 15.08827018737793, 15.792765617370605, 16.49726104736328, 17.20175552368164, 17.90625, 18.61074447631836, 19.31523895263672, 20.019733428955078, 20.724227905273438, 21.428722381591797, 22.133216857910156, 22.837711334228516, 23.542207717895508, 24.246700286865234, 24.951194763183594, 25.655689239501953, 26.360183715820312, 27.064678192138672, 27.76917266845703, 28.47366714477539, 29.178163528442383, 29.882658004760742, 30.5871524810791, 31.29164695739746, 31.99614143371582, 32.70063781738281, 33.40513229370117, 34.10962677001953, 34.81412124633789, 35.51861572265625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 3.0, 7.0, 9.0, 7.0, 9.0, 12.0, 9.0, 17.0, 22.0, 25.0, 18.0, 20.0, 33.0, 38.0, 35.0, 33.0, 40.0, 48.0, 48.0, 48.0, 47.0, 36.0, 41.0, 46.0, 32.0, 37.0, 38.0, 37.0, 26.0, 23.0, 21.0, 19.0, 24.0, 15.0, 14.0, 14.0, 15.0, 10.0, 6.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.502102375030518, -4.361291408538818, -4.220480918884277, -4.079669952392578, -3.938858985900879, -3.7980480194091797, -3.6572372913360596, -3.5164265632629395, -3.3756155967712402, -3.234804630279541, -3.093993902206421, -2.953183174133301, -2.8123722076416016, -2.6715612411499023, -2.5307505130767822, -2.389939785003662, -2.249128818511963, -2.1083178520202637, -1.9675071239471436, -1.8266962766647339, -1.6858854293823242, -1.5450745820999146, -1.4042637348175049, -1.2634528875350952, -1.1226420402526855, -0.9818311929702759, -0.8410203456878662, -0.7002094984054565, -0.5593986511230469, -0.4185878038406372, -0.27777695655822754, -0.13696610927581787, 0.0038442611694335938, 0.14465510845184326, 0.28546595573425293, 0.4262768030166626, 0.5670876502990723, 0.7078984975814819, 0.8487093448638916, 0.9895201921463013, 1.130331039428711, 1.2711418867111206, 1.4119527339935303, 1.55276358127594, 1.6935744285583496, 1.8343852758407593, 1.975196123123169, 2.116006851196289, 2.2568178176879883, 2.3976287841796875, 2.5384395122528076, 2.6792502403259277, 2.820061206817627, 2.960872173309326, 3.1016829013824463, 3.2424936294555664, 3.3833045959472656, 3.524115562438965, 3.664926290512085, 3.805737018585205, 3.9465479850769043, 4.0873589515686035, 4.2281694412231445, 4.368980407714844, 4.509791374206543]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 9.0, 4.0, 10.0, 10.0, 20.0, 27.0, 31.0, 44.0, 42.0, 72.0, 86.0, 141.0, 186.0, 291.0, 573.0, 1162.0, 2852.0, 9939.0, 49648.0, 470731.0, 449127.0, 48361.0, 9777.0, 2807.0, 1097.0, 506.0, 284.0, 226.0, 140.0, 94.0, 58.0, 44.0, 34.0, 37.0, 16.0, 19.0, 7.0, 5.0, 4.0, 8.0, 1.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.38671875, -6.15008544921875, -5.9134521484375, -5.67681884765625, -5.440185546875, -5.20355224609375, -4.9669189453125, -4.73028564453125, -4.49365234375, -4.25701904296875, -4.0203857421875, -3.78375244140625, -3.547119140625, -3.31048583984375, -3.0738525390625, -2.83721923828125, -2.6005859375, -2.36395263671875, -2.1273193359375, -1.89068603515625, -1.654052734375, -1.41741943359375, -1.1807861328125, -0.94415283203125, -0.70751953125, -0.47088623046875, -0.2342529296875, 0.00238037109375, 0.239013671875, 0.47564697265625, 0.7122802734375, 0.94891357421875, 1.185546875, 1.42218017578125, 1.6588134765625, 1.89544677734375, 2.132080078125, 2.36871337890625, 2.6053466796875, 2.84197998046875, 3.07861328125, 3.31524658203125, 3.5518798828125, 3.78851318359375, 4.025146484375, 4.26177978515625, 4.4984130859375, 4.73504638671875, 4.9716796875, 5.20831298828125, 5.4449462890625, 5.68157958984375, 5.918212890625, 6.15484619140625, 6.3914794921875, 6.62811279296875, 6.86474609375, 7.10137939453125, 7.3380126953125, 7.57464599609375, 7.811279296875, 8.04791259765625, 8.2845458984375, 8.52117919921875, 8.7578125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 10.0, 13.0, 20.0, 34.0, 40.0, 79.0, 90.0, 113.0, 118.0, 111.0, 99.0, 83.0, 79.0, 40.0, 35.0, 16.0, 13.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8642578125, -1.8174896240234375, -1.770721435546875, -1.7239532470703125, -1.67718505859375, -1.6304168701171875, -1.583648681640625, -1.5368804931640625, -1.4901123046875, -1.4433441162109375, -1.396575927734375, -1.3498077392578125, -1.30303955078125, -1.2562713623046875, -1.209503173828125, -1.1627349853515625, -1.115966796875, -1.0691986083984375, -1.022430419921875, -0.9756622314453125, -0.92889404296875, -0.8821258544921875, -0.835357666015625, -0.7885894775390625, -0.7418212890625, -0.6950531005859375, -0.648284912109375, -0.6015167236328125, -0.55474853515625, -0.5079803466796875, -0.461212158203125, -0.4144439697265625, -0.36767578125, -0.3209075927734375, -0.274139404296875, -0.2273712158203125, -0.18060302734375, -0.1338348388671875, -0.087066650390625, -0.0402984619140625, 0.0064697265625, 0.0532379150390625, 0.100006103515625, 0.1467742919921875, 0.19354248046875, 0.2403106689453125, 0.287078857421875, 0.3338470458984375, 0.380615234375, 0.4273834228515625, 0.474151611328125, 0.5209197998046875, 0.56768798828125, 0.6144561767578125, 0.661224365234375, 0.7079925537109375, 0.7547607421875, 0.8015289306640625, 0.848297119140625, 0.8950653076171875, 0.94183349609375, 0.9886016845703125, 1.035369873046875, 1.0821380615234375, 1.12890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 4.0, 0.0, 6.0, 6.0, 15.0, 10.0, 18.0, 25.0, 37.0, 48.0, 62.0, 111.0, 182.0, 315.0, 496.0, 824.0, 1678.0, 3114.0, 6576.0, 14697.0, 37467.0, 115752.0, 412144.0, 314975.0, 86827.0, 29617.0, 12138.0, 5418.0, 2736.0, 1351.0, 760.0, 411.0, 247.0, 158.0, 112.0, 83.0, 38.0, 32.0, 22.0, 19.0, 9.0, 5.0, 9.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.65625, -2.55743408203125, -2.4586181640625, -2.35980224609375, -2.260986328125, -2.16217041015625, -2.0633544921875, -1.96453857421875, -1.86572265625, -1.76690673828125, -1.6680908203125, -1.56927490234375, -1.470458984375, -1.37164306640625, -1.2728271484375, -1.17401123046875, -1.0751953125, -0.97637939453125, -0.8775634765625, -0.77874755859375, -0.679931640625, -0.58111572265625, -0.4822998046875, -0.38348388671875, -0.28466796875, -0.18585205078125, -0.0870361328125, 0.01177978515625, 0.110595703125, 0.20941162109375, 0.3082275390625, 0.40704345703125, 0.505859375, 0.60467529296875, 0.7034912109375, 0.80230712890625, 0.901123046875, 0.99993896484375, 1.0987548828125, 1.19757080078125, 1.29638671875, 1.39520263671875, 1.4940185546875, 1.59283447265625, 1.691650390625, 1.79046630859375, 1.8892822265625, 1.98809814453125, 2.0869140625, 2.18572998046875, 2.2845458984375, 2.38336181640625, 2.482177734375, 2.58099365234375, 2.6798095703125, 2.77862548828125, 2.87744140625, 2.97625732421875, 3.0750732421875, 3.17388916015625, 3.272705078125, 3.37152099609375, 3.4703369140625, 3.56915283203125, 3.66796875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 2.0, 7.0, 5.0, 5.0, 8.0, 13.0, 10.0, 10.0, 25.0, 15.0, 32.0, 19.0, 37.0, 25.0, 35.0, 36.0, 52.0, 40.0, 47.0, 54.0, 59.0, 49.0, 44.0, 42.0, 40.0, 36.0, 28.0, 37.0, 23.0, 24.0, 24.0, 16.0, 19.0, 17.0, 13.0, 12.0, 5.0, 9.0, 7.0, 3.0, 3.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.263671875, -3.17266845703125, -3.0816650390625, -2.99066162109375, -2.899658203125, -2.80865478515625, -2.7176513671875, -2.62664794921875, -2.53564453125, -2.44464111328125, -2.3536376953125, -2.26263427734375, -2.171630859375, -2.08062744140625, -1.9896240234375, -1.89862060546875, -1.8076171875, -1.71661376953125, -1.6256103515625, -1.53460693359375, -1.443603515625, -1.35260009765625, -1.2615966796875, -1.17059326171875, -1.07958984375, -0.98858642578125, -0.8975830078125, -0.80657958984375, -0.715576171875, -0.62457275390625, -0.5335693359375, -0.44256591796875, -0.3515625, -0.26055908203125, -0.1695556640625, -0.07855224609375, 0.012451171875, 0.10345458984375, 0.1944580078125, 0.28546142578125, 0.37646484375, 0.46746826171875, 0.5584716796875, 0.64947509765625, 0.740478515625, 0.83148193359375, 0.9224853515625, 1.01348876953125, 1.1044921875, 1.19549560546875, 1.2864990234375, 1.37750244140625, 1.468505859375, 1.55950927734375, 1.6505126953125, 1.74151611328125, 1.83251953125, 1.92352294921875, 2.0145263671875, 2.10552978515625, 2.196533203125, 2.28753662109375, 2.3785400390625, 2.46954345703125, 2.560546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 12.0, 10.0, 11.0, 20.0, 24.0, 34.0, 58.0, 69.0, 98.0, 175.0, 270.0, 400.0, 780.0, 1568.0, 3321.0, 8562.0, 27594.0, 117833.0, 575363.0, 243454.0, 46196.0, 13351.0, 4689.0, 2159.0, 1019.0, 560.0, 361.0, 181.0, 114.0, 60.0, 55.0, 38.0, 27.0, 21.0, 12.0, 14.0, 11.0, 6.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.60546875, -1.5514068603515625, -1.497344970703125, -1.4432830810546875, -1.38922119140625, -1.3351593017578125, -1.281097412109375, -1.2270355224609375, -1.1729736328125, -1.1189117431640625, -1.064849853515625, -1.0107879638671875, -0.95672607421875, -0.9026641845703125, -0.848602294921875, -0.7945404052734375, -0.740478515625, -0.6864166259765625, -0.632354736328125, -0.5782928466796875, -0.52423095703125, -0.4701690673828125, -0.416107177734375, -0.3620452880859375, -0.3079833984375, -0.2539215087890625, -0.199859619140625, -0.1457977294921875, -0.09173583984375, -0.0376739501953125, 0.016387939453125, 0.0704498291015625, 0.12451171875, 0.1785736083984375, 0.232635498046875, 0.2866973876953125, 0.34075927734375, 0.3948211669921875, 0.448883056640625, 0.5029449462890625, 0.5570068359375, 0.6110687255859375, 0.665130615234375, 0.7191925048828125, 0.77325439453125, 0.8273162841796875, 0.881378173828125, 0.9354400634765625, 0.989501953125, 1.0435638427734375, 1.097625732421875, 1.1516876220703125, 1.20574951171875, 1.2598114013671875, 1.313873291015625, 1.3679351806640625, 1.4219970703125, 1.4760589599609375, 1.530120849609375, 1.5841827392578125, 1.63824462890625, 1.6923065185546875, 1.746368408203125, 1.8004302978515625, 1.8544921875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 9.0, 9.0, 8.0, 22.0, 24.0, 37.0, 39.0, 88.0, 117.0, 155.0, 152.0, 101.0, 67.0, 42.0, 24.0, 13.0, 18.0, 14.0, 15.0, 8.0, 7.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004165172576904297, -0.0004025474190711975, -0.00038857758045196533, -0.00037460774183273315, -0.000360637903213501, -0.0003466680645942688, -0.0003326982259750366, -0.00031872838735580444, -0.00030475854873657227, -0.0002907887101173401, -0.0002768188714981079, -0.00026284903287887573, -0.00024887919425964355, -0.00023490935564041138, -0.0002209395170211792, -0.00020696967840194702, -0.00019299983978271484, -0.00017903000116348267, -0.0001650601625442505, -0.0001510903239250183, -0.00013712048530578613, -0.00012315064668655396, -0.00010918080806732178, -9.52109694480896e-05, -8.124113082885742e-05, -6.727129220962524e-05, -5.3301453590393066e-05, -3.933161497116089e-05, -2.536177635192871e-05, -1.1391937732696533e-05, 2.5779008865356445e-06, 1.6547739505767822e-05, 3.0517578125e-05, 4.448741674423218e-05, 5.8457255363464355e-05, 7.242709398269653e-05, 8.639693260192871e-05, 0.00010036677122116089, 0.00011433660984039307, 0.00012830644845962524, 0.00014227628707885742, 0.0001562461256980896, 0.00017021596431732178, 0.00018418580293655396, 0.00019815564155578613, 0.0002121254801750183, 0.0002260953187942505, 0.00024006515741348267, 0.00025403499603271484, 0.000268004834651947, 0.0002819746732711792, 0.0002959445118904114, 0.00030991435050964355, 0.00032388418912887573, 0.0003378540277481079, 0.0003518238663673401, 0.00036579370498657227, 0.00037976354360580444, 0.0003937333822250366, 0.0004077032208442688, 0.000421673059463501, 0.00043564289808273315, 0.00044961273670196533, 0.0004635825753211975, 0.0004775524139404297]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 12.0, 7.0, 20.0, 15.0, 33.0, 46.0, 68.0, 108.0, 187.0, 308.0, 579.0, 1052.0, 2420.0, 6136.0, 19538.0, 91365.0, 571705.0, 290122.0, 45565.0, 11487.0, 3971.0, 1800.0, 897.0, 446.0, 247.0, 143.0, 95.0, 52.0, 47.0, 24.0, 20.0, 10.0, 10.0, 4.0, 1.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.111328125, -2.0569000244140625, -2.002471923828125, -1.9480438232421875, -1.89361572265625, -1.8391876220703125, -1.784759521484375, -1.7303314208984375, -1.6759033203125, -1.6214752197265625, -1.567047119140625, -1.5126190185546875, -1.45819091796875, -1.4037628173828125, -1.349334716796875, -1.2949066162109375, -1.240478515625, -1.1860504150390625, -1.131622314453125, -1.0771942138671875, -1.02276611328125, -0.9683380126953125, -0.913909912109375, -0.8594818115234375, -0.8050537109375, -0.7506256103515625, -0.696197509765625, -0.6417694091796875, -0.58734130859375, -0.5329132080078125, -0.478485107421875, -0.4240570068359375, -0.36962890625, -0.3152008056640625, -0.260772705078125, -0.2063446044921875, -0.15191650390625, -0.0974884033203125, -0.043060302734375, 0.0113677978515625, 0.0657958984375, 0.1202239990234375, 0.174652099609375, 0.2290802001953125, 0.28350830078125, 0.3379364013671875, 0.392364501953125, 0.4467926025390625, 0.501220703125, 0.5556488037109375, 0.610076904296875, 0.6645050048828125, 0.71893310546875, 0.7733612060546875, 0.827789306640625, 0.8822174072265625, 0.9366455078125, 0.9910736083984375, 1.045501708984375, 1.0999298095703125, 1.15435791015625, 1.2087860107421875, 1.263214111328125, 1.3176422119140625, 1.3720703125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 9.0, 12.0, 23.0, 25.0, 31.0, 51.0, 59.0, 88.0, 107.0, 116.0, 102.0, 92.0, 67.0, 54.0, 46.0, 28.0, 25.0, 18.0, 7.0, 9.0, 6.0, 2.0, 0.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.36328125, -1.3189239501953125, -1.274566650390625, -1.2302093505859375, -1.18585205078125, -1.1414947509765625, -1.097137451171875, -1.0527801513671875, -1.0084228515625, -0.9640655517578125, -0.919708251953125, -0.8753509521484375, -0.83099365234375, -0.7866363525390625, -0.742279052734375, -0.6979217529296875, -0.653564453125, -0.6092071533203125, -0.564849853515625, -0.5204925537109375, -0.47613525390625, -0.4317779541015625, -0.387420654296875, -0.3430633544921875, -0.2987060546875, -0.2543487548828125, -0.209991455078125, -0.1656341552734375, -0.12127685546875, -0.0769195556640625, -0.032562255859375, 0.0117950439453125, 0.05615234375, 0.1005096435546875, 0.144866943359375, 0.1892242431640625, 0.23358154296875, 0.2779388427734375, 0.322296142578125, 0.3666534423828125, 0.4110107421875, 0.4553680419921875, 0.499725341796875, 0.5440826416015625, 0.58843994140625, 0.6327972412109375, 0.677154541015625, 0.7215118408203125, 0.765869140625, 0.8102264404296875, 0.854583740234375, 0.8989410400390625, 0.94329833984375, 0.9876556396484375, 1.032012939453125, 1.0763702392578125, 1.1207275390625, 1.1650848388671875, 1.209442138671875, 1.2537994384765625, 1.29815673828125, 1.3425140380859375, 1.386871337890625, 1.4312286376953125, 1.4755859375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 7.0, 16.0, 96.0, 402.0, 381.0, 79.0, 24.0, 6.0, 1.0, 0.0, 1.0], "bins": [-163.84609985351562, -160.96719360351562, -158.0883026123047, -155.2093963623047, -152.33050537109375, -149.45159912109375, -146.5727081298828, -143.6938018798828, -140.81491088867188, -137.93600463867188, -135.05711364746094, -132.17820739746094, -129.29931640625, -126.42041778564453, -123.54151916503906, -120.6626205444336, -117.78372192382812, -114.90482330322266, -112.02592468261719, -109.14702606201172, -106.26812744140625, -103.38922882080078, -100.51033020019531, -97.63143157958984, -94.75252532958984, -91.87362670898438, -88.9947280883789, -86.11582946777344, -83.23693084716797, -80.3580322265625, -77.47913360595703, -74.60023498535156, -71.72134399414062, -68.84244537353516, -65.96354675292969, -63.08464813232422, -60.20574951171875, -57.32685089111328, -54.44795227050781, -51.569053649902344, -48.690147399902344, -45.811248779296875, -42.932350158691406, -40.05345153808594, -37.17455291748047, -34.295654296875, -31.4167537689209, -28.53785514831543, -25.658958435058594, -22.780059814453125, -19.901161193847656, -17.022262573242188, -14.143362998962402, -11.264464378356934, -8.385564804077148, -5.50666618347168, -2.627767562866211, 0.2511312961578369, 3.1300301551818848, 6.008929252624512, 8.88782787322998, 11.76672649383545, 14.645626068115234, 17.524524688720703, 20.403423309326172]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 9.0, 9.0, 6.0, 6.0, 10.0, 16.0, 16.0, 24.0, 16.0, 13.0, 20.0, 33.0, 27.0, 25.0, 41.0, 46.0, 46.0, 48.0, 49.0, 46.0, 51.0, 43.0, 44.0, 34.0, 29.0, 30.0, 35.0, 36.0, 20.0, 36.0, 23.0, 16.0, 14.0, 10.0, 14.0, 9.0, 8.0, 6.0, 6.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-16.658592224121094, -16.147735595703125, -15.636880874633789, -15.12602424621582, -14.615168571472168, -14.104312896728516, -13.593456268310547, -13.082600593566895, -12.571744918823242, -12.06088924407959, -11.550033569335938, -11.039176940917969, -10.528321266174316, -10.017465591430664, -9.506608963012695, -8.995753288269043, -8.48489761352539, -7.974041938781738, -7.463185787200928, -6.952329635620117, -6.441473960876465, -5.9306182861328125, -5.419762134552002, -4.908905982971191, -4.398050308227539, -3.8871943950653076, -3.376338481903076, -2.8654825687408447, -2.3546266555786133, -1.8437707424163818, -1.3329148292541504, -0.822058916091919, -0.3112049102783203, 0.19965100288391113, 0.7105069160461426, 1.221362829208374, 1.7322187423706055, 2.243074655532837, 2.7539305686950684, 3.2647864818573, 3.7756423950195312, 4.286498069763184, 4.797354221343994, 5.308210372924805, 5.819066047668457, 6.329921722412109, 6.84077787399292, 7.3516340255737305, 7.862489700317383, 8.373345375061035, 8.884201049804688, 9.395057678222656, 9.905913352966309, 10.416769027709961, 10.92762565612793, 11.438481330871582, 11.949337005615234, 12.460192680358887, 12.971048355102539, 13.481904983520508, 13.99276065826416, 14.503616333007812, 15.014472961425781, 15.525328636169434, 16.036184310913086]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 10.0, 7.0, 10.0, 4.0, 7.0, 21.0, 13.0, 17.0, 19.0, 23.0, 34.0, 41.0, 41.0, 56.0, 67.0, 85.0, 182.0, 269.0, 535.0, 1267.0, 3139.0, 9761.0, 49327.0, 4038104.0, 72754.0, 11705.0, 3808.0, 1455.0, 655.0, 314.0, 191.0, 106.0, 72.0, 37.0, 44.0, 23.0, 17.0, 15.0, 13.0, 8.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-13.2890625, -12.9532470703125, -12.617431640625, -12.2816162109375, -11.94580078125, -11.6099853515625, -11.274169921875, -10.9383544921875, -10.6025390625, -10.2667236328125, -9.930908203125, -9.5950927734375, -9.25927734375, -8.9234619140625, -8.587646484375, -8.2518310546875, -7.916015625, -7.5802001953125, -7.244384765625, -6.9085693359375, -6.57275390625, -6.2369384765625, -5.901123046875, -5.5653076171875, -5.2294921875, -4.8936767578125, -4.557861328125, -4.2220458984375, -3.88623046875, -3.5504150390625, -3.214599609375, -2.8787841796875, -2.54296875, -2.2071533203125, -1.871337890625, -1.5355224609375, -1.19970703125, -0.8638916015625, -0.528076171875, -0.1922607421875, 0.1435546875, 0.4793701171875, 0.815185546875, 1.1510009765625, 1.48681640625, 1.8226318359375, 2.158447265625, 2.4942626953125, 2.830078125, 3.1658935546875, 3.501708984375, 3.8375244140625, 4.17333984375, 4.5091552734375, 4.844970703125, 5.1807861328125, 5.5166015625, 5.8524169921875, 6.188232421875, 6.5240478515625, 6.85986328125, 7.1956787109375, 7.531494140625, 7.8673095703125, 8.203125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 11.0, 13.0, 16.0, 27.0, 36.0, 45.0, 53.0, 73.0, 89.0, 89.0, 107.0, 88.0, 83.0, 75.0, 60.0, 47.0, 28.0, 19.0, 17.0, 9.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7119140625, -1.6672515869140625, -1.622589111328125, -1.5779266357421875, -1.53326416015625, -1.4886016845703125, -1.443939208984375, -1.3992767333984375, -1.3546142578125, -1.3099517822265625, -1.265289306640625, -1.2206268310546875, -1.17596435546875, -1.1313018798828125, -1.086639404296875, -1.0419769287109375, -0.997314453125, -0.9526519775390625, -0.907989501953125, -0.8633270263671875, -0.81866455078125, -0.7740020751953125, -0.729339599609375, -0.6846771240234375, -0.6400146484375, -0.5953521728515625, -0.550689697265625, -0.5060272216796875, -0.46136474609375, -0.4167022705078125, -0.372039794921875, -0.3273773193359375, -0.28271484375, -0.2380523681640625, -0.193389892578125, -0.1487274169921875, -0.10406494140625, -0.0594024658203125, -0.014739990234375, 0.0299224853515625, 0.0745849609375, 0.1192474365234375, 0.163909912109375, 0.2085723876953125, 0.25323486328125, 0.2978973388671875, 0.342559814453125, 0.3872222900390625, 0.431884765625, 0.4765472412109375, 0.521209716796875, 0.5658721923828125, 0.61053466796875, 0.6551971435546875, 0.699859619140625, 0.7445220947265625, 0.7891845703125, 0.8338470458984375, 0.878509521484375, 0.9231719970703125, 0.96783447265625, 1.0124969482421875, 1.057159423828125, 1.1018218994140625, 1.146484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 9.0, 4.0, 14.0, 24.0, 29.0, 55.0, 50.0, 82.0, 182.0, 309.0, 559.0, 1232.0, 2962.0, 8207.0, 30413.0, 340601.0, 3736659.0, 53523.0, 12118.0, 4021.0, 1599.0, 732.0, 393.0, 205.0, 121.0, 57.0, 38.0, 24.0, 16.0, 11.0, 11.0, 9.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3984375, -6.1539306640625, -5.909423828125, -5.6649169921875, -5.42041015625, -5.1759033203125, -4.931396484375, -4.6868896484375, -4.4423828125, -4.1978759765625, -3.953369140625, -3.7088623046875, -3.46435546875, -3.2198486328125, -2.975341796875, -2.7308349609375, -2.486328125, -2.2418212890625, -1.997314453125, -1.7528076171875, -1.50830078125, -1.2637939453125, -1.019287109375, -0.7747802734375, -0.5302734375, -0.2857666015625, -0.041259765625, 0.2032470703125, 0.44775390625, 0.6922607421875, 0.936767578125, 1.1812744140625, 1.42578125, 1.6702880859375, 1.914794921875, 2.1593017578125, 2.40380859375, 2.6483154296875, 2.892822265625, 3.1373291015625, 3.3818359375, 3.6263427734375, 3.870849609375, 4.1153564453125, 4.35986328125, 4.6043701171875, 4.848876953125, 5.0933837890625, 5.337890625, 5.5823974609375, 5.826904296875, 6.0714111328125, 6.31591796875, 6.5604248046875, 6.804931640625, 7.0494384765625, 7.2939453125, 7.5384521484375, 7.782958984375, 8.0274658203125, 8.27197265625, 8.5164794921875, 8.760986328125, 9.0054931640625, 9.25]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 7.0, 8.0, 17.0, 12.0, 13.0, 32.0, 50.0, 71.0, 167.0, 911.0, 2331.0, 218.0, 84.0, 54.0, 31.0, 19.0, 14.0, 9.0, 4.0, 7.0, 2.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.19921875, -4.104034423828125, -4.00885009765625, -3.913665771484375, -3.8184814453125, -3.723297119140625, -3.62811279296875, -3.532928466796875, -3.437744140625, -3.342559814453125, -3.24737548828125, -3.152191162109375, -3.0570068359375, -2.961822509765625, -2.86663818359375, -2.771453857421875, -2.67626953125, -2.581085205078125, -2.48590087890625, -2.390716552734375, -2.2955322265625, -2.200347900390625, -2.10516357421875, -2.009979248046875, -1.914794921875, -1.819610595703125, -1.72442626953125, -1.629241943359375, -1.5340576171875, -1.438873291015625, -1.34368896484375, -1.248504638671875, -1.1533203125, -1.058135986328125, -0.96295166015625, -0.867767333984375, -0.7725830078125, -0.677398681640625, -0.58221435546875, -0.487030029296875, -0.391845703125, -0.296661376953125, -0.20147705078125, -0.106292724609375, -0.0111083984375, 0.084075927734375, 0.17926025390625, 0.274444580078125, 0.36962890625, 0.464813232421875, 0.55999755859375, 0.655181884765625, 0.7503662109375, 0.845550537109375, 0.94073486328125, 1.035919189453125, 1.131103515625, 1.226287841796875, 1.32147216796875, 1.416656494140625, 1.5118408203125, 1.607025146484375, 1.70220947265625, 1.797393798828125, 1.892578125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 12.0, 5.0, 17.0, 27.0, 63.0, 83.0, 142.0, 204.0, 178.0, 133.0, 52.0, 41.0, 15.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.175186157226562, -19.668771743774414, -19.162357330322266, -18.655942916870117, -18.14952850341797, -17.643112182617188, -17.13669776916504, -16.63028335571289, -16.123868942260742, -15.617454528808594, -15.111040115356445, -14.60462474822998, -14.098210334777832, -13.591795921325684, -13.085380554199219, -12.57896614074707, -12.072551727294922, -11.566137313842773, -11.059722900390625, -10.55330753326416, -10.046893119812012, -9.540478706359863, -9.034063339233398, -8.52764892578125, -8.021234512329102, -7.514820098876953, -7.0084052085876465, -6.50199031829834, -5.995575904846191, -5.489161491394043, -4.982746601104736, -4.47633171081543, -3.969916343688965, -3.4635016918182373, -2.9570870399475098, -2.4506723880767822, -1.9442577362060547, -1.4378430843353271, -0.9314284324645996, -0.42501378059387207, 0.08140087127685547, 0.587815523147583, 1.0942301750183105, 1.600644826889038, 2.1070594787597656, 2.613474130630493, 3.1198887825012207, 3.6263034343719482, 4.132718086242676, 4.639132499694824, 5.145547389984131, 5.6519622802734375, 6.158376693725586, 6.664791107177734, 7.171205997467041, 7.677620887756348, 8.184035301208496, 8.690449714660645, 9.19686508178711, 9.703279495239258, 10.209693908691406, 10.716108322143555, 11.222522735595703, 11.728938102722168, 12.235352516174316]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 6.0, 7.0, 8.0, 12.0, 17.0, 12.0, 23.0, 28.0, 23.0, 22.0, 45.0, 45.0, 52.0, 48.0, 53.0, 53.0, 47.0, 57.0, 55.0, 44.0, 49.0, 38.0, 45.0, 32.0, 24.0, 30.0, 30.0, 15.0, 12.0, 13.0, 24.0, 8.0, 5.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.596019268035889, -5.365468502044678, -5.134917259216309, -4.904366493225098, -4.6738152503967285, -4.443264484405518, -4.212713241577148, -3.9821624755859375, -3.7516114711761475, -3.5210604667663574, -3.2905094623565674, -3.0599584579467773, -2.8294076919555664, -2.5988564491271973, -2.3683056831359863, -2.1377546787261963, -1.9072036743164062, -1.6766526699066162, -1.4461016654968262, -1.2155507802963257, -0.9849997758865356, -0.7544487714767456, -0.5238978862762451, -0.2933468818664551, -0.06279587745666504, 0.1677550971508026, 0.39830607175827026, 0.6288570165634155, 0.8594080209732056, 1.0899590253829956, 1.320509910583496, 1.5510609149932861, 1.7816123962402344, 2.0121634006500244, 2.2427144050598145, 2.4732651710510254, 2.7038164138793945, 2.9343671798706055, 3.1649181842803955, 3.3954691886901855, 3.6260201930999756, 3.8565711975097656, 4.087121963500977, 4.317673206329346, 4.548223972320557, 4.778775215148926, 5.009325981140137, 5.239876747131348, 5.470427989959717, 5.700978755950928, 5.931529998779297, 6.162080764770508, 6.392632007598877, 6.623182773590088, 6.853734016418457, 7.084284782409668, 7.314835548400879, 7.54538631439209, 7.775937557220459, 8.006488800048828, 8.237039566040039, 8.46759033203125, 8.698141098022461, 8.928691864013672, 9.1592435836792]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 0.0, 5.0, 17.0, 13.0, 22.0, 33.0, 44.0, 59.0, 135.0, 234.0, 502.0, 1130.0, 4868.0, 36163.0, 860690.0, 130830.0, 10361.0, 2049.0, 678.0, 316.0, 160.0, 90.0, 41.0, 38.0, 21.0, 12.0, 11.0, 17.0, 2.0, 4.0, 0.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.5, -10.0916748046875, -9.683349609375, -9.2750244140625, -8.86669921875, -8.4583740234375, -8.050048828125, -7.6417236328125, -7.2333984375, -6.8250732421875, -6.416748046875, -6.0084228515625, -5.60009765625, -5.1917724609375, -4.783447265625, -4.3751220703125, -3.966796875, -3.5584716796875, -3.150146484375, -2.7418212890625, -2.33349609375, -1.9251708984375, -1.516845703125, -1.1085205078125, -0.7001953125, -0.2918701171875, 0.116455078125, 0.5247802734375, 0.93310546875, 1.3414306640625, 1.749755859375, 2.1580810546875, 2.56640625, 2.9747314453125, 3.383056640625, 3.7913818359375, 4.19970703125, 4.6080322265625, 5.016357421875, 5.4246826171875, 5.8330078125, 6.2413330078125, 6.649658203125, 7.0579833984375, 7.46630859375, 7.8746337890625, 8.282958984375, 8.6912841796875, 9.099609375, 9.5079345703125, 9.916259765625, 10.3245849609375, 10.73291015625, 11.1412353515625, 11.549560546875, 11.9578857421875, 12.3662109375, 12.7745361328125, 13.182861328125, 13.5911865234375, 13.99951171875, 14.4078369140625, 14.816162109375, 15.2244873046875, 15.6328125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 11.0, 20.0, 21.0, 32.0, 30.0, 58.0, 65.0, 82.0, 111.0, 106.0, 100.0, 78.0, 82.0, 71.0, 42.0, 26.0, 26.0, 16.0, 12.0, 1.0, 3.0, 6.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8740234375, -1.826690673828125, -1.77935791015625, -1.732025146484375, -1.6846923828125, -1.637359619140625, -1.59002685546875, -1.542694091796875, -1.495361328125, -1.448028564453125, -1.40069580078125, -1.353363037109375, -1.3060302734375, -1.258697509765625, -1.21136474609375, -1.164031982421875, -1.11669921875, -1.069366455078125, -1.02203369140625, -0.974700927734375, -0.9273681640625, -0.880035400390625, -0.83270263671875, -0.785369873046875, -0.738037109375, -0.690704345703125, -0.64337158203125, -0.596038818359375, -0.5487060546875, -0.501373291015625, -0.45404052734375, -0.406707763671875, -0.359375, -0.312042236328125, -0.26470947265625, -0.217376708984375, -0.1700439453125, -0.122711181640625, -0.07537841796875, -0.028045654296875, 0.019287109375, 0.066619873046875, 0.11395263671875, 0.161285400390625, 0.2086181640625, 0.255950927734375, 0.30328369140625, 0.350616455078125, 0.39794921875, 0.445281982421875, 0.49261474609375, 0.539947509765625, 0.5872802734375, 0.634613037109375, 0.68194580078125, 0.729278564453125, 0.776611328125, 0.823944091796875, 0.87127685546875, 0.918609619140625, 0.9659423828125, 1.013275146484375, 1.06060791015625, 1.107940673828125, 1.1552734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 5.0, 3.0, 10.0, 9.0, 12.0, 18.0, 27.0, 26.0, 39.0, 40.0, 74.0, 93.0, 145.0, 212.0, 334.0, 538.0, 932.0, 1802.0, 3622.0, 7689.0, 18222.0, 49942.0, 181667.0, 555042.0, 153113.0, 44087.0, 16310.0, 6885.0, 3458.0, 1731.0, 914.0, 550.0, 319.0, 210.0, 139.0, 86.0, 70.0, 45.0, 34.0, 31.0, 17.0, 19.0, 7.0, 5.0, 6.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-3.5, -3.39837646484375, -3.2967529296875, -3.19512939453125, -3.093505859375, -2.99188232421875, -2.8902587890625, -2.78863525390625, -2.68701171875, -2.58538818359375, -2.4837646484375, -2.38214111328125, -2.280517578125, -2.17889404296875, -2.0772705078125, -1.97564697265625, -1.8740234375, -1.77239990234375, -1.6707763671875, -1.56915283203125, -1.467529296875, -1.36590576171875, -1.2642822265625, -1.16265869140625, -1.06103515625, -0.95941162109375, -0.8577880859375, -0.75616455078125, -0.654541015625, -0.55291748046875, -0.4512939453125, -0.34967041015625, -0.248046875, -0.14642333984375, -0.0447998046875, 0.05682373046875, 0.158447265625, 0.26007080078125, 0.3616943359375, 0.46331787109375, 0.56494140625, 0.66656494140625, 0.7681884765625, 0.86981201171875, 0.971435546875, 1.07305908203125, 1.1746826171875, 1.27630615234375, 1.3779296875, 1.47955322265625, 1.5811767578125, 1.68280029296875, 1.784423828125, 1.88604736328125, 1.9876708984375, 2.08929443359375, 2.19091796875, 2.29254150390625, 2.3941650390625, 2.49578857421875, 2.597412109375, 2.69903564453125, 2.8006591796875, 2.90228271484375, 3.00390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 1.0, 7.0, 14.0, 15.0, 18.0, 25.0, 32.0, 23.0, 33.0, 36.0, 38.0, 39.0, 38.0, 53.0, 54.0, 50.0, 44.0, 50.0, 57.0, 52.0, 49.0, 46.0, 45.0, 34.0, 25.0, 22.0, 29.0, 18.0, 13.0, 8.0, 6.0, 1.0, 7.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.626953125, -3.5125732421875, -3.398193359375, -3.2838134765625, -3.16943359375, -3.0550537109375, -2.940673828125, -2.8262939453125, -2.7119140625, -2.5975341796875, -2.483154296875, -2.3687744140625, -2.25439453125, -2.1400146484375, -2.025634765625, -1.9112548828125, -1.796875, -1.6824951171875, -1.568115234375, -1.4537353515625, -1.33935546875, -1.2249755859375, -1.110595703125, -0.9962158203125, -0.8818359375, -0.7674560546875, -0.653076171875, -0.5386962890625, -0.42431640625, -0.3099365234375, -0.195556640625, -0.0811767578125, 0.033203125, 0.1475830078125, 0.261962890625, 0.3763427734375, 0.49072265625, 0.6051025390625, 0.719482421875, 0.8338623046875, 0.9482421875, 1.0626220703125, 1.177001953125, 1.2913818359375, 1.40576171875, 1.5201416015625, 1.634521484375, 1.7489013671875, 1.86328125, 1.9776611328125, 2.092041015625, 2.2064208984375, 2.32080078125, 2.4351806640625, 2.549560546875, 2.6639404296875, 2.7783203125, 2.8927001953125, 3.007080078125, 3.1214599609375, 3.23583984375, 3.3502197265625, 3.464599609375, 3.5789794921875, 3.693359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 4.0, 15.0, 23.0, 32.0, 50.0, 99.0, 185.0, 367.0, 852.0, 2473.0, 10883.0, 127834.0, 857846.0, 38888.0, 6100.0, 1690.0, 619.0, 256.0, 138.0, 61.0, 40.0, 27.0, 16.0, 15.0, 8.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.658203125, -3.537506103515625, -3.41680908203125, -3.296112060546875, -3.1754150390625, -3.054718017578125, -2.93402099609375, -2.813323974609375, -2.692626953125, -2.571929931640625, -2.45123291015625, -2.330535888671875, -2.2098388671875, -2.089141845703125, -1.96844482421875, -1.847747802734375, -1.72705078125, -1.606353759765625, -1.48565673828125, -1.364959716796875, -1.2442626953125, -1.123565673828125, -1.00286865234375, -0.882171630859375, -0.761474609375, -0.640777587890625, -0.52008056640625, -0.399383544921875, -0.2786865234375, -0.157989501953125, -0.03729248046875, 0.083404541015625, 0.2041015625, 0.324798583984375, 0.44549560546875, 0.566192626953125, 0.6868896484375, 0.807586669921875, 0.92828369140625, 1.048980712890625, 1.169677734375, 1.290374755859375, 1.41107177734375, 1.531768798828125, 1.6524658203125, 1.773162841796875, 1.89385986328125, 2.014556884765625, 2.13525390625, 2.255950927734375, 2.37664794921875, 2.497344970703125, 2.6180419921875, 2.738739013671875, 2.85943603515625, 2.980133056640625, 3.100830078125, 3.221527099609375, 3.34222412109375, 3.462921142578125, 3.5836181640625, 3.704315185546875, 3.82501220703125, 3.945709228515625, 4.06640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 7.0, 9.0, 21.0, 27.0, 33.0, 82.0, 184.0, 273.0, 165.0, 92.0, 44.0, 19.0, 15.0, 9.0, 10.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005245208740234375, -0.0005054250359535217, -0.00048632919788360596, -0.0004672333598136902, -0.0004481375217437744, -0.00042904168367385864, -0.00040994584560394287, -0.0003908500075340271, -0.00037175416946411133, -0.00035265833139419556, -0.0003335624933242798, -0.000314466655254364, -0.00029537081718444824, -0.00027627497911453247, -0.0002571791410446167, -0.00023808330297470093, -0.00021898746490478516, -0.00019989162683486938, -0.0001807957887649536, -0.00016169995069503784, -0.00014260411262512207, -0.0001235082745552063, -0.00010441243648529053, -8.531659841537476e-05, -6.622076034545898e-05, -4.712492227554321e-05, -2.802908420562744e-05, -8.93324613571167e-06, 1.0162591934204102e-05, 2.9258430004119873e-05, 4.8354268074035645e-05, 6.745010614395142e-05, 8.654594421386719e-05, 0.00010564178228378296, 0.00012473762035369873, 0.0001438334584236145, 0.00016292929649353027, 0.00018202513456344604, 0.00020112097263336182, 0.0002202168107032776, 0.00023931264877319336, 0.00025840848684310913, 0.0002775043249130249, 0.0002966001629829407, 0.00031569600105285645, 0.0003347918391227722, 0.000353887677192688, 0.00037298351526260376, 0.00039207935333251953, 0.0004111751914024353, 0.0004302710294723511, 0.00044936686754226685, 0.0004684627056121826, 0.0004875585436820984, 0.0005066543817520142, 0.0005257502198219299, 0.0005448460578918457, 0.0005639418959617615, 0.0005830377340316772, 0.000602133572101593, 0.0006212294101715088, 0.0006403252482414246, 0.0006594210863113403, 0.0006785169243812561, 0.0006976127624511719]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 6.0, 7.0, 12.0, 21.0, 21.0, 44.0, 44.0, 61.0, 119.0, 200.0, 481.0, 1578.0, 8545.0, 188721.0, 828651.0, 16272.0, 2456.0, 651.0, 262.0, 141.0, 93.0, 57.0, 49.0, 19.0, 16.0, 8.0, 2.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96484375, -3.813232421875, -3.66162109375, -3.510009765625, -3.3583984375, -3.206787109375, -3.05517578125, -2.903564453125, -2.751953125, -2.600341796875, -2.44873046875, -2.297119140625, -2.1455078125, -1.993896484375, -1.84228515625, -1.690673828125, -1.5390625, -1.387451171875, -1.23583984375, -1.084228515625, -0.9326171875, -0.781005859375, -0.62939453125, -0.477783203125, -0.326171875, -0.174560546875, -0.02294921875, 0.128662109375, 0.2802734375, 0.431884765625, 0.58349609375, 0.735107421875, 0.88671875, 1.038330078125, 1.18994140625, 1.341552734375, 1.4931640625, 1.644775390625, 1.79638671875, 1.947998046875, 2.099609375, 2.251220703125, 2.40283203125, 2.554443359375, 2.7060546875, 2.857666015625, 3.00927734375, 3.160888671875, 3.3125, 3.464111328125, 3.61572265625, 3.767333984375, 3.9189453125, 4.070556640625, 4.22216796875, 4.373779296875, 4.525390625, 4.677001953125, 4.82861328125, 4.980224609375, 5.1318359375, 5.283447265625, 5.43505859375, 5.586669921875, 5.73828125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 7.0, 5.0, 15.0, 19.0, 59.0, 179.0, 443.0, 187.0, 50.0, 20.0, 12.0, 8.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.734375, -5.5814208984375, -5.428466796875, -5.2755126953125, -5.12255859375, -4.9696044921875, -4.816650390625, -4.6636962890625, -4.5107421875, -4.3577880859375, -4.204833984375, -4.0518798828125, -3.89892578125, -3.7459716796875, -3.593017578125, -3.4400634765625, -3.287109375, -3.1341552734375, -2.981201171875, -2.8282470703125, -2.67529296875, -2.5223388671875, -2.369384765625, -2.2164306640625, -2.0634765625, -1.9105224609375, -1.757568359375, -1.6046142578125, -1.45166015625, -1.2987060546875, -1.145751953125, -0.9927978515625, -0.83984375, -0.6868896484375, -0.533935546875, -0.3809814453125, -0.22802734375, -0.0750732421875, 0.077880859375, 0.2308349609375, 0.3837890625, 0.5367431640625, 0.689697265625, 0.8426513671875, 0.99560546875, 1.1485595703125, 1.301513671875, 1.4544677734375, 1.607421875, 1.7603759765625, 1.913330078125, 2.0662841796875, 2.21923828125, 2.3721923828125, 2.525146484375, 2.6781005859375, 2.8310546875, 2.9840087890625, 3.136962890625, 3.2899169921875, 3.44287109375, 3.5958251953125, 3.748779296875, 3.9017333984375, 4.0546875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 13.0, 19.0, 67.0, 110.0, 194.0, 189.0, 157.0, 112.0, 60.0, 34.0, 22.0, 10.0, 4.0, 6.0, 0.0, 2.0, 2.0, 3.0], "bins": [-59.06610107421875, -57.913002014160156, -56.75990295410156, -55.60680389404297, -54.453704833984375, -53.30060577392578, -52.14750671386719, -50.99440383911133, -49.841304779052734, -48.68820571899414, -47.53510665893555, -46.38200759887695, -45.22890853881836, -44.0758056640625, -42.922706604003906, -41.76960754394531, -40.61650848388672, -39.463409423828125, -38.31031036376953, -37.15721130371094, -36.004112243652344, -34.85101318359375, -33.697914123535156, -32.5448112487793, -31.39171600341797, -30.238616943359375, -29.08551788330078, -27.932418823242188, -26.77931785583496, -25.626218795776367, -24.473119735717773, -23.320018768310547, -22.166919708251953, -21.01382064819336, -19.860721588134766, -18.707622528076172, -17.554521560668945, -16.40142250061035, -15.248323440551758, -14.095223426818848, -12.942124366760254, -11.78902530670166, -10.63592529296875, -9.482826232910156, -8.329727172851562, -7.176627159118652, -6.023528099060059, -4.870428085327148, -3.7173290252685547, -2.5642294883728027, -1.4111301898956299, -0.25803089141845703, 0.8950686454772949, 2.048168182373047, 3.2012672424316406, 4.354367256164551, 5.5074663162231445, 6.6605658531188965, 7.813665390014648, 8.966764450073242, 10.119863510131836, 11.272963523864746, 12.42606258392334, 13.57916259765625, 14.732261657714844]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 6.0, 16.0, 15.0, 26.0, 26.0, 23.0, 30.0, 22.0, 30.0, 29.0, 41.0, 37.0, 56.0, 41.0, 42.0, 46.0, 39.0, 51.0, 45.0, 33.0, 32.0, 36.0, 27.0, 31.0, 33.0, 28.0, 20.0, 25.0, 14.0, 21.0, 11.0, 10.0, 11.0, 10.0, 2.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.634029388427734, -16.133546829223633, -15.633064270019531, -15.13258171081543, -14.632099151611328, -14.131616592407227, -13.631133079528809, -13.130650520324707, -12.630167961120605, -12.129685401916504, -11.629202842712402, -11.1287202835083, -10.628236770629883, -10.127754211425781, -9.62727165222168, -9.126789093017578, -8.626306533813477, -8.125823974609375, -7.625341415405273, -7.124858379364014, -6.624375820159912, -6.1238932609558105, -5.623410224914551, -5.122927665710449, -4.622445106506348, -4.121962547302246, -3.6214797496795654, -3.1209969520568848, -2.620514392852783, -2.1200318336486816, -1.619549036026001, -1.1190662384033203, -0.6185817718505859, -0.11809909343719482, 0.3823835849761963, 0.8828662633895874, 1.3833489418029785, 1.88383150100708, 2.3843142986297607, 2.8847970962524414, 3.385279655456543, 3.8857622146606445, 4.386244773864746, 4.886727809906006, 5.387210369110107, 5.887692928314209, 6.388175964355469, 6.88865852355957, 7.389141082763672, 7.889623641967773, 8.390106201171875, 8.890588760375977, 9.391071319580078, 9.89155387878418, 10.392037391662598, 10.8925199508667, 11.3930025100708, 11.893485069274902, 12.393967628479004, 12.894450187683105, 13.394933700561523, 13.895416259765625, 14.395898818969727, 14.896381378173828, 15.39686393737793]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 2.0, 4.0, 8.0, 5.0, 7.0, 3.0, 1.0, 7.0, 9.0, 14.0, 14.0, 21.0, 27.0, 45.0, 86.0, 111.0, 186.0, 567.0, 1565.0, 5225.0, 35587.0, 4105473.0, 37296.0, 5293.0, 1621.0, 591.0, 216.0, 127.0, 63.0, 27.0, 30.0, 18.0, 12.0, 10.0, 8.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.09375, -16.6717529296875, -16.249755859375, -15.8277587890625, -15.40576171875, -14.9837646484375, -14.561767578125, -14.1397705078125, -13.7177734375, -13.2957763671875, -12.873779296875, -12.4517822265625, -12.02978515625, -11.6077880859375, -11.185791015625, -10.7637939453125, -10.341796875, -9.9197998046875, -9.497802734375, -9.0758056640625, -8.65380859375, -8.2318115234375, -7.809814453125, -7.3878173828125, -6.9658203125, -6.5438232421875, -6.121826171875, -5.6998291015625, -5.27783203125, -4.8558349609375, -4.433837890625, -4.0118408203125, -3.58984375, -3.1678466796875, -2.745849609375, -2.3238525390625, -1.90185546875, -1.4798583984375, -1.057861328125, -0.6358642578125, -0.2138671875, 0.2081298828125, 0.630126953125, 1.0521240234375, 1.47412109375, 1.8961181640625, 2.318115234375, 2.7401123046875, 3.162109375, 3.5841064453125, 4.006103515625, 4.4281005859375, 4.85009765625, 5.2720947265625, 5.694091796875, 6.1160888671875, 6.5380859375, 6.9600830078125, 7.382080078125, 7.8040771484375, 8.22607421875, 8.6480712890625, 9.070068359375, 9.4920654296875, 9.9140625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 13.0, 11.0, 20.0, 29.0, 30.0, 43.0, 53.0, 79.0, 72.0, 92.0, 98.0, 70.0, 87.0, 93.0, 56.0, 53.0, 33.0, 25.0, 15.0, 10.0, 12.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.884765625, -1.8371429443359375, -1.789520263671875, -1.7418975830078125, -1.69427490234375, -1.6466522216796875, -1.599029541015625, -1.5514068603515625, -1.5037841796875, -1.4561614990234375, -1.408538818359375, -1.3609161376953125, -1.31329345703125, -1.2656707763671875, -1.218048095703125, -1.1704254150390625, -1.122802734375, -1.0751800537109375, -1.027557373046875, -0.9799346923828125, -0.93231201171875, -0.8846893310546875, -0.837066650390625, -0.7894439697265625, -0.7418212890625, -0.6941986083984375, -0.646575927734375, -0.5989532470703125, -0.55133056640625, -0.5037078857421875, -0.456085205078125, -0.4084625244140625, -0.36083984375, -0.3132171630859375, -0.265594482421875, -0.2179718017578125, -0.17034912109375, -0.1227264404296875, -0.075103759765625, -0.0274810791015625, 0.0201416015625, 0.0677642822265625, 0.115386962890625, 0.1630096435546875, 0.21063232421875, 0.2582550048828125, 0.305877685546875, 0.3535003662109375, 0.401123046875, 0.4487457275390625, 0.496368408203125, 0.5439910888671875, 0.59161376953125, 0.6392364501953125, 0.686859130859375, 0.7344818115234375, 0.7821044921875, 0.8297271728515625, 0.877349853515625, 0.9249725341796875, 0.97259521484375, 1.0202178955078125, 1.067840576171875, 1.1154632568359375, 1.1630859375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 7.0, 6.0, 5.0, 11.0, 6.0, 16.0, 38.0, 43.0, 54.0, 72.0, 100.0, 155.0, 245.0, 361.0, 545.0, 794.0, 1325.0, 2311.0, 3839.0, 7082.0, 14463.0, 39211.0, 256737.0, 3743239.0, 78326.0, 22609.0, 9997.0, 5131.0, 2908.0, 1676.0, 1033.0, 646.0, 415.0, 257.0, 194.0, 102.0, 93.0, 78.0, 50.0, 27.0, 17.0, 17.0, 15.0, 14.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.26953125, -4.12835693359375, -3.9871826171875, -3.84600830078125, -3.704833984375, -3.56365966796875, -3.4224853515625, -3.28131103515625, -3.14013671875, -2.99896240234375, -2.8577880859375, -2.71661376953125, -2.575439453125, -2.43426513671875, -2.2930908203125, -2.15191650390625, -2.0107421875, -1.86956787109375, -1.7283935546875, -1.58721923828125, -1.446044921875, -1.30487060546875, -1.1636962890625, -1.02252197265625, -0.88134765625, -0.74017333984375, -0.5989990234375, -0.45782470703125, -0.316650390625, -0.17547607421875, -0.0343017578125, 0.10687255859375, 0.248046875, 0.38922119140625, 0.5303955078125, 0.67156982421875, 0.812744140625, 0.95391845703125, 1.0950927734375, 1.23626708984375, 1.37744140625, 1.51861572265625, 1.6597900390625, 1.80096435546875, 1.942138671875, 2.08331298828125, 2.2244873046875, 2.36566162109375, 2.5068359375, 2.64801025390625, 2.7891845703125, 2.93035888671875, 3.071533203125, 3.21270751953125, 3.3538818359375, 3.49505615234375, 3.63623046875, 3.77740478515625, 3.9185791015625, 4.05975341796875, 4.200927734375, 4.34210205078125, 4.4832763671875, 4.62445068359375, 4.765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 6.0, 4.0, 5.0, 6.0, 5.0, 6.0, 10.0, 19.0, 34.0, 41.0, 63.0, 207.0, 2882.0, 469.0, 127.0, 53.0, 23.0, 33.0, 16.0, 14.0, 9.0, 8.0, 3.0, 6.0, 3.0, 2.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33203125, -2.262908935546875, -2.19378662109375, -2.124664306640625, -2.0555419921875, -1.986419677734375, -1.91729736328125, -1.848175048828125, -1.779052734375, -1.709930419921875, -1.64080810546875, -1.571685791015625, -1.5025634765625, -1.433441162109375, -1.36431884765625, -1.295196533203125, -1.22607421875, -1.156951904296875, -1.08782958984375, -1.018707275390625, -0.9495849609375, -0.880462646484375, -0.81134033203125, -0.742218017578125, -0.673095703125, -0.603973388671875, -0.53485107421875, -0.465728759765625, -0.3966064453125, -0.327484130859375, -0.25836181640625, -0.189239501953125, -0.1201171875, -0.050994873046875, 0.01812744140625, 0.087249755859375, 0.1563720703125, 0.225494384765625, 0.29461669921875, 0.363739013671875, 0.432861328125, 0.501983642578125, 0.57110595703125, 0.640228271484375, 0.7093505859375, 0.778472900390625, 0.84759521484375, 0.916717529296875, 0.98583984375, 1.054962158203125, 1.12408447265625, 1.193206787109375, 1.2623291015625, 1.331451416015625, 1.40057373046875, 1.469696044921875, 1.538818359375, 1.607940673828125, 1.67706298828125, 1.746185302734375, 1.8153076171875, 1.884429931640625, 1.95355224609375, 2.022674560546875, 2.091796875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 8.0, 17.0, 23.0, 41.0, 71.0, 95.0, 136.0, 189.0, 135.0, 105.0, 63.0, 35.0, 30.0, 13.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.80157470703125, -9.445779800415039, -9.089984893798828, -8.734189987182617, -8.378395080566406, -8.022600173950195, -7.666804790496826, -7.311009883880615, -6.955214977264404, -6.599420070648193, -6.243625164031982, -5.887829780578613, -5.532034873962402, -5.176239967346191, -4.8204450607299805, -4.4646501541137695, -4.108855247497559, -3.7530603408813477, -3.3972654342651367, -3.0414702892303467, -2.6856753826141357, -2.329880475997925, -1.9740853309631348, -1.6182904243469238, -1.262495517730713, -0.9067005515098572, -0.5509055852890015, -0.19511055946350098, 0.16068434715270996, 0.5164792537689209, 0.8722743988037109, 1.2280693054199219, 1.5838651657104492, 1.9396600723266602, 2.295454978942871, 2.651250123977661, 3.007045030593872, 3.362839937210083, 3.718635082244873, 4.074429988861084, 4.430224895477295, 4.786019802093506, 5.141814708709717, 5.497610092163086, 5.853404998779297, 6.209199905395508, 6.564994812011719, 6.92078971862793, 7.276584625244141, 7.632379531860352, 7.9881744384765625, 8.343969345092773, 8.699764251708984, 9.055559158325195, 9.411354064941406, 9.767148971557617, 10.122943878173828, 10.478738784790039, 10.83453369140625, 11.190328598022461, 11.546123504638672, 11.901918411254883, 12.257713317871094, 12.613508224487305, 12.969304084777832]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 5.0, 4.0, 6.0, 10.0, 9.0, 8.0, 13.0, 12.0, 26.0, 21.0, 15.0, 32.0, 27.0, 35.0, 24.0, 36.0, 42.0, 39.0, 48.0, 38.0, 38.0, 45.0, 44.0, 40.0, 34.0, 43.0, 35.0, 34.0, 37.0, 25.0, 21.0, 25.0, 13.0, 18.0, 18.0, 15.0, 12.0, 9.0, 9.0, 4.0, 3.0, 7.0, 1.0, 3.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.343256950378418, -4.184394836425781, -4.0255327224731445, -3.8666703701019287, -3.707808256149292, -3.5489461421966553, -3.3900837898254395, -3.2312216758728027, -3.072359561920166, -2.9134974479675293, -2.7546353340148926, -2.5957729816436768, -2.43691086769104, -2.2780487537384033, -2.1191864013671875, -1.9603242874145508, -1.801462173461914, -1.6426000595092773, -1.483737826347351, -1.3248755931854248, -1.166013479232788, -1.0071513652801514, -0.8482891321182251, -0.6894268989562988, -0.5305647850036621, -0.3717026114463806, -0.21284043788909912, -0.05397826433181763, 0.10488390922546387, 0.26374608278274536, 0.42260825634002686, 0.5814704895019531, 0.740333080291748, 0.8991952538490295, 1.058057427406311, 1.2169196605682373, 1.375781774520874, 1.5346438884735107, 1.693506121635437, 1.8523683547973633, 2.01123046875, 2.1700925827026367, 2.3289546966552734, 2.4878170490264893, 2.646679162979126, 2.8055412769317627, 2.9644036293029785, 3.1232657432556152, 3.282127857208252, 3.4409899711608887, 3.5998520851135254, 3.758714437484741, 3.917576551437378, 4.076438903808594, 4.2353010177612305, 4.394163131713867, 4.553025245666504, 4.711887359619141, 4.870749473571777, 5.029611587524414, 5.188473701477051, 5.347336292266846, 5.506198406219482, 5.665060520172119, 5.823922634124756]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 12.0, 8.0, 7.0, 10.0, 20.0, 45.0, 54.0, 101.0, 167.0, 364.0, 804.0, 2706.0, 14783.0, 312132.0, 689839.0, 22110.0, 3484.0, 979.0, 426.0, 199.0, 115.0, 66.0, 45.0, 26.0, 10.0, 10.0, 12.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-14.09375, -13.7237548828125, -13.353759765625, -12.9837646484375, -12.61376953125, -12.2437744140625, -11.873779296875, -11.5037841796875, -11.1337890625, -10.7637939453125, -10.393798828125, -10.0238037109375, -9.65380859375, -9.2838134765625, -8.913818359375, -8.5438232421875, -8.173828125, -7.8038330078125, -7.433837890625, -7.0638427734375, -6.69384765625, -6.3238525390625, -5.953857421875, -5.5838623046875, -5.2138671875, -4.8438720703125, -4.473876953125, -4.1038818359375, -3.73388671875, -3.3638916015625, -2.993896484375, -2.6239013671875, -2.25390625, -1.8839111328125, -1.513916015625, -1.1439208984375, -0.77392578125, -0.4039306640625, -0.033935546875, 0.3360595703125, 0.7060546875, 1.0760498046875, 1.446044921875, 1.8160400390625, 2.18603515625, 2.5560302734375, 2.926025390625, 3.2960205078125, 3.666015625, 4.0360107421875, 4.406005859375, 4.7760009765625, 5.14599609375, 5.5159912109375, 5.885986328125, 6.2559814453125, 6.6259765625, 6.9959716796875, 7.365966796875, 7.7359619140625, 8.10595703125, 8.4759521484375, 8.845947265625, 9.2159423828125, 9.5859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 11.0, 20.0, 27.0, 24.0, 34.0, 61.0, 67.0, 81.0, 101.0, 85.0, 78.0, 86.0, 75.0, 80.0, 50.0, 38.0, 22.0, 14.0, 20.0, 10.0, 4.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87109375, -1.82293701171875, -1.7747802734375, -1.72662353515625, -1.678466796875, -1.63031005859375, -1.5821533203125, -1.53399658203125, -1.48583984375, -1.43768310546875, -1.3895263671875, -1.34136962890625, -1.293212890625, -1.24505615234375, -1.1968994140625, -1.14874267578125, -1.1005859375, -1.05242919921875, -1.0042724609375, -0.95611572265625, -0.907958984375, -0.85980224609375, -0.8116455078125, -0.76348876953125, -0.71533203125, -0.66717529296875, -0.6190185546875, -0.57086181640625, -0.522705078125, -0.47454833984375, -0.4263916015625, -0.37823486328125, -0.330078125, -0.28192138671875, -0.2337646484375, -0.18560791015625, -0.137451171875, -0.08929443359375, -0.0411376953125, 0.00701904296875, 0.05517578125, 0.10333251953125, 0.1514892578125, 0.19964599609375, 0.247802734375, 0.29595947265625, 0.3441162109375, 0.39227294921875, 0.4404296875, 0.48858642578125, 0.5367431640625, 0.58489990234375, 0.633056640625, 0.68121337890625, 0.7293701171875, 0.77752685546875, 0.82568359375, 0.87384033203125, 0.9219970703125, 0.97015380859375, 1.018310546875, 1.06646728515625, 1.1146240234375, 1.16278076171875, 1.2109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 11.0, 24.0, 40.0, 61.0, 98.0, 159.0, 231.0, 496.0, 929.0, 2079.0, 4648.0, 11175.0, 31728.0, 114240.0, 561352.0, 237333.0, 53903.0, 17406.0, 6702.0, 2965.0, 1374.0, 697.0, 328.0, 215.0, 134.0, 80.0, 39.0, 33.0, 12.0, 11.0, 8.0, 6.0, 5.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.3828125, -3.272705078125, -3.16259765625, -3.052490234375, -2.9423828125, -2.832275390625, -2.72216796875, -2.612060546875, -2.501953125, -2.391845703125, -2.28173828125, -2.171630859375, -2.0615234375, -1.951416015625, -1.84130859375, -1.731201171875, -1.62109375, -1.510986328125, -1.40087890625, -1.290771484375, -1.1806640625, -1.070556640625, -0.96044921875, -0.850341796875, -0.740234375, -0.630126953125, -0.52001953125, -0.409912109375, -0.2998046875, -0.189697265625, -0.07958984375, 0.030517578125, 0.140625, 0.250732421875, 0.36083984375, 0.470947265625, 0.5810546875, 0.691162109375, 0.80126953125, 0.911376953125, 1.021484375, 1.131591796875, 1.24169921875, 1.351806640625, 1.4619140625, 1.572021484375, 1.68212890625, 1.792236328125, 1.90234375, 2.012451171875, 2.12255859375, 2.232666015625, 2.3427734375, 2.452880859375, 2.56298828125, 2.673095703125, 2.783203125, 2.893310546875, 3.00341796875, 3.113525390625, 3.2236328125, 3.333740234375, 3.44384765625, 3.553955078125, 3.6640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 3.0, 5.0, 5.0, 1.0, 11.0, 8.0, 15.0, 13.0, 16.0, 22.0, 19.0, 25.0, 21.0, 28.0, 28.0, 36.0, 37.0, 47.0, 45.0, 39.0, 42.0, 44.0, 38.0, 54.0, 58.0, 32.0, 34.0, 39.0, 24.0, 31.0, 35.0, 19.0, 13.0, 18.0, 23.0, 11.0, 14.0, 15.0, 7.0, 8.0, 8.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.75390625, -3.65057373046875, -3.5472412109375, -3.44390869140625, -3.340576171875, -3.23724365234375, -3.1339111328125, -3.03057861328125, -2.92724609375, -2.82391357421875, -2.7205810546875, -2.61724853515625, -2.513916015625, -2.41058349609375, -2.3072509765625, -2.20391845703125, -2.1005859375, -1.99725341796875, -1.8939208984375, -1.79058837890625, -1.687255859375, -1.58392333984375, -1.4805908203125, -1.37725830078125, -1.27392578125, -1.17059326171875, -1.0672607421875, -0.96392822265625, -0.860595703125, -0.75726318359375, -0.6539306640625, -0.55059814453125, -0.447265625, -0.34393310546875, -0.2406005859375, -0.13726806640625, -0.033935546875, 0.06939697265625, 0.1727294921875, 0.27606201171875, 0.37939453125, 0.48272705078125, 0.5860595703125, 0.68939208984375, 0.792724609375, 0.89605712890625, 0.9993896484375, 1.10272216796875, 1.2060546875, 1.30938720703125, 1.4127197265625, 1.51605224609375, 1.619384765625, 1.72271728515625, 1.8260498046875, 1.92938232421875, 2.03271484375, 2.13604736328125, 2.2393798828125, 2.34271240234375, 2.446044921875, 2.54937744140625, 2.6527099609375, 2.75604248046875, 2.859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 8.0, 9.0, 9.0, 20.0, 33.0, 40.0, 73.0, 116.0, 201.0, 462.0, 1041.0, 2841.0, 9824.0, 63134.0, 887241.0, 68268.0, 10193.0, 2892.0, 1097.0, 499.0, 232.0, 119.0, 68.0, 42.0, 28.0, 15.0, 8.0, 6.0, 4.0, 10.0, 4.0, 6.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5234375, -4.402862548828125, -4.28228759765625, -4.161712646484375, -4.0411376953125, -3.920562744140625, -3.79998779296875, -3.679412841796875, -3.558837890625, -3.438262939453125, -3.31768798828125, -3.197113037109375, -3.0765380859375, -2.955963134765625, -2.83538818359375, -2.714813232421875, -2.59423828125, -2.473663330078125, -2.35308837890625, -2.232513427734375, -2.1119384765625, -1.991363525390625, -1.87078857421875, -1.750213623046875, -1.629638671875, -1.509063720703125, -1.38848876953125, -1.267913818359375, -1.1473388671875, -1.026763916015625, -0.90618896484375, -0.785614013671875, -0.6650390625, -0.544464111328125, -0.42388916015625, -0.303314208984375, -0.1827392578125, -0.062164306640625, 0.05841064453125, 0.178985595703125, 0.299560546875, 0.420135498046875, 0.54071044921875, 0.661285400390625, 0.7818603515625, 0.902435302734375, 1.02301025390625, 1.143585205078125, 1.26416015625, 1.384735107421875, 1.50531005859375, 1.625885009765625, 1.7464599609375, 1.867034912109375, 1.98760986328125, 2.108184814453125, 2.228759765625, 2.349334716796875, 2.46990966796875, 2.590484619140625, 2.7110595703125, 2.831634521484375, 2.95220947265625, 3.072784423828125, 3.193359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 19.0, 25.0, 35.0, 78.0, 194.0, 349.0, 155.0, 63.0, 24.0, 13.0, 15.0, 8.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0010242462158203125, -0.001001652330160141, -0.0009790584444999695, -0.000956464558839798, -0.0009338706731796265, -0.000911276787519455, -0.0008886829018592834, -0.0008660890161991119, -0.0008434951305389404, -0.0008209012448787689, -0.0007983073592185974, -0.0007757134735584259, -0.0007531195878982544, -0.0007305257022380829, -0.0007079318165779114, -0.0006853379309177399, -0.0006627440452575684, -0.0006401501595973969, -0.0006175562739372253, -0.0005949623882770538, -0.0005723685026168823, -0.0005497746169567108, -0.0005271807312965393, -0.0005045868456363678, -0.0004819929599761963, -0.0004593990743160248, -0.00043680518865585327, -0.00041421130299568176, -0.00039161741733551025, -0.00036902353167533875, -0.00034642964601516724, -0.00032383576035499573, -0.0003012418746948242, -0.0002786479890346527, -0.0002560541033744812, -0.0002334602177143097, -0.00021086633205413818, -0.00018827244639396667, -0.00016567856073379517, -0.00014308467507362366, -0.00012049078941345215, -9.789690375328064e-05, -7.530301809310913e-05, -5.270913243293762e-05, -3.0115246772766113e-05, -7.5213611125946045e-06, 1.5072524547576904e-05, 3.766641020774841e-05, 6.026029586791992e-05, 8.285418152809143e-05, 0.00010544806718826294, 0.00012804195284843445, 0.00015063583850860596, 0.00017322972416877747, 0.00019582360982894897, 0.00021841749548912048, 0.000241011381149292, 0.0002636052668094635, 0.000286199152469635, 0.0003087930381298065, 0.00033138692378997803, 0.00035398080945014954, 0.00037657469511032104, 0.00039916858077049255, 0.00042176246643066406]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 5.0, 9.0, 17.0, 24.0, 28.0, 53.0, 105.0, 151.0, 331.0, 601.0, 1408.0, 3355.0, 11965.0, 153834.0, 844813.0, 23212.0, 5072.0, 1854.0, 771.0, 402.0, 214.0, 133.0, 67.0, 40.0, 29.0, 18.0, 15.0, 7.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.74609375, -5.599456787109375, -5.45281982421875, -5.306182861328125, -5.1595458984375, -5.012908935546875, -4.86627197265625, -4.719635009765625, -4.572998046875, -4.426361083984375, -4.27972412109375, -4.133087158203125, -3.9864501953125, -3.839813232421875, -3.69317626953125, -3.546539306640625, -3.39990234375, -3.253265380859375, -3.10662841796875, -2.959991455078125, -2.8133544921875, -2.666717529296875, -2.52008056640625, -2.373443603515625, -2.226806640625, -2.080169677734375, -1.93353271484375, -1.786895751953125, -1.6402587890625, -1.493621826171875, -1.34698486328125, -1.200347900390625, -1.0537109375, -0.907073974609375, -0.76043701171875, -0.613800048828125, -0.4671630859375, -0.320526123046875, -0.17388916015625, -0.027252197265625, 0.119384765625, 0.266021728515625, 0.41265869140625, 0.559295654296875, 0.7059326171875, 0.852569580078125, 0.99920654296875, 1.145843505859375, 1.29248046875, 1.439117431640625, 1.58575439453125, 1.732391357421875, 1.8790283203125, 2.025665283203125, 2.17230224609375, 2.318939208984375, 2.465576171875, 2.612213134765625, 2.75885009765625, 2.905487060546875, 3.0521240234375, 3.198760986328125, 3.34539794921875, 3.492034912109375, 3.638671875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 9.0, 8.0, 8.0, 16.0, 23.0, 51.0, 67.0, 156.0, 261.0, 175.0, 80.0, 41.0, 30.0, 16.0, 13.0, 6.0, 5.0, 5.0, 4.0, 1.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.080078125, -1.9920654296875, -1.904052734375, -1.8160400390625, -1.72802734375, -1.6400146484375, -1.552001953125, -1.4639892578125, -1.3759765625, -1.2879638671875, -1.199951171875, -1.1119384765625, -1.02392578125, -0.9359130859375, -0.847900390625, -0.7598876953125, -0.671875, -0.5838623046875, -0.495849609375, -0.4078369140625, -0.31982421875, -0.2318115234375, -0.143798828125, -0.0557861328125, 0.0322265625, 0.1202392578125, 0.208251953125, 0.2962646484375, 0.38427734375, 0.4722900390625, 0.560302734375, 0.6483154296875, 0.736328125, 0.8243408203125, 0.912353515625, 1.0003662109375, 1.08837890625, 1.1763916015625, 1.264404296875, 1.3524169921875, 1.4404296875, 1.5284423828125, 1.616455078125, 1.7044677734375, 1.79248046875, 1.8804931640625, 1.968505859375, 2.0565185546875, 2.14453125, 2.2325439453125, 2.320556640625, 2.4085693359375, 2.49658203125, 2.5845947265625, 2.672607421875, 2.7606201171875, 2.8486328125, 2.9366455078125, 3.024658203125, 3.1126708984375, 3.20068359375, 3.2886962890625, 3.376708984375, 3.4647216796875, 3.552734375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 15.0, 74.0, 199.0, 337.0, 218.0, 103.0, 32.0, 15.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.05762481689453, -81.14897155761719, -79.24031829833984, -77.3316650390625, -75.42301177978516, -73.51435852050781, -71.60570526123047, -69.69705200195312, -67.78840637207031, -65.87975311279297, -63.971099853515625, -62.06244659423828, -60.15379333496094, -58.245140075683594, -56.336490631103516, -54.42783737182617, -52.51918029785156, -50.61052703857422, -48.701873779296875, -46.79322052001953, -44.88456726074219, -42.975914001464844, -41.067264556884766, -39.15861129760742, -37.24995803833008, -35.341304779052734, -33.43265151977539, -31.52400016784668, -29.615346908569336, -27.706693649291992, -25.79804229736328, -23.889389038085938, -21.980735778808594, -20.07208251953125, -18.163429260253906, -16.254777908325195, -14.346124649047852, -12.437471389770508, -10.52881908416748, -8.620166778564453, -6.711513519287109, -4.802860736846924, -2.8942079544067383, -0.9855551719665527, 0.9230976104736328, 2.8317508697509766, 4.740403175354004, 6.649055480957031, 8.557708740234375, 10.466361999511719, 12.375014305114746, 14.283666610717773, 16.192319869995117, 18.10097312927246, 20.009624481201172, 21.918277740478516, 23.82693099975586, 25.735584259033203, 27.644237518310547, 29.552888870239258, 31.4615421295166, 33.37019348144531, 35.278846740722656, 37.1875, 39.096153259277344]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 7.0, 7.0, 3.0, 8.0, 11.0, 7.0, 12.0, 22.0, 14.0, 17.0, 20.0, 22.0, 10.0, 16.0, 26.0, 40.0, 35.0, 39.0, 30.0, 38.0, 42.0, 31.0, 40.0, 29.0, 51.0, 38.0, 43.0, 29.0, 38.0, 35.0, 29.0, 31.0, 30.0, 23.0, 21.0, 20.0, 10.0, 22.0, 8.0, 10.0, 8.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-13.920467376708984, -13.482731819152832, -13.044995307922363, -12.607259750366211, -12.169523239135742, -11.73178768157959, -11.294052124023438, -10.856315612792969, -10.4185791015625, -9.980843544006348, -9.543107032775879, -9.105371475219727, -8.667634963989258, -8.229899406433105, -7.792163372039795, -7.354427337646484, -6.916691780090332, -6.4789557456970215, -6.041219711303711, -5.603484153747559, -5.16574764251709, -4.7280120849609375, -4.290276050567627, -3.8525400161743164, -3.414803981781006, -2.9770679473876953, -2.5393319129943848, -2.1015961170196533, -1.6638600826263428, -1.2261240482330322, -0.7883882522583008, -0.35065221786499023, 0.0870828628540039, 0.5248188376426697, 0.9625548124313354, 1.4002907276153564, 1.838026762008667, 2.2757627964019775, 2.713498592376709, 3.1512346267700195, 3.58897066116333, 4.026706695556641, 4.464442729949951, 4.902178764343262, 5.339914321899414, 5.777650833129883, 6.215386390686035, 6.653122425079346, 7.090858459472656, 7.528594493865967, 7.966330528259277, 8.40406608581543, 8.841802597045898, 9.27953815460205, 9.717273712158203, 10.155010223388672, 10.59274673461914, 11.030482292175293, 11.468218803405762, 11.905954360961914, 12.343690872192383, 12.781426429748535, 13.219161987304688, 13.656898498535156, 14.094634056091309]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 4.0, 6.0, 10.0, 5.0, 9.0, 17.0, 12.0, 15.0, 21.0, 28.0, 56.0, 47.0, 103.0, 132.0, 315.0, 743.0, 2148.0, 7209.0, 36555.0, 4038083.0, 91605.0, 11863.0, 3190.0, 1086.0, 479.0, 200.0, 122.0, 76.0, 37.0, 31.0, 23.0, 8.0, 14.0, 8.0, 4.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-16.734375, -16.3126220703125, -15.890869140625, -15.4691162109375, -15.04736328125, -14.6256103515625, -14.203857421875, -13.7821044921875, -13.3603515625, -12.9385986328125, -12.516845703125, -12.0950927734375, -11.67333984375, -11.2515869140625, -10.829833984375, -10.4080810546875, -9.986328125, -9.5645751953125, -9.142822265625, -8.7210693359375, -8.29931640625, -7.8775634765625, -7.455810546875, -7.0340576171875, -6.6123046875, -6.1905517578125, -5.768798828125, -5.3470458984375, -4.92529296875, -4.5035400390625, -4.081787109375, -3.6600341796875, -3.23828125, -2.8165283203125, -2.394775390625, -1.9730224609375, -1.55126953125, -1.1295166015625, -0.707763671875, -0.2860107421875, 0.1357421875, 0.5574951171875, 0.979248046875, 1.4010009765625, 1.82275390625, 2.2445068359375, 2.666259765625, 3.0880126953125, 3.509765625, 3.9315185546875, 4.353271484375, 4.7750244140625, 5.19677734375, 5.6185302734375, 6.040283203125, 6.4620361328125, 6.8837890625, 7.3055419921875, 7.727294921875, 8.1490478515625, 8.57080078125, 8.9925537109375, 9.414306640625, 9.8360595703125, 10.2578125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 5.0, 5.0, 17.0, 16.0, 15.0, 29.0, 38.0, 47.0, 60.0, 74.0, 69.0, 91.0, 81.0, 68.0, 79.0, 73.0, 62.0, 51.0, 39.0, 20.0, 19.0, 12.0, 11.0, 11.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7470703125, -1.7003631591796875, -1.653656005859375, -1.6069488525390625, -1.56024169921875, -1.5135345458984375, -1.466827392578125, -1.4201202392578125, -1.3734130859375, -1.3267059326171875, -1.279998779296875, -1.2332916259765625, -1.18658447265625, -1.1398773193359375, -1.093170166015625, -1.0464630126953125, -0.999755859375, -0.9530487060546875, -0.906341552734375, -0.8596343994140625, -0.81292724609375, -0.7662200927734375, -0.719512939453125, -0.6728057861328125, -0.6260986328125, -0.5793914794921875, -0.532684326171875, -0.4859771728515625, -0.43927001953125, -0.3925628662109375, -0.345855712890625, -0.2991485595703125, -0.25244140625, -0.2057342529296875, -0.159027099609375, -0.1123199462890625, -0.06561279296875, -0.0189056396484375, 0.027801513671875, 0.0745086669921875, 0.1212158203125, 0.1679229736328125, 0.214630126953125, 0.2613372802734375, 0.30804443359375, 0.3547515869140625, 0.401458740234375, 0.4481658935546875, 0.494873046875, 0.5415802001953125, 0.588287353515625, 0.6349945068359375, 0.68170166015625, 0.7284088134765625, 0.775115966796875, 0.8218231201171875, 0.8685302734375, 0.9152374267578125, 0.961944580078125, 1.0086517333984375, 1.05535888671875, 1.1020660400390625, 1.148773193359375, 1.1954803466796875, 1.2421875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 1.0, 2.0, 6.0, 11.0, 14.0, 18.0, 28.0, 29.0, 45.0, 65.0, 110.0, 150.0, 189.0, 309.0, 443.0, 827.0, 1419.0, 2745.0, 5344.0, 12362.0, 34020.0, 163122.0, 3817841.0, 107365.0, 27148.0, 10289.0, 4641.0, 2305.0, 1338.0, 748.0, 440.0, 294.0, 180.0, 124.0, 78.0, 50.0, 50.0, 35.0, 28.0, 18.0, 16.0, 10.0, 4.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.45703125, -5.27752685546875, -5.0980224609375, -4.91851806640625, -4.739013671875, -4.55950927734375, -4.3800048828125, -4.20050048828125, -4.02099609375, -3.84149169921875, -3.6619873046875, -3.48248291015625, -3.302978515625, -3.12347412109375, -2.9439697265625, -2.76446533203125, -2.5849609375, -2.40545654296875, -2.2259521484375, -2.04644775390625, -1.866943359375, -1.68743896484375, -1.5079345703125, -1.32843017578125, -1.14892578125, -0.96942138671875, -0.7899169921875, -0.61041259765625, -0.430908203125, -0.25140380859375, -0.0718994140625, 0.10760498046875, 0.287109375, 0.46661376953125, 0.6461181640625, 0.82562255859375, 1.005126953125, 1.18463134765625, 1.3641357421875, 1.54364013671875, 1.72314453125, 1.90264892578125, 2.0821533203125, 2.26165771484375, 2.441162109375, 2.62066650390625, 2.8001708984375, 2.97967529296875, 3.1591796875, 3.33868408203125, 3.5181884765625, 3.69769287109375, 3.877197265625, 4.05670166015625, 4.2362060546875, 4.41571044921875, 4.59521484375, 4.77471923828125, 4.9542236328125, 5.13372802734375, 5.313232421875, 5.49273681640625, 5.6722412109375, 5.85174560546875, 6.03125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 4.0, 7.0, 7.0, 5.0, 14.0, 23.0, 20.0, 30.0, 51.0, 111.0, 429.0, 2929.0, 190.0, 77.0, 53.0, 34.0, 18.0, 11.0, 11.0, 8.0, 9.0, 5.0, 2.0, 7.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.66015625, -2.580230712890625, -2.50030517578125, -2.420379638671875, -2.3404541015625, -2.260528564453125, -2.18060302734375, -2.100677490234375, -2.020751953125, -1.940826416015625, -1.86090087890625, -1.780975341796875, -1.7010498046875, -1.621124267578125, -1.54119873046875, -1.461273193359375, -1.38134765625, -1.301422119140625, -1.22149658203125, -1.141571044921875, -1.0616455078125, -0.981719970703125, -0.90179443359375, -0.821868896484375, -0.741943359375, -0.662017822265625, -0.58209228515625, -0.502166748046875, -0.4222412109375, -0.342315673828125, -0.26239013671875, -0.182464599609375, -0.1025390625, -0.022613525390625, 0.05731201171875, 0.137237548828125, 0.2171630859375, 0.297088623046875, 0.37701416015625, 0.456939697265625, 0.536865234375, 0.616790771484375, 0.69671630859375, 0.776641845703125, 0.8565673828125, 0.936492919921875, 1.01641845703125, 1.096343994140625, 1.17626953125, 1.256195068359375, 1.33612060546875, 1.416046142578125, 1.4959716796875, 1.575897216796875, 1.65582275390625, 1.735748291015625, 1.815673828125, 1.895599365234375, 1.97552490234375, 2.055450439453125, 2.1353759765625, 2.215301513671875, 2.29522705078125, 2.375152587890625, 2.455078125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 12.0, 33.0, 61.0, 148.0, 262.0, 244.0, 126.0, 51.0, 24.0, 11.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.324113845825195, -23.756994247436523, -23.18987274169922, -22.622753143310547, -22.055631637573242, -21.48851203918457, -20.921390533447266, -20.354270935058594, -19.78714942932129, -19.220029830932617, -18.652908325195312, -18.08578872680664, -17.518667221069336, -16.951547622680664, -16.38442611694336, -15.817306518554688, -15.2501859664917, -14.683065414428711, -14.115944862365723, -13.548824310302734, -12.981703758239746, -12.414583206176758, -11.847463607788086, -11.280342102050781, -10.71322250366211, -10.146101951599121, -9.578981399536133, -9.011860847473145, -8.444740295410156, -7.877619743347168, -7.310499668121338, -6.74337911605835, -6.176258087158203, -5.609137535095215, -5.042016983032227, -4.474896430969238, -3.907776117324829, -3.340655565261841, -2.7735352516174316, -2.2064146995544434, -1.639294147491455, -1.0721735954284668, -0.5050531625747681, 0.062067270278930664, 0.629187822341919, 1.1963083744049072, 1.7634286880493164, 2.3305492401123047, 2.897669792175293, 3.4647903442382812, 4.0319108963012695, 4.599031448364258, 5.166152000427246, 5.733272552490234, 6.3003926277160645, 6.867513179779053, 7.434633731842041, 8.001753807067871, 8.56887435913086, 9.135994911193848, 9.703115463256836, 10.270236015319824, 10.837356567382812, 11.4044771194458, 11.971597671508789]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 3.0, 9.0, 11.0, 16.0, 14.0, 20.0, 31.0, 22.0, 35.0, 35.0, 41.0, 46.0, 42.0, 60.0, 66.0, 49.0, 59.0, 47.0, 53.0, 48.0, 62.0, 55.0, 35.0, 27.0, 14.0, 24.0, 20.0, 20.0, 10.0, 11.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.483158588409424, -6.265747547149658, -6.048336505889893, -5.830925464630127, -5.613514423370361, -5.396103858947754, -5.178692817687988, -4.961281776428223, -4.743870735168457, -4.526459693908691, -4.309048652648926, -4.09163761138916, -3.8742268085479736, -3.656815767288208, -3.4394047260284424, -3.221993923187256, -3.004582643508911, -2.7871716022491455, -2.56976056098938, -2.3523497581481934, -2.1349387168884277, -1.917527675628662, -1.7001166343688965, -1.4827057123184204, -1.2652946710586548, -1.0478836297988892, -0.8304727077484131, -0.6130616664886475, -0.3956506848335266, -0.17823970317840576, 0.03917133808135986, 0.25658226013183594, 0.47399330139160156, 0.6914042830467224, 0.9088152647018433, 1.1262263059616089, 1.343637228012085, 1.5610482692718506, 1.7784593105316162, 1.9958702325820923, 2.2132811546325684, 2.430692195892334, 2.6481032371520996, 2.8655142784118652, 3.0829250812530518, 3.3003361225128174, 3.517747163772583, 3.7351579666137695, 3.9525692462921143, 4.169980049133301, 4.387391090393066, 4.604802131652832, 4.822213172912598, 5.039624214172363, 5.257035255432129, 5.4744462966918945, 5.69185733795166, 5.909268379211426, 6.126679420471191, 6.344090461730957, 6.561501502990723, 6.778912544250488, 6.996323585510254, 7.213734149932861, 7.431145191192627]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 6.0, 8.0, 2.0, 4.0, 7.0, 10.0, 18.0, 16.0, 18.0, 39.0, 43.0, 80.0, 96.0, 165.0, 248.0, 484.0, 1021.0, 2342.0, 6329.0, 21104.0, 94924.0, 591379.0, 266460.0, 44881.0, 11693.0, 3909.0, 1564.0, 699.0, 372.0, 177.0, 123.0, 71.0, 74.0, 47.0, 31.0, 33.0, 16.0, 11.0, 15.0, 9.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.421875, -7.20208740234375, -6.9822998046875, -6.76251220703125, -6.542724609375, -6.32293701171875, -6.1031494140625, -5.88336181640625, -5.66357421875, -5.44378662109375, -5.2239990234375, -5.00421142578125, -4.784423828125, -4.56463623046875, -4.3448486328125, -4.12506103515625, -3.9052734375, -3.68548583984375, -3.4656982421875, -3.24591064453125, -3.026123046875, -2.80633544921875, -2.5865478515625, -2.36676025390625, -2.14697265625, -1.92718505859375, -1.7073974609375, -1.48760986328125, -1.267822265625, -1.04803466796875, -0.8282470703125, -0.60845947265625, -0.388671875, -0.16888427734375, 0.0509033203125, 0.27069091796875, 0.490478515625, 0.71026611328125, 0.9300537109375, 1.14984130859375, 1.36962890625, 1.58941650390625, 1.8092041015625, 2.02899169921875, 2.248779296875, 2.46856689453125, 2.6883544921875, 2.90814208984375, 3.1279296875, 3.34771728515625, 3.5675048828125, 3.78729248046875, 4.007080078125, 4.22686767578125, 4.4466552734375, 4.66644287109375, 4.88623046875, 5.10601806640625, 5.3258056640625, 5.54559326171875, 5.765380859375, 5.98516845703125, 6.2049560546875, 6.42474365234375, 6.64453125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 10.0, 14.0, 15.0, 27.0, 36.0, 36.0, 48.0, 64.0, 86.0, 65.0, 89.0, 73.0, 65.0, 71.0, 65.0, 62.0, 45.0, 40.0, 22.0, 20.0, 14.0, 8.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8291015625, -1.781097412109375, -1.73309326171875, -1.685089111328125, -1.6370849609375, -1.589080810546875, -1.54107666015625, -1.493072509765625, -1.445068359375, -1.397064208984375, -1.34906005859375, -1.301055908203125, -1.2530517578125, -1.205047607421875, -1.15704345703125, -1.109039306640625, -1.06103515625, -1.013031005859375, -0.96502685546875, -0.917022705078125, -0.8690185546875, -0.821014404296875, -0.77301025390625, -0.725006103515625, -0.677001953125, -0.628997802734375, -0.58099365234375, -0.532989501953125, -0.4849853515625, -0.436981201171875, -0.38897705078125, -0.340972900390625, -0.29296875, -0.244964599609375, -0.19696044921875, -0.148956298828125, -0.1009521484375, -0.052947998046875, -0.00494384765625, 0.043060302734375, 0.091064453125, 0.139068603515625, 0.18707275390625, 0.235076904296875, 0.2830810546875, 0.331085205078125, 0.37908935546875, 0.427093505859375, 0.47509765625, 0.523101806640625, 0.57110595703125, 0.619110107421875, 0.6671142578125, 0.715118408203125, 0.76312255859375, 0.811126708984375, 0.859130859375, 0.907135009765625, 0.95513916015625, 1.003143310546875, 1.0511474609375, 1.099151611328125, 1.14715576171875, 1.195159912109375, 1.2431640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 7.0, 11.0, 8.0, 10.0, 14.0, 16.0, 20.0, 38.0, 63.0, 97.0, 143.0, 248.0, 510.0, 920.0, 1748.0, 3511.0, 7839.0, 18242.0, 49481.0, 166528.0, 511218.0, 194949.0, 55909.0, 20601.0, 8416.0, 3856.0, 1883.0, 979.0, 525.0, 286.0, 176.0, 101.0, 53.0, 44.0, 28.0, 21.0, 16.0, 13.0, 13.0, 3.0, 0.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.949005126953125, -3.82769775390625, -3.706390380859375, -3.5850830078125, -3.463775634765625, -3.34246826171875, -3.221160888671875, -3.099853515625, -2.978546142578125, -2.85723876953125, -2.735931396484375, -2.6146240234375, -2.493316650390625, -2.37200927734375, -2.250701904296875, -2.12939453125, -2.008087158203125, -1.88677978515625, -1.765472412109375, -1.6441650390625, -1.522857666015625, -1.40155029296875, -1.280242919921875, -1.158935546875, -1.037628173828125, -0.91632080078125, -0.795013427734375, -0.6737060546875, -0.552398681640625, -0.43109130859375, -0.309783935546875, -0.1884765625, -0.067169189453125, 0.05413818359375, 0.175445556640625, 0.2967529296875, 0.418060302734375, 0.53936767578125, 0.660675048828125, 0.781982421875, 0.903289794921875, 1.02459716796875, 1.145904541015625, 1.2672119140625, 1.388519287109375, 1.50982666015625, 1.631134033203125, 1.75244140625, 1.873748779296875, 1.99505615234375, 2.116363525390625, 2.2376708984375, 2.358978271484375, 2.48028564453125, 2.601593017578125, 2.722900390625, 2.844207763671875, 2.96551513671875, 3.086822509765625, 3.2081298828125, 3.329437255859375, 3.45074462890625, 3.572052001953125, 3.693359375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 12.0, 10.0, 8.0, 14.0, 10.0, 16.0, 19.0, 32.0, 23.0, 28.0, 39.0, 50.0, 47.0, 38.0, 42.0, 52.0, 54.0, 49.0, 56.0, 45.0, 53.0, 45.0, 27.0, 31.0, 28.0, 25.0, 25.0, 19.0, 22.0, 11.0, 11.0, 16.0, 5.0, 4.0, 8.0, 4.0, 2.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.3333740234375, -4.190185546875, -4.0469970703125, -3.90380859375, -3.7606201171875, -3.617431640625, -3.4742431640625, -3.3310546875, -3.1878662109375, -3.044677734375, -2.9014892578125, -2.75830078125, -2.6151123046875, -2.471923828125, -2.3287353515625, -2.185546875, -2.0423583984375, -1.899169921875, -1.7559814453125, -1.61279296875, -1.4696044921875, -1.326416015625, -1.1832275390625, -1.0400390625, -0.8968505859375, -0.753662109375, -0.6104736328125, -0.46728515625, -0.3240966796875, -0.180908203125, -0.0377197265625, 0.10546875, 0.2486572265625, 0.391845703125, 0.5350341796875, 0.67822265625, 0.8214111328125, 0.964599609375, 1.1077880859375, 1.2509765625, 1.3941650390625, 1.537353515625, 1.6805419921875, 1.82373046875, 1.9669189453125, 2.110107421875, 2.2532958984375, 2.396484375, 2.5396728515625, 2.682861328125, 2.8260498046875, 2.96923828125, 3.1124267578125, 3.255615234375, 3.3988037109375, 3.5419921875, 3.6851806640625, 3.828369140625, 3.9715576171875, 4.11474609375, 4.2579345703125, 4.401123046875, 4.5443115234375, 4.6875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 3.0, 6.0, 8.0, 22.0, 10.0, 15.0, 28.0, 46.0, 64.0, 123.0, 192.0, 375.0, 684.0, 1636.0, 3951.0, 12443.0, 55162.0, 560452.0, 357627.0, 39715.0, 9815.0, 3358.0, 1443.0, 638.0, 283.0, 154.0, 105.0, 59.0, 32.0, 29.0, 20.0, 18.0, 12.0, 9.0, 3.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.025390625, -2.941131591796875, -2.85687255859375, -2.772613525390625, -2.6883544921875, -2.604095458984375, -2.51983642578125, -2.435577392578125, -2.351318359375, -2.267059326171875, -2.18280029296875, -2.098541259765625, -2.0142822265625, -1.930023193359375, -1.84576416015625, -1.761505126953125, -1.67724609375, -1.592987060546875, -1.50872802734375, -1.424468994140625, -1.3402099609375, -1.255950927734375, -1.17169189453125, -1.087432861328125, -1.003173828125, -0.918914794921875, -0.83465576171875, -0.750396728515625, -0.6661376953125, -0.581878662109375, -0.49761962890625, -0.413360595703125, -0.3291015625, -0.244842529296875, -0.16058349609375, -0.076324462890625, 0.0079345703125, 0.092193603515625, 0.17645263671875, 0.260711669921875, 0.344970703125, 0.429229736328125, 0.51348876953125, 0.597747802734375, 0.6820068359375, 0.766265869140625, 0.85052490234375, 0.934783935546875, 1.01904296875, 1.103302001953125, 1.18756103515625, 1.271820068359375, 1.3560791015625, 1.440338134765625, 1.52459716796875, 1.608856201171875, 1.693115234375, 1.777374267578125, 1.86163330078125, 1.945892333984375, 2.0301513671875, 2.114410400390625, 2.19866943359375, 2.282928466796875, 2.3671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 10.0, 11.0, 20.0, 42.0, 52.0, 81.0, 140.0, 209.0, 158.0, 94.0, 60.0, 42.0, 28.0, 11.0, 15.0, 8.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005521774291992188, -0.0005362518131732941, -0.0005203261971473694, -0.0005044005811214447, -0.00048847496509552, -0.00047254934906959534, -0.00045662373304367065, -0.00044069811701774597, -0.0004247725009918213, -0.0004088468849658966, -0.0003929212689399719, -0.00037699565291404724, -0.00036107003688812256, -0.0003451444208621979, -0.0003292188048362732, -0.0003132931888103485, -0.00029736757278442383, -0.00028144195675849915, -0.00026551634073257446, -0.0002495907247066498, -0.0002336651086807251, -0.00021773949265480042, -0.00020181387662887573, -0.00018588826060295105, -0.00016996264457702637, -0.00015403702855110168, -0.000138111412525177, -0.00012218579649925232, -0.00010626018047332764, -9.033456444740295e-05, -7.440894842147827e-05, -5.848333239555359e-05, -4.2557716369628906e-05, -2.6632100343704224e-05, -1.0706484317779541e-05, 5.219131708145142e-06, 2.1144747734069824e-05, 3.707036375999451e-05, 5.299597978591919e-05, 6.892159581184387e-05, 8.484721183776855e-05, 0.00010077282786369324, 0.00011669844388961792, 0.0001326240599155426, 0.00014854967594146729, 0.00016447529196739197, 0.00018040090799331665, 0.00019632652401924133, 0.00021225214004516602, 0.0002281777560710907, 0.00024410337209701538, 0.00026002898812294006, 0.00027595460414886475, 0.00029188022017478943, 0.0003078058362007141, 0.0003237314522266388, 0.0003396570682525635, 0.00035558268427848816, 0.00037150830030441284, 0.0003874339163303375, 0.0004033595323562622, 0.0004192851483821869, 0.00043521076440811157, 0.00045113638043403625, 0.00046706199645996094]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 20.0, 23.0, 29.0, 33.0, 51.0, 80.0, 112.0, 190.0, 277.0, 424.0, 701.0, 1078.0, 1998.0, 3555.0, 6961.0, 14763.0, 38492.0, 131167.0, 480257.0, 259164.0, 65748.0, 22644.0, 9644.0, 4713.0, 2534.0, 1488.0, 831.0, 558.0, 341.0, 232.0, 136.0, 100.0, 72.0, 41.0, 23.0, 18.0, 10.0, 14.0, 6.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3955078125, -1.34857177734375, -1.3016357421875, -1.25469970703125, -1.207763671875, -1.16082763671875, -1.1138916015625, -1.06695556640625, -1.02001953125, -0.97308349609375, -0.9261474609375, -0.87921142578125, -0.832275390625, -0.78533935546875, -0.7384033203125, -0.69146728515625, -0.64453125, -0.59759521484375, -0.5506591796875, -0.50372314453125, -0.456787109375, -0.40985107421875, -0.3629150390625, -0.31597900390625, -0.26904296875, -0.22210693359375, -0.1751708984375, -0.12823486328125, -0.081298828125, -0.03436279296875, 0.0125732421875, 0.05950927734375, 0.1064453125, 0.15338134765625, 0.2003173828125, 0.24725341796875, 0.294189453125, 0.34112548828125, 0.3880615234375, 0.43499755859375, 0.48193359375, 0.52886962890625, 0.5758056640625, 0.62274169921875, 0.669677734375, 0.71661376953125, 0.7635498046875, 0.81048583984375, 0.857421875, 0.90435791015625, 0.9512939453125, 0.99822998046875, 1.045166015625, 1.09210205078125, 1.1390380859375, 1.18597412109375, 1.23291015625, 1.27984619140625, 1.3267822265625, 1.37371826171875, 1.420654296875, 1.46759033203125, 1.5145263671875, 1.56146240234375, 1.6083984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 2.0, 3.0, 6.0, 5.0, 8.0, 14.0, 14.0, 13.0, 32.0, 28.0, 29.0, 57.0, 75.0, 95.0, 81.0, 102.0, 88.0, 82.0, 51.0, 46.0, 34.0, 21.0, 27.0, 19.0, 13.0, 11.0, 11.0, 4.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7265625, -1.66583251953125, -1.6051025390625, -1.54437255859375, -1.483642578125, -1.42291259765625, -1.3621826171875, -1.30145263671875, -1.24072265625, -1.17999267578125, -1.1192626953125, -1.05853271484375, -0.997802734375, -0.93707275390625, -0.8763427734375, -0.81561279296875, -0.7548828125, -0.69415283203125, -0.6334228515625, -0.57269287109375, -0.511962890625, -0.45123291015625, -0.3905029296875, -0.32977294921875, -0.26904296875, -0.20831298828125, -0.1475830078125, -0.08685302734375, -0.026123046875, 0.03460693359375, 0.0953369140625, 0.15606689453125, 0.216796875, 0.27752685546875, 0.3382568359375, 0.39898681640625, 0.459716796875, 0.52044677734375, 0.5811767578125, 0.64190673828125, 0.70263671875, 0.76336669921875, 0.8240966796875, 0.88482666015625, 0.945556640625, 1.00628662109375, 1.0670166015625, 1.12774658203125, 1.1884765625, 1.24920654296875, 1.3099365234375, 1.37066650390625, 1.431396484375, 1.49212646484375, 1.5528564453125, 1.61358642578125, 1.67431640625, 1.73504638671875, 1.7957763671875, 1.85650634765625, 1.917236328125, 1.97796630859375, 2.0386962890625, 2.09942626953125, 2.16015625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 4.0, 11.0, 20.0, 29.0, 52.0, 79.0, 96.0, 133.0, 130.0, 137.0, 111.0, 70.0, 43.0, 22.0, 25.0, 13.0, 9.0, 7.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.897438049316406, -44.8162727355957, -43.735103607177734, -42.65393829345703, -41.57277297973633, -40.491607666015625, -39.410438537597656, -38.32927322387695, -37.24810791015625, -36.16694259643555, -35.08577346801758, -34.004608154296875, -32.92344284057617, -31.842275619506836, -30.7611083984375, -29.679943084716797, -28.598773956298828, -27.517606735229492, -26.43644142150879, -25.355274200439453, -24.27410888671875, -23.192941665649414, -22.111774444580078, -21.030609130859375, -19.94944190979004, -18.868274688720703, -17.787109375, -16.705942153930664, -15.624775886535645, -14.543609619140625, -13.462442398071289, -12.38127613067627, -11.300107955932617, -10.218941688537598, -9.137775421142578, -8.056608200073242, -6.975441932678223, -5.894275665283203, -4.813108921051025, -3.7319421768188477, -2.650775909423828, -1.5696094036102295, -0.48844289779663086, 0.5927236080169678, 1.6738901138305664, 2.755056381225586, 3.8362231254577637, 4.917389869689941, 5.998556137084961, 7.0797224044799805, 8.160888671875, 9.242055892944336, 10.323222160339355, 11.404388427734375, 12.485555648803711, 13.56672191619873, 14.64788818359375, 15.72905445098877, 16.81022071838379, 17.891387939453125, 18.972553253173828, 20.053720474243164, 21.1348876953125, 22.216053009033203, 23.29722023010254]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 8.0, 8.0, 9.0, 12.0, 9.0, 19.0, 23.0, 21.0, 26.0, 15.0, 26.0, 28.0, 28.0, 35.0, 23.0, 42.0, 30.0, 37.0, 37.0, 44.0, 41.0, 39.0, 32.0, 41.0, 33.0, 42.0, 33.0, 23.0, 23.0, 33.0, 24.0, 22.0, 19.0, 17.0, 15.0, 16.0, 11.0, 14.0, 12.0, 1.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-20.260244369506836, -19.632579803466797, -19.004913330078125, -18.377246856689453, -17.749582290649414, -17.121917724609375, -16.494251251220703, -15.866585731506348, -15.238920211791992, -14.611254692077637, -13.983589172363281, -13.355923652648926, -12.72825813293457, -12.100592613220215, -11.47292709350586, -10.845261573791504, -10.217596054077148, -9.589930534362793, -8.962265014648438, -8.334599494934082, -7.706933975219727, -7.079268455505371, -6.451602935791016, -5.82393741607666, -5.196271896362305, -4.568606376647949, -3.9409408569335938, -3.3132753372192383, -2.685609817504883, -2.0579442977905273, -1.4302787780761719, -0.8026132583618164, -0.17494773864746094, 0.45271778106689453, 1.08038330078125, 1.7080488204956055, 2.335714340209961, 2.9633798599243164, 3.591045379638672, 4.218710899353027, 4.846376419067383, 5.474041938781738, 6.101707458496094, 6.729372978210449, 7.357038497924805, 7.98470401763916, 8.612369537353516, 9.240035057067871, 9.867700576782227, 10.495366096496582, 11.123031616210938, 11.750697135925293, 12.378362655639648, 13.006028175354004, 13.63369369506836, 14.261359214782715, 14.88902473449707, 15.516690254211426, 16.14435577392578, 16.772022247314453, 17.399686813354492, 18.02735137939453, 18.655017852783203, 19.282684326171875, 19.910348892211914]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 11.0, 6.0, 4.0, 7.0, 10.0, 12.0, 13.0, 19.0, 29.0, 37.0, 64.0, 90.0, 163.0, 344.0, 859.0, 2472.0, 8527.0, 47512.0, 3984588.0, 128450.0, 14845.0, 3898.0, 1292.0, 539.0, 227.0, 110.0, 52.0, 34.0, 22.0, 14.0, 12.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.625, -14.2564697265625, -13.887939453125, -13.5194091796875, -13.15087890625, -12.7823486328125, -12.413818359375, -12.0452880859375, -11.6767578125, -11.3082275390625, -10.939697265625, -10.5711669921875, -10.20263671875, -9.8341064453125, -9.465576171875, -9.0970458984375, -8.728515625, -8.3599853515625, -7.991455078125, -7.6229248046875, -7.25439453125, -6.8858642578125, -6.517333984375, -6.1488037109375, -5.7802734375, -5.4117431640625, -5.043212890625, -4.6746826171875, -4.30615234375, -3.9376220703125, -3.569091796875, -3.2005615234375, -2.83203125, -2.4635009765625, -2.094970703125, -1.7264404296875, -1.35791015625, -0.9893798828125, -0.620849609375, -0.2523193359375, 0.1162109375, 0.4847412109375, 0.853271484375, 1.2218017578125, 1.59033203125, 1.9588623046875, 2.327392578125, 2.6959228515625, 3.064453125, 3.4329833984375, 3.801513671875, 4.1700439453125, 4.53857421875, 4.9071044921875, 5.275634765625, 5.6441650390625, 6.0126953125, 6.3812255859375, 6.749755859375, 7.1182861328125, 7.48681640625, 7.8553466796875, 8.223876953125, 8.5924072265625, 8.9609375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 11.0, 8.0, 8.0, 22.0, 27.0, 20.0, 36.0, 46.0, 47.0, 51.0, 63.0, 68.0, 60.0, 74.0, 68.0, 52.0, 62.0, 58.0, 47.0, 37.0, 24.0, 25.0, 23.0, 18.0, 17.0, 10.0, 6.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7607421875, -1.713623046875, -1.66650390625, -1.619384765625, -1.572265625, -1.525146484375, -1.47802734375, -1.430908203125, -1.3837890625, -1.336669921875, -1.28955078125, -1.242431640625, -1.1953125, -1.148193359375, -1.10107421875, -1.053955078125, -1.0068359375, -0.959716796875, -0.91259765625, -0.865478515625, -0.818359375, -0.771240234375, -0.72412109375, -0.677001953125, -0.6298828125, -0.582763671875, -0.53564453125, -0.488525390625, -0.44140625, -0.394287109375, -0.34716796875, -0.300048828125, -0.2529296875, -0.205810546875, -0.15869140625, -0.111572265625, -0.064453125, -0.017333984375, 0.02978515625, 0.076904296875, 0.1240234375, 0.171142578125, 0.21826171875, 0.265380859375, 0.3125, 0.359619140625, 0.40673828125, 0.453857421875, 0.5009765625, 0.548095703125, 0.59521484375, 0.642333984375, 0.689453125, 0.736572265625, 0.78369140625, 0.830810546875, 0.8779296875, 0.925048828125, 0.97216796875, 1.019287109375, 1.06640625, 1.113525390625, 1.16064453125, 1.207763671875, 1.2548828125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 12.0, 15.0, 15.0, 18.0, 27.0, 40.0, 56.0, 67.0, 100.0, 152.0, 234.0, 396.0, 626.0, 1023.0, 1924.0, 3742.0, 8030.0, 19312.0, 61909.0, 777065.0, 3205312.0, 74273.0, 22015.0, 8841.0, 4082.0, 1998.0, 1187.0, 628.0, 394.0, 269.0, 139.0, 105.0, 77.0, 48.0, 35.0, 39.0, 26.0, 13.0, 10.0, 8.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.13671875, -5.93914794921875, -5.7415771484375, -5.54400634765625, -5.346435546875, -5.14886474609375, -4.9512939453125, -4.75372314453125, -4.55615234375, -4.35858154296875, -4.1610107421875, -3.96343994140625, -3.765869140625, -3.56829833984375, -3.3707275390625, -3.17315673828125, -2.9755859375, -2.77801513671875, -2.5804443359375, -2.38287353515625, -2.185302734375, -1.98773193359375, -1.7901611328125, -1.59259033203125, -1.39501953125, -1.19744873046875, -0.9998779296875, -0.80230712890625, -0.604736328125, -0.40716552734375, -0.2095947265625, -0.01202392578125, 0.185546875, 0.38311767578125, 0.5806884765625, 0.77825927734375, 0.975830078125, 1.17340087890625, 1.3709716796875, 1.56854248046875, 1.76611328125, 1.96368408203125, 2.1612548828125, 2.35882568359375, 2.556396484375, 2.75396728515625, 2.9515380859375, 3.14910888671875, 3.3466796875, 3.54425048828125, 3.7418212890625, 3.93939208984375, 4.136962890625, 4.33453369140625, 4.5321044921875, 4.72967529296875, 4.92724609375, 5.12481689453125, 5.3223876953125, 5.51995849609375, 5.717529296875, 5.91510009765625, 6.1126708984375, 6.31024169921875, 6.5078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 13.0, 10.0, 13.0, 23.0, 24.0, 35.0, 106.0, 240.0, 2818.0, 421.0, 127.0, 80.0, 40.0, 32.0, 22.0, 14.0, 13.0, 4.0, 9.0, 5.0, 9.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.79296875, -4.665771484375, -4.53857421875, -4.411376953125, -4.2841796875, -4.156982421875, -4.02978515625, -3.902587890625, -3.775390625, -3.648193359375, -3.52099609375, -3.393798828125, -3.2666015625, -3.139404296875, -3.01220703125, -2.885009765625, -2.7578125, -2.630615234375, -2.50341796875, -2.376220703125, -2.2490234375, -2.121826171875, -1.99462890625, -1.867431640625, -1.740234375, -1.613037109375, -1.48583984375, -1.358642578125, -1.2314453125, -1.104248046875, -0.97705078125, -0.849853515625, -0.72265625, -0.595458984375, -0.46826171875, -0.341064453125, -0.2138671875, -0.086669921875, 0.04052734375, 0.167724609375, 0.294921875, 0.422119140625, 0.54931640625, 0.676513671875, 0.8037109375, 0.930908203125, 1.05810546875, 1.185302734375, 1.3125, 1.439697265625, 1.56689453125, 1.694091796875, 1.8212890625, 1.948486328125, 2.07568359375, 2.202880859375, 2.330078125, 2.457275390625, 2.58447265625, 2.711669921875, 2.8388671875, 2.966064453125, 3.09326171875, 3.220458984375, 3.34765625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 19.0, 19.0, 40.0, 47.0, 67.0, 110.0, 146.0, 177.0, 136.0, 90.0, 54.0, 22.0, 17.0, 16.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.25238037109375, -11.67287826538086, -11.093375205993652, -10.513872146606445, -9.934370040893555, -9.354867935180664, -8.775364875793457, -8.19586181640625, -7.616359710693359, -7.0368571281433105, -6.457354545593262, -5.877851963043213, -5.298349380493164, -4.718846797943115, -4.139344215393066, -3.5598416328430176, -2.9803390502929688, -2.40083646774292, -1.821333885192871, -1.2418313026428223, -0.6623287200927734, -0.08282613754272461, 0.4966764450073242, 1.076179027557373, 1.6556816101074219, 2.2351841926574707, 2.8146867752075195, 3.3941893577575684, 3.973691940307617, 4.553194522857666, 5.132697105407715, 5.712199687957764, 6.291704177856445, 6.871206760406494, 7.450709342956543, 8.03021240234375, 8.60971450805664, 9.189216613769531, 9.768719673156738, 10.348222732543945, 10.927724838256836, 11.507226943969727, 12.086730003356934, 12.66623306274414, 13.245735168457031, 13.825237274169922, 14.404740333557129, 14.984243392944336, 15.563745498657227, 16.143247604370117, 16.72275161743164, 17.30225372314453, 17.881755828857422, 18.461257934570312, 19.040760040283203, 19.620264053344727, 20.199766159057617, 20.779268264770508, 21.35877227783203, 21.938274383544922, 22.517776489257812, 23.097278594970703, 23.676780700683594, 24.256284713745117, 24.835786819458008]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 7.0, 4.0, 3.0, 6.0, 10.0, 8.0, 13.0, 16.0, 23.0, 18.0, 21.0, 36.0, 26.0, 25.0, 38.0, 39.0, 33.0, 53.0, 39.0, 42.0, 40.0, 48.0, 41.0, 39.0, 30.0, 41.0, 29.0, 36.0, 41.0, 31.0, 25.0, 28.0, 17.0, 25.0, 11.0, 16.0, 11.0, 5.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.516212463378906, -8.23979663848877, -7.963380813598633, -7.686964988708496, -7.410549163818359, -7.134133338928223, -6.857717990875244, -6.581302165985107, -6.304886341094971, -6.028470516204834, -5.752054691314697, -5.4756388664245605, -5.199223518371582, -4.922807693481445, -4.646391868591309, -4.369976043701172, -4.093560218811035, -3.8171443939208984, -3.5407285690307617, -3.264312982559204, -2.9878971576690674, -2.7114813327789307, -2.435065746307373, -2.1586499214172363, -1.8822340965270996, -1.605818271636963, -1.3294025659561157, -1.0529868602752686, -0.7765710353851318, -0.5001552104949951, -0.22373950481414795, 0.05267620086669922, 0.32909297943115234, 0.6055087447166443, 0.8819245100021362, 1.1583402156829834, 1.4347560405731201, 1.7111718654632568, 1.987587571144104, 2.264003276824951, 2.540419101715088, 2.8168349266052246, 3.0932507514953613, 3.369666337966919, 3.6460821628570557, 3.9224979877471924, 4.19891357421875, 4.475329399108887, 4.751745223999023, 5.02816104888916, 5.304576873779297, 5.580992698669434, 5.85740852355957, 6.133824348449707, 6.4102396965026855, 6.686655521392822, 6.963071346282959, 7.239487171173096, 7.515902996063232, 7.792318820953369, 8.068734169006348, 8.345149993896484, 8.621565818786621, 8.897981643676758, 9.174397468566895]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 5.0, 1.0, 13.0, 14.0, 32.0, 46.0, 78.0, 163.0, 296.0, 717.0, 1808.0, 6168.0, 27666.0, 164463.0, 642326.0, 167212.0, 28067.0, 6296.0, 1821.0, 697.0, 290.0, 143.0, 83.0, 54.0, 28.0, 23.0, 15.0, 8.0, 10.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.3125, -9.0345458984375, -8.756591796875, -8.4786376953125, -8.20068359375, -7.9227294921875, -7.644775390625, -7.3668212890625, -7.0888671875, -6.8109130859375, -6.532958984375, -6.2550048828125, -5.97705078125, -5.6990966796875, -5.421142578125, -5.1431884765625, -4.865234375, -4.5872802734375, -4.309326171875, -4.0313720703125, -3.75341796875, -3.4754638671875, -3.197509765625, -2.9195556640625, -2.6416015625, -2.3636474609375, -2.085693359375, -1.8077392578125, -1.52978515625, -1.2518310546875, -0.973876953125, -0.6959228515625, -0.41796875, -0.1400146484375, 0.137939453125, 0.4158935546875, 0.69384765625, 0.9718017578125, 1.249755859375, 1.5277099609375, 1.8056640625, 2.0836181640625, 2.361572265625, 2.6395263671875, 2.91748046875, 3.1954345703125, 3.473388671875, 3.7513427734375, 4.029296875, 4.3072509765625, 4.585205078125, 4.8631591796875, 5.14111328125, 5.4190673828125, 5.697021484375, 5.9749755859375, 6.2529296875, 6.5308837890625, 6.808837890625, 7.0867919921875, 7.36474609375, 7.6427001953125, 7.920654296875, 8.1986083984375, 8.4765625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 9.0, 4.0, 7.0, 7.0, 18.0, 20.0, 21.0, 34.0, 32.0, 36.0, 44.0, 58.0, 66.0, 57.0, 68.0, 75.0, 53.0, 60.0, 57.0, 37.0, 44.0, 37.0, 36.0, 30.0, 26.0, 19.0, 10.0, 16.0, 13.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7177734375, -1.6693572998046875, -1.620941162109375, -1.5725250244140625, -1.52410888671875, -1.4756927490234375, -1.427276611328125, -1.3788604736328125, -1.3304443359375, -1.2820281982421875, -1.233612060546875, -1.1851959228515625, -1.13677978515625, -1.0883636474609375, -1.039947509765625, -0.9915313720703125, -0.943115234375, -0.8946990966796875, -0.846282958984375, -0.7978668212890625, -0.74945068359375, -0.7010345458984375, -0.652618408203125, -0.6042022705078125, -0.5557861328125, -0.5073699951171875, -0.458953857421875, -0.4105377197265625, -0.36212158203125, -0.3137054443359375, -0.265289306640625, -0.2168731689453125, -0.16845703125, -0.1200408935546875, -0.071624755859375, -0.0232086181640625, 0.02520751953125, 0.0736236572265625, 0.122039794921875, 0.1704559326171875, 0.2188720703125, 0.2672882080078125, 0.315704345703125, 0.3641204833984375, 0.41253662109375, 0.4609527587890625, 0.509368896484375, 0.5577850341796875, 0.606201171875, 0.6546173095703125, 0.703033447265625, 0.7514495849609375, 0.79986572265625, 0.8482818603515625, 0.896697998046875, 0.9451141357421875, 0.9935302734375, 1.0419464111328125, 1.090362548828125, 1.1387786865234375, 1.18719482421875, 1.2356109619140625, 1.284027099609375, 1.3324432373046875, 1.380859375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 10.0, 15.0, 15.0, 14.0, 34.0, 45.0, 69.0, 111.0, 191.0, 320.0, 551.0, 1065.0, 2120.0, 4427.0, 10339.0, 26018.0, 74634.0, 266680.0, 455038.0, 135344.0, 42525.0, 16106.0, 6540.0, 3030.0, 1489.0, 762.0, 408.0, 211.0, 158.0, 66.0, 60.0, 42.0, 26.0, 19.0, 20.0, 12.0, 9.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.26171875, -5.10345458984375, -4.9451904296875, -4.78692626953125, -4.628662109375, -4.47039794921875, -4.3121337890625, -4.15386962890625, -3.99560546875, -3.83734130859375, -3.6790771484375, -3.52081298828125, -3.362548828125, -3.20428466796875, -3.0460205078125, -2.88775634765625, -2.7294921875, -2.57122802734375, -2.4129638671875, -2.25469970703125, -2.096435546875, -1.93817138671875, -1.7799072265625, -1.62164306640625, -1.46337890625, -1.30511474609375, -1.1468505859375, -0.98858642578125, -0.830322265625, -0.67205810546875, -0.5137939453125, -0.35552978515625, -0.197265625, -0.03900146484375, 0.1192626953125, 0.27752685546875, 0.435791015625, 0.59405517578125, 0.7523193359375, 0.91058349609375, 1.06884765625, 1.22711181640625, 1.3853759765625, 1.54364013671875, 1.701904296875, 1.86016845703125, 2.0184326171875, 2.17669677734375, 2.3349609375, 2.49322509765625, 2.6514892578125, 2.80975341796875, 2.968017578125, 3.12628173828125, 3.2845458984375, 3.44281005859375, 3.60107421875, 3.75933837890625, 3.9176025390625, 4.07586669921875, 4.234130859375, 4.39239501953125, 4.5506591796875, 4.70892333984375, 4.8671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 8.0, 7.0, 10.0, 12.0, 16.0, 10.0, 21.0, 25.0, 21.0, 19.0, 26.0, 26.0, 40.0, 44.0, 42.0, 52.0, 39.0, 48.0, 53.0, 46.0, 56.0, 45.0, 47.0, 38.0, 33.0, 24.0, 27.0, 31.0, 22.0, 22.0, 8.0, 13.0, 14.0, 9.0, 7.0, 7.0, 8.0, 3.0, 1.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.2955322265625, -5.102783203125, -4.9100341796875, -4.71728515625, -4.5245361328125, -4.331787109375, -4.1390380859375, -3.9462890625, -3.7535400390625, -3.560791015625, -3.3680419921875, -3.17529296875, -2.9825439453125, -2.789794921875, -2.5970458984375, -2.404296875, -2.2115478515625, -2.018798828125, -1.8260498046875, -1.63330078125, -1.4405517578125, -1.247802734375, -1.0550537109375, -0.8623046875, -0.6695556640625, -0.476806640625, -0.2840576171875, -0.09130859375, 0.1014404296875, 0.294189453125, 0.4869384765625, 0.6796875, 0.8724365234375, 1.065185546875, 1.2579345703125, 1.45068359375, 1.6434326171875, 1.836181640625, 2.0289306640625, 2.2216796875, 2.4144287109375, 2.607177734375, 2.7999267578125, 2.99267578125, 3.1854248046875, 3.378173828125, 3.5709228515625, 3.763671875, 3.9564208984375, 4.149169921875, 4.3419189453125, 4.53466796875, 4.7274169921875, 4.920166015625, 5.1129150390625, 5.3056640625, 5.4984130859375, 5.691162109375, 5.8839111328125, 6.07666015625, 6.2694091796875, 6.462158203125, 6.6549072265625, 6.84765625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 6.0, 12.0, 9.0, 13.0, 14.0, 33.0, 44.0, 38.0, 66.0, 115.0, 180.0, 293.0, 505.0, 1071.0, 2376.0, 6267.0, 20951.0, 106920.0, 668924.0, 195018.0, 30974.0, 8703.0, 3092.0, 1316.0, 660.0, 318.0, 211.0, 130.0, 85.0, 46.0, 46.0, 30.0, 20.0, 13.0, 16.0, 7.0, 8.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.828125, -3.710845947265625, -3.59356689453125, -3.476287841796875, -3.3590087890625, -3.241729736328125, -3.12445068359375, -3.007171630859375, -2.889892578125, -2.772613525390625, -2.65533447265625, -2.538055419921875, -2.4207763671875, -2.303497314453125, -2.18621826171875, -2.068939208984375, -1.95166015625, -1.834381103515625, -1.71710205078125, -1.599822998046875, -1.4825439453125, -1.365264892578125, -1.24798583984375, -1.130706787109375, -1.013427734375, -0.896148681640625, -0.77886962890625, -0.661590576171875, -0.5443115234375, -0.427032470703125, -0.30975341796875, -0.192474365234375, -0.0751953125, 0.042083740234375, 0.15936279296875, 0.276641845703125, 0.3939208984375, 0.511199951171875, 0.62847900390625, 0.745758056640625, 0.863037109375, 0.980316162109375, 1.09759521484375, 1.214874267578125, 1.3321533203125, 1.449432373046875, 1.56671142578125, 1.683990478515625, 1.80126953125, 1.918548583984375, 2.03582763671875, 2.153106689453125, 2.2703857421875, 2.387664794921875, 2.50494384765625, 2.622222900390625, 2.739501953125, 2.856781005859375, 2.97406005859375, 3.091339111328125, 3.2086181640625, 3.325897216796875, 3.44317626953125, 3.560455322265625, 3.677734375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 10.0, 12.0, 24.0, 47.0, 79.0, 176.0, 218.0, 191.0, 105.0, 72.0, 33.0, 14.0, 8.0, 6.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001316070556640625, -0.0012836754322052002, -0.0012512803077697754, -0.0012188851833343506, -0.0011864900588989258, -0.001154094934463501, -0.0011216998100280762, -0.0010893046855926514, -0.0010569095611572266, -0.0010245144367218018, -0.000992119312286377, -0.0009597241878509521, -0.0009273290634155273, -0.0008949339389801025, -0.0008625388145446777, -0.0008301436901092529, -0.0007977485656738281, -0.0007653534412384033, -0.0007329583168029785, -0.0007005631923675537, -0.0006681680679321289, -0.0006357729434967041, -0.0006033778190612793, -0.0005709826946258545, -0.0005385875701904297, -0.0005061924457550049, -0.0004737973213195801, -0.0004414021968841553, -0.00040900707244873047, -0.00037661194801330566, -0.00034421682357788086, -0.00031182169914245605, -0.00027942657470703125, -0.00024703145027160645, -0.00021463632583618164, -0.00018224120140075684, -0.00014984607696533203, -0.00011745095252990723, -8.505582809448242e-05, -5.266070365905762e-05, -2.0265579223632812e-05, 1.2129545211791992e-05, 4.45246696472168e-05, 7.69197940826416e-05, 0.0001093149185180664, 0.0001417100429534912, 0.00017410516738891602, 0.00020650029182434082, 0.00023889541625976562, 0.00027129054069519043, 0.00030368566513061523, 0.00033608078956604004, 0.00036847591400146484, 0.00040087103843688965, 0.00043326616287231445, 0.00046566128730773926, 0.0004980564117431641, 0.0005304515361785889, 0.0005628466606140137, 0.0005952417850494385, 0.0006276369094848633, 0.0006600320339202881, 0.0006924271583557129, 0.0007248222827911377, 0.0007572174072265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 11.0, 14.0, 15.0, 30.0, 45.0, 87.0, 168.0, 269.0, 518.0, 1171.0, 2629.0, 7074.0, 24345.0, 144566.0, 712564.0, 121969.0, 21876.0, 6562.0, 2521.0, 1037.0, 476.0, 254.0, 163.0, 94.0, 35.0, 28.0, 12.0, 9.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.2421875, -5.109344482421875, -4.97650146484375, -4.843658447265625, -4.7108154296875, -4.577972412109375, -4.44512939453125, -4.312286376953125, -4.179443359375, -4.046600341796875, -3.91375732421875, -3.780914306640625, -3.6480712890625, -3.515228271484375, -3.38238525390625, -3.249542236328125, -3.11669921875, -2.983856201171875, -2.85101318359375, -2.718170166015625, -2.5853271484375, -2.452484130859375, -2.31964111328125, -2.186798095703125, -2.053955078125, -1.921112060546875, -1.78826904296875, -1.655426025390625, -1.5225830078125, -1.389739990234375, -1.25689697265625, -1.124053955078125, -0.9912109375, -0.858367919921875, -0.72552490234375, -0.592681884765625, -0.4598388671875, -0.326995849609375, -0.19415283203125, -0.061309814453125, 0.071533203125, 0.204376220703125, 0.33721923828125, 0.470062255859375, 0.6029052734375, 0.735748291015625, 0.86859130859375, 1.001434326171875, 1.13427734375, 1.267120361328125, 1.39996337890625, 1.532806396484375, 1.6656494140625, 1.798492431640625, 1.93133544921875, 2.064178466796875, 2.197021484375, 2.329864501953125, 2.46270751953125, 2.595550537109375, 2.7283935546875, 2.861236572265625, 2.99407958984375, 3.126922607421875, 3.259765625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 3.0, 2.0, 10.0, 13.0, 10.0, 20.0, 24.0, 22.0, 41.0, 69.0, 109.0, 148.0, 148.0, 124.0, 70.0, 60.0, 27.0, 20.0, 14.0, 11.0, 9.0, 11.0, 9.0, 1.0, 5.0, 5.0, 0.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.623046875, -3.484832763671875, -3.34661865234375, -3.208404541015625, -3.0701904296875, -2.931976318359375, -2.79376220703125, -2.655548095703125, -2.517333984375, -2.379119873046875, -2.24090576171875, -2.102691650390625, -1.9644775390625, -1.826263427734375, -1.68804931640625, -1.549835205078125, -1.41162109375, -1.273406982421875, -1.13519287109375, -0.996978759765625, -0.8587646484375, -0.720550537109375, -0.58233642578125, -0.444122314453125, -0.305908203125, -0.167694091796875, -0.02947998046875, 0.108734130859375, 0.2469482421875, 0.385162353515625, 0.52337646484375, 0.661590576171875, 0.7998046875, 0.938018798828125, 1.07623291015625, 1.214447021484375, 1.3526611328125, 1.490875244140625, 1.62908935546875, 1.767303466796875, 1.905517578125, 2.043731689453125, 2.18194580078125, 2.320159912109375, 2.4583740234375, 2.596588134765625, 2.73480224609375, 2.873016357421875, 3.01123046875, 3.149444580078125, 3.28765869140625, 3.425872802734375, 3.5640869140625, 3.702301025390625, 3.84051513671875, 3.978729248046875, 4.116943359375, 4.255157470703125, 4.39337158203125, 4.531585693359375, 4.6697998046875, 4.808013916015625, 4.94622802734375, 5.084442138671875, 5.22265625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 20.0, 82.0, 249.0, 367.0, 186.0, 67.0, 25.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-225.08436584472656, -220.86749267578125, -216.65060424804688, -212.43373107910156, -208.21685791015625, -203.99996948242188, -199.78309631347656, -195.56622314453125, -191.34933471679688, -187.13246154785156, -182.9155731201172, -178.69869995117188, -174.48182678222656, -170.2649383544922, -166.04806518554688, -161.83119201660156, -157.61431884765625, -153.39744567871094, -149.18055725097656, -144.96368408203125, -140.74681091308594, -136.52992248535156, -132.31304931640625, -128.09617614746094, -123.87928771972656, -119.66240692138672, -115.4455337524414, -111.22865295410156, -107.01177215576172, -102.79489135742188, -98.57801818847656, -94.36113739013672, -90.14424896240234, -85.9273681640625, -81.71049499511719, -77.49361419677734, -73.2767333984375, -69.05986022949219, -64.84297943115234, -60.6260986328125, -56.40922164916992, -52.192344665527344, -47.9754638671875, -43.75858688354492, -39.541709899902344, -35.3248291015625, -31.107952117919922, -26.89107322692871, -22.6741943359375, -18.45731544494629, -14.240437507629395, -10.0235595703125, -5.806680679321289, -1.5898017883300781, 2.6270751953125, 6.843954086303711, 11.060832977294922, 15.277711868286133, 19.494590759277344, 23.711467742919922, 27.928346633911133, 32.145225524902344, 36.36210250854492, 40.5789794921875, 44.795860290527344]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 3.0, 9.0, 12.0, 17.0, 14.0, 18.0, 25.0, 22.0, 34.0, 40.0, 40.0, 58.0, 52.0, 53.0, 51.0, 63.0, 57.0, 54.0, 61.0, 46.0, 52.0, 31.0, 37.0, 36.0, 23.0, 17.0, 18.0, 16.0, 10.0, 10.0, 9.0, 3.0, 2.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.235107421875, -39.83210372924805, -38.42909622192383, -37.026092529296875, -35.62308883666992, -34.2200813293457, -32.81707763671875, -31.414072036743164, -30.011066436767578, -28.608060836791992, -27.20505714416504, -25.802051544189453, -24.399045944213867, -22.99604034423828, -21.593036651611328, -20.190031051635742, -18.78702735900879, -17.384021759033203, -15.981017112731934, -14.578012466430664, -13.175006866455078, -11.772002220153809, -10.368997573852539, -8.965991973876953, -7.562987327575684, -6.159982204437256, -4.756977081298828, -3.3539724349975586, -1.9509673118591309, -0.5479621887207031, 0.8550424575805664, 2.2580480575561523, 3.661052703857422, 5.06405782699585, 6.467062950134277, 7.870067596435547, 9.273073196411133, 10.676077842712402, 12.079082489013672, 13.482088088989258, 14.885092735290527, 16.288097381591797, 17.691102981567383, 19.09410858154297, 20.497112274169922, 21.900117874145508, 23.303123474121094, 24.706127166748047, 26.109132766723633, 27.51213836669922, 28.915142059326172, 30.318147659301758, 31.721153259277344, 33.1241569519043, 34.52716064453125, 35.93016815185547, 37.33317184448242, 38.736175537109375, 40.139183044433594, 41.54218673706055, 42.9451904296875, 44.34819793701172, 45.75120162963867, 47.154205322265625, 48.557212829589844]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 11.0, 8.0, 9.0, 19.0, 31.0, 37.0, 52.0, 75.0, 133.0, 190.0, 314.0, 505.0, 784.0, 1538.0, 3576.0, 13073.0, 4101776.0, 59965.0, 6846.0, 2303.0, 1201.0, 674.0, 416.0, 250.0, 156.0, 116.0, 74.0, 54.0, 26.0, 22.0, 9.0, 7.0, 5.0, 7.0, 5.0, 3.0, 7.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-15.453125, -15.0546875, -14.65625, -14.2578125, -13.859375, -13.4609375, -13.0625, -12.6640625, -12.265625, -11.8671875, -11.46875, -11.0703125, -10.671875, -10.2734375, -9.875, -9.4765625, -9.078125, -8.6796875, -8.28125, -7.8828125, -7.484375, -7.0859375, -6.6875, -6.2890625, -5.890625, -5.4921875, -5.09375, -4.6953125, -4.296875, -3.8984375, -3.5, -3.1015625, -2.703125, -2.3046875, -1.90625, -1.5078125, -1.109375, -0.7109375, -0.3125, 0.0859375, 0.484375, 0.8828125, 1.28125, 1.6796875, 2.078125, 2.4765625, 2.875, 3.2734375, 3.671875, 4.0703125, 4.46875, 4.8671875, 5.265625, 5.6640625, 6.0625, 6.4609375, 6.859375, 7.2578125, 7.65625, 8.0546875, 8.453125, 8.8515625, 9.25, 9.6484375, 10.046875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 5.0, 10.0, 11.0, 18.0, 24.0, 28.0, 33.0, 40.0, 41.0, 37.0, 39.0, 50.0, 67.0, 65.0, 59.0, 50.0, 62.0, 64.0, 44.0, 51.0, 39.0, 35.0, 25.0, 19.0, 13.0, 20.0, 8.0, 11.0, 3.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.00390625, -1.94525146484375, -1.8865966796875, -1.82794189453125, -1.769287109375, -1.71063232421875, -1.6519775390625, -1.59332275390625, -1.53466796875, -1.47601318359375, -1.4173583984375, -1.35870361328125, -1.300048828125, -1.24139404296875, -1.1827392578125, -1.12408447265625, -1.0654296875, -1.00677490234375, -0.9481201171875, -0.88946533203125, -0.830810546875, -0.77215576171875, -0.7135009765625, -0.65484619140625, -0.59619140625, -0.53753662109375, -0.4788818359375, -0.42022705078125, -0.361572265625, -0.30291748046875, -0.2442626953125, -0.18560791015625, -0.126953125, -0.06829833984375, -0.0096435546875, 0.04901123046875, 0.107666015625, 0.16632080078125, 0.2249755859375, 0.28363037109375, 0.34228515625, 0.40093994140625, 0.4595947265625, 0.51824951171875, 0.576904296875, 0.63555908203125, 0.6942138671875, 0.75286865234375, 0.8115234375, 0.87017822265625, 0.9288330078125, 0.98748779296875, 1.046142578125, 1.10479736328125, 1.1634521484375, 1.22210693359375, 1.28076171875, 1.33941650390625, 1.3980712890625, 1.45672607421875, 1.515380859375, 1.57403564453125, 1.6326904296875, 1.69134521484375, 1.75]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 3.0, 8.0, 6.0, 5.0, 17.0, 12.0, 27.0, 26.0, 51.0, 65.0, 88.0, 117.0, 160.0, 244.0, 296.0, 428.0, 579.0, 852.0, 1207.0, 1781.0, 2674.0, 4212.0, 7428.0, 16433.0, 66223.0, 4003701.0, 53721.0, 14761.0, 6982.0, 3927.0, 2557.0, 1618.0, 1134.0, 795.0, 588.0, 445.0, 280.0, 230.0, 154.0, 124.0, 93.0, 60.0, 46.0, 30.0, 31.0, 16.0, 14.0, 15.0, 11.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.4296875, -5.24530029296875, -5.0609130859375, -4.87652587890625, -4.692138671875, -4.50775146484375, -4.3233642578125, -4.13897705078125, -3.95458984375, -3.77020263671875, -3.5858154296875, -3.40142822265625, -3.217041015625, -3.03265380859375, -2.8482666015625, -2.66387939453125, -2.4794921875, -2.29510498046875, -2.1107177734375, -1.92633056640625, -1.741943359375, -1.55755615234375, -1.3731689453125, -1.18878173828125, -1.00439453125, -0.82000732421875, -0.6356201171875, -0.45123291015625, -0.266845703125, -0.08245849609375, 0.1019287109375, 0.28631591796875, 0.470703125, 0.65509033203125, 0.8394775390625, 1.02386474609375, 1.208251953125, 1.39263916015625, 1.5770263671875, 1.76141357421875, 1.94580078125, 2.13018798828125, 2.3145751953125, 2.49896240234375, 2.683349609375, 2.86773681640625, 3.0521240234375, 3.23651123046875, 3.4208984375, 3.60528564453125, 3.7896728515625, 3.97406005859375, 4.158447265625, 4.34283447265625, 4.5272216796875, 4.71160888671875, 4.89599609375, 5.08038330078125, 5.2647705078125, 5.44915771484375, 5.633544921875, 5.81793212890625, 6.0023193359375, 6.18670654296875, 6.37109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 4.0, 2.0, 1.0, 3.0, 10.0, 7.0, 15.0, 23.0, 39.0, 225.0, 3527.0, 89.0, 38.0, 25.0, 12.0, 7.0, 8.0, 5.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.6611328125, -1.612640380859375, -1.56414794921875, -1.515655517578125, -1.4671630859375, -1.418670654296875, -1.37017822265625, -1.321685791015625, -1.273193359375, -1.224700927734375, -1.17620849609375, -1.127716064453125, -1.0792236328125, -1.030731201171875, -0.98223876953125, -0.933746337890625, -0.88525390625, -0.836761474609375, -0.78826904296875, -0.739776611328125, -0.6912841796875, -0.642791748046875, -0.59429931640625, -0.545806884765625, -0.497314453125, -0.448822021484375, -0.40032958984375, -0.351837158203125, -0.3033447265625, -0.254852294921875, -0.20635986328125, -0.157867431640625, -0.109375, -0.060882568359375, -0.01239013671875, 0.036102294921875, 0.0845947265625, 0.133087158203125, 0.18157958984375, 0.230072021484375, 0.278564453125, 0.327056884765625, 0.37554931640625, 0.424041748046875, 0.4725341796875, 0.521026611328125, 0.56951904296875, 0.618011474609375, 0.66650390625, 0.714996337890625, 0.76348876953125, 0.811981201171875, 0.8604736328125, 0.908966064453125, 0.95745849609375, 1.005950927734375, 1.054443359375, 1.102935791015625, 1.15142822265625, 1.199920654296875, 1.2484130859375, 1.296905517578125, 1.34539794921875, 1.393890380859375, 1.4423828125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 9.0, 32.0, 96.0, 202.0, 276.0, 227.0, 108.0, 33.0, 17.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.639272689819336, -22.182661056518555, -21.726049423217773, -21.269437789916992, -20.81282615661621, -20.356212615966797, -19.899600982666016, -19.442989349365234, -18.986377716064453, -18.529766082763672, -18.07315444946289, -17.61654281616211, -17.159931182861328, -16.703319549560547, -16.246707916259766, -15.790095329284668, -15.333483695983887, -14.876872062683105, -14.420260429382324, -13.963647842407227, -13.507036209106445, -13.050424575805664, -12.593812942504883, -12.137201309204102, -11.68058967590332, -11.223978042602539, -10.767366409301758, -10.310754776000977, -9.854142189025879, -9.397530555725098, -8.940918922424316, -8.484307289123535, -8.027694702148438, -7.571083068847656, -7.114470958709717, -6.6578593254089355, -6.201247215270996, -5.744635581970215, -5.288023948669434, -4.831412315368652, -4.374800205230713, -3.9181883335113525, -3.461576461791992, -3.004964828491211, -2.5483529567718506, -2.0917410850524902, -1.635129451751709, -1.1785175800323486, -0.7219057083129883, -0.2652938961982727, 0.19131791591644287, 0.6479296684265137, 1.104541540145874, 1.5611534118652344, 2.0177650451660156, 2.474376916885376, 2.9309887886047363, 3.3876006603240967, 3.844212532043457, 4.300824165344238, 4.7574357986450195, 5.214047908782959, 5.67065954208374, 6.12727165222168, 6.583883285522461]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 0.0, 4.0, 2.0, 10.0, 9.0, 11.0, 16.0, 22.0, 21.0, 14.0, 15.0, 28.0, 30.0, 31.0, 34.0, 34.0, 40.0, 41.0, 48.0, 43.0, 55.0, 50.0, 45.0, 55.0, 51.0, 38.0, 34.0, 23.0, 29.0, 31.0, 21.0, 15.0, 22.0, 12.0, 15.0, 12.0, 11.0, 12.0, 3.0, 4.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.6851954460144043, -3.5713894367218018, -3.45758318901062, -3.3437771797180176, -3.229970932006836, -3.1161649227142334, -3.002358913421631, -2.888552665710449, -2.7747466564178467, -2.660940647125244, -2.5471343994140625, -2.43332839012146, -2.3195221424102783, -2.205716133117676, -2.091909885406494, -1.9781038761138916, -1.8642977476119995, -1.7504916191101074, -1.6366854906082153, -1.5228793621063232, -1.4090733528137207, -1.2952672243118286, -1.1814610958099365, -1.067655086517334, -0.9538488984107971, -0.840042769908905, -0.7262367010116577, -0.6124305725097656, -0.4986244738101959, -0.3848183751106262, -0.27101224660873413, -0.15720617771148682, -0.04340004920959473, 0.07040605694055557, 0.18421216309070587, 0.29801827669143677, 0.41182437539100647, 0.5256304740905762, 0.6394366025924683, 0.7532426714897156, 0.8670487999916077, 0.9808549284934998, 1.094660997390747, 1.2084671258926392, 1.3222732543945312, 1.4360792636871338, 1.5498855113983154, 1.663691520690918, 1.77749764919281, 1.8913037776947021, 2.0051097869873047, 2.1189160346984863, 2.232722043991089, 2.3465280532836914, 2.460334300994873, 2.5741403102874756, 2.6879465579986572, 2.8017525672912598, 2.9155588150024414, 3.029364824295044, 3.1431710720062256, 3.256977081298828, 3.3707833290100098, 3.4845893383026123, 3.598395347595215]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 5.0, 10.0, 13.0, 17.0, 24.0, 35.0, 46.0, 77.0, 128.0, 180.0, 330.0, 570.0, 959.0, 1657.0, 2968.0, 5650.0, 11720.0, 26172.0, 62940.0, 160723.0, 346856.0, 252312.0, 99873.0, 40431.0, 17358.0, 8184.0, 4138.0, 2144.0, 1239.0, 696.0, 382.0, 267.0, 138.0, 101.0, 62.0, 45.0, 29.0, 29.0, 17.0, 9.0, 4.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-5.99609375, -5.828369140625, -5.66064453125, -5.492919921875, -5.3251953125, -5.157470703125, -4.98974609375, -4.822021484375, -4.654296875, -4.486572265625, -4.31884765625, -4.151123046875, -3.9833984375, -3.815673828125, -3.64794921875, -3.480224609375, -3.3125, -3.144775390625, -2.97705078125, -2.809326171875, -2.6416015625, -2.473876953125, -2.30615234375, -2.138427734375, -1.970703125, -1.802978515625, -1.63525390625, -1.467529296875, -1.2998046875, -1.132080078125, -0.96435546875, -0.796630859375, -0.62890625, -0.461181640625, -0.29345703125, -0.125732421875, 0.0419921875, 0.209716796875, 0.37744140625, 0.545166015625, 0.712890625, 0.880615234375, 1.04833984375, 1.216064453125, 1.3837890625, 1.551513671875, 1.71923828125, 1.886962890625, 2.0546875, 2.222412109375, 2.39013671875, 2.557861328125, 2.7255859375, 2.893310546875, 3.06103515625, 3.228759765625, 3.396484375, 3.564208984375, 3.73193359375, 3.899658203125, 4.0673828125, 4.235107421875, 4.40283203125, 4.570556640625, 4.73828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 11.0, 4.0, 12.0, 12.0, 7.0, 14.0, 20.0, 17.0, 30.0, 31.0, 51.0, 43.0, 34.0, 50.0, 45.0, 50.0, 53.0, 65.0, 47.0, 62.0, 59.0, 50.0, 42.0, 37.0, 29.0, 36.0, 18.0, 21.0, 12.0, 9.0, 7.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7802734375, -1.7207183837890625, -1.661163330078125, -1.6016082763671875, -1.54205322265625, -1.4824981689453125, -1.422943115234375, -1.3633880615234375, -1.3038330078125, -1.2442779541015625, -1.184722900390625, -1.1251678466796875, -1.06561279296875, -1.0060577392578125, -0.946502685546875, -0.8869476318359375, -0.827392578125, -0.7678375244140625, -0.708282470703125, -0.6487274169921875, -0.58917236328125, -0.5296173095703125, -0.470062255859375, -0.4105072021484375, -0.3509521484375, -0.2913970947265625, -0.231842041015625, -0.1722869873046875, -0.11273193359375, -0.0531768798828125, 0.006378173828125, 0.0659332275390625, 0.12548828125, 0.1850433349609375, 0.244598388671875, 0.3041534423828125, 0.36370849609375, 0.4232635498046875, 0.482818603515625, 0.5423736572265625, 0.6019287109375, 0.6614837646484375, 0.721038818359375, 0.7805938720703125, 0.84014892578125, 0.8997039794921875, 0.959259033203125, 1.0188140869140625, 1.078369140625, 1.1379241943359375, 1.197479248046875, 1.2570343017578125, 1.31658935546875, 1.3761444091796875, 1.435699462890625, 1.4952545166015625, 1.5548095703125, 1.6143646240234375, 1.673919677734375, 1.7334747314453125, 1.79302978515625, 1.8525848388671875, 1.912139892578125, 1.9716949462890625, 2.03125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 5.0, 3.0, 7.0, 7.0, 15.0, 18.0, 19.0, 39.0, 58.0, 76.0, 152.0, 175.0, 317.0, 576.0, 1162.0, 2609.0, 6148.0, 16854.0, 54773.0, 236089.0, 542910.0, 132317.0, 34177.0, 11491.0, 4482.0, 1963.0, 939.0, 429.0, 268.0, 157.0, 101.0, 61.0, 46.0, 30.0, 30.0, 17.0, 12.0, 7.0, 6.0, 5.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.27734375, -7.03729248046875, -6.7972412109375, -6.55718994140625, -6.317138671875, -6.07708740234375, -5.8370361328125, -5.59698486328125, -5.35693359375, -5.11688232421875, -4.8768310546875, -4.63677978515625, -4.396728515625, -4.15667724609375, -3.9166259765625, -3.67657470703125, -3.4365234375, -3.19647216796875, -2.9564208984375, -2.71636962890625, -2.476318359375, -2.23626708984375, -1.9962158203125, -1.75616455078125, -1.51611328125, -1.27606201171875, -1.0360107421875, -0.79595947265625, -0.555908203125, -0.31585693359375, -0.0758056640625, 0.16424560546875, 0.404296875, 0.64434814453125, 0.8843994140625, 1.12445068359375, 1.364501953125, 1.60455322265625, 1.8446044921875, 2.08465576171875, 2.32470703125, 2.56475830078125, 2.8048095703125, 3.04486083984375, 3.284912109375, 3.52496337890625, 3.7650146484375, 4.00506591796875, 4.2451171875, 4.48516845703125, 4.7252197265625, 4.96527099609375, 5.205322265625, 5.44537353515625, 5.6854248046875, 5.92547607421875, 6.16552734375, 6.40557861328125, 6.6456298828125, 6.88568115234375, 7.125732421875, 7.36578369140625, 7.6058349609375, 7.84588623046875, 8.0859375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 8.0, 11.0, 3.0, 9.0, 9.0, 10.0, 30.0, 28.0, 27.0, 46.0, 57.0, 54.0, 64.0, 65.0, 75.0, 62.0, 63.0, 66.0, 54.0, 40.0, 42.0, 43.0, 29.0, 27.0, 21.0, 17.0, 11.0, 12.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.6771240234375, -8.252685546875, -7.8282470703125, -7.40380859375, -6.9793701171875, -6.554931640625, -6.1304931640625, -5.7060546875, -5.2816162109375, -4.857177734375, -4.4327392578125, -4.00830078125, -3.5838623046875, -3.159423828125, -2.7349853515625, -2.310546875, -1.8861083984375, -1.461669921875, -1.0372314453125, -0.61279296875, -0.1883544921875, 0.236083984375, 0.6605224609375, 1.0849609375, 1.5093994140625, 1.933837890625, 2.3582763671875, 2.78271484375, 3.2071533203125, 3.631591796875, 4.0560302734375, 4.48046875, 4.9049072265625, 5.329345703125, 5.7537841796875, 6.17822265625, 6.6026611328125, 7.027099609375, 7.4515380859375, 7.8759765625, 8.3004150390625, 8.724853515625, 9.1492919921875, 9.57373046875, 9.9981689453125, 10.422607421875, 10.8470458984375, 11.271484375, 11.6959228515625, 12.120361328125, 12.5447998046875, 12.96923828125, 13.3936767578125, 13.818115234375, 14.2425537109375, 14.6669921875, 15.0914306640625, 15.515869140625, 15.9403076171875, 16.36474609375, 16.7891845703125, 17.213623046875, 17.6380615234375, 18.0625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 6.0, 5.0, 4.0, 15.0, 22.0, 36.0, 57.0, 115.0, 267.0, 1150.0, 10152.0, 1002562.0, 31500.0, 1888.0, 419.0, 169.0, 85.0, 46.0, 20.0, 17.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.234375, -18.484375, -17.734375, -16.984375, -16.234375, -15.484375, -14.734375, -13.984375, -13.234375, -12.484375, -11.734375, -10.984375, -10.234375, -9.484375, -8.734375, -7.984375, -7.234375, -6.484375, -5.734375, -4.984375, -4.234375, -3.484375, -2.734375, -1.984375, -1.234375, -0.484375, 0.265625, 1.015625, 1.765625, 2.515625, 3.265625, 4.015625, 4.765625, 5.515625, 6.265625, 7.015625, 7.765625, 8.515625, 9.265625, 10.015625, 10.765625, 11.515625, 12.265625, 13.015625, 13.765625, 14.515625, 15.265625, 16.015625, 16.765625, 17.515625, 18.265625, 19.015625, 19.765625, 20.515625, 21.265625, 22.015625, 22.765625, 23.515625, 24.265625, 25.015625, 25.765625, 26.515625, 27.265625, 28.015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 16.0, 7.0, 17.0, 28.0, 41.0, 58.0, 109.0, 137.0, 148.0, 143.0, 96.0, 78.0, 31.0, 32.0, 16.0, 9.0, 2.0, 7.0, 7.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0011081695556640625, -0.0010814517736434937, -0.0010547339916229248, -0.001028016209602356, -0.0010012984275817871, -0.0009745806455612183, -0.0009478628635406494, -0.0009211450815200806, -0.0008944272994995117, -0.0008677095174789429, -0.000840991735458374, -0.0008142739534378052, -0.0007875561714172363, -0.0007608383893966675, -0.0007341206073760986, -0.0007074028253555298, -0.0006806850433349609, -0.0006539672613143921, -0.0006272494792938232, -0.0006005316972732544, -0.0005738139152526855, -0.0005470961332321167, -0.0005203783512115479, -0.000493660569190979, -0.00046694278717041016, -0.0004402250051498413, -0.00041350722312927246, -0.0003867894411087036, -0.00036007165908813477, -0.0003333538770675659, -0.00030663609504699707, -0.0002799183130264282, -0.0002532005310058594, -0.00022648274898529053, -0.00019976496696472168, -0.00017304718494415283, -0.00014632940292358398, -0.00011961162090301514, -9.289383888244629e-05, -6.617605686187744e-05, -3.9458274841308594e-05, -1.2740492820739746e-05, 1.3977289199829102e-05, 4.069507122039795e-05, 6.74128532409668e-05, 9.413063526153564e-05, 0.00012084841728210449, 0.00014756619930267334, 0.0001742839813232422, 0.00020100176334381104, 0.00022771954536437988, 0.00025443732738494873, 0.0002811551094055176, 0.0003078728914260864, 0.0003345906734466553, 0.0003613084554672241, 0.00038802623748779297, 0.0004147440195083618, 0.00044146180152893066, 0.0004681795835494995, 0.0004948973655700684, 0.0005216151475906372, 0.0005483329296112061, 0.0005750507116317749, 0.0006017684936523438]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 11.0, 15.0, 29.0, 45.0, 96.0, 205.0, 529.0, 1372.0, 4733.0, 36193.0, 893134.0, 101272.0, 7584.0, 2024.0, 765.0, 294.0, 128.0, 51.0, 21.0, 13.0, 11.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.6171875, -11.27197265625, -10.9267578125, -10.58154296875, -10.236328125, -9.89111328125, -9.5458984375, -9.20068359375, -8.85546875, -8.51025390625, -8.1650390625, -7.81982421875, -7.474609375, -7.12939453125, -6.7841796875, -6.43896484375, -6.09375, -5.74853515625, -5.4033203125, -5.05810546875, -4.712890625, -4.36767578125, -4.0224609375, -3.67724609375, -3.33203125, -2.98681640625, -2.6416015625, -2.29638671875, -1.951171875, -1.60595703125, -1.2607421875, -0.91552734375, -0.5703125, -0.22509765625, 0.1201171875, 0.46533203125, 0.810546875, 1.15576171875, 1.5009765625, 1.84619140625, 2.19140625, 2.53662109375, 2.8818359375, 3.22705078125, 3.572265625, 3.91748046875, 4.2626953125, 4.60791015625, 4.953125, 5.29833984375, 5.6435546875, 5.98876953125, 6.333984375, 6.67919921875, 7.0244140625, 7.36962890625, 7.71484375, 8.06005859375, 8.4052734375, 8.75048828125, 9.095703125, 9.44091796875, 9.7861328125, 10.13134765625, 10.4765625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 11.0, 10.0, 19.0, 30.0, 74.0, 130.0, 213.0, 225.0, 122.0, 66.0, 30.0, 21.0, 8.0, 10.0, 2.0, 7.0, 6.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5078125, -11.1221923828125, -10.736572265625, -10.3509521484375, -9.96533203125, -9.5797119140625, -9.194091796875, -8.8084716796875, -8.4228515625, -8.0372314453125, -7.651611328125, -7.2659912109375, -6.88037109375, -6.4947509765625, -6.109130859375, -5.7235107421875, -5.337890625, -4.9522705078125, -4.566650390625, -4.1810302734375, -3.79541015625, -3.4097900390625, -3.024169921875, -2.6385498046875, -2.2529296875, -1.8673095703125, -1.481689453125, -1.0960693359375, -0.71044921875, -0.3248291015625, 0.060791015625, 0.4464111328125, 0.83203125, 1.2176513671875, 1.603271484375, 1.9888916015625, 2.37451171875, 2.7601318359375, 3.145751953125, 3.5313720703125, 3.9169921875, 4.3026123046875, 4.688232421875, 5.0738525390625, 5.45947265625, 5.8450927734375, 6.230712890625, 6.6163330078125, 7.001953125, 7.3875732421875, 7.773193359375, 8.1588134765625, 8.54443359375, 8.9300537109375, 9.315673828125, 9.7012939453125, 10.0869140625, 10.4725341796875, 10.858154296875, 11.2437744140625, 11.62939453125, 12.0150146484375, 12.400634765625, 12.7862548828125, 13.171875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 8.0, 16.0, 27.0, 44.0, 71.0, 121.0, 198.0, 202.0, 136.0, 84.0, 50.0, 23.0, 11.0, 9.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.56695556640625, -157.62384033203125, -153.6807098388672, -149.7375946044922, -145.79446411132812, -141.85134887695312, -137.90823364257812, -133.96510314941406, -130.02198791503906, -126.07886505126953, -122.1357421875, -118.192626953125, -114.24950408935547, -110.30638122558594, -106.3632583618164, -102.42013549804688, -98.47701263427734, -94.53388977050781, -90.59076690673828, -86.64764404296875, -82.70452880859375, -78.76140594482422, -74.81828308105469, -70.87516021728516, -66.93203735351562, -62.988914489746094, -59.04579544067383, -55.1026725769043, -51.15955352783203, -47.2164306640625, -43.27330780029297, -39.33018493652344, -35.38706970214844, -31.44394874572754, -27.50082778930664, -23.55770492553711, -19.61458396911621, -15.671463012695312, -11.728340148925781, -7.785219192504883, -3.8420982360839844, 0.10102319717407227, 4.044144630432129, 7.987266540527344, 11.930387496948242, 15.87350845336914, 19.816631317138672, 23.75975227355957, 27.70287322998047, 31.645994186401367, 35.589115142822266, 39.5322380065918, 43.47535705566406, 47.418479919433594, 51.361602783203125, 55.304725646972656, 59.24784469604492, 63.19096755981445, 67.13408660888672, 71.07720947265625, 75.02033233642578, 78.96345520019531, 82.90657043457031, 86.84969329833984, 90.79281616210938]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 7.0, 4.0, 9.0, 8.0, 10.0, 16.0, 19.0, 20.0, 27.0, 21.0, 30.0, 37.0, 39.0, 59.0, 49.0, 59.0, 41.0, 50.0, 57.0, 66.0, 41.0, 40.0, 41.0, 37.0, 24.0, 31.0, 26.0, 21.0, 22.0, 12.0, 16.0, 15.0, 9.0, 9.0, 8.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.79658508300781, -64.80411529541016, -62.81165313720703, -60.819183349609375, -58.826717376708984, -56.834251403808594, -54.8417854309082, -52.84931945800781, -50.856849670410156, -48.864383697509766, -46.871917724609375, -44.87944793701172, -42.88698196411133, -40.89451599121094, -38.90205001831055, -36.909584045410156, -34.917118072509766, -32.924652099609375, -30.93218421936035, -28.93971824645996, -26.947250366210938, -24.954784393310547, -22.962318420410156, -20.969852447509766, -18.977384567260742, -16.98491859436035, -14.992450714111328, -12.999984741210938, -11.00751781463623, -9.015050888061523, -7.022584915161133, -5.030117988586426, -3.0376548767089844, -1.0451881885528564, 0.9472784996032715, 2.9397449493408203, 4.932211875915527, 6.924678802490234, 8.917144775390625, 10.909611701965332, 12.902078628540039, 14.894545555114746, 16.887012481689453, 18.879478454589844, 20.871944427490234, 22.864412307739258, 24.85687828063965, 26.849346160888672, 28.841812133789062, 30.834278106689453, 32.826744079589844, 34.8192138671875, 36.81167984008789, 38.80414581298828, 40.79661178588867, 42.78907775878906, 44.78154754638672, 46.77401351928711, 48.7664794921875, 50.758949279785156, 52.75141525268555, 54.74388122558594, 56.73634719848633, 58.72881317138672, 60.72127914428711]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 3.0, 7.0, 1.0, 11.0, 13.0, 18.0, 21.0, 37.0, 54.0, 81.0, 148.0, 213.0, 479.0, 1095.0, 3102.0, 14801.0, 4131848.0, 34851.0, 4874.0, 1425.0, 552.0, 286.0, 139.0, 80.0, 34.0, 38.0, 21.0, 9.0, 15.0, 8.0, 4.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.234375, -23.5732421875, -22.912109375, -22.2509765625, -21.58984375, -20.9287109375, -20.267578125, -19.6064453125, -18.9453125, -18.2841796875, -17.623046875, -16.9619140625, -16.30078125, -15.6396484375, -14.978515625, -14.3173828125, -13.65625, -12.9951171875, -12.333984375, -11.6728515625, -11.01171875, -10.3505859375, -9.689453125, -9.0283203125, -8.3671875, -7.7060546875, -7.044921875, -6.3837890625, -5.72265625, -5.0615234375, -4.400390625, -3.7392578125, -3.078125, -2.4169921875, -1.755859375, -1.0947265625, -0.43359375, 0.2275390625, 0.888671875, 1.5498046875, 2.2109375, 2.8720703125, 3.533203125, 4.1943359375, 4.85546875, 5.5166015625, 6.177734375, 6.8388671875, 7.5, 8.1611328125, 8.822265625, 9.4833984375, 10.14453125, 10.8056640625, 11.466796875, 12.1279296875, 12.7890625, 13.4501953125, 14.111328125, 14.7724609375, 15.43359375, 16.0947265625, 16.755859375, 17.4169921875, 18.078125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 5.0, 4.0, 3.0, 4.0, 0.0, 5.0, 4.0, 7.0, 9.0, 18.0, 12.0, 16.0, 16.0, 33.0, 33.0, 43.0, 39.0, 57.0, 61.0, 69.0, 79.0, 50.0, 56.0, 69.0, 52.0, 45.0, 31.0, 42.0, 33.0, 28.0, 19.0, 21.0, 4.0, 8.0, 10.0, 7.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.943359375, -2.863616943359375, -2.78387451171875, -2.704132080078125, -2.6243896484375, -2.544647216796875, -2.46490478515625, -2.385162353515625, -2.305419921875, -2.225677490234375, -2.14593505859375, -2.066192626953125, -1.9864501953125, -1.906707763671875, -1.82696533203125, -1.747222900390625, -1.66748046875, -1.587738037109375, -1.50799560546875, -1.428253173828125, -1.3485107421875, -1.268768310546875, -1.18902587890625, -1.109283447265625, -1.029541015625, -0.949798583984375, -0.87005615234375, -0.790313720703125, -0.7105712890625, -0.630828857421875, -0.55108642578125, -0.471343994140625, -0.3916015625, -0.311859130859375, -0.23211669921875, -0.152374267578125, -0.0726318359375, 0.007110595703125, 0.08685302734375, 0.166595458984375, 0.246337890625, 0.326080322265625, 0.40582275390625, 0.485565185546875, 0.5653076171875, 0.645050048828125, 0.72479248046875, 0.804534912109375, 0.88427734375, 0.964019775390625, 1.04376220703125, 1.123504638671875, 1.2032470703125, 1.282989501953125, 1.36273193359375, 1.442474365234375, 1.522216796875, 1.601959228515625, 1.68170166015625, 1.761444091796875, 1.8411865234375, 1.920928955078125, 2.00067138671875, 2.080413818359375, 2.16015625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 4.0, 8.0, 9.0, 9.0, 13.0, 19.0, 27.0, 34.0, 58.0, 54.0, 67.0, 94.0, 123.0, 171.0, 241.0, 279.0, 439.0, 586.0, 902.0, 1245.0, 2144.0, 3376.0, 6464.0, 14350.0, 51175.0, 3920379.0, 147577.0, 23570.0, 8789.0, 4341.0, 2555.0, 1611.0, 1006.0, 680.0, 483.0, 324.0, 242.0, 208.0, 121.0, 99.0, 99.0, 73.0, 55.0, 49.0, 32.0, 22.0, 17.0, 24.0, 7.0, 10.0, 4.0, 3.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0], "bins": [-10.265625, -9.9420166015625, -9.618408203125, -9.2947998046875, -8.97119140625, -8.6475830078125, -8.323974609375, -8.0003662109375, -7.6767578125, -7.3531494140625, -7.029541015625, -6.7059326171875, -6.38232421875, -6.0587158203125, -5.735107421875, -5.4114990234375, -5.087890625, -4.7642822265625, -4.440673828125, -4.1170654296875, -3.79345703125, -3.4698486328125, -3.146240234375, -2.8226318359375, -2.4990234375, -2.1754150390625, -1.851806640625, -1.5281982421875, -1.20458984375, -0.8809814453125, -0.557373046875, -0.2337646484375, 0.08984375, 0.4134521484375, 0.737060546875, 1.0606689453125, 1.38427734375, 1.7078857421875, 2.031494140625, 2.3551025390625, 2.6787109375, 3.0023193359375, 3.325927734375, 3.6495361328125, 3.97314453125, 4.2967529296875, 4.620361328125, 4.9439697265625, 5.267578125, 5.5911865234375, 5.914794921875, 6.2384033203125, 6.56201171875, 6.8856201171875, 7.209228515625, 7.5328369140625, 7.8564453125, 8.1800537109375, 8.503662109375, 8.8272705078125, 9.15087890625, 9.4744873046875, 9.798095703125, 10.1217041015625, 10.4453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 3.0, 8.0, 13.0, 16.0, 29.0, 52.0, 173.0, 3371.0, 240.0, 64.0, 32.0, 18.0, 9.0, 8.0, 5.0, 9.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1953125, -4.08648681640625, -3.9776611328125, -3.86883544921875, -3.760009765625, -3.65118408203125, -3.5423583984375, -3.43353271484375, -3.32470703125, -3.21588134765625, -3.1070556640625, -2.99822998046875, -2.889404296875, -2.78057861328125, -2.6717529296875, -2.56292724609375, -2.4541015625, -2.34527587890625, -2.2364501953125, -2.12762451171875, -2.018798828125, -1.90997314453125, -1.8011474609375, -1.69232177734375, -1.58349609375, -1.47467041015625, -1.3658447265625, -1.25701904296875, -1.148193359375, -1.03936767578125, -0.9305419921875, -0.82171630859375, -0.712890625, -0.60406494140625, -0.4952392578125, -0.38641357421875, -0.277587890625, -0.16876220703125, -0.0599365234375, 0.04888916015625, 0.15771484375, 0.26654052734375, 0.3753662109375, 0.48419189453125, 0.593017578125, 0.70184326171875, 0.8106689453125, 0.91949462890625, 1.0283203125, 1.13714599609375, 1.2459716796875, 1.35479736328125, 1.463623046875, 1.57244873046875, 1.6812744140625, 1.79010009765625, 1.89892578125, 2.00775146484375, 2.1165771484375, 2.22540283203125, 2.334228515625, 2.44305419921875, 2.5518798828125, 2.66070556640625, 2.76953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 8.0, 10.0, 30.0, 41.0, 58.0, 90.0, 143.0, 191.0, 160.0, 125.0, 77.0, 29.0, 20.0, 8.0, 9.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.60069465637207, -27.964872360229492, -27.32904815673828, -26.693225860595703, -26.057403564453125, -25.421579360961914, -24.785757064819336, -24.149932861328125, -23.514110565185547, -22.87828826904297, -22.242464065551758, -21.60664176940918, -20.9708194732666, -20.33499526977539, -19.699172973632812, -19.063350677490234, -18.427528381347656, -17.791706085205078, -17.155881881713867, -16.52005958557129, -15.884236335754395, -15.2484130859375, -14.612590789794922, -13.976767539978027, -13.340944290161133, -12.705121040344238, -12.06929874420166, -11.433475494384766, -10.797652244567871, -10.161828994750977, -9.526006698608398, -8.890183448791504, -8.25436019897461, -7.618537425994873, -6.9827141761779785, -6.346891403198242, -5.711068153381348, -5.075245380401611, -4.439422607421875, -3.8035993576049805, -3.167776584625244, -2.5319535732269287, -1.8961306810379028, -1.260307788848877, -0.6244847774505615, 0.011338233947753906, 0.6471610069274902, 1.2829842567443848, 1.918807029724121, 2.5546300411224365, 3.190453052520752, 3.8262758255004883, 4.462099075317383, 5.097921848297119, 5.7337446212768555, 6.36956787109375, 7.005390644073486, 7.641213417053223, 8.277036666870117, 8.912858963012695, 9.54868221282959, 10.184505462646484, 10.820327758789062, 11.456151962280273, 12.091974258422852]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 8.0, 6.0, 13.0, 8.0, 17.0, 8.0, 17.0, 27.0, 26.0, 23.0, 22.0, 39.0, 39.0, 46.0, 43.0, 38.0, 37.0, 31.0, 56.0, 44.0, 45.0, 37.0, 37.0, 30.0, 40.0, 22.0, 36.0, 31.0, 20.0, 23.0, 25.0, 14.0, 20.0, 20.0, 6.0, 5.0, 8.0, 9.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.977933883666992, -6.733251094818115, -6.488568305969238, -6.243885517120361, -5.999202728271484, -5.754519939422607, -5.5098371505737305, -5.265154838562012, -5.020471572875977, -4.7757887840271, -4.531105995178223, -4.286423206329346, -4.041740417480469, -3.797057628631592, -3.552375078201294, -3.307692289352417, -3.063009738922119, -2.818326950073242, -2.5736441612243652, -2.3289613723754883, -2.0842785835266113, -1.839595913887024, -1.5949132442474365, -1.3502304553985596, -1.1055476665496826, -0.8608648777008057, -0.6161821484565735, -0.3714994192123413, -0.12681663036346436, 0.1178661584854126, 0.362548828125, 0.607231616973877, 0.8519144058227539, 1.0965971946716309, 1.3412799835205078, 1.5859626531600952, 1.8306454420089722, 2.0753283500671387, 2.3200109004974365, 2.5646936893463135, 2.8093764781951904, 3.0540592670440674, 3.2987420558929443, 3.543424606323242, 3.788107395172119, 4.032790184020996, 4.277472972869873, 4.52215576171875, 4.766838550567627, 5.011521339416504, 5.256204128265381, 5.500886917114258, 5.745569705963135, 5.990252494812012, 6.2349348068237305, 6.479618072509766, 6.724300384521484, 6.968983173370361, 7.213665962219238, 7.458348751068115, 7.703031539916992, 7.947714328765869, 8.192397117614746, 8.437079429626465, 8.6817626953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 9.0, 7.0, 17.0, 13.0, 28.0, 38.0, 43.0, 90.0, 121.0, 165.0, 316.0, 460.0, 853.0, 1482.0, 2908.0, 5766.0, 12194.0, 27774.0, 68676.0, 194655.0, 408165.0, 201181.0, 70299.0, 28286.0, 12450.0, 5829.0, 3032.0, 1585.0, 817.0, 473.0, 295.0, 191.0, 117.0, 69.0, 50.0, 22.0, 26.0, 17.0, 12.0, 12.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.89453125, -6.69476318359375, -6.4949951171875, -6.29522705078125, -6.095458984375, -5.89569091796875, -5.6959228515625, -5.49615478515625, -5.29638671875, -5.09661865234375, -4.8968505859375, -4.69708251953125, -4.497314453125, -4.29754638671875, -4.0977783203125, -3.89801025390625, -3.6982421875, -3.49847412109375, -3.2987060546875, -3.09893798828125, -2.899169921875, -2.69940185546875, -2.4996337890625, -2.29986572265625, -2.10009765625, -1.90032958984375, -1.7005615234375, -1.50079345703125, -1.301025390625, -1.10125732421875, -0.9014892578125, -0.70172119140625, -0.501953125, -0.30218505859375, -0.1024169921875, 0.09735107421875, 0.297119140625, 0.49688720703125, 0.6966552734375, 0.89642333984375, 1.09619140625, 1.29595947265625, 1.4957275390625, 1.69549560546875, 1.895263671875, 2.09503173828125, 2.2947998046875, 2.49456787109375, 2.6943359375, 2.89410400390625, 3.0938720703125, 3.29364013671875, 3.493408203125, 3.69317626953125, 3.8929443359375, 4.09271240234375, 4.29248046875, 4.49224853515625, 4.6920166015625, 4.89178466796875, 5.091552734375, 5.29132080078125, 5.4910888671875, 5.69085693359375, 5.890625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 4.0, 10.0, 12.0, 17.0, 14.0, 31.0, 27.0, 28.0, 39.0, 53.0, 50.0, 53.0, 56.0, 72.0, 75.0, 68.0, 61.0, 63.0, 42.0, 37.0, 24.0, 21.0, 31.0, 20.0, 15.0, 14.0, 15.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.89453125, -2.808990478515625, -2.72344970703125, -2.637908935546875, -2.5523681640625, -2.466827392578125, -2.38128662109375, -2.295745849609375, -2.210205078125, -2.124664306640625, -2.03912353515625, -1.953582763671875, -1.8680419921875, -1.782501220703125, -1.69696044921875, -1.611419677734375, -1.52587890625, -1.440338134765625, -1.35479736328125, -1.269256591796875, -1.1837158203125, -1.098175048828125, -1.01263427734375, -0.927093505859375, -0.841552734375, -0.756011962890625, -0.67047119140625, -0.584930419921875, -0.4993896484375, -0.413848876953125, -0.32830810546875, -0.242767333984375, -0.1572265625, -0.071685791015625, 0.01385498046875, 0.099395751953125, 0.1849365234375, 0.270477294921875, 0.35601806640625, 0.441558837890625, 0.527099609375, 0.612640380859375, 0.69818115234375, 0.783721923828125, 0.8692626953125, 0.954803466796875, 1.04034423828125, 1.125885009765625, 1.21142578125, 1.296966552734375, 1.38250732421875, 1.468048095703125, 1.5535888671875, 1.639129638671875, 1.72467041015625, 1.810211181640625, 1.895751953125, 1.981292724609375, 2.06683349609375, 2.152374267578125, 2.2379150390625, 2.323455810546875, 2.40899658203125, 2.494537353515625, 2.580078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 7.0, 13.0, 9.0, 15.0, 35.0, 48.0, 83.0, 124.0, 308.0, 761.0, 2046.0, 7790.0, 41056.0, 460571.0, 481695.0, 42445.0, 8032.0, 2150.0, 680.0, 291.0, 134.0, 84.0, 60.0, 29.0, 35.0, 11.0, 14.0, 10.0, 5.0, 1.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-19.703125, -19.22265625, -18.7421875, -18.26171875, -17.78125, -17.30078125, -16.8203125, -16.33984375, -15.859375, -15.37890625, -14.8984375, -14.41796875, -13.9375, -13.45703125, -12.9765625, -12.49609375, -12.015625, -11.53515625, -11.0546875, -10.57421875, -10.09375, -9.61328125, -9.1328125, -8.65234375, -8.171875, -7.69140625, -7.2109375, -6.73046875, -6.25, -5.76953125, -5.2890625, -4.80859375, -4.328125, -3.84765625, -3.3671875, -2.88671875, -2.40625, -1.92578125, -1.4453125, -0.96484375, -0.484375, -0.00390625, 0.4765625, 0.95703125, 1.4375, 1.91796875, 2.3984375, 2.87890625, 3.359375, 3.83984375, 4.3203125, 4.80078125, 5.28125, 5.76171875, 6.2421875, 6.72265625, 7.203125, 7.68359375, 8.1640625, 8.64453125, 9.125, 9.60546875, 10.0859375, 10.56640625, 11.046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 6.0, 5.0, 6.0, 8.0, 21.0, 13.0, 17.0, 20.0, 23.0, 26.0, 27.0, 33.0, 27.0, 53.0, 50.0, 47.0, 59.0, 40.0, 51.0, 42.0, 36.0, 43.0, 41.0, 54.0, 39.0, 36.0, 27.0, 17.0, 23.0, 25.0, 13.0, 13.0, 10.0, 6.0, 9.0, 9.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.058837890625, -11.67236328125, -11.285888671875, -10.8994140625, -10.512939453125, -10.12646484375, -9.739990234375, -9.353515625, -8.967041015625, -8.58056640625, -8.194091796875, -7.8076171875, -7.421142578125, -7.03466796875, -6.648193359375, -6.26171875, -5.875244140625, -5.48876953125, -5.102294921875, -4.7158203125, -4.329345703125, -3.94287109375, -3.556396484375, -3.169921875, -2.783447265625, -2.39697265625, -2.010498046875, -1.6240234375, -1.237548828125, -0.85107421875, -0.464599609375, -0.078125, 0.308349609375, 0.69482421875, 1.081298828125, 1.4677734375, 1.854248046875, 2.24072265625, 2.627197265625, 3.013671875, 3.400146484375, 3.78662109375, 4.173095703125, 4.5595703125, 4.946044921875, 5.33251953125, 5.718994140625, 6.10546875, 6.491943359375, 6.87841796875, 7.264892578125, 7.6513671875, 8.037841796875, 8.42431640625, 8.810791015625, 9.197265625, 9.583740234375, 9.97021484375, 10.356689453125, 10.7431640625, 11.129638671875, 11.51611328125, 11.902587890625, 12.2890625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 0.0, 5.0, 9.0, 9.0, 11.0, 21.0, 24.0, 43.0, 42.0, 90.0, 116.0, 182.0, 294.0, 586.0, 1190.0, 3218.0, 13153.0, 116395.0, 811553.0, 85442.0, 10849.0, 2955.0, 1143.0, 490.0, 267.0, 179.0, 87.0, 59.0, 37.0, 29.0, 31.0, 8.0, 13.0, 8.0, 7.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.11700439453125, -7.8668212890625, -7.61663818359375, -7.366455078125, -7.11627197265625, -6.8660888671875, -6.61590576171875, -6.36572265625, -6.11553955078125, -5.8653564453125, -5.61517333984375, -5.364990234375, -5.11480712890625, -4.8646240234375, -4.61444091796875, -4.3642578125, -4.11407470703125, -3.8638916015625, -3.61370849609375, -3.363525390625, -3.11334228515625, -2.8631591796875, -2.61297607421875, -2.36279296875, -2.11260986328125, -1.8624267578125, -1.61224365234375, -1.362060546875, -1.11187744140625, -0.8616943359375, -0.61151123046875, -0.361328125, -0.11114501953125, 0.1390380859375, 0.38922119140625, 0.639404296875, 0.88958740234375, 1.1397705078125, 1.38995361328125, 1.64013671875, 1.89031982421875, 2.1405029296875, 2.39068603515625, 2.640869140625, 2.89105224609375, 3.1412353515625, 3.39141845703125, 3.6416015625, 3.89178466796875, 4.1419677734375, 4.39215087890625, 4.642333984375, 4.89251708984375, 5.1427001953125, 5.39288330078125, 5.64306640625, 5.89324951171875, 6.1434326171875, 6.39361572265625, 6.643798828125, 6.89398193359375, 7.1441650390625, 7.39434814453125, 7.64453125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 5.0, 5.0, 12.0, 22.0, 22.0, 25.0, 37.0, 64.0, 90.0, 98.0, 124.0, 112.0, 100.0, 94.0, 60.0, 34.0, 21.0, 22.0, 17.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0011615753173828125, -0.0011324509978294373, -0.001103326678276062, -0.0010742023587226868, -0.0010450780391693115, -0.0010159537196159363, -0.000986829400062561, -0.0009577050805091858, -0.0009285807609558105, -0.0008994564414024353, -0.0008703321218490601, -0.0008412078022956848, -0.0008120834827423096, -0.0007829591631889343, -0.0007538348436355591, -0.0007247105240821838, -0.0006955862045288086, -0.0006664618849754333, -0.0006373375654220581, -0.0006082132458686829, -0.0005790889263153076, -0.0005499646067619324, -0.0005208402872085571, -0.0004917159676551819, -0.00046259164810180664, -0.0004334673285484314, -0.00040434300899505615, -0.0003752186894416809, -0.00034609436988830566, -0.0003169700503349304, -0.0002878457307815552, -0.00025872141122817993, -0.0002295970916748047, -0.00020047277212142944, -0.0001713484525680542, -0.00014222413301467896, -0.00011309981346130371, -8.397549390792847e-05, -5.485117435455322e-05, -2.572685480117798e-05, 3.3974647521972656e-06, 3.252178430557251e-05, 6.164610385894775e-05, 9.0770423412323e-05, 0.00011989474296569824, 0.00014901906251907349, 0.00017814338207244873, 0.00020726770162582397, 0.00023639202117919922, 0.00026551634073257446, 0.0002946406602859497, 0.00032376497983932495, 0.0003528892993927002, 0.00038201361894607544, 0.0004111379384994507, 0.00044026225805282593, 0.00046938657760620117, 0.0004985108971595764, 0.0005276352167129517, 0.0005567595362663269, 0.0005858838558197021, 0.0006150081753730774, 0.0006441324949264526, 0.0006732568144798279, 0.0007023811340332031]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 5.0, 14.0, 12.0, 28.0, 38.0, 59.0, 121.0, 202.0, 408.0, 841.0, 2146.0, 6469.0, 34596.0, 630993.0, 341956.0, 22387.0, 4983.0, 1795.0, 740.0, 303.0, 153.0, 108.0, 58.0, 46.0, 28.0, 19.0, 18.0, 4.0, 2.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.7421875, -7.4742431640625, -7.206298828125, -6.9383544921875, -6.67041015625, -6.4024658203125, -6.134521484375, -5.8665771484375, -5.5986328125, -5.3306884765625, -5.062744140625, -4.7947998046875, -4.52685546875, -4.2589111328125, -3.990966796875, -3.7230224609375, -3.455078125, -3.1871337890625, -2.919189453125, -2.6512451171875, -2.38330078125, -2.1153564453125, -1.847412109375, -1.5794677734375, -1.3115234375, -1.0435791015625, -0.775634765625, -0.5076904296875, -0.23974609375, 0.0281982421875, 0.296142578125, 0.5640869140625, 0.83203125, 1.0999755859375, 1.367919921875, 1.6358642578125, 1.90380859375, 2.1717529296875, 2.439697265625, 2.7076416015625, 2.9755859375, 3.2435302734375, 3.511474609375, 3.7794189453125, 4.04736328125, 4.3153076171875, 4.583251953125, 4.8511962890625, 5.119140625, 5.3870849609375, 5.655029296875, 5.9229736328125, 6.19091796875, 6.4588623046875, 6.726806640625, 6.9947509765625, 7.2626953125, 7.5306396484375, 7.798583984375, 8.0665283203125, 8.33447265625, 8.6024169921875, 8.870361328125, 9.1383056640625, 9.40625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 0.0, 4.0, 3.0, 6.0, 10.0, 10.0, 16.0, 16.0, 26.0, 27.0, 40.0, 64.0, 68.0, 102.0, 101.0, 87.0, 94.0, 79.0, 61.0, 44.0, 40.0, 20.0, 31.0, 14.0, 11.0, 7.0, 3.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.8359375, -6.6517333984375, -6.467529296875, -6.2833251953125, -6.09912109375, -5.9149169921875, -5.730712890625, -5.5465087890625, -5.3623046875, -5.1781005859375, -4.993896484375, -4.8096923828125, -4.62548828125, -4.4412841796875, -4.257080078125, -4.0728759765625, -3.888671875, -3.7044677734375, -3.520263671875, -3.3360595703125, -3.15185546875, -2.9676513671875, -2.783447265625, -2.5992431640625, -2.4150390625, -2.2308349609375, -2.046630859375, -1.8624267578125, -1.67822265625, -1.4940185546875, -1.309814453125, -1.1256103515625, -0.94140625, -0.7572021484375, -0.572998046875, -0.3887939453125, -0.20458984375, -0.0203857421875, 0.163818359375, 0.3480224609375, 0.5322265625, 0.7164306640625, 0.900634765625, 1.0848388671875, 1.26904296875, 1.4532470703125, 1.637451171875, 1.8216552734375, 2.005859375, 2.1900634765625, 2.374267578125, 2.5584716796875, 2.74267578125, 2.9268798828125, 3.111083984375, 3.2952880859375, 3.4794921875, 3.6636962890625, 3.847900390625, 4.0321044921875, 4.21630859375, 4.4005126953125, 4.584716796875, 4.7689208984375, 4.953125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 12.0, 24.0, 67.0, 105.0, 212.0, 249.0, 169.0, 92.0, 42.0, 21.0, 5.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-189.49513244628906, -184.24549865722656, -178.99588012695312, -173.74624633789062, -168.4966278076172, -163.2469940185547, -157.99737548828125, -152.74774169921875, -147.49810791015625, -142.24847412109375, -136.9988555908203, -131.7492218017578, -126.49960327148438, -121.24996948242188, -116.0003433227539, -110.75071716308594, -105.5010986328125, -100.25147247314453, -95.00184631347656, -89.7522201538086, -84.50259399414062, -79.25296020507812, -74.00333404541016, -68.75370788574219, -63.50408172607422, -58.25445556640625, -53.00482940673828, -47.75519943237305, -42.50557327270508, -37.25594711303711, -32.006317138671875, -26.756690979003906, -21.507080078125, -16.25745391845703, -11.00782585144043, -5.7581987380981445, -0.5085716247558594, 4.741054534912109, 9.990682601928711, 15.240310668945312, 20.48993682861328, 25.73956298828125, 30.98919105529785, 36.23881912231445, 41.48844528198242, 46.73807144165039, 51.987701416015625, 57.237327575683594, 62.48695373535156, 67.73657989501953, 72.9862060546875, 78.23583221435547, 83.48545837402344, 88.73509216308594, 93.9847183227539, 99.23434448242188, 104.48397064208984, 109.73359680175781, 114.98322296142578, 120.23284912109375, 125.48248291015625, 130.7321014404297, 135.9817352294922, 141.23135375976562, 146.48098754882812]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 4.0, 6.0, 4.0, 9.0, 13.0, 15.0, 15.0, 21.0, 19.0, 23.0, 21.0, 18.0, 42.0, 33.0, 48.0, 41.0, 49.0, 43.0, 49.0, 55.0, 48.0, 55.0, 49.0, 33.0, 41.0, 33.0, 37.0, 37.0, 25.0, 24.0, 12.0, 19.0, 14.0, 8.0, 12.0, 3.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.035037994384766, -58.16160583496094, -56.288177490234375, -54.41474533081055, -52.541316986083984, -50.667884826660156, -48.794456481933594, -46.921024322509766, -45.04759216308594, -43.17416000366211, -41.30073165893555, -39.42729949951172, -37.553871154785156, -35.68043899536133, -33.8070068359375, -31.933578491210938, -30.060150146484375, -28.18671989440918, -26.313289642333984, -24.439857482910156, -22.566429138183594, -20.692996978759766, -18.81956672668457, -16.946136474609375, -15.07270622253418, -13.199275970458984, -11.325845718383789, -9.452414512634277, -7.578984260559082, -5.705554008483887, -3.832122802734375, -1.9586925506591797, -0.08525848388671875, 1.7881720066070557, 3.66160249710083, 5.535033226013184, 7.408463478088379, 9.281893730163574, 11.155324935913086, 13.028755187988281, 14.902185440063477, 16.775615692138672, 18.649045944213867, 20.522476196289062, 22.39590835571289, 24.269336700439453, 26.14276885986328, 28.016199111938477, 29.889629364013672, 31.763059616088867, 33.63648986816406, 35.50992202758789, 37.38335037231445, 39.25678253173828, 41.130210876464844, 43.00364303588867, 44.8770751953125, 46.75050735473633, 48.62393569946289, 50.49736785888672, 52.37079620361328, 54.24422836303711, 56.11766052246094, 57.9910888671875, 59.86451721191406]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 11.0, 8.0, 13.0, 24.0, 31.0, 71.0, 140.0, 281.0, 680.0, 2494.0, 45764.0, 4139747.0, 3503.0, 880.0, 313.0, 142.0, 75.0, 43.0, 23.0, 12.0, 11.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.78125, -52.533203125, -51.28515625, -50.037109375, -48.7890625, -47.541015625, -46.29296875, -45.044921875, -43.796875, -42.548828125, -41.30078125, -40.052734375, -38.8046875, -37.556640625, -36.30859375, -35.060546875, -33.8125, -32.564453125, -31.31640625, -30.068359375, -28.8203125, -27.572265625, -26.32421875, -25.076171875, -23.828125, -22.580078125, -21.33203125, -20.083984375, -18.8359375, -17.587890625, -16.33984375, -15.091796875, -13.84375, -12.595703125, -11.34765625, -10.099609375, -8.8515625, -7.603515625, -6.35546875, -5.107421875, -3.859375, -2.611328125, -1.36328125, -0.115234375, 1.1328125, 2.380859375, 3.62890625, 4.876953125, 6.125, 7.373046875, 8.62109375, 9.869140625, 11.1171875, 12.365234375, 13.61328125, 14.861328125, 16.109375, 17.357421875, 18.60546875, 19.853515625, 21.1015625, 22.349609375, 23.59765625, 24.845703125, 26.09375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 8.0, 9.0, 10.0, 11.0, 23.0, 20.0, 37.0, 52.0, 59.0, 59.0, 63.0, 82.0, 67.0, 75.0, 66.0, 66.0, 66.0, 60.0, 19.0, 24.0, 17.0, 22.0, 25.0, 10.0, 5.0, 12.0, 7.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.947265625, -3.833465576171875, -3.71966552734375, -3.605865478515625, -3.4920654296875, -3.378265380859375, -3.26446533203125, -3.150665283203125, -3.036865234375, -2.923065185546875, -2.80926513671875, -2.695465087890625, -2.5816650390625, -2.467864990234375, -2.35406494140625, -2.240264892578125, -2.12646484375, -2.012664794921875, -1.89886474609375, -1.785064697265625, -1.6712646484375, -1.557464599609375, -1.44366455078125, -1.329864501953125, -1.216064453125, -1.102264404296875, -0.98846435546875, -0.874664306640625, -0.7608642578125, -0.647064208984375, -0.53326416015625, -0.419464111328125, -0.3056640625, -0.191864013671875, -0.07806396484375, 0.035736083984375, 0.1495361328125, 0.263336181640625, 0.37713623046875, 0.490936279296875, 0.604736328125, 0.718536376953125, 0.83233642578125, 0.946136474609375, 1.0599365234375, 1.173736572265625, 1.28753662109375, 1.401336669921875, 1.51513671875, 1.628936767578125, 1.74273681640625, 1.856536865234375, 1.9703369140625, 2.084136962890625, 2.19793701171875, 2.311737060546875, 2.425537109375, 2.539337158203125, 2.65313720703125, 2.766937255859375, 2.8807373046875, 2.994537353515625, 3.10833740234375, 3.222137451171875, 3.3359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 7.0, 12.0, 17.0, 23.0, 23.0, 42.0, 36.0, 51.0, 102.0, 123.0, 178.0, 222.0, 319.0, 449.0, 636.0, 853.0, 1327.0, 1953.0, 3427.0, 6679.0, 18890.0, 3973290.0, 156936.0, 14272.0, 5597.0, 2923.0, 1740.0, 1135.0, 831.0, 643.0, 419.0, 285.0, 206.0, 165.0, 117.0, 93.0, 74.0, 57.0, 38.0, 27.0, 16.0, 18.0, 7.0, 4.0, 4.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.515625, -12.1351318359375, -11.754638671875, -11.3741455078125, -10.99365234375, -10.6131591796875, -10.232666015625, -9.8521728515625, -9.4716796875, -9.0911865234375, -8.710693359375, -8.3302001953125, -7.94970703125, -7.5692138671875, -7.188720703125, -6.8082275390625, -6.427734375, -6.0472412109375, -5.666748046875, -5.2862548828125, -4.90576171875, -4.5252685546875, -4.144775390625, -3.7642822265625, -3.3837890625, -3.0032958984375, -2.622802734375, -2.2423095703125, -1.86181640625, -1.4813232421875, -1.100830078125, -0.7203369140625, -0.33984375, 0.0406494140625, 0.421142578125, 0.8016357421875, 1.18212890625, 1.5626220703125, 1.943115234375, 2.3236083984375, 2.7041015625, 3.0845947265625, 3.465087890625, 3.8455810546875, 4.22607421875, 4.6065673828125, 4.987060546875, 5.3675537109375, 5.748046875, 6.1285400390625, 6.509033203125, 6.8895263671875, 7.27001953125, 7.6505126953125, 8.031005859375, 8.4114990234375, 8.7919921875, 9.1724853515625, 9.552978515625, 9.9334716796875, 10.31396484375, 10.6944580078125, 11.074951171875, 11.4554443359375, 11.8359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 7.0, 4.0, 13.0, 15.0, 14.0, 65.0, 3606.0, 240.0, 47.0, 15.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.248046875, -3.14593505859375, -3.0438232421875, -2.94171142578125, -2.839599609375, -2.73748779296875, -2.6353759765625, -2.53326416015625, -2.43115234375, -2.32904052734375, -2.2269287109375, -2.12481689453125, -2.022705078125, -1.92059326171875, -1.8184814453125, -1.71636962890625, -1.6142578125, -1.51214599609375, -1.4100341796875, -1.30792236328125, -1.205810546875, -1.10369873046875, -1.0015869140625, -0.89947509765625, -0.79736328125, -0.69525146484375, -0.5931396484375, -0.49102783203125, -0.388916015625, -0.28680419921875, -0.1846923828125, -0.08258056640625, 0.01953125, 0.12164306640625, 0.2237548828125, 0.32586669921875, 0.427978515625, 0.53009033203125, 0.6322021484375, 0.73431396484375, 0.83642578125, 0.93853759765625, 1.0406494140625, 1.14276123046875, 1.244873046875, 1.34698486328125, 1.4490966796875, 1.55120849609375, 1.6533203125, 1.75543212890625, 1.8575439453125, 1.95965576171875, 2.061767578125, 2.16387939453125, 2.2659912109375, 2.36810302734375, 2.47021484375, 2.57232666015625, 2.6744384765625, 2.77655029296875, 2.878662109375, 2.98077392578125, 3.0828857421875, 3.18499755859375, 3.287109375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 10.0, 16.0, 9.0, 25.0, 53.0, 63.0, 97.0, 143.0, 164.0, 161.0, 107.0, 69.0, 37.0, 25.0, 10.0, 8.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.264812469482422, -17.76633644104004, -17.267860412597656, -16.769384384155273, -16.270906448364258, -15.772430419921875, -15.273954391479492, -14.77547836303711, -14.277002334594727, -13.778526306152344, -13.280049324035645, -12.781573295593262, -12.283097267150879, -11.78462028503418, -11.286144256591797, -10.787668228149414, -10.289192199707031, -9.790716171264648, -9.29223918914795, -8.793763160705566, -8.295287132263184, -7.796810626983643, -7.298334121704102, -6.799858093261719, -6.3013811111450195, -5.8029046058654785, -5.304428577423096, -4.805952072143555, -4.307476043701172, -3.808999538421631, -3.310523271560669, -2.812047004699707, -2.313570976257324, -1.8150947093963623, -1.3166184425354004, -0.8181420564651489, -0.319665789604187, 0.17881059646606445, 0.6772868633270264, 1.1757631301879883, 1.6742393970489502, 2.172715663909912, 2.671191930770874, 3.169668197631836, 3.668144702911377, 4.166621208190918, 4.665097236633301, 5.163573265075684, 5.662049770355225, 6.160526275634766, 6.659002304077148, 7.1574788093566895, 7.655954837799072, 8.154431343078613, 8.652907371520996, 9.151384353637695, 9.649860382080078, 10.148336410522461, 10.64681339263916, 11.145289421081543, 11.643765449523926, 12.142242431640625, 12.640718460083008, 13.13919448852539, 13.637670516967773]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 1.0, 5.0, 3.0, 9.0, 7.0, 9.0, 7.0, 15.0, 14.0, 16.0, 20.0, 31.0, 29.0, 34.0, 44.0, 45.0, 33.0, 44.0, 43.0, 43.0, 42.0, 41.0, 44.0, 49.0, 37.0, 33.0, 40.0, 45.0, 30.0, 26.0, 25.0, 23.0, 21.0, 14.0, 12.0, 16.0, 10.0, 6.0, 9.0, 9.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.868834495544434, -5.685405731201172, -5.50197696685791, -5.318548202514648, -5.135119438171387, -4.951690673828125, -4.768261909484863, -4.584833145141602, -4.40140438079834, -4.217975616455078, -4.034546852111816, -3.8511180877685547, -3.667689323425293, -3.4842605590820312, -3.3008315563201904, -3.1174027919769287, -2.933973789215088, -2.750545024871826, -2.5671162605285645, -2.3836874961853027, -2.200258731842041, -2.0168299674987793, -1.8334009647369385, -1.6499722003936768, -1.466543436050415, -1.2831146717071533, -1.0996859073638916, -0.9162570238113403, -0.7328282594680786, -0.5493994951248169, -0.3659706115722656, -0.1825418472290039, 0.0008864402770996094, 0.18431523442268372, 0.3677440285682678, 0.5511728525161743, 0.734601616859436, 0.9180303812026978, 1.101459264755249, 1.2848880290985107, 1.4683167934417725, 1.6517455577850342, 1.835174322128296, 2.0186033248901367, 2.2020320892333984, 2.38546085357666, 2.568889617919922, 2.7523183822631836, 2.9357471466064453, 3.119175910949707, 3.3026046752929688, 3.4860334396362305, 3.669462203979492, 3.852890968322754, 4.036319732666016, 4.219748497009277, 4.403177261352539, 4.586606025695801, 4.7700347900390625, 4.953463554382324, 5.136892318725586, 5.320321083068848, 5.503749847412109, 5.687178611755371, 5.870607852935791]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 7.0, 21.0, 22.0, 31.0, 41.0, 79.0, 114.0, 172.0, 328.0, 501.0, 1028.0, 2097.0, 4898.0, 13427.0, 46217.0, 215392.0, 564336.0, 147565.0, 33723.0, 10617.0, 4025.0, 1771.0, 901.0, 478.0, 278.0, 174.0, 98.0, 65.0, 40.0, 25.0, 19.0, 12.0, 9.0, 4.0, 9.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.640625, -9.3233642578125, -9.006103515625, -8.6888427734375, -8.37158203125, -8.0543212890625, -7.737060546875, -7.4197998046875, -7.1025390625, -6.7852783203125, -6.468017578125, -6.1507568359375, -5.83349609375, -5.5162353515625, -5.198974609375, -4.8817138671875, -4.564453125, -4.2471923828125, -3.929931640625, -3.6126708984375, -3.29541015625, -2.9781494140625, -2.660888671875, -2.3436279296875, -2.0263671875, -1.7091064453125, -1.391845703125, -1.0745849609375, -0.75732421875, -0.4400634765625, -0.122802734375, 0.1944580078125, 0.51171875, 0.8289794921875, 1.146240234375, 1.4635009765625, 1.78076171875, 2.0980224609375, 2.415283203125, 2.7325439453125, 3.0498046875, 3.3670654296875, 3.684326171875, 4.0015869140625, 4.31884765625, 4.6361083984375, 4.953369140625, 5.2706298828125, 5.587890625, 5.9051513671875, 6.222412109375, 6.5396728515625, 6.85693359375, 7.1741943359375, 7.491455078125, 7.8087158203125, 8.1259765625, 8.4432373046875, 8.760498046875, 9.0777587890625, 9.39501953125, 9.7122802734375, 10.029541015625, 10.3468017578125, 10.6640625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 9.0, 7.0, 6.0, 9.0, 15.0, 13.0, 17.0, 27.0, 36.0, 52.0, 55.0, 67.0, 68.0, 51.0, 69.0, 75.0, 69.0, 62.0, 54.0, 56.0, 41.0, 29.0, 25.0, 20.0, 18.0, 12.0, 8.0, 11.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.56640625, -4.44580078125, -4.3251953125, -4.20458984375, -4.083984375, -3.96337890625, -3.8427734375, -3.72216796875, -3.6015625, -3.48095703125, -3.3603515625, -3.23974609375, -3.119140625, -2.99853515625, -2.8779296875, -2.75732421875, -2.63671875, -2.51611328125, -2.3955078125, -2.27490234375, -2.154296875, -2.03369140625, -1.9130859375, -1.79248046875, -1.671875, -1.55126953125, -1.4306640625, -1.31005859375, -1.189453125, -1.06884765625, -0.9482421875, -0.82763671875, -0.70703125, -0.58642578125, -0.4658203125, -0.34521484375, -0.224609375, -0.10400390625, 0.0166015625, 0.13720703125, 0.2578125, 0.37841796875, 0.4990234375, 0.61962890625, 0.740234375, 0.86083984375, 0.9814453125, 1.10205078125, 1.22265625, 1.34326171875, 1.4638671875, 1.58447265625, 1.705078125, 1.82568359375, 1.9462890625, 2.06689453125, 2.1875, 2.30810546875, 2.4287109375, 2.54931640625, 2.669921875, 2.79052734375, 2.9111328125, 3.03173828125, 3.15234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 5.0, 13.0, 13.0, 28.0, 27.0, 38.0, 56.0, 86.0, 163.0, 291.0, 555.0, 1410.0, 4467.0, 19493.0, 154886.0, 737583.0, 108463.0, 15120.0, 3600.0, 1142.0, 483.0, 232.0, 123.0, 88.0, 52.0, 42.0, 23.0, 24.0, 11.0, 10.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.125, -15.6697998046875, -15.214599609375, -14.7593994140625, -14.30419921875, -13.8489990234375, -13.393798828125, -12.9385986328125, -12.4833984375, -12.0281982421875, -11.572998046875, -11.1177978515625, -10.66259765625, -10.2073974609375, -9.752197265625, -9.2969970703125, -8.841796875, -8.3865966796875, -7.931396484375, -7.4761962890625, -7.02099609375, -6.5657958984375, -6.110595703125, -5.6553955078125, -5.2001953125, -4.7449951171875, -4.289794921875, -3.8345947265625, -3.37939453125, -2.9241943359375, -2.468994140625, -2.0137939453125, -1.55859375, -1.1033935546875, -0.648193359375, -0.1929931640625, 0.26220703125, 0.7174072265625, 1.172607421875, 1.6278076171875, 2.0830078125, 2.5382080078125, 2.993408203125, 3.4486083984375, 3.90380859375, 4.3590087890625, 4.814208984375, 5.2694091796875, 5.724609375, 6.1798095703125, 6.635009765625, 7.0902099609375, 7.54541015625, 8.0006103515625, 8.455810546875, 8.9110107421875, 9.3662109375, 9.8214111328125, 10.276611328125, 10.7318115234375, 11.18701171875, 11.6422119140625, 12.097412109375, 12.5526123046875, 13.0078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 11.0, 6.0, 5.0, 10.0, 16.0, 15.0, 19.0, 18.0, 19.0, 33.0, 35.0, 41.0, 26.0, 35.0, 42.0, 48.0, 43.0, 53.0, 49.0, 57.0, 52.0, 38.0, 31.0, 35.0, 39.0, 44.0, 25.0, 38.0, 25.0, 19.0, 8.0, 16.0, 2.0, 12.0, 10.0, 2.0, 2.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.359375, -12.899169921875, -12.43896484375, -11.978759765625, -11.5185546875, -11.058349609375, -10.59814453125, -10.137939453125, -9.677734375, -9.217529296875, -8.75732421875, -8.297119140625, -7.8369140625, -7.376708984375, -6.91650390625, -6.456298828125, -5.99609375, -5.535888671875, -5.07568359375, -4.615478515625, -4.1552734375, -3.695068359375, -3.23486328125, -2.774658203125, -2.314453125, -1.854248046875, -1.39404296875, -0.933837890625, -0.4736328125, -0.013427734375, 0.44677734375, 0.906982421875, 1.3671875, 1.827392578125, 2.28759765625, 2.747802734375, 3.2080078125, 3.668212890625, 4.12841796875, 4.588623046875, 5.048828125, 5.509033203125, 5.96923828125, 6.429443359375, 6.8896484375, 7.349853515625, 7.81005859375, 8.270263671875, 8.73046875, 9.190673828125, 9.65087890625, 10.111083984375, 10.5712890625, 11.031494140625, 11.49169921875, 11.951904296875, 12.412109375, 12.872314453125, 13.33251953125, 13.792724609375, 14.2529296875, 14.713134765625, 15.17333984375, 15.633544921875, 16.09375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 10.0, 9.0, 10.0, 18.0, 44.0, 49.0, 89.0, 168.0, 375.0, 1292.0, 11516.0, 912388.0, 117803.0, 3574.0, 701.0, 248.0, 109.0, 46.0, 42.0, 15.0, 16.0, 5.0, 8.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8515625, -14.3690185546875, -13.886474609375, -13.4039306640625, -12.92138671875, -12.4388427734375, -11.956298828125, -11.4737548828125, -10.9912109375, -10.5086669921875, -10.026123046875, -9.5435791015625, -9.06103515625, -8.5784912109375, -8.095947265625, -7.6134033203125, -7.130859375, -6.6483154296875, -6.165771484375, -5.6832275390625, -5.20068359375, -4.7181396484375, -4.235595703125, -3.7530517578125, -3.2705078125, -2.7879638671875, -2.305419921875, -1.8228759765625, -1.34033203125, -0.8577880859375, -0.375244140625, 0.1072998046875, 0.58984375, 1.0723876953125, 1.554931640625, 2.0374755859375, 2.52001953125, 3.0025634765625, 3.485107421875, 3.9676513671875, 4.4501953125, 4.9327392578125, 5.415283203125, 5.8978271484375, 6.38037109375, 6.8629150390625, 7.345458984375, 7.8280029296875, 8.310546875, 8.7930908203125, 9.275634765625, 9.7581787109375, 10.24072265625, 10.7232666015625, 11.205810546875, 11.6883544921875, 12.1708984375, 12.6534423828125, 13.135986328125, 13.6185302734375, 14.10107421875, 14.5836181640625, 15.066162109375, 15.5487060546875, 16.03125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 8.0, 8.0, 12.0, 20.0, 26.0, 38.0, 60.0, 69.0, 118.0, 146.0, 147.0, 103.0, 90.0, 47.0, 27.0, 24.0, 18.0, 17.0, 11.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00070953369140625, -0.0006800591945648193, -0.0006505846977233887, -0.000621110200881958, -0.0005916357040405273, -0.0005621612071990967, -0.000532686710357666, -0.0005032122135162354, -0.0004737377166748047, -0.000444263219833374, -0.00041478872299194336, -0.0003853142261505127, -0.00035583972930908203, -0.00032636523246765137, -0.0002968907356262207, -0.00026741623878479004, -0.00023794174194335938, -0.0002084672451019287, -0.00017899274826049805, -0.00014951825141906738, -0.00012004375457763672, -9.056925773620605e-05, -6.109476089477539e-05, -3.1620264053344727e-05, -2.1457672119140625e-06, 2.73287296295166e-05, 5.6803226470947266e-05, 8.627772331237793e-05, 0.0001157522201538086, 0.00014522671699523926, 0.00017470121383666992, 0.00020417571067810059, 0.00023365020751953125, 0.0002631247043609619, 0.0002925992012023926, 0.00032207369804382324, 0.0003515481948852539, 0.00038102269172668457, 0.00041049718856811523, 0.0004399716854095459, 0.00046944618225097656, 0.0004989206790924072, 0.0005283951759338379, 0.0005578696727752686, 0.0005873441696166992, 0.0006168186664581299, 0.0006462931632995605, 0.0006757676601409912, 0.0007052421569824219, 0.0007347166538238525, 0.0007641911506652832, 0.0007936656475067139, 0.0008231401443481445, 0.0008526146411895752, 0.0008820891380310059, 0.0009115636348724365, 0.0009410381317138672, 0.0009705126285552979, 0.0009999871253967285, 0.0010294616222381592, 0.0010589361190795898, 0.0010884106159210205, 0.0011178851127624512, 0.0011473596096038818, 0.0011768341064453125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 8.0, 11.0, 19.0, 17.0, 50.0, 68.0, 108.0, 173.0, 367.0, 835.0, 2784.0, 15000.0, 229812.0, 754321.0, 37396.0, 5172.0, 1364.0, 508.0, 223.0, 124.0, 66.0, 48.0, 28.0, 17.0, 11.0, 11.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.453125, -7.1888427734375, -6.924560546875, -6.6602783203125, -6.39599609375, -6.1317138671875, -5.867431640625, -5.6031494140625, -5.3388671875, -5.0745849609375, -4.810302734375, -4.5460205078125, -4.28173828125, -4.0174560546875, -3.753173828125, -3.4888916015625, -3.224609375, -2.9603271484375, -2.696044921875, -2.4317626953125, -2.16748046875, -1.9031982421875, -1.638916015625, -1.3746337890625, -1.1103515625, -0.8460693359375, -0.581787109375, -0.3175048828125, -0.05322265625, 0.2110595703125, 0.475341796875, 0.7396240234375, 1.00390625, 1.2681884765625, 1.532470703125, 1.7967529296875, 2.06103515625, 2.3253173828125, 2.589599609375, 2.8538818359375, 3.1181640625, 3.3824462890625, 3.646728515625, 3.9110107421875, 4.17529296875, 4.4395751953125, 4.703857421875, 4.9681396484375, 5.232421875, 5.4967041015625, 5.760986328125, 6.0252685546875, 6.28955078125, 6.5538330078125, 6.818115234375, 7.0823974609375, 7.3466796875, 7.6109619140625, 7.875244140625, 8.1395263671875, 8.40380859375, 8.6680908203125, 8.932373046875, 9.1966552734375, 9.4609375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 7.0, 13.0, 23.0, 22.0, 28.0, 55.0, 85.0, 129.0, 146.0, 174.0, 92.0, 67.0, 56.0, 39.0, 19.0, 16.0, 12.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-12.265625, -11.9852294921875, -11.704833984375, -11.4244384765625, -11.14404296875, -10.8636474609375, -10.583251953125, -10.3028564453125, -10.0224609375, -9.7420654296875, -9.461669921875, -9.1812744140625, -8.90087890625, -8.6204833984375, -8.340087890625, -8.0596923828125, -7.779296875, -7.4989013671875, -7.218505859375, -6.9381103515625, -6.65771484375, -6.3773193359375, -6.096923828125, -5.8165283203125, -5.5361328125, -5.2557373046875, -4.975341796875, -4.6949462890625, -4.41455078125, -4.1341552734375, -3.853759765625, -3.5733642578125, -3.29296875, -3.0125732421875, -2.732177734375, -2.4517822265625, -2.17138671875, -1.8909912109375, -1.610595703125, -1.3302001953125, -1.0498046875, -0.7694091796875, -0.489013671875, -0.2086181640625, 0.07177734375, 0.3521728515625, 0.632568359375, 0.9129638671875, 1.193359375, 1.4737548828125, 1.754150390625, 2.0345458984375, 2.31494140625, 2.5953369140625, 2.875732421875, 3.1561279296875, 3.4365234375, 3.7169189453125, 3.997314453125, 4.2777099609375, 4.55810546875, 4.8385009765625, 5.118896484375, 5.3992919921875, 5.6796875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 18.0, 47.0, 279.0, 436.0, 173.0, 45.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.34608459472656, -76.08837890625, -66.8306655883789, -57.57295608520508, -48.31524658203125, -39.05753707885742, -29.799827575683594, -20.5421142578125, -11.284408569335938, -2.0266990661621094, 7.231010437011719, 16.488719940185547, 25.746429443359375, 35.0041389465332, 44.26184844970703, 53.519561767578125, 62.77726745605469, 72.03497314453125, 81.29268646240234, 90.55039978027344, 99.80810546875, 109.06581115722656, 118.32352447509766, 127.58123779296875, 136.8389434814453, 146.09664916992188, 155.3543701171875, 164.61207580566406, 173.86978149414062, 183.1274871826172, 192.38519287109375, 201.64291381835938, 210.900634765625, 220.15834045410156, 229.41604614257812, 238.67376708984375, 247.9314727783203, 257.1891784667969, 266.4468994140625, 275.70458984375, 284.9623107910156, 294.22003173828125, 303.47772216796875, 312.7354431152344, 321.9931640625, 331.2508544921875, 340.5085754394531, 349.76629638671875, 359.02398681640625, 368.2817077636719, 377.5393981933594, 386.797119140625, 396.0548095703125, 405.3125305175781, 414.57025146484375, 423.82794189453125, 433.0856628417969, 442.3433837890625, 451.60107421875, 460.8587951660156, 470.11651611328125, 479.37420654296875, 488.6319274902344, 497.8896484375, 507.1473388671875]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 6.0, 5.0, 6.0, 11.0, 6.0, 13.0, 16.0, 20.0, 18.0, 16.0, 17.0, 20.0, 22.0, 34.0, 22.0, 38.0, 45.0, 36.0, 35.0, 46.0, 50.0, 35.0, 31.0, 45.0, 45.0, 48.0, 34.0, 32.0, 28.0, 28.0, 36.0, 18.0, 17.0, 20.0, 18.0, 11.0, 15.0, 13.0, 6.0, 9.0, 9.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-64.68049621582031, -62.86137771606445, -61.04225540161133, -59.22313690185547, -57.404014587402344, -55.584896087646484, -53.765777587890625, -51.9466552734375, -50.12753677368164, -48.30841827392578, -46.489295959472656, -44.6701774597168, -42.85105895996094, -41.03193664550781, -39.21281814575195, -37.393699645996094, -35.57457733154297, -33.75545883178711, -31.936336517333984, -30.117218017578125, -28.298097610473633, -26.47897720336914, -24.65985870361328, -22.84073829650879, -21.021617889404297, -19.202497482299805, -17.383377075195312, -15.564258575439453, -13.745138168334961, -11.926017761230469, -10.106898307800293, -8.287778854370117, -6.468658447265625, -4.649538516998291, -2.830418586730957, -1.011298656463623, 0.8078212738037109, 2.626941680908203, 4.446061134338379, 6.265180587768555, 8.084300994873047, 9.903421401977539, 11.722540855407715, 13.54166030883789, 15.360780715942383, 17.179901123046875, 18.999019622802734, 20.818140029907227, 22.63726043701172, 24.45638084411621, 26.275501251220703, 28.094619750976562, 29.913740158081055, 31.732860565185547, 33.551979064941406, 35.37110137939453, 37.19021987915039, 39.00933837890625, 40.828460693359375, 42.647579193115234, 44.466697692871094, 46.28582000732422, 48.10493850708008, 49.92405700683594, 51.74317932128906]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 7.0, 7.0, 18.0, 20.0, 48.0, 71.0, 120.0, 255.0, 518.0, 1223.0, 4968.0, 4084158.0, 97152.0, 3818.0, 1052.0, 404.0, 199.0, 106.0, 57.0, 34.0, 15.0, 9.0, 7.0, 5.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-42.8125, -41.837646484375, -40.86279296875, -39.887939453125, -38.9130859375, -37.938232421875, -36.96337890625, -35.988525390625, -35.013671875, -34.038818359375, -33.06396484375, -32.089111328125, -31.1142578125, -30.139404296875, -29.16455078125, -28.189697265625, -27.21484375, -26.239990234375, -25.26513671875, -24.290283203125, -23.3154296875, -22.340576171875, -21.36572265625, -20.390869140625, -19.416015625, -18.441162109375, -17.46630859375, -16.491455078125, -15.5166015625, -14.541748046875, -13.56689453125, -12.592041015625, -11.6171875, -10.642333984375, -9.66748046875, -8.692626953125, -7.7177734375, -6.742919921875, -5.76806640625, -4.793212890625, -3.818359375, -2.843505859375, -1.86865234375, -0.893798828125, 0.0810546875, 1.055908203125, 2.03076171875, 3.005615234375, 3.98046875, 4.955322265625, 5.93017578125, 6.905029296875, 7.8798828125, 8.854736328125, 9.82958984375, 10.804443359375, 11.779296875, 12.754150390625, 13.72900390625, 14.703857421875, 15.6787109375, 16.653564453125, 17.62841796875, 18.603271484375, 19.578125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 5.0, 5.0, 5.0, 4.0, 6.0, 8.0, 9.0, 13.0, 16.0, 23.0, 24.0, 34.0, 47.0, 57.0, 49.0, 62.0, 59.0, 72.0, 67.0, 74.0, 63.0, 48.0, 50.0, 51.0, 37.0, 30.0, 18.0, 12.0, 9.0, 12.0, 9.0, 5.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.603515625, -3.49700927734375, -3.3905029296875, -3.28399658203125, -3.177490234375, -3.07098388671875, -2.9644775390625, -2.85797119140625, -2.75146484375, -2.64495849609375, -2.5384521484375, -2.43194580078125, -2.325439453125, -2.21893310546875, -2.1124267578125, -2.00592041015625, -1.8994140625, -1.79290771484375, -1.6864013671875, -1.57989501953125, -1.473388671875, -1.36688232421875, -1.2603759765625, -1.15386962890625, -1.04736328125, -0.94085693359375, -0.8343505859375, -0.72784423828125, -0.621337890625, -0.51483154296875, -0.4083251953125, -0.30181884765625, -0.1953125, -0.08880615234375, 0.0177001953125, 0.12420654296875, 0.230712890625, 0.33721923828125, 0.4437255859375, 0.55023193359375, 0.65673828125, 0.76324462890625, 0.8697509765625, 0.97625732421875, 1.082763671875, 1.18927001953125, 1.2957763671875, 1.40228271484375, 1.5087890625, 1.61529541015625, 1.7218017578125, 1.82830810546875, 1.934814453125, 2.04132080078125, 2.1478271484375, 2.25433349609375, 2.36083984375, 2.46734619140625, 2.5738525390625, 2.68035888671875, 2.786865234375, 2.89337158203125, 2.9998779296875, 3.10638427734375, 3.212890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 6.0, 24.0, 21.0, 28.0, 57.0, 58.0, 106.0, 166.0, 220.0, 393.0, 628.0, 1057.0, 1901.0, 3485.0, 6726.0, 13618.0, 40896.0, 3926265.0, 155373.0, 22511.0, 9383.0, 4979.0, 2610.0, 1548.0, 798.0, 559.0, 304.0, 173.0, 113.0, 81.0, 64.0, 31.0, 27.0, 31.0, 10.0, 9.0, 5.0, 3.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1328125, -9.8236083984375, -9.514404296875, -9.2052001953125, -8.89599609375, -8.5867919921875, -8.277587890625, -7.9683837890625, -7.6591796875, -7.3499755859375, -7.040771484375, -6.7315673828125, -6.42236328125, -6.1131591796875, -5.803955078125, -5.4947509765625, -5.185546875, -4.8763427734375, -4.567138671875, -4.2579345703125, -3.94873046875, -3.6395263671875, -3.330322265625, -3.0211181640625, -2.7119140625, -2.4027099609375, -2.093505859375, -1.7843017578125, -1.47509765625, -1.1658935546875, -0.856689453125, -0.5474853515625, -0.23828125, 0.0709228515625, 0.380126953125, 0.6893310546875, 0.99853515625, 1.3077392578125, 1.616943359375, 1.9261474609375, 2.2353515625, 2.5445556640625, 2.853759765625, 3.1629638671875, 3.47216796875, 3.7813720703125, 4.090576171875, 4.3997802734375, 4.708984375, 5.0181884765625, 5.327392578125, 5.6365966796875, 5.94580078125, 6.2550048828125, 6.564208984375, 6.8734130859375, 7.1826171875, 7.4918212890625, 7.801025390625, 8.1102294921875, 8.41943359375, 8.7286376953125, 9.037841796875, 9.3470458984375, 9.65625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 3.0, 6.0, 3.0, 4.0, 11.0, 7.0, 9.0, 10.0, 15.0, 12.0, 35.0, 88.0, 792.0, 2821.0, 121.0, 41.0, 28.0, 13.0, 13.0, 6.0, 5.0, 3.0, 3.0, 3.0, 7.0, 5.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28515625, -4.1375732421875, -3.989990234375, -3.8424072265625, -3.69482421875, -3.5472412109375, -3.399658203125, -3.2520751953125, -3.1044921875, -2.9569091796875, -2.809326171875, -2.6617431640625, -2.51416015625, -2.3665771484375, -2.218994140625, -2.0714111328125, -1.923828125, -1.7762451171875, -1.628662109375, -1.4810791015625, -1.33349609375, -1.1859130859375, -1.038330078125, -0.8907470703125, -0.7431640625, -0.5955810546875, -0.447998046875, -0.3004150390625, -0.15283203125, -0.0052490234375, 0.142333984375, 0.2899169921875, 0.4375, 0.5850830078125, 0.732666015625, 0.8802490234375, 1.02783203125, 1.1754150390625, 1.322998046875, 1.4705810546875, 1.6181640625, 1.7657470703125, 1.913330078125, 2.0609130859375, 2.20849609375, 2.3560791015625, 2.503662109375, 2.6512451171875, 2.798828125, 2.9464111328125, 3.093994140625, 3.2415771484375, 3.38916015625, 3.5367431640625, 3.684326171875, 3.8319091796875, 3.9794921875, 4.1270751953125, 4.274658203125, 4.4222412109375, 4.56982421875, 4.7174072265625, 4.864990234375, 5.0125732421875, 5.16015625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 23.0, 48.0, 88.0, 172.0, 236.0, 205.0, 126.0, 51.0, 18.0, 10.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.96001434326172, -44.80512619018555, -43.65024185180664, -42.49535369873047, -41.3404655456543, -40.185577392578125, -39.03069305419922, -37.87580490112305, -36.720916748046875, -35.5660285949707, -34.4111442565918, -33.256256103515625, -32.10136795043945, -30.946481704711914, -29.791595458984375, -28.636707305908203, -27.481822967529297, -26.326936721801758, -25.172048568725586, -24.017162322998047, -22.862274169921875, -21.707387924194336, -20.552501678466797, -19.397613525390625, -18.242727279663086, -17.087841033935547, -15.932952880859375, -14.778066635131836, -13.62317943572998, -12.468292236328125, -11.313405990600586, -10.15851879119873, -9.00363540649414, -7.848748207092285, -6.693861484527588, -5.538974761962891, -4.384087562561035, -3.2292003631591797, -2.0743136405944824, -0.9194269180297852, 0.2354602813720703, 1.3903472423553467, 2.545234203338623, 3.7001211643218994, 4.855008125305176, 6.009895324707031, 7.1647820472717285, 8.319668769836426, 9.474555969238281, 10.629443168640137, 11.784330368041992, 12.939216613769531, 14.094103813171387, 15.248991012573242, 16.40387725830078, 17.558765411376953, 18.713651657104492, 19.86853790283203, 21.023426055908203, 22.178312301635742, 23.33319854736328, 24.488086700439453, 25.642972946166992, 26.79785919189453, 27.952747344970703]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 10.0, 10.0, 11.0, 10.0, 12.0, 26.0, 28.0, 35.0, 29.0, 43.0, 49.0, 59.0, 44.0, 55.0, 61.0, 57.0, 65.0, 54.0, 45.0, 47.0, 36.0, 42.0, 28.0, 38.0, 18.0, 16.0, 22.0, 9.0, 9.0, 7.0, 4.0, 11.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.56656265258789, -11.110664367675781, -10.654765129089355, -10.198866844177246, -9.742968559265137, -9.287069320678711, -8.831171035766602, -8.375272750854492, -7.919373989105225, -7.463475227355957, -7.007576942443848, -6.55167818069458, -6.0957794189453125, -5.639881134033203, -5.1839823722839355, -4.728083610534668, -4.272185325622559, -3.81628680229187, -3.3603882789611816, -2.904489517211914, -2.4485909938812256, -1.992692470550537, -1.5367937088012695, -1.080895185470581, -0.6249966621398926, -0.16909807920455933, 0.2868005037307739, 0.742699146270752, 1.1985976696014404, 1.654496192932129, 2.1103949546813965, 2.566293478012085, 3.0221920013427734, 3.478090524673462, 3.9339890480041504, 4.389887809753418, 4.845786094665527, 5.301684856414795, 5.7575836181640625, 6.213481903076172, 6.6693806648254395, 7.125279426574707, 7.581177711486816, 8.037076950073242, 8.492975234985352, 8.948873519897461, 9.40477180480957, 9.860671043395996, 10.316569328308105, 10.772467613220215, 11.22836685180664, 11.68426513671875, 12.14016342163086, 12.596061706542969, 13.051960945129395, 13.507859230041504, 13.96375846862793, 14.419656753540039, 14.875555992126465, 15.331454277038574, 15.787352561950684, 16.24325180053711, 16.69915008544922, 17.155048370361328, 17.610946655273438]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 8.0, 14.0, 26.0, 47.0, 91.0, 172.0, 469.0, 1263.0, 4493.0, 18780.0, 112637.0, 642259.0, 225274.0, 32893.0, 7020.0, 2016.0, 607.0, 272.0, 100.0, 49.0, 29.0, 15.0, 6.0, 11.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -8.0257568359375, -7.637451171875, -7.2491455078125, -6.86083984375, -6.4725341796875, -6.084228515625, -5.6959228515625, -5.3076171875, -4.9193115234375, -4.531005859375, -4.1427001953125, -3.75439453125, -3.3660888671875, -2.977783203125, -2.5894775390625, -2.201171875, -1.8128662109375, -1.424560546875, -1.0362548828125, -0.64794921875, -0.2596435546875, 0.128662109375, 0.5169677734375, 0.9052734375, 1.2935791015625, 1.681884765625, 2.0701904296875, 2.45849609375, 2.8468017578125, 3.235107421875, 3.6234130859375, 4.01171875, 4.4000244140625, 4.788330078125, 5.1766357421875, 5.56494140625, 5.9532470703125, 6.341552734375, 6.7298583984375, 7.1181640625, 7.5064697265625, 7.894775390625, 8.2830810546875, 8.67138671875, 9.0596923828125, 9.447998046875, 9.8363037109375, 10.224609375, 10.6129150390625, 11.001220703125, 11.3895263671875, 11.77783203125, 12.1661376953125, 12.554443359375, 12.9427490234375, 13.3310546875, 13.7193603515625, 14.107666015625, 14.4959716796875, 14.88427734375, 15.2725830078125, 15.660888671875, 16.0491943359375, 16.4375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 11.0, 3.0, 8.0, 9.0, 7.0, 11.0, 23.0, 27.0, 25.0, 47.0, 35.0, 61.0, 39.0, 54.0, 67.0, 75.0, 79.0, 47.0, 60.0, 53.0, 44.0, 46.0, 33.0, 36.0, 17.0, 17.0, 9.0, 16.0, 8.0, 8.0, 3.0, 6.0, 2.0, 5.0, 2.0, 0.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2421875, -3.13330078125, -3.0244140625, -2.91552734375, -2.806640625, -2.69775390625, -2.5888671875, -2.47998046875, -2.37109375, -2.26220703125, -2.1533203125, -2.04443359375, -1.935546875, -1.82666015625, -1.7177734375, -1.60888671875, -1.5, -1.39111328125, -1.2822265625, -1.17333984375, -1.064453125, -0.95556640625, -0.8466796875, -0.73779296875, -0.62890625, -0.52001953125, -0.4111328125, -0.30224609375, -0.193359375, -0.08447265625, 0.0244140625, 0.13330078125, 0.2421875, 0.35107421875, 0.4599609375, 0.56884765625, 0.677734375, 0.78662109375, 0.8955078125, 1.00439453125, 1.11328125, 1.22216796875, 1.3310546875, 1.43994140625, 1.548828125, 1.65771484375, 1.7666015625, 1.87548828125, 1.984375, 2.09326171875, 2.2021484375, 2.31103515625, 2.419921875, 2.52880859375, 2.6376953125, 2.74658203125, 2.85546875, 2.96435546875, 3.0732421875, 3.18212890625, 3.291015625, 3.39990234375, 3.5087890625, 3.61767578125, 3.7265625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 5.0, 12.0, 13.0, 14.0, 17.0, 31.0, 42.0, 54.0, 106.0, 170.0, 310.0, 578.0, 1252.0, 3514.0, 12748.0, 70121.0, 598147.0, 310463.0, 38422.0, 8046.0, 2407.0, 982.0, 436.0, 244.0, 139.0, 75.0, 68.0, 44.0, 37.0, 14.0, 9.0, 7.0, 9.0, 7.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3125, -10.9456787109375, -10.578857421875, -10.2120361328125, -9.84521484375, -9.4783935546875, -9.111572265625, -8.7447509765625, -8.3779296875, -8.0111083984375, -7.644287109375, -7.2774658203125, -6.91064453125, -6.5438232421875, -6.177001953125, -5.8101806640625, -5.443359375, -5.0765380859375, -4.709716796875, -4.3428955078125, -3.97607421875, -3.6092529296875, -3.242431640625, -2.8756103515625, -2.5087890625, -2.1419677734375, -1.775146484375, -1.4083251953125, -1.04150390625, -0.6746826171875, -0.307861328125, 0.0589599609375, 0.42578125, 0.7926025390625, 1.159423828125, 1.5262451171875, 1.89306640625, 2.2598876953125, 2.626708984375, 2.9935302734375, 3.3603515625, 3.7271728515625, 4.093994140625, 4.4608154296875, 4.82763671875, 5.1944580078125, 5.561279296875, 5.9281005859375, 6.294921875, 6.6617431640625, 7.028564453125, 7.3953857421875, 7.76220703125, 8.1290283203125, 8.495849609375, 8.8626708984375, 9.2294921875, 9.5963134765625, 9.963134765625, 10.3299560546875, 10.69677734375, 11.0635986328125, 11.430419921875, 11.7972412109375, 12.1640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 7.0, 8.0, 11.0, 7.0, 13.0, 19.0, 16.0, 17.0, 25.0, 18.0, 36.0, 30.0, 39.0, 35.0, 30.0, 44.0, 51.0, 55.0, 37.0, 58.0, 41.0, 57.0, 36.0, 33.0, 46.0, 32.0, 33.0, 23.0, 21.0, 18.0, 16.0, 17.0, 10.0, 13.0, 11.0, 6.0, 8.0, 2.0, 6.0, 1.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-13.3359375, -12.9610595703125, -12.586181640625, -12.2113037109375, -11.83642578125, -11.4615478515625, -11.086669921875, -10.7117919921875, -10.3369140625, -9.9620361328125, -9.587158203125, -9.2122802734375, -8.83740234375, -8.4625244140625, -8.087646484375, -7.7127685546875, -7.337890625, -6.9630126953125, -6.588134765625, -6.2132568359375, -5.83837890625, -5.4635009765625, -5.088623046875, -4.7137451171875, -4.3388671875, -3.9639892578125, -3.589111328125, -3.2142333984375, -2.83935546875, -2.4644775390625, -2.089599609375, -1.7147216796875, -1.33984375, -0.9649658203125, -0.590087890625, -0.2152099609375, 0.15966796875, 0.5345458984375, 0.909423828125, 1.2843017578125, 1.6591796875, 2.0340576171875, 2.408935546875, 2.7838134765625, 3.15869140625, 3.5335693359375, 3.908447265625, 4.2833251953125, 4.658203125, 5.0330810546875, 5.407958984375, 5.7828369140625, 6.15771484375, 6.5325927734375, 6.907470703125, 7.2823486328125, 7.6572265625, 8.0321044921875, 8.406982421875, 8.7818603515625, 9.15673828125, 9.5316162109375, 9.906494140625, 10.2813720703125, 10.65625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 11.0, 6.0, 12.0, 24.0, 29.0, 45.0, 57.0, 99.0, 188.0, 376.0, 781.0, 2478.0, 18574.0, 797596.0, 217309.0, 8045.0, 1612.0, 628.0, 263.0, 159.0, 90.0, 55.0, 36.0, 20.0, 12.0, 6.0, 4.0, 5.0, 2.0, 7.0, 4.0, 4.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66015625, -7.41168212890625, -7.1632080078125, -6.91473388671875, -6.666259765625, -6.41778564453125, -6.1693115234375, -5.92083740234375, -5.67236328125, -5.42388916015625, -5.1754150390625, -4.92694091796875, -4.678466796875, -4.42999267578125, -4.1815185546875, -3.93304443359375, -3.6845703125, -3.43609619140625, -3.1876220703125, -2.93914794921875, -2.690673828125, -2.44219970703125, -2.1937255859375, -1.94525146484375, -1.69677734375, -1.44830322265625, -1.1998291015625, -0.95135498046875, -0.702880859375, -0.45440673828125, -0.2059326171875, 0.04254150390625, 0.291015625, 0.53948974609375, 0.7879638671875, 1.03643798828125, 1.284912109375, 1.53338623046875, 1.7818603515625, 2.03033447265625, 2.27880859375, 2.52728271484375, 2.7757568359375, 3.02423095703125, 3.272705078125, 3.52117919921875, 3.7696533203125, 4.01812744140625, 4.2666015625, 4.51507568359375, 4.7635498046875, 5.01202392578125, 5.260498046875, 5.50897216796875, 5.7574462890625, 6.00592041015625, 6.25439453125, 6.50286865234375, 6.7513427734375, 6.99981689453125, 7.248291015625, 7.49676513671875, 7.7452392578125, 7.99371337890625, 8.2421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 7.0, 5.0, 11.0, 16.0, 13.0, 24.0, 35.0, 48.0, 48.0, 62.0, 81.0, 99.0, 116.0, 83.0, 83.0, 67.0, 54.0, 40.0, 39.0, 28.0, 11.0, 10.0, 5.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008020401000976562, -0.000781819224357605, -0.0007615983486175537, -0.0007413774728775024, -0.0007211565971374512, -0.0007009357213973999, -0.0006807148456573486, -0.0006604939699172974, -0.0006402730941772461, -0.0006200522184371948, -0.0005998313426971436, -0.0005796104669570923, -0.000559389591217041, -0.0005391687154769897, -0.0005189478397369385, -0.0004987269639968872, -0.00047850608825683594, -0.00045828521251678467, -0.0004380643367767334, -0.00041784346103668213, -0.00039762258529663086, -0.0003774017095565796, -0.0003571808338165283, -0.00033695995807647705, -0.0003167390823364258, -0.0002965182065963745, -0.00027629733085632324, -0.00025607645511627197, -0.0002358555793762207, -0.00021563470363616943, -0.00019541382789611816, -0.0001751929521560669, -0.00015497207641601562, -0.00013475120067596436, -0.00011453032493591309, -9.430944919586182e-05, -7.408857345581055e-05, -5.386769771575928e-05, -3.364682197570801e-05, -1.3425946235656738e-05, 6.794929504394531e-06, 2.70158052444458e-05, 4.723668098449707e-05, 6.745755672454834e-05, 8.767843246459961e-05, 0.00010789930820465088, 0.00012812018394470215, 0.00014834105968475342, 0.0001685619354248047, 0.00018878281116485596, 0.00020900368690490723, 0.0002292245626449585, 0.00024944543838500977, 0.00026966631412506104, 0.0002898871898651123, 0.0003101080656051636, 0.00033032894134521484, 0.0003505498170852661, 0.0003707706928253174, 0.00039099156856536865, 0.0004112124443054199, 0.0004314333200454712, 0.00045165419578552246, 0.00047187507152557373, 0.000492095947265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 9.0, 15.0, 29.0, 30.0, 62.0, 116.0, 163.0, 386.0, 1010.0, 3463.0, 21982.0, 601215.0, 398751.0, 16866.0, 2796.0, 890.0, 383.0, 146.0, 77.0, 50.0, 33.0, 26.0, 6.0, 9.0, 6.0, 7.0, 1.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0], "bins": [-9.0546875, -8.83880615234375, -8.6229248046875, -8.40704345703125, -8.191162109375, -7.97528076171875, -7.7593994140625, -7.54351806640625, -7.32763671875, -7.11175537109375, -6.8958740234375, -6.67999267578125, -6.464111328125, -6.24822998046875, -6.0323486328125, -5.81646728515625, -5.6005859375, -5.38470458984375, -5.1688232421875, -4.95294189453125, -4.737060546875, -4.52117919921875, -4.3052978515625, -4.08941650390625, -3.87353515625, -3.65765380859375, -3.4417724609375, -3.22589111328125, -3.010009765625, -2.79412841796875, -2.5782470703125, -2.36236572265625, -2.146484375, -1.93060302734375, -1.7147216796875, -1.49884033203125, -1.282958984375, -1.06707763671875, -0.8511962890625, -0.63531494140625, -0.41943359375, -0.20355224609375, 0.0123291015625, 0.22821044921875, 0.444091796875, 0.65997314453125, 0.8758544921875, 1.09173583984375, 1.3076171875, 1.52349853515625, 1.7393798828125, 1.95526123046875, 2.171142578125, 2.38702392578125, 2.6029052734375, 2.81878662109375, 3.03466796875, 3.25054931640625, 3.4664306640625, 3.68231201171875, 3.898193359375, 4.11407470703125, 4.3299560546875, 4.54583740234375, 4.76171875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 15.0, 23.0, 40.0, 70.0, 109.0, 158.0, 187.0, 139.0, 95.0, 66.0, 34.0, 11.0, 14.0, 11.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.7421875, -10.49493408203125, -10.2476806640625, -10.00042724609375, -9.753173828125, -9.50592041015625, -9.2586669921875, -9.01141357421875, -8.76416015625, -8.51690673828125, -8.2696533203125, -8.02239990234375, -7.775146484375, -7.52789306640625, -7.2806396484375, -7.03338623046875, -6.7861328125, -6.53887939453125, -6.2916259765625, -6.04437255859375, -5.797119140625, -5.54986572265625, -5.3026123046875, -5.05535888671875, -4.80810546875, -4.56085205078125, -4.3135986328125, -4.06634521484375, -3.819091796875, -3.57183837890625, -3.3245849609375, -3.07733154296875, -2.830078125, -2.58282470703125, -2.3355712890625, -2.08831787109375, -1.841064453125, -1.59381103515625, -1.3465576171875, -1.09930419921875, -0.85205078125, -0.60479736328125, -0.3575439453125, -0.11029052734375, 0.136962890625, 0.38421630859375, 0.6314697265625, 0.87872314453125, 1.1259765625, 1.37322998046875, 1.6204833984375, 1.86773681640625, 2.114990234375, 2.36224365234375, 2.6094970703125, 2.85675048828125, 3.10400390625, 3.35125732421875, 3.5985107421875, 3.84576416015625, 4.093017578125, 4.34027099609375, 4.5875244140625, 4.83477783203125, 5.08203125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 9.0, 19.0, 23.0, 48.0, 96.0, 174.0, 230.0, 188.0, 112.0, 58.0, 26.0, 10.0, 10.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.55062484741211, -42.87131118774414, -39.19200134277344, -35.51268768310547, -31.833375930786133, -28.154064178466797, -24.474750518798828, -20.795438766479492, -17.116127014160156, -13.43681526184082, -9.757502555847168, -6.078189849853516, -2.3988780975341797, 1.2804336547851562, 4.959747314453125, 8.639059066772461, 12.318370819091797, 15.997682571411133, 19.67699432373047, 23.356307983398438, 27.035619735717773, 30.71493148803711, 34.39424514770508, 38.07355499267578, 41.75286865234375, 45.43218231201172, 49.11149215698242, 52.79080581665039, 56.470115661621094, 60.14942932128906, 63.82874298095703, 67.508056640625, 71.18736267089844, 74.8666763305664, 78.54598999023438, 82.22529602050781, 85.90460968017578, 89.58392333984375, 93.26323699951172, 96.94255065917969, 100.62185668945312, 104.3011703491211, 107.98048400878906, 111.6597900390625, 115.33910369873047, 119.01841735839844, 122.6977310180664, 126.37704467773438, 130.05636596679688, 133.7356719970703, 137.4149932861328, 141.09429931640625, 144.77362060546875, 148.4529266357422, 152.13223266601562, 155.81155395507812, 159.49085998535156, 163.170166015625, 166.8494873046875, 170.52879333496094, 174.20811462402344, 177.88742065429688, 181.56674194335938, 185.2460479736328, 188.92535400390625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 12.0, 11.0, 12.0, 13.0, 19.0, 21.0, 32.0, 29.0, 48.0, 48.0, 49.0, 56.0, 48.0, 59.0, 55.0, 57.0, 58.0, 61.0, 51.0, 40.0, 33.0, 37.0, 33.0, 30.0, 19.0, 20.0, 8.0, 7.0, 6.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-60.157470703125, -57.98529815673828, -55.8131217956543, -53.64094924926758, -51.468772888183594, -49.296600341796875, -47.124427795410156, -44.95225524902344, -42.78007888793945, -40.607906341552734, -38.43572998046875, -36.26355743408203, -34.09138488769531, -31.919208526611328, -29.74703598022461, -27.574861526489258, -25.402687072753906, -23.230512619018555, -21.058338165283203, -18.886165618896484, -16.713991165161133, -14.541816711425781, -12.369643211364746, -10.197469711303711, -8.02529525756836, -5.853121280670166, -3.6809473037719727, -1.5087733268737793, 0.6634006500244141, 2.8355751037597656, 5.007748603820801, 7.179922103881836, 9.352096557617188, 11.524271011352539, 13.696444511413574, 15.86861801147461, 18.04079246520996, 20.212966918945312, 22.38513946533203, 24.557313919067383, 26.729488372802734, 28.901662826538086, 31.073837280273438, 33.246009826660156, 35.418182373046875, 37.59035873413086, 39.76253128051758, 41.93470764160156, 44.10688018798828, 46.279052734375, 48.451229095458984, 50.6234016418457, 52.79557800292969, 54.967750549316406, 57.139923095703125, 59.312095642089844, 61.48427200317383, 63.65644454956055, 65.82862091064453, 68.00079345703125, 70.17296600341797, 72.34513854980469, 74.51731872558594, 76.68949127197266, 78.86166381835938]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 9.0, 8.0, 7.0, 14.0, 23.0, 31.0, 44.0, 64.0, 122.0, 230.0, 520.0, 1415.0, 4756.0, 20186.0, 172647.0, 3870601.0, 102783.0, 14670.0, 3834.0, 1219.0, 501.0, 247.0, 121.0, 66.0, 48.0, 27.0, 25.0, 21.0, 17.0, 2.0, 7.0, 5.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5390625, -7.2027587890625, -6.866455078125, -6.5301513671875, -6.19384765625, -5.8575439453125, -5.521240234375, -5.1849365234375, -4.8486328125, -4.5123291015625, -4.176025390625, -3.8397216796875, -3.50341796875, -3.1671142578125, -2.830810546875, -2.4945068359375, -2.158203125, -1.8218994140625, -1.485595703125, -1.1492919921875, -0.81298828125, -0.4766845703125, -0.140380859375, 0.1959228515625, 0.5322265625, 0.8685302734375, 1.204833984375, 1.5411376953125, 1.87744140625, 2.2137451171875, 2.550048828125, 2.8863525390625, 3.22265625, 3.5589599609375, 3.895263671875, 4.2315673828125, 4.56787109375, 4.9041748046875, 5.240478515625, 5.5767822265625, 5.9130859375, 6.2493896484375, 6.585693359375, 6.9219970703125, 7.25830078125, 7.5946044921875, 7.930908203125, 8.2672119140625, 8.603515625, 8.9398193359375, 9.276123046875, 9.6124267578125, 9.94873046875, 10.2850341796875, 10.621337890625, 10.9576416015625, 11.2939453125, 11.6302490234375, 11.966552734375, 12.3028564453125, 12.63916015625, 12.9754638671875, 13.311767578125, 13.6480712890625, 13.984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 11.0, 19.0, 28.0, 51.0, 92.0, 95.0, 95.0, 110.0, 123.0, 103.0, 92.0, 69.0, 53.0, 28.0, 15.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.884765625, -3.699371337890625, -3.51397705078125, -3.328582763671875, -3.1431884765625, -2.957794189453125, -2.77239990234375, -2.587005615234375, -2.401611328125, -2.216217041015625, -2.03082275390625, -1.845428466796875, -1.6600341796875, -1.474639892578125, -1.28924560546875, -1.103851318359375, -0.91845703125, -0.733062744140625, -0.54766845703125, -0.362274169921875, -0.1768798828125, 0.008514404296875, 0.19390869140625, 0.379302978515625, 0.564697265625, 0.750091552734375, 0.93548583984375, 1.120880126953125, 1.3062744140625, 1.491668701171875, 1.67706298828125, 1.862457275390625, 2.0478515625, 2.233245849609375, 2.41864013671875, 2.604034423828125, 2.7894287109375, 2.974822998046875, 3.16021728515625, 3.345611572265625, 3.531005859375, 3.716400146484375, 3.90179443359375, 4.087188720703125, 4.2725830078125, 4.457977294921875, 4.64337158203125, 4.828765869140625, 5.01416015625, 5.199554443359375, 5.38494873046875, 5.570343017578125, 5.7557373046875, 5.941131591796875, 6.12652587890625, 6.311920166015625, 6.497314453125, 6.682708740234375, 6.86810302734375, 7.053497314453125, 7.2388916015625, 7.424285888671875, 7.60968017578125, 7.795074462890625, 7.98046875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 11.0, 8.0, 11.0, 24.0, 30.0, 42.0, 69.0, 147.0, 262.0, 459.0, 960.0, 2151.0, 6049.0, 20371.0, 95416.0, 3246476.0, 744294.0, 56254.0, 13537.0, 4277.0, 1710.0, 776.0, 360.0, 215.0, 124.0, 68.0, 50.0, 37.0, 24.0, 16.0, 9.0, 11.0, 7.0, 7.0, 3.0, 2.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4296875, -7.142333984375, -6.85498046875, -6.567626953125, -6.2802734375, -5.992919921875, -5.70556640625, -5.418212890625, -5.130859375, -4.843505859375, -4.55615234375, -4.268798828125, -3.9814453125, -3.694091796875, -3.40673828125, -3.119384765625, -2.83203125, -2.544677734375, -2.25732421875, -1.969970703125, -1.6826171875, -1.395263671875, -1.10791015625, -0.820556640625, -0.533203125, -0.245849609375, 0.04150390625, 0.328857421875, 0.6162109375, 0.903564453125, 1.19091796875, 1.478271484375, 1.765625, 2.052978515625, 2.34033203125, 2.627685546875, 2.9150390625, 3.202392578125, 3.48974609375, 3.777099609375, 4.064453125, 4.351806640625, 4.63916015625, 4.926513671875, 5.2138671875, 5.501220703125, 5.78857421875, 6.075927734375, 6.36328125, 6.650634765625, 6.93798828125, 7.225341796875, 7.5126953125, 7.800048828125, 8.08740234375, 8.374755859375, 8.662109375, 8.949462890625, 9.23681640625, 9.524169921875, 9.8115234375, 10.098876953125, 10.38623046875, 10.673583984375, 10.9609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 2.0, 11.0, 8.0, 13.0, 14.0, 24.0, 37.0, 54.0, 77.0, 116.0, 247.0, 728.0, 1584.0, 650.0, 205.0, 111.0, 55.0, 42.0, 22.0, 20.0, 12.0, 8.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.98828125, -7.66168212890625, -7.3350830078125, -7.00848388671875, -6.681884765625, -6.35528564453125, -6.0286865234375, -5.70208740234375, -5.37548828125, -5.04888916015625, -4.7222900390625, -4.39569091796875, -4.069091796875, -3.74249267578125, -3.4158935546875, -3.08929443359375, -2.7626953125, -2.43609619140625, -2.1094970703125, -1.78289794921875, -1.456298828125, -1.12969970703125, -0.8031005859375, -0.47650146484375, -0.14990234375, 0.17669677734375, 0.5032958984375, 0.82989501953125, 1.156494140625, 1.48309326171875, 1.8096923828125, 2.13629150390625, 2.462890625, 2.78948974609375, 3.1160888671875, 3.44268798828125, 3.769287109375, 4.09588623046875, 4.4224853515625, 4.74908447265625, 5.07568359375, 5.40228271484375, 5.7288818359375, 6.05548095703125, 6.382080078125, 6.70867919921875, 7.0352783203125, 7.36187744140625, 7.6884765625, 8.01507568359375, 8.3416748046875, 8.66827392578125, 8.994873046875, 9.32147216796875, 9.6480712890625, 9.97467041015625, 10.30126953125, 10.62786865234375, 10.9544677734375, 11.28106689453125, 11.607666015625, 11.93426513671875, 12.2608642578125, 12.58746337890625, 12.9140625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 10.0, 7.0, 13.0, 28.0, 36.0, 90.0, 173.0, 237.0, 200.0, 107.0, 51.0, 27.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.2810287475586, -101.19893646240234, -98.11685180664062, -95.03475952148438, -91.95267486572266, -88.8705825805664, -85.78849792480469, -82.70640563964844, -79.62431335449219, -76.54222106933594, -73.46013641357422, -70.37804412841797, -67.29595947265625, -64.2138671875, -61.131778717041016, -58.04969024658203, -54.96760559082031, -51.88551712036133, -48.803428649902344, -45.721336364746094, -42.639251708984375, -39.557159423828125, -36.47507095336914, -33.392982482910156, -30.310894012451172, -27.228805541992188, -24.146717071533203, -21.064626693725586, -17.9825382232666, -14.900449752807617, -11.818359375, -8.736270904541016, -5.6541748046875, -2.5720858573913574, 0.5100030899047852, 3.592092514038086, 6.67418098449707, 9.756269454956055, 12.838359832763672, 15.920448303222656, 19.00253677368164, 22.084625244140625, 25.16671371459961, 28.248804092407227, 31.33089256286621, 34.41297912597656, 37.49507141113281, 40.5771598815918, 43.65924835205078, 46.741336822509766, 49.82342529296875, 52.905517578125, 55.98760223388672, 59.06969451904297, 62.15178298950195, 65.23387145996094, 68.31596374511719, 71.39805603027344, 74.48014068603516, 77.5622329711914, 80.64431762695312, 83.72640991210938, 86.80850219726562, 89.89058685302734, 92.97267150878906]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 1.0, 7.0, 5.0, 10.0, 11.0, 11.0, 11.0, 20.0, 31.0, 28.0, 36.0, 37.0, 55.0, 53.0, 53.0, 41.0, 59.0, 50.0, 56.0, 41.0, 45.0, 46.0, 47.0, 43.0, 38.0, 30.0, 23.0, 39.0, 22.0, 23.0, 12.0, 4.0, 6.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.659873962402344, -41.1981315612793, -39.736385345458984, -38.27464294433594, -36.812896728515625, -35.35115432739258, -33.889408111572266, -32.42766571044922, -30.965919494628906, -29.504175186157227, -28.042430877685547, -26.580686569213867, -25.118942260742188, -23.657197952270508, -22.195453643798828, -20.73371124267578, -19.2719669342041, -17.810222625732422, -16.348478317260742, -14.886734008789062, -13.424989700317383, -11.963245391845703, -10.50150203704834, -9.03975772857666, -7.5780134201049805, -6.116269111633301, -4.654524803161621, -3.1927809715270996, -1.73103666305542, -0.26929235458374023, 1.1924514770507812, 2.654195785522461, 4.115940093994141, 5.57768440246582, 7.0394287109375, 8.50117301940918, 9.96291732788086, 11.424661636352539, 12.886404991149902, 14.348149299621582, 15.809893608093262, 17.271636962890625, 18.733381271362305, 20.195125579833984, 21.656869888305664, 23.118614196777344, 24.580358505249023, 26.042102813720703, 27.503847122192383, 28.965591430664062, 30.427335739135742, 31.889080047607422, 33.35082244873047, 34.81256866455078, 36.27431106567383, 37.73605728149414, 39.19779968261719, 40.659542083740234, 42.12128829956055, 43.583030700683594, 45.044776916503906, 46.50651931762695, 47.968265533447266, 49.43000793457031, 50.891754150390625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 9.0, 6.0, 13.0, 12.0, 23.0, 28.0, 56.0, 84.0, 137.0, 232.0, 358.0, 645.0, 1200.0, 2365.0, 4960.0, 11105.0, 27430.0, 71735.0, 199896.0, 406447.0, 200985.0, 72188.0, 27349.0, 11045.0, 5026.0, 2391.0, 1236.0, 622.0, 388.0, 222.0, 129.0, 84.0, 47.0, 33.0, 30.0, 5.0, 9.0, 8.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.96875, -5.79058837890625, -5.6124267578125, -5.43426513671875, -5.256103515625, -5.07794189453125, -4.8997802734375, -4.72161865234375, -4.54345703125, -4.36529541015625, -4.1871337890625, -4.00897216796875, -3.830810546875, -3.65264892578125, -3.4744873046875, -3.29632568359375, -3.1181640625, -2.94000244140625, -2.7618408203125, -2.58367919921875, -2.405517578125, -2.22735595703125, -2.0491943359375, -1.87103271484375, -1.69287109375, -1.51470947265625, -1.3365478515625, -1.15838623046875, -0.980224609375, -0.80206298828125, -0.6239013671875, -0.44573974609375, -0.267578125, -0.08941650390625, 0.0887451171875, 0.26690673828125, 0.445068359375, 0.62322998046875, 0.8013916015625, 0.97955322265625, 1.15771484375, 1.33587646484375, 1.5140380859375, 1.69219970703125, 1.870361328125, 2.04852294921875, 2.2266845703125, 2.40484619140625, 2.5830078125, 2.76116943359375, 2.9393310546875, 3.11749267578125, 3.295654296875, 3.47381591796875, 3.6519775390625, 3.83013916015625, 4.00830078125, 4.18646240234375, 4.3646240234375, 4.54278564453125, 4.720947265625, 4.89910888671875, 5.0772705078125, 5.25543212890625, 5.43359375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 16.0, 9.0, 14.0, 24.0, 23.0, 44.0, 25.0, 42.0, 47.0, 51.0, 71.0, 69.0, 66.0, 53.0, 58.0, 56.0, 62.0, 61.0, 41.0, 37.0, 29.0, 18.0, 22.0, 18.0, 9.0, 9.0, 7.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6796875, -2.5723876953125, -2.465087890625, -2.3577880859375, -2.25048828125, -2.1431884765625, -2.035888671875, -1.9285888671875, -1.8212890625, -1.7139892578125, -1.606689453125, -1.4993896484375, -1.39208984375, -1.2847900390625, -1.177490234375, -1.0701904296875, -0.962890625, -0.8555908203125, -0.748291015625, -0.6409912109375, -0.53369140625, -0.4263916015625, -0.319091796875, -0.2117919921875, -0.1044921875, 0.0028076171875, 0.110107421875, 0.2174072265625, 0.32470703125, 0.4320068359375, 0.539306640625, 0.6466064453125, 0.75390625, 0.8612060546875, 0.968505859375, 1.0758056640625, 1.18310546875, 1.2904052734375, 1.397705078125, 1.5050048828125, 1.6123046875, 1.7196044921875, 1.826904296875, 1.9342041015625, 2.04150390625, 2.1488037109375, 2.256103515625, 2.3634033203125, 2.470703125, 2.5780029296875, 2.685302734375, 2.7926025390625, 2.89990234375, 3.0072021484375, 3.114501953125, 3.2218017578125, 3.3291015625, 3.4364013671875, 3.543701171875, 3.6510009765625, 3.75830078125, 3.8656005859375, 3.972900390625, 4.0802001953125, 4.1875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 9.0, 7.0, 19.0, 22.0, 32.0, 37.0, 59.0, 86.0, 155.0, 242.0, 364.0, 649.0, 1190.0, 2459.0, 6882.0, 26061.0, 157826.0, 686275.0, 132465.0, 22858.0, 5983.0, 2241.0, 1082.0, 572.0, 353.0, 229.0, 124.0, 76.0, 54.0, 40.0, 28.0, 22.0, 11.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.78125, -9.4888916015625, -9.196533203125, -8.9041748046875, -8.61181640625, -8.3194580078125, -8.027099609375, -7.7347412109375, -7.4423828125, -7.1500244140625, -6.857666015625, -6.5653076171875, -6.27294921875, -5.9805908203125, -5.688232421875, -5.3958740234375, -5.103515625, -4.8111572265625, -4.518798828125, -4.2264404296875, -3.93408203125, -3.6417236328125, -3.349365234375, -3.0570068359375, -2.7646484375, -2.4722900390625, -2.179931640625, -1.8875732421875, -1.59521484375, -1.3028564453125, -1.010498046875, -0.7181396484375, -0.42578125, -0.1334228515625, 0.158935546875, 0.4512939453125, 0.74365234375, 1.0360107421875, 1.328369140625, 1.6207275390625, 1.9130859375, 2.2054443359375, 2.497802734375, 2.7901611328125, 3.08251953125, 3.3748779296875, 3.667236328125, 3.9595947265625, 4.251953125, 4.5443115234375, 4.836669921875, 5.1290283203125, 5.42138671875, 5.7137451171875, 6.006103515625, 6.2984619140625, 6.5908203125, 6.8831787109375, 7.175537109375, 7.4678955078125, 7.76025390625, 8.0526123046875, 8.344970703125, 8.6373291015625, 8.9296875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 5.0, 9.0, 11.0, 9.0, 14.0, 18.0, 20.0, 27.0, 29.0, 30.0, 23.0, 41.0, 45.0, 51.0, 58.0, 54.0, 52.0, 42.0, 55.0, 57.0, 55.0, 45.0, 38.0, 28.0, 38.0, 29.0, 19.0, 22.0, 11.0, 11.0, 15.0, 8.0, 13.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.2723388671875, -9.880615234375, -9.4888916015625, -9.09716796875, -8.7054443359375, -8.313720703125, -7.9219970703125, -7.5302734375, -7.1385498046875, -6.746826171875, -6.3551025390625, -5.96337890625, -5.5716552734375, -5.179931640625, -4.7882080078125, -4.396484375, -4.0047607421875, -3.613037109375, -3.2213134765625, -2.82958984375, -2.4378662109375, -2.046142578125, -1.6544189453125, -1.2626953125, -0.8709716796875, -0.479248046875, -0.0875244140625, 0.30419921875, 0.6959228515625, 1.087646484375, 1.4793701171875, 1.87109375, 2.2628173828125, 2.654541015625, 3.0462646484375, 3.43798828125, 3.8297119140625, 4.221435546875, 4.6131591796875, 5.0048828125, 5.3966064453125, 5.788330078125, 6.1800537109375, 6.57177734375, 6.9635009765625, 7.355224609375, 7.7469482421875, 8.138671875, 8.5303955078125, 8.922119140625, 9.3138427734375, 9.70556640625, 10.0972900390625, 10.489013671875, 10.8807373046875, 11.2724609375, 11.6641845703125, 12.055908203125, 12.4476318359375, 12.83935546875, 13.2310791015625, 13.622802734375, 14.0145263671875, 14.40625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 3.0, 5.0, 12.0, 12.0, 22.0, 21.0, 38.0, 64.0, 101.0, 198.0, 350.0, 718.0, 2063.0, 7927.0, 57870.0, 780844.0, 176598.0, 16249.0, 3282.0, 1106.0, 490.0, 243.0, 120.0, 91.0, 34.0, 25.0, 19.0, 11.0, 10.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.12109375, -4.9776611328125, -4.834228515625, -4.6907958984375, -4.54736328125, -4.4039306640625, -4.260498046875, -4.1170654296875, -3.9736328125, -3.8302001953125, -3.686767578125, -3.5433349609375, -3.39990234375, -3.2564697265625, -3.113037109375, -2.9696044921875, -2.826171875, -2.6827392578125, -2.539306640625, -2.3958740234375, -2.25244140625, -2.1090087890625, -1.965576171875, -1.8221435546875, -1.6787109375, -1.5352783203125, -1.391845703125, -1.2484130859375, -1.10498046875, -0.9615478515625, -0.818115234375, -0.6746826171875, -0.53125, -0.3878173828125, -0.244384765625, -0.1009521484375, 0.04248046875, 0.1859130859375, 0.329345703125, 0.4727783203125, 0.6162109375, 0.7596435546875, 0.903076171875, 1.0465087890625, 1.18994140625, 1.3333740234375, 1.476806640625, 1.6202392578125, 1.763671875, 1.9071044921875, 2.050537109375, 2.1939697265625, 2.33740234375, 2.4808349609375, 2.624267578125, 2.7677001953125, 2.9111328125, 3.0545654296875, 3.197998046875, 3.3414306640625, 3.48486328125, 3.6282958984375, 3.771728515625, 3.9151611328125, 4.05859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 3.0, 11.0, 3.0, 5.0, 7.0, 12.0, 13.0, 22.0, 27.0, 29.0, 42.0, 62.0, 66.0, 81.0, 94.0, 102.0, 85.0, 68.0, 56.0, 51.0, 32.0, 30.0, 23.0, 12.0, 11.0, 10.0, 12.0, 8.0, 7.0, 2.0, 1.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0006971359252929688, -0.0006788335740566254, -0.000660531222820282, -0.0006422288715839386, -0.0006239265203475952, -0.0006056241691112518, -0.0005873218178749084, -0.0005690194666385651, -0.0005507171154022217, -0.0005324147641658783, -0.0005141124129295349, -0.0004958100616931915, -0.00047750771045684814, -0.00045920535922050476, -0.0004409030079841614, -0.000422600656747818, -0.0004042983055114746, -0.0003859959542751312, -0.00036769360303878784, -0.00034939125180244446, -0.0003310889005661011, -0.0003127865493297577, -0.0002944841980934143, -0.0002761818468570709, -0.00025787949562072754, -0.00023957714438438416, -0.00022127479314804077, -0.0002029724419116974, -0.000184670090675354, -0.00016636773943901062, -0.00014806538820266724, -0.00012976303696632385, -0.00011146068572998047, -9.315833449363708e-05, -7.48559832572937e-05, -5.655363202095032e-05, -3.8251280784606934e-05, -1.994892954826355e-05, -1.646578311920166e-06, 1.6655772924423218e-05, 3.49581241607666e-05, 5.3260475397109985e-05, 7.156282663345337e-05, 8.986517786979675e-05, 0.00010816752910614014, 0.00012646988034248352, 0.0001447722315788269, 0.0001630745828151703, 0.00018137693405151367, 0.00019967928528785706, 0.00021798163652420044, 0.00023628398776054382, 0.0002545863389968872, 0.0002728886902332306, 0.000291191041469574, 0.00030949339270591736, 0.00032779574394226074, 0.0003460980951786041, 0.0003644004464149475, 0.0003827027976512909, 0.0004010051488876343, 0.00041930750012397766, 0.00043760985136032104, 0.00045591220259666443, 0.0004742145538330078]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 3.0, 5.0, 7.0, 11.0, 15.0, 23.0, 33.0, 60.0, 128.0, 214.0, 406.0, 960.0, 2871.0, 12059.0, 101226.0, 804268.0, 108709.0, 12569.0, 2959.0, 1066.0, 422.0, 212.0, 131.0, 69.0, 44.0, 19.0, 17.0, 7.0, 9.0, 6.0, 6.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.4796142578125, -4.345947265625, -4.2122802734375, -4.07861328125, -3.9449462890625, -3.811279296875, -3.6776123046875, -3.5439453125, -3.4102783203125, -3.276611328125, -3.1429443359375, -3.00927734375, -2.8756103515625, -2.741943359375, -2.6082763671875, -2.474609375, -2.3409423828125, -2.207275390625, -2.0736083984375, -1.93994140625, -1.8062744140625, -1.672607421875, -1.5389404296875, -1.4052734375, -1.2716064453125, -1.137939453125, -1.0042724609375, -0.87060546875, -0.7369384765625, -0.603271484375, -0.4696044921875, -0.3359375, -0.2022705078125, -0.068603515625, 0.0650634765625, 0.19873046875, 0.3323974609375, 0.466064453125, 0.5997314453125, 0.7333984375, 0.8670654296875, 1.000732421875, 1.1343994140625, 1.26806640625, 1.4017333984375, 1.535400390625, 1.6690673828125, 1.802734375, 1.9364013671875, 2.070068359375, 2.2037353515625, 2.33740234375, 2.4710693359375, 2.604736328125, 2.7384033203125, 2.8720703125, 3.0057373046875, 3.139404296875, 3.2730712890625, 3.40673828125, 3.5404052734375, 3.674072265625, 3.8077392578125, 3.94140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 12.0, 8.0, 8.0, 5.0, 11.0, 25.0, 22.0, 29.0, 37.0, 50.0, 63.0, 67.0, 83.0, 99.0, 77.0, 67.0, 67.0, 64.0, 35.0, 37.0, 28.0, 22.0, 14.0, 20.0, 13.0, 10.0, 4.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.365234375, -3.251861572265625, -3.13848876953125, -3.025115966796875, -2.9117431640625, -2.798370361328125, -2.68499755859375, -2.571624755859375, -2.458251953125, -2.344879150390625, -2.23150634765625, -2.118133544921875, -2.0047607421875, -1.891387939453125, -1.77801513671875, -1.664642333984375, -1.55126953125, -1.437896728515625, -1.32452392578125, -1.211151123046875, -1.0977783203125, -0.984405517578125, -0.87103271484375, -0.757659912109375, -0.644287109375, -0.530914306640625, -0.41754150390625, -0.304168701171875, -0.1907958984375, -0.077423095703125, 0.03594970703125, 0.149322509765625, 0.2626953125, 0.376068115234375, 0.48944091796875, 0.602813720703125, 0.7161865234375, 0.829559326171875, 0.94293212890625, 1.056304931640625, 1.169677734375, 1.283050537109375, 1.39642333984375, 1.509796142578125, 1.6231689453125, 1.736541748046875, 1.84991455078125, 1.963287353515625, 2.07666015625, 2.190032958984375, 2.30340576171875, 2.416778564453125, 2.5301513671875, 2.643524169921875, 2.75689697265625, 2.870269775390625, 2.983642578125, 3.097015380859375, 3.21038818359375, 3.323760986328125, 3.4371337890625, 3.550506591796875, 3.66387939453125, 3.777252197265625, 3.890625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 10.0, 21.0, 59.0, 142.0, 294.0, 245.0, 134.0, 53.0, 19.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.8255844116211, -77.13379669189453, -73.44200897216797, -69.7502212524414, -66.05843353271484, -62.36664581298828, -58.67485427856445, -54.98306655883789, -51.29127883911133, -47.599491119384766, -43.9077033996582, -40.215911865234375, -36.52412414550781, -32.83233642578125, -29.140548706054688, -25.448760986328125, -21.756973266601562, -18.065185546875, -14.373396873474121, -10.681608200073242, -6.98982048034668, -3.298032760620117, 0.3937568664550781, 4.085544586181641, 7.777332305908203, 11.469120025634766, 15.160908699035645, 18.852697372436523, 22.544485092163086, 26.23627281188965, 29.928062438964844, 33.619850158691406, 37.31163024902344, 41.00341796875, 44.69520568847656, 48.386993408203125, 52.07878112792969, 55.77056884765625, 59.46236038208008, 63.15414810180664, 66.84593200683594, 70.5377197265625, 74.22950744628906, 77.92129516601562, 81.61308288574219, 85.30487060546875, 88.99665832519531, 92.68844604492188, 96.38024139404297, 100.07202911376953, 103.7638168334961, 107.45560455322266, 111.14739227294922, 114.83917999267578, 118.53097534179688, 122.22276306152344, 125.91455078125, 129.60633850097656, 133.29812622070312, 136.9899139404297, 140.68170166015625, 144.3734893798828, 148.06527709960938, 151.75706481933594, 155.4488525390625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 12.0, 13.0, 18.0, 15.0, 30.0, 39.0, 47.0, 45.0, 50.0, 67.0, 81.0, 95.0, 86.0, 69.0, 57.0, 56.0, 46.0, 28.0, 32.0, 26.0, 17.0, 18.0, 15.0, 11.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.80537414550781, -81.68424224853516, -79.56311798095703, -77.44198608398438, -75.32085418701172, -73.19972229003906, -71.07859802246094, -68.95746612548828, -66.83633422851562, -64.71520233154297, -62.59407424926758, -60.47294616699219, -58.35181427001953, -56.23068618774414, -54.10955810546875, -51.988426208496094, -49.86730194091797, -47.74617385864258, -45.62504196166992, -43.50391387939453, -41.382781982421875, -39.261653900146484, -37.140525817871094, -35.01939392089844, -32.89826583862305, -30.777135848999023, -28.656005859375, -26.53487777709961, -24.413747787475586, -22.292617797851562, -20.171489715576172, -18.05035972595215, -15.929237365722656, -13.808107376098633, -11.686978340148926, -9.565849304199219, -7.444719314575195, -5.323589324951172, -3.202460289001465, -1.0813312530517578, 1.0397987365722656, 3.160928249359131, 5.282057762145996, 7.403187274932861, 9.524316787719727, 11.64544677734375, 13.766575813293457, 15.887704849243164, 18.008834838867188, 20.12996482849121, 22.251094818115234, 24.372222900390625, 26.49335289001465, 28.614482879638672, 30.735610961914062, 32.85674285888672, 34.97787094116211, 37.0989990234375, 39.220130920410156, 41.34125900268555, 43.46238708496094, 45.583518981933594, 47.704647064208984, 49.825775146484375, 51.94690704345703]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 7.0, 9.0, 15.0, 15.0, 13.0, 27.0, 39.0, 62.0, 84.0, 154.0, 246.0, 533.0, 1909.0, 10233.0, 221264.0, 3922615.0, 31313.0, 4014.0, 988.0, 314.0, 166.0, 75.0, 45.0, 39.0, 24.0, 16.0, 11.0, 13.0, 4.0, 3.0, 5.0, 2.0, 3.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.90625, -11.468994140625, -11.03173828125, -10.594482421875, -10.1572265625, -9.719970703125, -9.28271484375, -8.845458984375, -8.408203125, -7.970947265625, -7.53369140625, -7.096435546875, -6.6591796875, -6.221923828125, -5.78466796875, -5.347412109375, -4.91015625, -4.472900390625, -4.03564453125, -3.598388671875, -3.1611328125, -2.723876953125, -2.28662109375, -1.849365234375, -1.412109375, -0.974853515625, -0.53759765625, -0.100341796875, 0.3369140625, 0.774169921875, 1.21142578125, 1.648681640625, 2.0859375, 2.523193359375, 2.96044921875, 3.397705078125, 3.8349609375, 4.272216796875, 4.70947265625, 5.146728515625, 5.583984375, 6.021240234375, 6.45849609375, 6.895751953125, 7.3330078125, 7.770263671875, 8.20751953125, 8.644775390625, 9.08203125, 9.519287109375, 9.95654296875, 10.393798828125, 10.8310546875, 11.268310546875, 11.70556640625, 12.142822265625, 12.580078125, 13.017333984375, 13.45458984375, 13.891845703125, 14.3291015625, 14.766357421875, 15.20361328125, 15.640869140625, 16.078125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 6.0, 18.0, 21.0, 35.0, 55.0, 68.0, 79.0, 105.0, 88.0, 88.0, 103.0, 93.0, 62.0, 54.0, 34.0, 43.0, 23.0, 13.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.37109375, -7.21484375, -7.05859375, -6.90234375, -6.74609375, -6.58984375, -6.43359375, -6.27734375, -6.12109375, -5.96484375, -5.80859375, -5.65234375, -5.49609375, -5.33984375, -5.18359375, -5.02734375, -4.87109375, -4.71484375, -4.55859375, -4.40234375, -4.24609375, -4.08984375, -3.93359375, -3.77734375, -3.62109375, -3.46484375, -3.30859375, -3.15234375, -2.99609375, -2.83984375, -2.68359375, -2.52734375, -2.37109375, -2.21484375, -2.05859375, -1.90234375, -1.74609375, -1.58984375, -1.43359375, -1.27734375, -1.12109375, -0.96484375, -0.80859375, -0.65234375, -0.49609375, -0.33984375, -0.18359375, -0.02734375, 0.12890625, 0.28515625, 0.44140625, 0.59765625, 0.75390625, 0.91015625, 1.06640625, 1.22265625, 1.37890625, 1.53515625, 1.69140625, 1.84765625, 2.00390625, 2.16015625, 2.31640625, 2.47265625, 2.62890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 5.0, 9.0, 11.0, 16.0, 17.0, 36.0, 65.0, 114.0, 209.0, 421.0, 947.0, 1970.0, 4483.0, 11180.0, 30235.0, 116562.0, 2621217.0, 1282348.0, 85756.0, 23408.0, 8729.0, 3540.0, 1552.0, 708.0, 318.0, 182.0, 103.0, 38.0, 45.0, 20.0, 16.0, 12.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.2633056640625, -5.081298828125, -4.8992919921875, -4.71728515625, -4.5352783203125, -4.353271484375, -4.1712646484375, -3.9892578125, -3.8072509765625, -3.625244140625, -3.4432373046875, -3.26123046875, -3.0792236328125, -2.897216796875, -2.7152099609375, -2.533203125, -2.3511962890625, -2.169189453125, -1.9871826171875, -1.80517578125, -1.6231689453125, -1.441162109375, -1.2591552734375, -1.0771484375, -0.8951416015625, -0.713134765625, -0.5311279296875, -0.34912109375, -0.1671142578125, 0.014892578125, 0.1968994140625, 0.37890625, 0.5609130859375, 0.742919921875, 0.9249267578125, 1.10693359375, 1.2889404296875, 1.470947265625, 1.6529541015625, 1.8349609375, 2.0169677734375, 2.198974609375, 2.3809814453125, 2.56298828125, 2.7449951171875, 2.927001953125, 3.1090087890625, 3.291015625, 3.4730224609375, 3.655029296875, 3.8370361328125, 4.01904296875, 4.2010498046875, 4.383056640625, 4.5650634765625, 4.7470703125, 4.9290771484375, 5.111083984375, 5.2930908203125, 5.47509765625, 5.6571044921875, 5.839111328125, 6.0211181640625, 6.203125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 5.0, 8.0, 4.0, 11.0, 21.0, 18.0, 22.0, 20.0, 50.0, 44.0, 77.0, 118.0, 212.0, 448.0, 999.0, 958.0, 449.0, 200.0, 154.0, 72.0, 50.0, 32.0, 17.0, 13.0, 5.0, 12.0, 5.0, 7.0, 5.0, 6.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.64453125, -5.46246337890625, -5.2803955078125, -5.09832763671875, -4.916259765625, -4.73419189453125, -4.5521240234375, -4.37005615234375, -4.18798828125, -4.00592041015625, -3.8238525390625, -3.64178466796875, -3.459716796875, -3.27764892578125, -3.0955810546875, -2.91351318359375, -2.7314453125, -2.54937744140625, -2.3673095703125, -2.18524169921875, -2.003173828125, -1.82110595703125, -1.6390380859375, -1.45697021484375, -1.27490234375, -1.09283447265625, -0.9107666015625, -0.72869873046875, -0.546630859375, -0.36456298828125, -0.1824951171875, -0.00042724609375, 0.181640625, 0.36370849609375, 0.5457763671875, 0.72784423828125, 0.909912109375, 1.09197998046875, 1.2740478515625, 1.45611572265625, 1.63818359375, 1.82025146484375, 2.0023193359375, 2.18438720703125, 2.366455078125, 2.54852294921875, 2.7305908203125, 2.91265869140625, 3.0947265625, 3.27679443359375, 3.4588623046875, 3.64093017578125, 3.822998046875, 4.00506591796875, 4.1871337890625, 4.36920166015625, 4.55126953125, 4.73333740234375, 4.9154052734375, 5.09747314453125, 5.279541015625, 5.46160888671875, 5.6436767578125, 5.82574462890625, 6.0078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 12.0, 7.0, 15.0, 50.0, 150.0, 276.0, 250.0, 161.0, 35.0, 15.0, 8.0, 2.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.70965576171875, -100.08948516845703, -97.46932220458984, -94.84915161132812, -92.22898864746094, -89.60881805419922, -86.9886474609375, -84.36848449707031, -81.7483139038086, -79.12814331054688, -76.50798034667969, -73.88780975341797, -71.26763916015625, -68.64747619628906, -66.02730560302734, -63.40713882446289, -60.78697204589844, -58.166805267333984, -55.54663848876953, -52.92646789550781, -50.30630111694336, -47.686134338378906, -45.06596374511719, -42.445796966552734, -39.82563018798828, -37.20546340942383, -34.585296630859375, -31.965126037597656, -29.344959259033203, -26.72479248046875, -24.104623794555664, -21.484455108642578, -18.864295959472656, -16.244129180908203, -13.623960494995117, -11.003792762756348, -8.383625030517578, -5.763457298278809, -3.143289566040039, -0.5231208801269531, 2.0970458984375, 4.7172136306762695, 7.337381362915039, 9.957549095153809, 12.577716827392578, 15.197884559631348, 17.818052291870117, 20.438220977783203, 23.058387756347656, 25.67855453491211, 28.298723220825195, 30.91889190673828, 33.539058685302734, 36.15922546386719, 38.779396057128906, 41.39956283569336, 44.01972961425781, 46.639896392822266, 49.26006317138672, 51.88023376464844, 54.50040054321289, 57.120567321777344, 59.74073791503906, 62.360904693603516, 64.98107147216797]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 2.0, 7.0, 18.0, 15.0, 18.0, 23.0, 35.0, 48.0, 38.0, 54.0, 61.0, 61.0, 73.0, 65.0, 64.0, 55.0, 51.0, 60.0, 56.0, 42.0, 41.0, 22.0, 23.0, 22.0, 13.0, 12.0, 10.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.1634521484375, -44.91395568847656, -43.664459228515625, -42.41495895385742, -41.165462493896484, -39.91596603393555, -38.666465759277344, -37.416969299316406, -36.16747283935547, -34.91797637939453, -33.668479919433594, -32.41897964477539, -31.169483184814453, -29.919986724853516, -28.670488357543945, -27.420989990234375, -26.171493530273438, -24.9219970703125, -23.67249870300293, -22.42300033569336, -21.173503875732422, -19.924007415771484, -18.674509048461914, -17.425010681152344, -16.175514221191406, -14.926016807556152, -13.676519393920898, -12.427021980285645, -11.17752456665039, -9.928027153015137, -8.678529739379883, -7.429032325744629, -6.179534912109375, -4.930037498474121, -3.680540084838867, -2.4310426712036133, -1.1815452575683594, 0.06795215606689453, 1.3174495697021484, 2.5669469833374023, 3.8164443969726562, 5.06594181060791, 6.315439224243164, 7.564936637878418, 8.814434051513672, 10.063931465148926, 11.31342887878418, 12.562926292419434, 13.812423706054688, 15.061921119689941, 16.311418533325195, 17.560916900634766, 18.810413360595703, 20.05990982055664, 21.30940818786621, 22.55890655517578, 23.80840301513672, 25.057899475097656, 26.307397842407227, 27.556896209716797, 28.806392669677734, 30.055889129638672, 31.305387496948242, 32.55488586425781, 33.80438232421875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 4.0, 7.0, 12.0, 20.0, 30.0, 34.0, 49.0, 98.0, 132.0, 221.0, 352.0, 651.0, 1063.0, 1959.0, 3707.0, 7069.0, 14741.0, 32462.0, 75728.0, 192327.0, 384120.0, 194358.0, 76276.0, 32673.0, 15038.0, 7057.0, 3727.0, 1965.0, 1078.0, 625.0, 361.0, 215.0, 140.0, 76.0, 46.0, 38.0, 33.0, 20.0, 12.0, 5.0, 8.0, 9.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.30596923828125, -4.1549072265625, -4.00384521484375, -3.852783203125, -3.70172119140625, -3.5506591796875, -3.39959716796875, -3.24853515625, -3.09747314453125, -2.9464111328125, -2.79534912109375, -2.644287109375, -2.49322509765625, -2.3421630859375, -2.19110107421875, -2.0400390625, -1.88897705078125, -1.7379150390625, -1.58685302734375, -1.435791015625, -1.28472900390625, -1.1336669921875, -0.98260498046875, -0.83154296875, -0.68048095703125, -0.5294189453125, -0.37835693359375, -0.227294921875, -0.07623291015625, 0.0748291015625, 0.22589111328125, 0.376953125, 0.52801513671875, 0.6790771484375, 0.83013916015625, 0.981201171875, 1.13226318359375, 1.2833251953125, 1.43438720703125, 1.58544921875, 1.73651123046875, 1.8875732421875, 2.03863525390625, 2.189697265625, 2.34075927734375, 2.4918212890625, 2.64288330078125, 2.7939453125, 2.94500732421875, 3.0960693359375, 3.24713134765625, 3.398193359375, 3.54925537109375, 3.7003173828125, 3.85137939453125, 4.00244140625, 4.15350341796875, 4.3045654296875, 4.45562744140625, 4.606689453125, 4.75775146484375, 4.9088134765625, 5.05987548828125, 5.2109375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 12.0, 15.0, 18.0, 28.0, 28.0, 37.0, 42.0, 52.0, 53.0, 54.0, 50.0, 51.0, 62.0, 64.0, 49.0, 49.0, 61.0, 48.0, 28.0, 40.0, 31.0, 27.0, 26.0, 18.0, 11.0, 13.0, 3.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -4.0679931640625, -3.968017578125, -3.8680419921875, -3.76806640625, -3.6680908203125, -3.568115234375, -3.4681396484375, -3.3681640625, -3.2681884765625, -3.168212890625, -3.0682373046875, -2.96826171875, -2.8682861328125, -2.768310546875, -2.6683349609375, -2.568359375, -2.4683837890625, -2.368408203125, -2.2684326171875, -2.16845703125, -2.0684814453125, -1.968505859375, -1.8685302734375, -1.7685546875, -1.6685791015625, -1.568603515625, -1.4686279296875, -1.36865234375, -1.2686767578125, -1.168701171875, -1.0687255859375, -0.96875, -0.8687744140625, -0.768798828125, -0.6688232421875, -0.56884765625, -0.4688720703125, -0.368896484375, -0.2689208984375, -0.1689453125, -0.0689697265625, 0.031005859375, 0.1309814453125, 0.23095703125, 0.3309326171875, 0.430908203125, 0.5308837890625, 0.630859375, 0.7308349609375, 0.830810546875, 0.9307861328125, 1.03076171875, 1.1307373046875, 1.230712890625, 1.3306884765625, 1.4306640625, 1.5306396484375, 1.630615234375, 1.7305908203125, 1.83056640625, 1.9305419921875, 2.030517578125, 2.1304931640625, 2.23046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 4.0, 4.0, 8.0, 11.0, 13.0, 16.0, 30.0, 35.0, 73.0, 133.0, 223.0, 600.0, 1705.0, 6711.0, 46955.0, 683045.0, 278784.0, 23894.0, 4179.0, 1191.0, 487.0, 192.0, 114.0, 53.0, 36.0, 18.0, 7.0, 9.0, 6.0, 5.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-17.234375, -16.822509765625, -16.41064453125, -15.998779296875, -15.5869140625, -15.175048828125, -14.76318359375, -14.351318359375, -13.939453125, -13.527587890625, -13.11572265625, -12.703857421875, -12.2919921875, -11.880126953125, -11.46826171875, -11.056396484375, -10.64453125, -10.232666015625, -9.82080078125, -9.408935546875, -8.9970703125, -8.585205078125, -8.17333984375, -7.761474609375, -7.349609375, -6.937744140625, -6.52587890625, -6.114013671875, -5.7021484375, -5.290283203125, -4.87841796875, -4.466552734375, -4.0546875, -3.642822265625, -3.23095703125, -2.819091796875, -2.4072265625, -1.995361328125, -1.58349609375, -1.171630859375, -0.759765625, -0.347900390625, 0.06396484375, 0.475830078125, 0.8876953125, 1.299560546875, 1.71142578125, 2.123291015625, 2.53515625, 2.947021484375, 3.35888671875, 3.770751953125, 4.1826171875, 4.594482421875, 5.00634765625, 5.418212890625, 5.830078125, 6.241943359375, 6.65380859375, 7.065673828125, 7.4775390625, 7.889404296875, 8.30126953125, 8.713134765625, 9.125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 10.0, 13.0, 16.0, 15.0, 34.0, 27.0, 28.0, 37.0, 48.0, 32.0, 42.0, 48.0, 65.0, 55.0, 57.0, 56.0, 53.0, 40.0, 41.0, 25.0, 34.0, 33.0, 33.0, 29.0, 24.0, 14.0, 14.0, 7.0, 8.0, 4.0, 6.0, 4.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.609375, -10.2681884765625, -9.927001953125, -9.5858154296875, -9.24462890625, -8.9034423828125, -8.562255859375, -8.2210693359375, -7.8798828125, -7.5386962890625, -7.197509765625, -6.8563232421875, -6.51513671875, -6.1739501953125, -5.832763671875, -5.4915771484375, -5.150390625, -4.8092041015625, -4.468017578125, -4.1268310546875, -3.78564453125, -3.4444580078125, -3.103271484375, -2.7620849609375, -2.4208984375, -2.0797119140625, -1.738525390625, -1.3973388671875, -1.05615234375, -0.7149658203125, -0.373779296875, -0.0325927734375, 0.30859375, 0.6497802734375, 0.990966796875, 1.3321533203125, 1.67333984375, 2.0145263671875, 2.355712890625, 2.6968994140625, 3.0380859375, 3.3792724609375, 3.720458984375, 4.0616455078125, 4.40283203125, 4.7440185546875, 5.085205078125, 5.4263916015625, 5.767578125, 6.1087646484375, 6.449951171875, 6.7911376953125, 7.13232421875, 7.4735107421875, 7.814697265625, 8.1558837890625, 8.4970703125, 8.8382568359375, 9.179443359375, 9.5206298828125, 9.86181640625, 10.2030029296875, 10.544189453125, 10.8853759765625, 11.2265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 14.0, 9.0, 24.0, 41.0, 50.0, 93.0, 181.0, 448.0, 1416.0, 8536.0, 724529.0, 304932.0, 6261.0, 1234.0, 393.0, 156.0, 85.0, 55.0, 32.0, 23.0, 12.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.51806640625, -8.2236328125, -7.92919921875, -7.634765625, -7.34033203125, -7.0458984375, -6.75146484375, -6.45703125, -6.16259765625, -5.8681640625, -5.57373046875, -5.279296875, -4.98486328125, -4.6904296875, -4.39599609375, -4.1015625, -3.80712890625, -3.5126953125, -3.21826171875, -2.923828125, -2.62939453125, -2.3349609375, -2.04052734375, -1.74609375, -1.45166015625, -1.1572265625, -0.86279296875, -0.568359375, -0.27392578125, 0.0205078125, 0.31494140625, 0.609375, 0.90380859375, 1.1982421875, 1.49267578125, 1.787109375, 2.08154296875, 2.3759765625, 2.67041015625, 2.96484375, 3.25927734375, 3.5537109375, 3.84814453125, 4.142578125, 4.43701171875, 4.7314453125, 5.02587890625, 5.3203125, 5.61474609375, 5.9091796875, 6.20361328125, 6.498046875, 6.79248046875, 7.0869140625, 7.38134765625, 7.67578125, 7.97021484375, 8.2646484375, 8.55908203125, 8.853515625, 9.14794921875, 9.4423828125, 9.73681640625, 10.03125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 8.0, 9.0, 23.0, 44.0, 125.0, 304.0, 275.0, 127.0, 54.0, 23.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021839141845703125, -0.002117753028869629, -0.0020515918731689453, -0.0019854307174682617, -0.0019192695617675781, -0.0018531084060668945, -0.001786947250366211, -0.0017207860946655273, -0.0016546249389648438, -0.0015884637832641602, -0.0015223026275634766, -0.001456141471862793, -0.0013899803161621094, -0.0013238191604614258, -0.0012576580047607422, -0.0011914968490600586, -0.001125335693359375, -0.0010591745376586914, -0.0009930133819580078, -0.0009268522262573242, -0.0008606910705566406, -0.000794529914855957, -0.0007283687591552734, -0.0006622076034545898, -0.0005960464477539062, -0.0005298852920532227, -0.00046372413635253906, -0.00039756298065185547, -0.0003314018249511719, -0.0002652406692504883, -0.0001990795135498047, -0.0001329183578491211, -6.67572021484375e-05, -5.960464477539062e-07, 6.556510925292969e-05, 0.00013172626495361328, 0.00019788742065429688, 0.00026404857635498047, 0.00033020973205566406, 0.00039637088775634766, 0.00046253204345703125, 0.0005286931991577148, 0.0005948543548583984, 0.000661015510559082, 0.0007271766662597656, 0.0007933378219604492, 0.0008594989776611328, 0.0009256601333618164, 0.0009918212890625, 0.0010579824447631836, 0.0011241436004638672, 0.0011903047561645508, 0.0012564659118652344, 0.001322627067565918, 0.0013887882232666016, 0.0014549493789672852, 0.0015211105346679688, 0.0015872716903686523, 0.001653432846069336, 0.0017195940017700195, 0.0017857551574707031, 0.0018519163131713867, 0.0019180774688720703, 0.001984238624572754, 0.0020503997802734375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 9.0, 14.0, 23.0, 48.0, 104.0, 214.0, 610.0, 2685.0, 28948.0, 944713.0, 65908.0, 3969.0, 785.0, 268.0, 111.0, 62.0, 24.0, 24.0, 14.0, 7.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.59765625, -5.36053466796875, -5.1234130859375, -4.88629150390625, -4.649169921875, -4.41204833984375, -4.1749267578125, -3.93780517578125, -3.70068359375, -3.46356201171875, -3.2264404296875, -2.98931884765625, -2.752197265625, -2.51507568359375, -2.2779541015625, -2.04083251953125, -1.8037109375, -1.56658935546875, -1.3294677734375, -1.09234619140625, -0.855224609375, -0.61810302734375, -0.3809814453125, -0.14385986328125, 0.09326171875, 0.33038330078125, 0.5675048828125, 0.80462646484375, 1.041748046875, 1.27886962890625, 1.5159912109375, 1.75311279296875, 1.990234375, 2.22735595703125, 2.4644775390625, 2.70159912109375, 2.938720703125, 3.17584228515625, 3.4129638671875, 3.65008544921875, 3.88720703125, 4.12432861328125, 4.3614501953125, 4.59857177734375, 4.835693359375, 5.07281494140625, 5.3099365234375, 5.54705810546875, 5.7841796875, 6.02130126953125, 6.2584228515625, 6.49554443359375, 6.732666015625, 6.96978759765625, 7.2069091796875, 7.44403076171875, 7.68115234375, 7.91827392578125, 8.1553955078125, 8.39251708984375, 8.629638671875, 8.86676025390625, 9.1038818359375, 9.34100341796875, 9.578125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 2.0, 5.0, 10.0, 16.0, 25.0, 27.0, 64.0, 86.0, 144.0, 173.0, 155.0, 110.0, 74.0, 42.0, 26.0, 12.0, 8.0, 8.0, 1.0, 7.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.89453125, -7.704833984375, -7.51513671875, -7.325439453125, -7.1357421875, -6.946044921875, -6.75634765625, -6.566650390625, -6.376953125, -6.187255859375, -5.99755859375, -5.807861328125, -5.6181640625, -5.428466796875, -5.23876953125, -5.049072265625, -4.859375, -4.669677734375, -4.47998046875, -4.290283203125, -4.1005859375, -3.910888671875, -3.72119140625, -3.531494140625, -3.341796875, -3.152099609375, -2.96240234375, -2.772705078125, -2.5830078125, -2.393310546875, -2.20361328125, -2.013916015625, -1.82421875, -1.634521484375, -1.44482421875, -1.255126953125, -1.0654296875, -0.875732421875, -0.68603515625, -0.496337890625, -0.306640625, -0.116943359375, 0.07275390625, 0.262451171875, 0.4521484375, 0.641845703125, 0.83154296875, 1.021240234375, 1.2109375, 1.400634765625, 1.59033203125, 1.780029296875, 1.9697265625, 2.159423828125, 2.34912109375, 2.538818359375, 2.728515625, 2.918212890625, 3.10791015625, 3.297607421875, 3.4873046875, 3.677001953125, 3.86669921875, 4.056396484375, 4.24609375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 6.0, 7.0, 18.0, 35.0, 56.0, 131.0, 219.0, 209.0, 133.0, 74.0, 44.0, 34.0, 11.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.428253173828125, -54.912776947021484, -52.397300720214844, -49.8818244934082, -47.36634826660156, -44.85087203979492, -42.33539581298828, -39.81991958618164, -37.304443359375, -34.78896713256836, -32.27349090576172, -29.758014678955078, -27.242538452148438, -24.727062225341797, -22.211585998535156, -19.696109771728516, -17.180633544921875, -14.665157318115234, -12.149681091308594, -9.634204864501953, -7.1187286376953125, -4.603252410888672, -2.0877761840820312, 0.4277000427246094, 2.94317626953125, 5.458652496337891, 7.974128723144531, 10.489604949951172, 13.005081176757812, 15.520557403564453, 18.036033630371094, 20.551509857177734, 23.066986083984375, 25.582462310791016, 28.097938537597656, 30.613414764404297, 33.12889099121094, 35.64436721801758, 38.15984344482422, 40.67531967163086, 43.1907958984375, 45.70627212524414, 48.22174835205078, 50.73722457885742, 53.25270080566406, 55.7681770324707, 58.283653259277344, 60.799129486083984, 63.314605712890625, 65.830078125, 68.3455581665039, 70.86103820800781, 73.37651062011719, 75.89198303222656, 78.40746307373047, 80.92294311523438, 83.43841552734375, 85.95388793945312, 88.46936798095703, 90.98484802246094, 93.50032043457031, 96.01579284667969, 98.5312728881836, 101.0467529296875, 103.56222534179688]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 8.0, 5.0, 11.0, 6.0, 13.0, 15.0, 19.0, 22.0, 18.0, 28.0, 24.0, 32.0, 36.0, 29.0, 30.0, 38.0, 48.0, 43.0, 65.0, 51.0, 45.0, 43.0, 41.0, 41.0, 47.0, 36.0, 41.0, 22.0, 17.0, 14.0, 20.0, 13.0, 18.0, 10.0, 7.0, 6.0, 5.0, 6.0, 5.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-44.51716232299805, -43.176795959472656, -41.83642578125, -40.49605941772461, -39.15569305419922, -37.81532287597656, -36.47495651245117, -35.13459014892578, -33.794219970703125, -32.453853607177734, -31.113483428955078, -29.773117065429688, -28.432748794555664, -27.09238052368164, -25.75201416015625, -24.411645889282227, -23.071277618408203, -21.73090934753418, -20.390541076660156, -19.050174713134766, -17.709806442260742, -16.36943817138672, -15.029070854187012, -13.688703536987305, -12.348335266113281, -11.007966995239258, -9.66759967803955, -8.327232360839844, -6.98686408996582, -5.646496295928955, -4.30612850189209, -2.965761184692383, -1.625396728515625, -0.28502893447875977, 1.0553388595581055, 2.3957066535949707, 3.736074447631836, 5.076442241668701, 6.416810035705566, 7.757177352905273, 9.097545623779297, 10.43791389465332, 11.778281211853027, 13.118648529052734, 14.459016799926758, 15.799385070800781, 17.139751434326172, 18.480119705200195, 19.82048797607422, 21.160856246948242, 22.501224517822266, 23.841590881347656, 25.18195915222168, 26.522327423095703, 27.862693786621094, 29.203062057495117, 30.54343032836914, 31.883798599243164, 33.22416687011719, 34.56453323364258, 35.90489959716797, 37.245269775390625, 38.585636138916016, 39.926002502441406, 41.26637268066406]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 7.0, 8.0, 17.0, 23.0, 31.0, 26.0, 72.0, 97.0, 137.0, 274.0, 542.0, 1373.0, 4228.0, 17865.0, 137991.0, 3441790.0, 541490.0, 37580.0, 7118.0, 2042.0, 765.0, 337.0, 168.0, 115.0, 62.0, 29.0, 23.0, 17.0, 7.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4765625, -7.2728271484375, -7.069091796875, -6.8653564453125, -6.66162109375, -6.4578857421875, -6.254150390625, -6.0504150390625, -5.8466796875, -5.6429443359375, -5.439208984375, -5.2354736328125, -5.03173828125, -4.8280029296875, -4.624267578125, -4.4205322265625, -4.216796875, -4.0130615234375, -3.809326171875, -3.6055908203125, -3.40185546875, -3.1981201171875, -2.994384765625, -2.7906494140625, -2.5869140625, -2.3831787109375, -2.179443359375, -1.9757080078125, -1.77197265625, -1.5682373046875, -1.364501953125, -1.1607666015625, -0.95703125, -0.7532958984375, -0.549560546875, -0.3458251953125, -0.14208984375, 0.0616455078125, 0.265380859375, 0.4691162109375, 0.6728515625, 0.8765869140625, 1.080322265625, 1.2840576171875, 1.48779296875, 1.6915283203125, 1.895263671875, 2.0989990234375, 2.302734375, 2.5064697265625, 2.710205078125, 2.9139404296875, 3.11767578125, 3.3214111328125, 3.525146484375, 3.7288818359375, 3.9326171875, 4.1363525390625, 4.340087890625, 4.5438232421875, 4.74755859375, 4.9512939453125, 5.155029296875, 5.3587646484375, 5.5625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 7.0, 10.0, 5.0, 13.0, 16.0, 17.0, 27.0, 33.0, 32.0, 31.0, 42.0, 34.0, 44.0, 48.0, 39.0, 41.0, 59.0, 49.0, 62.0, 46.0, 37.0, 50.0, 42.0, 42.0, 35.0, 14.0, 23.0, 16.0, 18.0, 13.0, 11.0, 16.0, 10.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.751953125, -2.6784210205078125, -2.604888916015625, -2.5313568115234375, -2.45782470703125, -2.3842926025390625, -2.310760498046875, -2.2372283935546875, -2.1636962890625, -2.0901641845703125, -2.016632080078125, -1.9430999755859375, -1.86956787109375, -1.7960357666015625, -1.722503662109375, -1.6489715576171875, -1.575439453125, -1.5019073486328125, -1.428375244140625, -1.3548431396484375, -1.28131103515625, -1.2077789306640625, -1.134246826171875, -1.0607147216796875, -0.9871826171875, -0.9136505126953125, -0.840118408203125, -0.7665863037109375, -0.69305419921875, -0.6195220947265625, -0.545989990234375, -0.4724578857421875, -0.39892578125, -0.3253936767578125, -0.251861572265625, -0.1783294677734375, -0.10479736328125, -0.0312652587890625, 0.042266845703125, 0.1157989501953125, 0.1893310546875, 0.2628631591796875, 0.336395263671875, 0.4099273681640625, 0.48345947265625, 0.5569915771484375, 0.630523681640625, 0.7040557861328125, 0.777587890625, 0.8511199951171875, 0.924652099609375, 0.9981842041015625, 1.07171630859375, 1.1452484130859375, 1.218780517578125, 1.2923126220703125, 1.3658447265625, 1.4393768310546875, 1.512908935546875, 1.5864410400390625, 1.65997314453125, 1.7335052490234375, 1.807037353515625, 1.8805694580078125, 1.9541015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 12.0, 17.0, 30.0, 35.0, 53.0, 91.0, 170.0, 325.0, 622.0, 1508.0, 4054.0, 14799.0, 82807.0, 2314445.0, 1679478.0, 74498.0, 14643.0, 4132.0, 1430.0, 552.0, 256.0, 127.0, 77.0, 39.0, 24.0, 25.0, 9.0, 7.0, 0.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.49609375, -5.26678466796875, -5.0374755859375, -4.80816650390625, -4.578857421875, -4.34954833984375, -4.1202392578125, -3.89093017578125, -3.66162109375, -3.43231201171875, -3.2030029296875, -2.97369384765625, -2.744384765625, -2.51507568359375, -2.2857666015625, -2.05645751953125, -1.8271484375, -1.59783935546875, -1.3685302734375, -1.13922119140625, -0.909912109375, -0.68060302734375, -0.4512939453125, -0.22198486328125, 0.00732421875, 0.23663330078125, 0.4659423828125, 0.69525146484375, 0.924560546875, 1.15386962890625, 1.3831787109375, 1.61248779296875, 1.841796875, 2.07110595703125, 2.3004150390625, 2.52972412109375, 2.759033203125, 2.98834228515625, 3.2176513671875, 3.44696044921875, 3.67626953125, 3.90557861328125, 4.1348876953125, 4.36419677734375, 4.593505859375, 4.82281494140625, 5.0521240234375, 5.28143310546875, 5.5107421875, 5.74005126953125, 5.9693603515625, 6.19866943359375, 6.427978515625, 6.65728759765625, 6.8865966796875, 7.11590576171875, 7.34521484375, 7.57452392578125, 7.8038330078125, 8.03314208984375, 8.262451171875, 8.49176025390625, 8.7210693359375, 8.95037841796875, 9.1796875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 7.0, 10.0, 15.0, 16.0, 42.0, 43.0, 69.0, 89.0, 133.0, 245.0, 491.0, 1022.0, 889.0, 395.0, 184.0, 123.0, 83.0, 53.0, 40.0, 22.0, 20.0, 20.0, 13.0, 5.0, 12.0, 4.0, 3.0, 2.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.5078125, -8.28277587890625, -8.0577392578125, -7.83270263671875, -7.607666015625, -7.38262939453125, -7.1575927734375, -6.93255615234375, -6.70751953125, -6.48248291015625, -6.2574462890625, -6.03240966796875, -5.807373046875, -5.58233642578125, -5.3572998046875, -5.13226318359375, -4.9072265625, -4.68218994140625, -4.4571533203125, -4.23211669921875, -4.007080078125, -3.78204345703125, -3.5570068359375, -3.33197021484375, -3.10693359375, -2.88189697265625, -2.6568603515625, -2.43182373046875, -2.206787109375, -1.98175048828125, -1.7567138671875, -1.53167724609375, -1.306640625, -1.08160400390625, -0.8565673828125, -0.63153076171875, -0.406494140625, -0.18145751953125, 0.0435791015625, 0.26861572265625, 0.49365234375, 0.71868896484375, 0.9437255859375, 1.16876220703125, 1.393798828125, 1.61883544921875, 1.8438720703125, 2.06890869140625, 2.2939453125, 2.51898193359375, 2.7440185546875, 2.96905517578125, 3.194091796875, 3.41912841796875, 3.6441650390625, 3.86920166015625, 4.09423828125, 4.31927490234375, 4.5443115234375, 4.76934814453125, 4.994384765625, 5.21942138671875, 5.4444580078125, 5.66949462890625, 5.89453125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 15.0, 24.0, 82.0, 191.0, 330.0, 229.0, 75.0, 23.0, 12.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-117.02490997314453, -113.55226135253906, -110.0796127319336, -106.60696411132812, -103.13431549072266, -99.66166687011719, -96.18901824951172, -92.71636962890625, -89.24372100830078, -85.77107238769531, -82.29842376708984, -78.82577514648438, -75.3531265258789, -71.88047790527344, -68.40782928466797, -64.9351806640625, -61.462528228759766, -57.9898796081543, -54.51723098754883, -51.04458236694336, -47.57193374633789, -44.099281311035156, -40.62663269042969, -37.15398406982422, -33.68133544921875, -30.20868682861328, -26.736038208007812, -23.263389587402344, -19.790740966796875, -16.318090438842773, -12.845441818237305, -9.372793197631836, -5.900146484375, -2.427497625350952, 1.0451512336730957, 4.517800331115723, 7.990448951721191, 11.463098526000977, 14.935747146606445, 18.408395767211914, 21.881044387817383, 25.35369300842285, 28.82634162902832, 32.29899215698242, 35.77164077758789, 39.24428939819336, 42.71693801879883, 46.1895866394043, 49.662235260009766, 53.134883880615234, 56.6075325012207, 60.08018112182617, 63.55282974243164, 67.02548217773438, 70.49813079833984, 73.97077941894531, 77.44342803955078, 80.91607666015625, 84.38872528076172, 87.86137390136719, 91.33402252197266, 94.80667114257812, 98.2793197631836, 101.75196838378906, 105.22461700439453]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 7.0, 10.0, 4.0, 4.0, 6.0, 7.0, 15.0, 13.0, 16.0, 25.0, 29.0, 37.0, 24.0, 41.0, 31.0, 57.0, 61.0, 56.0, 57.0, 50.0, 50.0, 47.0, 53.0, 38.0, 40.0, 36.0, 30.0, 30.0, 29.0, 14.0, 17.0, 18.0, 20.0, 9.0, 8.0, 3.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.60093688964844, -33.525184631347656, -32.449432373046875, -31.373676300048828, -30.297924041748047, -29.222171783447266, -28.14641761779785, -27.070663452148438, -25.994911193847656, -24.919158935546875, -23.84340476989746, -22.767650604248047, -21.691898345947266, -20.616146087646484, -19.54039192199707, -18.464637756347656, -17.388885498046875, -16.313133239746094, -15.23737907409668, -14.161625862121582, -13.085872650146484, -12.010119438171387, -10.934366226196289, -9.858613014221191, -8.782859802246094, -7.707106590270996, -6.631353378295898, -5.555600166320801, -4.479846954345703, -3.4040937423706055, -2.328340530395508, -1.2525873184204102, -0.1768341064453125, 0.8989191055297852, 1.9746723175048828, 3.0504255294799805, 4.126178741455078, 5.201931953430176, 6.277685165405273, 7.353438377380371, 8.429191589355469, 9.504944801330566, 10.580698013305664, 11.656451225280762, 12.73220443725586, 13.807957649230957, 14.883710861206055, 15.959464073181152, 17.03521728515625, 18.11096954345703, 19.186723709106445, 20.26247787475586, 21.33823013305664, 22.413982391357422, 23.489736557006836, 24.56549072265625, 25.64124298095703, 26.716995239257812, 27.792749404907227, 28.86850357055664, 29.944255828857422, 31.020008087158203, 32.09576416015625, 33.17151641845703, 34.24726867675781]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 8.0, 11.0, 11.0, 16.0, 31.0, 62.0, 65.0, 133.0, 265.0, 405.0, 903.0, 1924.0, 4605.0, 11090.0, 28385.0, 75346.0, 194819.0, 380616.0, 213410.0, 83325.0, 31603.0, 12332.0, 4955.0, 2147.0, 985.0, 500.0, 234.0, 128.0, 86.0, 60.0, 31.0, 19.0, 13.0, 15.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8984375, -4.75244140625, -4.6064453125, -4.46044921875, -4.314453125, -4.16845703125, -4.0224609375, -3.87646484375, -3.73046875, -3.58447265625, -3.4384765625, -3.29248046875, -3.146484375, -3.00048828125, -2.8544921875, -2.70849609375, -2.5625, -2.41650390625, -2.2705078125, -2.12451171875, -1.978515625, -1.83251953125, -1.6865234375, -1.54052734375, -1.39453125, -1.24853515625, -1.1025390625, -0.95654296875, -0.810546875, -0.66455078125, -0.5185546875, -0.37255859375, -0.2265625, -0.08056640625, 0.0654296875, 0.21142578125, 0.357421875, 0.50341796875, 0.6494140625, 0.79541015625, 0.94140625, 1.08740234375, 1.2333984375, 1.37939453125, 1.525390625, 1.67138671875, 1.8173828125, 1.96337890625, 2.109375, 2.25537109375, 2.4013671875, 2.54736328125, 2.693359375, 2.83935546875, 2.9853515625, 3.13134765625, 3.27734375, 3.42333984375, 3.5693359375, 3.71533203125, 3.861328125, 4.00732421875, 4.1533203125, 4.29931640625, 4.4453125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 4.0, 6.0, 12.0, 10.0, 14.0, 17.0, 20.0, 18.0, 28.0, 32.0, 32.0, 33.0, 40.0, 32.0, 41.0, 31.0, 40.0, 56.0, 43.0, 40.0, 36.0, 36.0, 33.0, 40.0, 41.0, 30.0, 26.0, 29.0, 19.0, 17.0, 26.0, 21.0, 20.0, 20.0, 17.0, 10.0, 8.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.361328125, -2.296875, -2.232421875, -2.16796875, -2.103515625, -2.0390625, -1.974609375, -1.91015625, -1.845703125, -1.78125, -1.716796875, -1.65234375, -1.587890625, -1.5234375, -1.458984375, -1.39453125, -1.330078125, -1.265625, -1.201171875, -1.13671875, -1.072265625, -1.0078125, -0.943359375, -0.87890625, -0.814453125, -0.75, -0.685546875, -0.62109375, -0.556640625, -0.4921875, -0.427734375, -0.36328125, -0.298828125, -0.234375, -0.169921875, -0.10546875, -0.041015625, 0.0234375, 0.087890625, 0.15234375, 0.216796875, 0.28125, 0.345703125, 0.41015625, 0.474609375, 0.5390625, 0.603515625, 0.66796875, 0.732421875, 0.796875, 0.861328125, 0.92578125, 0.990234375, 1.0546875, 1.119140625, 1.18359375, 1.248046875, 1.3125, 1.376953125, 1.44140625, 1.505859375, 1.5703125, 1.634765625, 1.69921875, 1.763671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 3.0, 11.0, 14.0, 26.0, 28.0, 28.0, 49.0, 53.0, 75.0, 94.0, 126.0, 175.0, 223.0, 403.0, 586.0, 955.0, 1581.0, 3227.0, 9017.0, 35099.0, 190668.0, 647998.0, 120773.0, 24080.0, 6707.0, 2704.0, 1333.0, 812.0, 505.0, 359.0, 256.0, 158.0, 125.0, 82.0, 61.0, 47.0, 28.0, 24.0, 11.0, 9.0, 5.0, 6.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8203125, -6.59576416015625, -6.3712158203125, -6.14666748046875, -5.922119140625, -5.69757080078125, -5.4730224609375, -5.24847412109375, -5.02392578125, -4.79937744140625, -4.5748291015625, -4.35028076171875, -4.125732421875, -3.90118408203125, -3.6766357421875, -3.45208740234375, -3.2275390625, -3.00299072265625, -2.7784423828125, -2.55389404296875, -2.329345703125, -2.10479736328125, -1.8802490234375, -1.65570068359375, -1.43115234375, -1.20660400390625, -0.9820556640625, -0.75750732421875, -0.532958984375, -0.30841064453125, -0.0838623046875, 0.14068603515625, 0.365234375, 0.58978271484375, 0.8143310546875, 1.03887939453125, 1.263427734375, 1.48797607421875, 1.7125244140625, 1.93707275390625, 2.16162109375, 2.38616943359375, 2.6107177734375, 2.83526611328125, 3.059814453125, 3.28436279296875, 3.5089111328125, 3.73345947265625, 3.9580078125, 4.18255615234375, 4.4071044921875, 4.63165283203125, 4.856201171875, 5.08074951171875, 5.3052978515625, 5.52984619140625, 5.75439453125, 5.97894287109375, 6.2034912109375, 6.42803955078125, 6.652587890625, 6.87713623046875, 7.1016845703125, 7.32623291015625, 7.55078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 7.0, 7.0, 14.0, 16.0, 12.0, 16.0, 15.0, 18.0, 32.0, 27.0, 30.0, 37.0, 34.0, 43.0, 52.0, 40.0, 31.0, 35.0, 46.0, 53.0, 46.0, 36.0, 44.0, 37.0, 35.0, 36.0, 15.0, 26.0, 26.0, 21.0, 13.0, 16.0, 16.0, 15.0, 13.0, 6.0, 3.0, 5.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5390625, -9.2373046875, -8.935546875, -8.6337890625, -8.33203125, -8.0302734375, -7.728515625, -7.4267578125, -7.125, -6.8232421875, -6.521484375, -6.2197265625, -5.91796875, -5.6162109375, -5.314453125, -5.0126953125, -4.7109375, -4.4091796875, -4.107421875, -3.8056640625, -3.50390625, -3.2021484375, -2.900390625, -2.5986328125, -2.296875, -1.9951171875, -1.693359375, -1.3916015625, -1.08984375, -0.7880859375, -0.486328125, -0.1845703125, 0.1171875, 0.4189453125, 0.720703125, 1.0224609375, 1.32421875, 1.6259765625, 1.927734375, 2.2294921875, 2.53125, 2.8330078125, 3.134765625, 3.4365234375, 3.73828125, 4.0400390625, 4.341796875, 4.6435546875, 4.9453125, 5.2470703125, 5.548828125, 5.8505859375, 6.15234375, 6.4541015625, 6.755859375, 7.0576171875, 7.359375, 7.6611328125, 7.962890625, 8.2646484375, 8.56640625, 8.8681640625, 9.169921875, 9.4716796875, 9.7734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 15.0, 11.0, 10.0, 13.0, 30.0, 45.0, 55.0, 63.0, 104.0, 187.0, 302.0, 550.0, 1152.0, 2484.0, 6705.0, 26663.0, 271036.0, 675863.0, 47316.0, 9557.0, 3270.0, 1471.0, 664.0, 358.0, 187.0, 143.0, 91.0, 46.0, 37.0, 17.0, 24.0, 16.0, 15.0, 13.0, 10.0, 10.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.438751220703125, -2.35211181640625, -2.265472412109375, -2.1788330078125, -2.092193603515625, -2.00555419921875, -1.918914794921875, -1.832275390625, -1.745635986328125, -1.65899658203125, -1.572357177734375, -1.4857177734375, -1.399078369140625, -1.31243896484375, -1.225799560546875, -1.13916015625, -1.052520751953125, -0.96588134765625, -0.879241943359375, -0.7926025390625, -0.705963134765625, -0.61932373046875, -0.532684326171875, -0.446044921875, -0.359405517578125, -0.27276611328125, -0.186126708984375, -0.0994873046875, -0.012847900390625, 0.07379150390625, 0.160430908203125, 0.2470703125, 0.333709716796875, 0.42034912109375, 0.506988525390625, 0.5936279296875, 0.680267333984375, 0.76690673828125, 0.853546142578125, 0.940185546875, 1.026824951171875, 1.11346435546875, 1.200103759765625, 1.2867431640625, 1.373382568359375, 1.46002197265625, 1.546661376953125, 1.63330078125, 1.719940185546875, 1.80657958984375, 1.893218994140625, 1.9798583984375, 2.066497802734375, 2.15313720703125, 2.239776611328125, 2.326416015625, 2.413055419921875, 2.49969482421875, 2.586334228515625, 2.6729736328125, 2.759613037109375, 2.84625244140625, 2.932891845703125, 3.01953125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 6.0, 4.0, 7.0, 10.0, 5.0, 21.0, 29.0, 68.0, 76.0, 137.0, 199.0, 140.0, 99.0, 60.0, 43.0, 20.0, 20.0, 11.0, 15.0, 2.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009512901306152344, -0.0009212866425514221, -0.0008912831544876099, -0.0008612796664237976, -0.0008312761783599854, -0.0008012726902961731, -0.0007712692022323608, -0.0007412657141685486, -0.0007112622261047363, -0.0006812587380409241, -0.0006512552499771118, -0.0006212517619132996, -0.0005912482738494873, -0.000561244785785675, -0.0005312412977218628, -0.0005012378096580505, -0.0004712343215942383, -0.000441230833530426, -0.00041122734546661377, -0.0003812238574028015, -0.00035122036933898926, -0.000321216881275177, -0.00029121339321136475, -0.0002612099051475525, -0.00023120641708374023, -0.00020120292901992798, -0.00017119944095611572, -0.00014119595289230347, -0.00011119246482849121, -8.118897676467896e-05, -5.11854887008667e-05, -2.1182000637054443e-05, 8.821487426757812e-06, 3.882497549057007e-05, 6.882846355438232e-05, 9.883195161819458e-05, 0.00012883543968200684, 0.0001588389277458191, 0.00018884241580963135, 0.0002188459038734436, 0.00024884939193725586, 0.0002788528800010681, 0.00030885636806488037, 0.0003388598561286926, 0.0003688633441925049, 0.00039886683225631714, 0.0004288703203201294, 0.00045887380838394165, 0.0004888772964477539, 0.0005188807845115662, 0.0005488842725753784, 0.0005788877606391907, 0.0006088912487030029, 0.0006388947367668152, 0.0006688982248306274, 0.0006989017128944397, 0.000728905200958252, 0.0007589086890220642, 0.0007889121770858765, 0.0008189156651496887, 0.000848919153213501, 0.0008789226412773132, 0.0009089261293411255, 0.0009389296174049377, 0.00096893310546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 8.0, 14.0, 18.0, 28.0, 63.0, 98.0, 158.0, 339.0, 895.0, 2470.0, 11107.0, 141754.0, 847102.0, 36272.0, 5434.0, 1583.0, 605.0, 280.0, 140.0, 69.0, 48.0, 25.0, 17.0, 9.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.5390625, -4.420501708984375, -4.30194091796875, -4.183380126953125, -4.0648193359375, -3.946258544921875, -3.82769775390625, -3.709136962890625, -3.590576171875, -3.472015380859375, -3.35345458984375, -3.234893798828125, -3.1163330078125, -2.997772216796875, -2.87921142578125, -2.760650634765625, -2.64208984375, -2.523529052734375, -2.40496826171875, -2.286407470703125, -2.1678466796875, -2.049285888671875, -1.93072509765625, -1.812164306640625, -1.693603515625, -1.575042724609375, -1.45648193359375, -1.337921142578125, -1.2193603515625, -1.100799560546875, -0.98223876953125, -0.863677978515625, -0.7451171875, -0.626556396484375, -0.50799560546875, -0.389434814453125, -0.2708740234375, -0.152313232421875, -0.03375244140625, 0.084808349609375, 0.203369140625, 0.321929931640625, 0.44049072265625, 0.559051513671875, 0.6776123046875, 0.796173095703125, 0.91473388671875, 1.033294677734375, 1.15185546875, 1.270416259765625, 1.38897705078125, 1.507537841796875, 1.6260986328125, 1.744659423828125, 1.86322021484375, 1.981781005859375, 2.100341796875, 2.218902587890625, 2.33746337890625, 2.456024169921875, 2.5745849609375, 2.693145751953125, 2.81170654296875, 2.930267333984375, 3.048828125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 12.0, 11.0, 8.0, 14.0, 20.0, 43.0, 45.0, 51.0, 62.0, 63.0, 92.0, 89.0, 92.0, 72.0, 49.0, 56.0, 42.0, 37.0, 36.0, 19.0, 17.0, 15.0, 6.0, 5.0, 5.0, 4.0, 0.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.96014404296875, -1.8890380859375, -1.81793212890625, -1.746826171875, -1.67572021484375, -1.6046142578125, -1.53350830078125, -1.46240234375, -1.39129638671875, -1.3201904296875, -1.24908447265625, -1.177978515625, -1.10687255859375, -1.0357666015625, -0.96466064453125, -0.8935546875, -0.82244873046875, -0.7513427734375, -0.68023681640625, -0.609130859375, -0.53802490234375, -0.4669189453125, -0.39581298828125, -0.32470703125, -0.25360107421875, -0.1824951171875, -0.11138916015625, -0.040283203125, 0.03082275390625, 0.1019287109375, 0.17303466796875, 0.244140625, 0.31524658203125, 0.3863525390625, 0.45745849609375, 0.528564453125, 0.59967041015625, 0.6707763671875, 0.74188232421875, 0.81298828125, 0.88409423828125, 0.9552001953125, 1.02630615234375, 1.097412109375, 1.16851806640625, 1.2396240234375, 1.31072998046875, 1.3818359375, 1.45294189453125, 1.5240478515625, 1.59515380859375, 1.666259765625, 1.73736572265625, 1.8084716796875, 1.87957763671875, 1.95068359375, 2.02178955078125, 2.0928955078125, 2.16400146484375, 2.235107421875, 2.30621337890625, 2.3773193359375, 2.44842529296875, 2.51953125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 7.0, 16.0, 33.0, 41.0, 77.0, 113.0, 180.0, 171.0, 130.0, 93.0, 45.0, 27.0, 18.0, 10.0, 6.0, 7.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-51.031551361083984, -49.385169982910156, -47.73878860473633, -46.0924072265625, -44.446022033691406, -42.79964065551758, -41.15325927734375, -39.50687789916992, -37.860496520996094, -36.214115142822266, -34.56773376464844, -32.921348571777344, -31.27496910095215, -29.628585815429688, -27.98220443725586, -26.33582305908203, -24.68943977355957, -23.043058395385742, -21.39667510986328, -19.750293731689453, -18.103912353515625, -16.457530975341797, -14.811147689819336, -13.164766311645508, -11.518383979797363, -9.872001647949219, -8.22562026977539, -6.579237937927246, -4.93285608291626, -3.2864742279052734, -1.640091896057129, 0.006289482116699219, 1.6526718139648438, 3.29905366897583, 4.945435523986816, 6.591817855834961, 8.238199234008789, 9.884581565856934, 11.530963897705078, 13.177345275878906, 14.82372760772705, 16.470109939575195, 18.116491317749023, 19.762874603271484, 21.409255981445312, 23.05563735961914, 24.70201873779297, 26.348400115966797, 27.994783401489258, 29.641164779663086, 31.287548065185547, 32.933929443359375, 34.5803108215332, 36.22669219970703, 37.873077392578125, 39.51945495605469, 41.16584014892578, 42.81222152709961, 44.45860290527344, 46.10498809814453, 47.75136947631836, 49.39775085449219, 51.044132232666016, 52.690513610839844, 54.33689498901367]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 11.0, 11.0, 3.0, 7.0, 13.0, 10.0, 15.0, 19.0, 23.0, 27.0, 19.0, 28.0, 26.0, 33.0, 33.0, 29.0, 38.0, 44.0, 62.0, 74.0, 72.0, 48.0, 41.0, 34.0, 32.0, 30.0, 40.0, 24.0, 26.0, 16.0, 13.0, 26.0, 11.0, 8.0, 8.0, 8.0, 7.0, 6.0, 10.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.02223205566406, -32.83033752441406, -31.638442993164062, -30.44654655456543, -29.25465202331543, -28.06275749206543, -26.870861053466797, -25.678966522216797, -24.487071990966797, -23.295177459716797, -22.103282928466797, -20.911386489868164, -19.719491958618164, -18.527597427368164, -17.33570098876953, -16.14380645751953, -14.951911926269531, -13.760017395019531, -12.568121910095215, -11.376226425170898, -10.184331893920898, -8.992437362670898, -7.800541877746582, -6.608646392822266, -5.416751861572266, -4.224856853485107, -3.032961845397949, -1.841066837310791, -0.6491718292236328, 0.5427231788635254, 1.7346181869506836, 2.926513671875, 4.118404388427734, 5.310299396514893, 6.502194404602051, 7.694089412689209, 8.885984420776367, 10.077878952026367, 11.269774436950684, 12.461669921875, 13.653564453125, 14.845458984375, 16.037353515625, 17.229249954223633, 18.421144485473633, 19.613039016723633, 20.804935455322266, 21.996829986572266, 23.188724517822266, 24.380619049072266, 25.572513580322266, 26.7644100189209, 27.9563045501709, 29.1481990814209, 30.34009552001953, 31.53199005126953, 32.72388458251953, 33.91577911376953, 35.10767364501953, 36.29956817626953, 37.49146270751953, 38.6833610534668, 39.8752555847168, 41.0671501159668, 42.2590446472168]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 8.0, 12.0, 17.0, 16.0, 27.0, 46.0, 51.0, 80.0, 171.0, 314.0, 609.0, 1525.0, 3810.0, 11193.0, 43563.0, 391369.0, 3148358.0, 518841.0, 52754.0, 13908.0, 4459.0, 1670.0, 735.0, 315.0, 172.0, 90.0, 53.0, 28.0, 19.0, 13.0, 7.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.06640625, -4.94146728515625, -4.8165283203125, -4.69158935546875, -4.566650390625, -4.44171142578125, -4.3167724609375, -4.19183349609375, -4.06689453125, -3.94195556640625, -3.8170166015625, -3.69207763671875, -3.567138671875, -3.44219970703125, -3.3172607421875, -3.19232177734375, -3.0673828125, -2.94244384765625, -2.8175048828125, -2.69256591796875, -2.567626953125, -2.44268798828125, -2.3177490234375, -2.19281005859375, -2.06787109375, -1.94293212890625, -1.8179931640625, -1.69305419921875, -1.568115234375, -1.44317626953125, -1.3182373046875, -1.19329833984375, -1.068359375, -0.94342041015625, -0.8184814453125, -0.69354248046875, -0.568603515625, -0.44366455078125, -0.3187255859375, -0.19378662109375, -0.06884765625, 0.05609130859375, 0.1810302734375, 0.30596923828125, 0.430908203125, 0.55584716796875, 0.6807861328125, 0.80572509765625, 0.9306640625, 1.05560302734375, 1.1805419921875, 1.30548095703125, 1.430419921875, 1.55535888671875, 1.6802978515625, 1.80523681640625, 1.93017578125, 2.05511474609375, 2.1800537109375, 2.30499267578125, 2.429931640625, 2.55487060546875, 2.6798095703125, 2.80474853515625, 2.9296875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 8.0, 6.0, 11.0, 16.0, 21.0, 23.0, 29.0, 49.0, 56.0, 50.0, 51.0, 62.0, 70.0, 78.0, 53.0, 61.0, 71.0, 56.0, 59.0, 57.0, 20.0, 24.0, 27.0, 11.0, 12.0, 13.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.2392578125, -4.134765625, -4.0302734375, -3.92578125, -3.8212890625, -3.716796875, -3.6123046875, -3.5078125, -3.4033203125, -3.298828125, -3.1943359375, -3.08984375, -2.9853515625, -2.880859375, -2.7763671875, -2.671875, -2.5673828125, -2.462890625, -2.3583984375, -2.25390625, -2.1494140625, -2.044921875, -1.9404296875, -1.8359375, -1.7314453125, -1.626953125, -1.5224609375, -1.41796875, -1.3134765625, -1.208984375, -1.1044921875, -1.0, -0.8955078125, -0.791015625, -0.6865234375, -0.58203125, -0.4775390625, -0.373046875, -0.2685546875, -0.1640625, -0.0595703125, 0.044921875, 0.1494140625, 0.25390625, 0.3583984375, 0.462890625, 0.5673828125, 0.671875, 0.7763671875, 0.880859375, 0.9853515625, 1.08984375, 1.1943359375, 1.298828125, 1.4033203125, 1.5078125, 1.6123046875, 1.716796875, 1.8212890625, 1.92578125, 2.0302734375, 2.134765625, 2.2392578125, 2.34375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 14.0, 13.0, 24.0, 39.0, 52.0, 77.0, 90.0, 186.0, 305.0, 723.0, 2132.0, 10438.0, 100929.0, 3781255.0, 272394.0, 19792.0, 3887.0, 1120.0, 467.0, 154.0, 86.0, 51.0, 25.0, 8.0, 8.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3125, -8.0498046875, -7.787109375, -7.5244140625, -7.26171875, -6.9990234375, -6.736328125, -6.4736328125, -6.2109375, -5.9482421875, -5.685546875, -5.4228515625, -5.16015625, -4.8974609375, -4.634765625, -4.3720703125, -4.109375, -3.8466796875, -3.583984375, -3.3212890625, -3.05859375, -2.7958984375, -2.533203125, -2.2705078125, -2.0078125, -1.7451171875, -1.482421875, -1.2197265625, -0.95703125, -0.6943359375, -0.431640625, -0.1689453125, 0.09375, 0.3564453125, 0.619140625, 0.8818359375, 1.14453125, 1.4072265625, 1.669921875, 1.9326171875, 2.1953125, 2.4580078125, 2.720703125, 2.9833984375, 3.24609375, 3.5087890625, 3.771484375, 4.0341796875, 4.296875, 4.5595703125, 4.822265625, 5.0849609375, 5.34765625, 5.6103515625, 5.873046875, 6.1357421875, 6.3984375, 6.6611328125, 6.923828125, 7.1865234375, 7.44921875, 7.7119140625, 7.974609375, 8.2373046875, 8.5]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 12.0, 20.0, 27.0, 42.0, 67.0, 132.0, 273.0, 735.0, 1298.0, 746.0, 347.0, 141.0, 78.0, 43.0, 45.0, 19.0, 9.0, 10.0, 9.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.8046875, -10.544677734375, -10.28466796875, -10.024658203125, -9.7646484375, -9.504638671875, -9.24462890625, -8.984619140625, -8.724609375, -8.464599609375, -8.20458984375, -7.944580078125, -7.6845703125, -7.424560546875, -7.16455078125, -6.904541015625, -6.64453125, -6.384521484375, -6.12451171875, -5.864501953125, -5.6044921875, -5.344482421875, -5.08447265625, -4.824462890625, -4.564453125, -4.304443359375, -4.04443359375, -3.784423828125, -3.5244140625, -3.264404296875, -3.00439453125, -2.744384765625, -2.484375, -2.224365234375, -1.96435546875, -1.704345703125, -1.4443359375, -1.184326171875, -0.92431640625, -0.664306640625, -0.404296875, -0.144287109375, 0.11572265625, 0.375732421875, 0.6357421875, 0.895751953125, 1.15576171875, 1.415771484375, 1.67578125, 1.935791015625, 2.19580078125, 2.455810546875, 2.7158203125, 2.975830078125, 3.23583984375, 3.495849609375, 3.755859375, 4.015869140625, 4.27587890625, 4.535888671875, 4.7958984375, 5.055908203125, 5.31591796875, 5.575927734375, 5.8359375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 10.0, 22.0, 55.0, 128.0, 275.0, 249.0, 129.0, 70.0, 25.0, 13.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.22256469726562, -69.8890151977539, -67.55547332763672, -65.221923828125, -62.88837814331055, -60.554832458496094, -58.221282958984375, -55.88773727416992, -53.55419158935547, -51.220645904541016, -48.88710021972656, -46.553550720214844, -44.22000503540039, -41.88645935058594, -39.55290985107422, -37.219364166259766, -34.88581848144531, -32.55227279663086, -30.218725204467773, -27.885177612304688, -25.551631927490234, -23.21808624267578, -20.884538650512695, -18.55099105834961, -16.217445373535156, -13.883898735046387, -11.550352096557617, -9.216805458068848, -6.883258819580078, -4.549712181091309, -2.216165542602539, 0.11738204956054688, 2.450927734375, 4.7844743728637695, 7.118021011352539, 9.451567649841309, 11.785114288330078, 14.118660926818848, 16.452207565307617, 18.785755157470703, 21.119300842285156, 23.45284652709961, 25.786394119262695, 28.11994171142578, 30.453487396240234, 32.78703308105469, 35.120582580566406, 37.45412826538086, 39.78767395019531, 42.121219635009766, 44.45476531982422, 46.78831481933594, 49.12186050415039, 51.455406188964844, 53.78895568847656, 56.122501373291016, 58.45604705810547, 60.78959274291992, 63.123138427734375, 65.4566879272461, 67.79023742675781, 70.123779296875, 72.45732879638672, 74.79087829589844, 77.12442016601562]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 6.0, 6.0, 10.0, 9.0, 9.0, 20.0, 13.0, 16.0, 27.0, 24.0, 30.0, 24.0, 38.0, 53.0, 39.0, 42.0, 48.0, 57.0, 67.0, 51.0, 45.0, 46.0, 54.0, 37.0, 33.0, 30.0, 32.0, 27.0, 24.0, 17.0, 15.0, 19.0, 10.0, 7.0, 4.0, 5.0, 5.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.07762908935547, -30.16109275817871, -29.24455451965332, -28.328018188476562, -27.411479949951172, -26.494943618774414, -25.578407287597656, -24.661869049072266, -23.745330810546875, -22.828794479370117, -21.912256240844727, -20.99571990966797, -20.079181671142578, -19.16264533996582, -18.246109008789062, -17.329570770263672, -16.413034439086914, -15.49649715423584, -14.579959869384766, -13.663423538208008, -12.746885299682617, -11.83034896850586, -10.913811683654785, -9.997274398803711, -9.080737113952637, -8.164199829101562, -7.247662544250488, -6.331125736236572, -5.414588451385498, -4.498051166534424, -3.581514358520508, -2.6649770736694336, -1.7484397888183594, -0.8319026231765747, 0.08463454246520996, 1.001171588897705, 1.9177088737487793, 2.8342461585998535, 3.7507829666137695, 4.667320251464844, 5.583857536315918, 6.500394821166992, 7.416932106018066, 8.33346939086914, 9.250005722045898, 10.166543960571289, 11.083080291748047, 11.999617576599121, 12.916154861450195, 13.83269214630127, 14.749229431152344, 15.665765762329102, 16.582304000854492, 17.49884033203125, 18.41537857055664, 19.3319149017334, 20.248451232910156, 21.164987564086914, 22.081525802612305, 22.998062133789062, 23.914600372314453, 24.83113670349121, 25.74767303466797, 26.66421127319336, 27.58074951171875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 14.0, 11.0, 22.0, 43.0, 53.0, 93.0, 183.0, 320.0, 626.0, 1448.0, 3273.0, 8488.0, 24083.0, 74022.0, 246198.0, 448098.0, 162993.0, 50713.0, 17040.0, 6107.0, 2480.0, 1087.0, 510.0, 253.0, 157.0, 77.0, 48.0, 37.0, 23.0, 15.0, 6.0, 10.0, 9.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.79559326171875, -4.6263427734375, -4.45709228515625, -4.287841796875, -4.11859130859375, -3.9493408203125, -3.78009033203125, -3.61083984375, -3.44158935546875, -3.2723388671875, -3.10308837890625, -2.933837890625, -2.76458740234375, -2.5953369140625, -2.42608642578125, -2.2568359375, -2.08758544921875, -1.9183349609375, -1.74908447265625, -1.579833984375, -1.41058349609375, -1.2413330078125, -1.07208251953125, -0.90283203125, -0.73358154296875, -0.5643310546875, -0.39508056640625, -0.225830078125, -0.05657958984375, 0.1126708984375, 0.28192138671875, 0.451171875, 0.62042236328125, 0.7896728515625, 0.95892333984375, 1.128173828125, 1.29742431640625, 1.4666748046875, 1.63592529296875, 1.80517578125, 1.97442626953125, 2.1436767578125, 2.31292724609375, 2.482177734375, 2.65142822265625, 2.8206787109375, 2.98992919921875, 3.1591796875, 3.32843017578125, 3.4976806640625, 3.66693115234375, 3.836181640625, 4.00543212890625, 4.1746826171875, 4.34393310546875, 4.51318359375, 4.68243408203125, 4.8516845703125, 5.02093505859375, 5.190185546875, 5.35943603515625, 5.5286865234375, 5.69793701171875, 5.8671875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 9.0, 1.0, 6.0, 9.0, 10.0, 11.0, 22.0, 17.0, 14.0, 23.0, 26.0, 30.0, 32.0, 33.0, 48.0, 45.0, 46.0, 46.0, 65.0, 44.0, 45.0, 54.0, 62.0, 44.0, 37.0, 44.0, 19.0, 30.0, 30.0, 24.0, 17.0, 15.0, 15.0, 12.0, 10.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5078125, -2.43206787109375, -2.3563232421875, -2.28057861328125, -2.204833984375, -2.12908935546875, -2.0533447265625, -1.97760009765625, -1.90185546875, -1.82611083984375, -1.7503662109375, -1.67462158203125, -1.598876953125, -1.52313232421875, -1.4473876953125, -1.37164306640625, -1.2958984375, -1.22015380859375, -1.1444091796875, -1.06866455078125, -0.992919921875, -0.91717529296875, -0.8414306640625, -0.76568603515625, -0.68994140625, -0.61419677734375, -0.5384521484375, -0.46270751953125, -0.386962890625, -0.31121826171875, -0.2354736328125, -0.15972900390625, -0.083984375, -0.00823974609375, 0.0675048828125, 0.14324951171875, 0.218994140625, 0.29473876953125, 0.3704833984375, 0.44622802734375, 0.52197265625, 0.59771728515625, 0.6734619140625, 0.74920654296875, 0.824951171875, 0.90069580078125, 0.9764404296875, 1.05218505859375, 1.1279296875, 1.20367431640625, 1.2794189453125, 1.35516357421875, 1.430908203125, 1.50665283203125, 1.5823974609375, 1.65814208984375, 1.73388671875, 1.80963134765625, 1.8853759765625, 1.96112060546875, 2.036865234375, 2.11260986328125, 2.1883544921875, 2.26409912109375, 2.33984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 0.0, 6.0, 2.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 5.0, 10.0, 21.0, 23.0, 33.0, 35.0, 50.0, 67.0, 100.0, 171.0, 241.0, 448.0, 782.0, 1808.0, 5072.0, 23253.0, 187452.0, 723556.0, 86263.0, 12546.0, 3461.0, 1413.0, 657.0, 358.0, 253.0, 134.0, 109.0, 56.0, 45.0, 34.0, 25.0, 10.0, 9.0, 13.0, 6.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.5546875, -8.2725830078125, -7.990478515625, -7.7083740234375, -7.42626953125, -7.1441650390625, -6.862060546875, -6.5799560546875, -6.2978515625, -6.0157470703125, -5.733642578125, -5.4515380859375, -5.16943359375, -4.8873291015625, -4.605224609375, -4.3231201171875, -4.041015625, -3.7589111328125, -3.476806640625, -3.1947021484375, -2.91259765625, -2.6304931640625, -2.348388671875, -2.0662841796875, -1.7841796875, -1.5020751953125, -1.219970703125, -0.9378662109375, -0.65576171875, -0.3736572265625, -0.091552734375, 0.1905517578125, 0.47265625, 0.7547607421875, 1.036865234375, 1.3189697265625, 1.60107421875, 1.8831787109375, 2.165283203125, 2.4473876953125, 2.7294921875, 3.0115966796875, 3.293701171875, 3.5758056640625, 3.85791015625, 4.1400146484375, 4.422119140625, 4.7042236328125, 4.986328125, 5.2684326171875, 5.550537109375, 5.8326416015625, 6.11474609375, 6.3968505859375, 6.678955078125, 6.9610595703125, 7.2431640625, 7.5252685546875, 7.807373046875, 8.0894775390625, 8.37158203125, 8.6536865234375, 8.935791015625, 9.2178955078125, 9.5]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 17.0, 4.0, 14.0, 13.0, 9.0, 19.0, 21.0, 28.0, 41.0, 44.0, 57.0, 45.0, 50.0, 58.0, 69.0, 71.0, 52.0, 52.0, 42.0, 54.0, 46.0, 43.0, 32.0, 25.0, 22.0, 15.0, 23.0, 13.0, 6.0, 6.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.0859375, -12.7550048828125, -12.424072265625, -12.0931396484375, -11.76220703125, -11.4312744140625, -11.100341796875, -10.7694091796875, -10.4384765625, -10.1075439453125, -9.776611328125, -9.4456787109375, -9.11474609375, -8.7838134765625, -8.452880859375, -8.1219482421875, -7.791015625, -7.4600830078125, -7.129150390625, -6.7982177734375, -6.46728515625, -6.1363525390625, -5.805419921875, -5.4744873046875, -5.1435546875, -4.8126220703125, -4.481689453125, -4.1507568359375, -3.81982421875, -3.4888916015625, -3.157958984375, -2.8270263671875, -2.49609375, -2.1651611328125, -1.834228515625, -1.5032958984375, -1.17236328125, -0.8414306640625, -0.510498046875, -0.1795654296875, 0.1513671875, 0.4822998046875, 0.813232421875, 1.1441650390625, 1.47509765625, 1.8060302734375, 2.136962890625, 2.4678955078125, 2.798828125, 3.1297607421875, 3.460693359375, 3.7916259765625, 4.12255859375, 4.4534912109375, 4.784423828125, 5.1153564453125, 5.4462890625, 5.7772216796875, 6.108154296875, 6.4390869140625, 6.77001953125, 7.1009521484375, 7.431884765625, 7.7628173828125, 8.09375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 6.0, 8.0, 17.0, 26.0, 37.0, 57.0, 96.0, 199.0, 334.0, 753.0, 2236.0, 9302.0, 66224.0, 707834.0, 229751.0, 24632.0, 4589.0, 1353.0, 521.0, 223.0, 152.0, 65.0, 51.0, 32.0, 11.0, 13.0, 8.0, 1.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.50390625, -2.42974853515625, -2.3555908203125, -2.28143310546875, -2.207275390625, -2.13311767578125, -2.0589599609375, -1.98480224609375, -1.91064453125, -1.83648681640625, -1.7623291015625, -1.68817138671875, -1.614013671875, -1.53985595703125, -1.4656982421875, -1.39154052734375, -1.3173828125, -1.24322509765625, -1.1690673828125, -1.09490966796875, -1.020751953125, -0.94659423828125, -0.8724365234375, -0.79827880859375, -0.72412109375, -0.64996337890625, -0.5758056640625, -0.50164794921875, -0.427490234375, -0.35333251953125, -0.2791748046875, -0.20501708984375, -0.130859375, -0.05670166015625, 0.0174560546875, 0.09161376953125, 0.165771484375, 0.23992919921875, 0.3140869140625, 0.38824462890625, 0.46240234375, 0.53656005859375, 0.6107177734375, 0.68487548828125, 0.759033203125, 0.83319091796875, 0.9073486328125, 0.98150634765625, 1.0556640625, 1.12982177734375, 1.2039794921875, 1.27813720703125, 1.352294921875, 1.42645263671875, 1.5006103515625, 1.57476806640625, 1.64892578125, 1.72308349609375, 1.7972412109375, 1.87139892578125, 1.945556640625, 2.01971435546875, 2.0938720703125, 2.16802978515625, 2.2421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 6.0, 7.0, 5.0, 9.0, 13.0, 9.0, 18.0, 17.0, 19.0, 20.0, 34.0, 34.0, 47.0, 56.0, 83.0, 73.0, 80.0, 79.0, 77.0, 74.0, 41.0, 41.0, 24.0, 19.0, 19.0, 18.0, 10.0, 8.0, 15.0, 5.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00042724609375, -0.0004131719470024109, -0.0003990978002548218, -0.00038502365350723267, -0.00037094950675964355, -0.00035687536001205444, -0.00034280121326446533, -0.0003287270665168762, -0.0003146529197692871, -0.000300578773021698, -0.0002865046262741089, -0.0002724304795265198, -0.00025835633277893066, -0.00024428218603134155, -0.00023020803928375244, -0.00021613389253616333, -0.00020205974578857422, -0.0001879855990409851, -0.000173911452293396, -0.00015983730554580688, -0.00014576315879821777, -0.00013168901205062866, -0.00011761486530303955, -0.00010354071855545044, -8.946657180786133e-05, -7.539242506027222e-05, -6.13182783126831e-05, -4.7244131565093994e-05, -3.316998481750488e-05, -1.909583806991577e-05, -5.02169132232666e-06, 9.052455425262451e-06, 2.3126602172851562e-05, 3.7200748920440674e-05, 5.1274895668029785e-05, 6.53490424156189e-05, 7.942318916320801e-05, 9.349733591079712e-05, 0.00010757148265838623, 0.00012164562940597534, 0.00013571977615356445, 0.00014979392290115356, 0.00016386806964874268, 0.0001779422163963318, 0.0001920163631439209, 0.00020609050989151, 0.00022016465663909912, 0.00023423880338668823, 0.00024831295013427734, 0.00026238709688186646, 0.00027646124362945557, 0.0002905353903770447, 0.0003046095371246338, 0.0003186836838722229, 0.000332757830619812, 0.0003468319773674011, 0.00036090612411499023, 0.00037498027086257935, 0.00038905441761016846, 0.00040312856435775757, 0.0004172027111053467, 0.0004312768578529358, 0.0004453510046005249, 0.000459425151348114, 0.0004734992980957031]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 13.0, 20.0, 41.0, 87.0, 211.0, 715.0, 3185.0, 48161.0, 927427.0, 63745.0, 3720.0, 803.0, 284.0, 80.0, 29.0, 19.0, 6.0, 7.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62890625, -2.5068359375, -2.384765625, -2.2626953125, -2.140625, -2.0185546875, -1.896484375, -1.7744140625, -1.65234375, -1.5302734375, -1.408203125, -1.2861328125, -1.1640625, -1.0419921875, -0.919921875, -0.7978515625, -0.67578125, -0.5537109375, -0.431640625, -0.3095703125, -0.1875, -0.0654296875, 0.056640625, 0.1787109375, 0.30078125, 0.4228515625, 0.544921875, 0.6669921875, 0.7890625, 0.9111328125, 1.033203125, 1.1552734375, 1.27734375, 1.3994140625, 1.521484375, 1.6435546875, 1.765625, 1.8876953125, 2.009765625, 2.1318359375, 2.25390625, 2.3759765625, 2.498046875, 2.6201171875, 2.7421875, 2.8642578125, 2.986328125, 3.1083984375, 3.23046875, 3.3525390625, 3.474609375, 3.5966796875, 3.71875, 3.8408203125, 3.962890625, 4.0849609375, 4.20703125, 4.3291015625, 4.451171875, 4.5732421875, 4.6953125, 4.8173828125, 4.939453125, 5.0615234375, 5.18359375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 17.0, 17.0, 19.0, 18.0, 26.0, 41.0, 25.0, 46.0, 51.0, 55.0, 50.0, 58.0, 67.0, 60.0, 72.0, 51.0, 46.0, 56.0, 42.0, 25.0, 30.0, 22.0, 23.0, 13.0, 12.0, 5.0, 10.0, 10.0, 4.0, 7.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0419921875, -0.99627685546875, -0.9505615234375, -0.90484619140625, -0.859130859375, -0.81341552734375, -0.7677001953125, -0.72198486328125, -0.67626953125, -0.63055419921875, -0.5848388671875, -0.53912353515625, -0.493408203125, -0.44769287109375, -0.4019775390625, -0.35626220703125, -0.310546875, -0.26483154296875, -0.2191162109375, -0.17340087890625, -0.127685546875, -0.08197021484375, -0.0362548828125, 0.00946044921875, 0.05517578125, 0.10089111328125, 0.1466064453125, 0.19232177734375, 0.238037109375, 0.28375244140625, 0.3294677734375, 0.37518310546875, 0.4208984375, 0.46661376953125, 0.5123291015625, 0.55804443359375, 0.603759765625, 0.64947509765625, 0.6951904296875, 0.74090576171875, 0.78662109375, 0.83233642578125, 0.8780517578125, 0.92376708984375, 0.969482421875, 1.01519775390625, 1.0609130859375, 1.10662841796875, 1.15234375, 1.19805908203125, 1.2437744140625, 1.28948974609375, 1.335205078125, 1.38092041015625, 1.4266357421875, 1.47235107421875, 1.51806640625, 1.56378173828125, 1.6094970703125, 1.65521240234375, 1.700927734375, 1.74664306640625, 1.7923583984375, 1.83807373046875, 1.8837890625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 9.0, 31.0, 102.0, 375.0, 298.0, 118.0, 35.0, 16.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.57394409179688, -61.31277084350586, -58.05160140991211, -54.790428161621094, -51.529258728027344, -48.26808547973633, -45.00691223144531, -41.74574279785156, -38.48456954956055, -35.22339630126953, -31.96222686767578, -28.701053619384766, -25.439882278442383, -22.1787109375, -18.917537689208984, -15.656366348266602, -12.395195007324219, -9.134023666381836, -5.872851371765137, -2.6116790771484375, 0.6494922637939453, 3.910663604736328, 7.171836853027344, 10.433008193969727, 13.69417953491211, 16.955350875854492, 20.216522216796875, 23.47769546508789, 26.738866806030273, 30.000038146972656, 33.26121139526367, 36.52238464355469, 39.78355407714844, 43.04472732543945, 46.3058967590332, 49.56707000732422, 52.82823944091797, 56.089412689208984, 59.3505859375, 62.61175537109375, 65.8729248046875, 69.13409423828125, 72.39527130126953, 75.65644073486328, 78.91761016845703, 82.17878723144531, 85.43995666503906, 88.70112609863281, 91.9623031616211, 95.22347259521484, 98.48464965820312, 101.74581909179688, 105.00698852539062, 108.26815795898438, 111.52933502197266, 114.7905044555664, 118.05168151855469, 121.31285095214844, 124.57402801513672, 127.83519744873047, 131.09637451171875, 134.3575439453125, 137.61871337890625, 140.8798828125, 144.14105224609375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 2.0, 5.0, 1.0, 8.0, 9.0, 9.0, 9.0, 12.0, 17.0, 14.0, 16.0, 12.0, 19.0, 35.0, 18.0, 31.0, 30.0, 39.0, 46.0, 46.0, 73.0, 70.0, 63.0, 56.0, 43.0, 41.0, 34.0, 37.0, 21.0, 22.0, 21.0, 19.0, 17.0, 19.0, 8.0, 9.0, 14.0, 7.0, 12.0, 9.0, 10.0, 3.0, 6.0, 6.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.876930236816406, -33.84788131713867, -32.81883239746094, -31.78978729248047, -30.760738372802734, -29.731689453125, -28.7026424407959, -27.673595428466797, -26.644546508789062, -25.615497589111328, -24.586450576782227, -23.557403564453125, -22.52835464477539, -21.499305725097656, -20.470258712768555, -19.441211700439453, -18.41216278076172, -17.383113861083984, -16.354066848754883, -15.325018882751465, -14.295970916748047, -13.266922950744629, -12.237874984741211, -11.208827018737793, -10.179779052734375, -9.150731086730957, -8.121683120727539, -7.092635154724121, -6.063587188720703, -5.034539222717285, -4.005491256713867, -2.976443290710449, -1.947397232055664, -0.9183492660522461, 0.11069869995117188, 1.1397466659545898, 2.168794631958008, 3.197842597961426, 4.226890563964844, 5.255938529968262, 6.28498649597168, 7.314034461975098, 8.343082427978516, 9.372130393981934, 10.401178359985352, 11.43022632598877, 12.459274291992188, 13.488322257995605, 14.517370223999023, 15.546418190002441, 16.57546615600586, 17.604515075683594, 18.633562088012695, 19.662609100341797, 20.69165802001953, 21.720706939697266, 22.749753952026367, 23.77880096435547, 24.807849884033203, 25.836898803710938, 26.86594581604004, 27.89499282836914, 28.924041748046875, 29.95309066772461, 30.98213768005371]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 12.0, 12.0, 5.0, 13.0, 11.0, 38.0, 57.0, 107.0, 261.0, 546.0, 1885.0, 9168.0, 97411.0, 3435140.0, 619677.0, 24588.0, 3721.0, 911.0, 374.0, 156.0, 90.0, 48.0, 15.0, 10.0, 10.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.43359375, -7.2510986328125, -7.068603515625, -6.8861083984375, -6.70361328125, -6.5211181640625, -6.338623046875, -6.1561279296875, -5.9736328125, -5.7911376953125, -5.608642578125, -5.4261474609375, -5.24365234375, -5.0611572265625, -4.878662109375, -4.6961669921875, -4.513671875, -4.3311767578125, -4.148681640625, -3.9661865234375, -3.78369140625, -3.6011962890625, -3.418701171875, -3.2362060546875, -3.0537109375, -2.8712158203125, -2.688720703125, -2.5062255859375, -2.32373046875, -2.1412353515625, -1.958740234375, -1.7762451171875, -1.59375, -1.4112548828125, -1.228759765625, -1.0462646484375, -0.86376953125, -0.6812744140625, -0.498779296875, -0.3162841796875, -0.1337890625, 0.0487060546875, 0.231201171875, 0.4136962890625, 0.59619140625, 0.7786865234375, 0.961181640625, 1.1436767578125, 1.326171875, 1.5086669921875, 1.691162109375, 1.8736572265625, 2.05615234375, 2.2386474609375, 2.421142578125, 2.6036376953125, 2.7861328125, 2.9686279296875, 3.151123046875, 3.3336181640625, 3.51611328125, 3.6986083984375, 3.881103515625, 4.0635986328125, 4.24609375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 2.0, 7.0, 7.0, 17.0, 16.0, 16.0, 21.0, 26.0, 36.0, 27.0, 35.0, 43.0, 29.0, 47.0, 49.0, 49.0, 59.0, 60.0, 49.0, 45.0, 49.0, 55.0, 42.0, 29.0, 29.0, 28.0, 29.0, 24.0, 19.0, 13.0, 13.0, 9.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.48828125, -2.417266845703125, -2.34625244140625, -2.275238037109375, -2.2042236328125, -2.133209228515625, -2.06219482421875, -1.991180419921875, -1.920166015625, -1.849151611328125, -1.77813720703125, -1.707122802734375, -1.6361083984375, -1.565093994140625, -1.49407958984375, -1.423065185546875, -1.35205078125, -1.281036376953125, -1.21002197265625, -1.139007568359375, -1.0679931640625, -0.996978759765625, -0.92596435546875, -0.854949951171875, -0.783935546875, -0.712921142578125, -0.64190673828125, -0.570892333984375, -0.4998779296875, -0.428863525390625, -0.35784912109375, -0.286834716796875, -0.2158203125, -0.144805908203125, -0.07379150390625, -0.002777099609375, 0.0682373046875, 0.139251708984375, 0.21026611328125, 0.281280517578125, 0.352294921875, 0.423309326171875, 0.49432373046875, 0.565338134765625, 0.6363525390625, 0.707366943359375, 0.77838134765625, 0.849395751953125, 0.92041015625, 0.991424560546875, 1.06243896484375, 1.133453369140625, 1.2044677734375, 1.275482177734375, 1.34649658203125, 1.417510986328125, 1.488525390625, 1.559539794921875, 1.63055419921875, 1.701568603515625, 1.7725830078125, 1.843597412109375, 1.91461181640625, 1.985626220703125, 2.056640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 9.0, 7.0, 15.0, 17.0, 21.0, 37.0, 59.0, 71.0, 135.0, 168.0, 322.0, 602.0, 1319.0, 3105.0, 9084.0, 36312.0, 307519.0, 3554973.0, 237992.0, 30193.0, 7652.0, 2469.0, 988.0, 457.0, 240.0, 146.0, 100.0, 55.0, 59.0, 38.0, 25.0, 22.0, 13.0, 7.0, 8.0, 10.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.83203125, -4.68316650390625, -4.5343017578125, -4.38543701171875, -4.236572265625, -4.08770751953125, -3.9388427734375, -3.78997802734375, -3.64111328125, -3.49224853515625, -3.3433837890625, -3.19451904296875, -3.045654296875, -2.89678955078125, -2.7479248046875, -2.59906005859375, -2.4501953125, -2.30133056640625, -2.1524658203125, -2.00360107421875, -1.854736328125, -1.70587158203125, -1.5570068359375, -1.40814208984375, -1.25927734375, -1.11041259765625, -0.9615478515625, -0.81268310546875, -0.663818359375, -0.51495361328125, -0.3660888671875, -0.21722412109375, -0.068359375, 0.08050537109375, 0.2293701171875, 0.37823486328125, 0.527099609375, 0.67596435546875, 0.8248291015625, 0.97369384765625, 1.12255859375, 1.27142333984375, 1.4202880859375, 1.56915283203125, 1.718017578125, 1.86688232421875, 2.0157470703125, 2.16461181640625, 2.3134765625, 2.46234130859375, 2.6112060546875, 2.76007080078125, 2.908935546875, 3.05780029296875, 3.2066650390625, 3.35552978515625, 3.50439453125, 3.65325927734375, 3.8021240234375, 3.95098876953125, 4.099853515625, 4.24871826171875, 4.3975830078125, 4.54644775390625, 4.6953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 4.0, 3.0, 2.0, 10.0, 3.0, 1.0, 14.0, 13.0, 9.0, 29.0, 34.0, 33.0, 54.0, 58.0, 99.0, 184.0, 312.0, 513.0, 833.0, 728.0, 422.0, 253.0, 151.0, 99.0, 55.0, 38.0, 35.0, 18.0, 27.0, 10.0, 10.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.5833740234375, -4.447998046875, -4.3126220703125, -4.17724609375, -4.0418701171875, -3.906494140625, -3.7711181640625, -3.6357421875, -3.5003662109375, -3.364990234375, -3.2296142578125, -3.09423828125, -2.9588623046875, -2.823486328125, -2.6881103515625, -2.552734375, -2.4173583984375, -2.281982421875, -2.1466064453125, -2.01123046875, -1.8758544921875, -1.740478515625, -1.6051025390625, -1.4697265625, -1.3343505859375, -1.198974609375, -1.0635986328125, -0.92822265625, -0.7928466796875, -0.657470703125, -0.5220947265625, -0.38671875, -0.2513427734375, -0.115966796875, 0.0194091796875, 0.15478515625, 0.2901611328125, 0.425537109375, 0.5609130859375, 0.6962890625, 0.8316650390625, 0.967041015625, 1.1024169921875, 1.23779296875, 1.3731689453125, 1.508544921875, 1.6439208984375, 1.779296875, 1.9146728515625, 2.050048828125, 2.1854248046875, 2.32080078125, 2.4561767578125, 2.591552734375, 2.7269287109375, 2.8623046875, 2.9976806640625, 3.133056640625, 3.2684326171875, 3.40380859375, 3.5391845703125, 3.674560546875, 3.8099365234375, 3.9453125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 8.0, 7.0, 19.0, 26.0, 57.0, 139.0, 212.0, 237.0, 155.0, 70.0, 30.0, 11.0, 9.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-66.54733276367188, -65.01029968261719, -63.473262786865234, -61.93622970581055, -60.399192810058594, -58.862159729003906, -57.32512283325195, -55.788089752197266, -54.25105285644531, -52.714019775390625, -51.17698287963867, -49.639949798583984, -48.10291290283203, -46.565879821777344, -45.02884292602539, -43.4918098449707, -41.95477294921875, -40.41773986816406, -38.88070297241211, -37.34366989135742, -35.80663299560547, -34.26959991455078, -32.73256301879883, -31.19552993774414, -29.658496856689453, -28.121461868286133, -26.584426879882812, -25.047391891479492, -23.510356903076172, -21.97332191467285, -20.43628692626953, -18.899253845214844, -17.362218856811523, -15.825183868408203, -14.288148880004883, -12.751113891601562, -11.214078903198242, -9.677043914794922, -8.140009880065918, -6.602974891662598, -5.065939903259277, -3.528904914855957, -1.9918701648712158, -0.4548354148864746, 1.0821995735168457, 2.619234561920166, 4.156269073486328, 5.693304061889648, 7.230339050292969, 8.767374038696289, 10.30440902709961, 11.84144401550293, 13.37847900390625, 14.91551399230957, 16.45254898071289, 17.989582061767578, 19.52661895751953, 21.06365394592285, 22.600688934326172, 24.137723922729492, 25.674758911132812, 27.211793899536133, 28.748828887939453, 30.28586196899414, 31.82289695739746]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 7.0, 16.0, 13.0, 10.0, 24.0, 32.0, 20.0, 39.0, 51.0, 65.0, 56.0, 53.0, 59.0, 70.0, 64.0, 54.0, 48.0, 56.0, 40.0, 42.0, 29.0, 35.0, 26.0, 27.0, 14.0, 9.0, 7.0, 10.0, 7.0, 5.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.269634246826172, -26.519567489624023, -25.769500732421875, -25.01943588256836, -24.26936912536621, -23.519302368164062, -22.769235610961914, -22.019168853759766, -21.26910400390625, -20.5190372467041, -19.768970489501953, -19.018905639648438, -18.26883888244629, -17.51877212524414, -16.768705368041992, -16.018638610839844, -15.268571853637695, -14.518505096435547, -13.768439292907715, -13.018372535705566, -12.268306732177734, -11.518239974975586, -10.768173217773438, -10.018106460571289, -9.268040657043457, -8.517973899841309, -7.767908096313477, -7.017841339111328, -6.267775058746338, -5.517708778381348, -4.767642021179199, -4.017575740814209, -3.2675113677978516, -2.5174450874328613, -1.767378568649292, -1.0173120498657227, -0.2672457695007324, 0.4828205108642578, 1.2328872680664062, 1.9829535484313965, 2.7330198287963867, 3.483086109161377, 4.233152389526367, 4.983219146728516, 5.733285427093506, 6.483351707458496, 7.2334184646606445, 7.983484745025635, 8.733551025390625, 9.483617782592773, 10.233683586120605, 10.983750343322754, 11.733816146850586, 12.483882904052734, 13.233949661254883, 13.984016418457031, 14.734082221984863, 15.484148979187012, 16.234214782714844, 16.984281539916992, 17.73434829711914, 18.484413146972656, 19.234481811523438, 19.984546661376953, 20.7346134185791]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 6.0, 11.0, 13.0, 17.0, 14.0, 33.0, 34.0, 81.0, 95.0, 158.0, 234.0, 358.0, 597.0, 1059.0, 1845.0, 3230.0, 6724.0, 13715.0, 31389.0, 74660.0, 171750.0, 297995.0, 241279.0, 114721.0, 47844.0, 20543.0, 9562.0, 4682.0, 2449.0, 1326.0, 797.0, 470.0, 292.0, 188.0, 125.0, 89.0, 52.0, 26.0, 27.0, 25.0, 13.0, 10.0, 4.0, 5.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-3.12890625, -3.03619384765625, -2.9434814453125, -2.85076904296875, -2.758056640625, -2.66534423828125, -2.5726318359375, -2.47991943359375, -2.38720703125, -2.29449462890625, -2.2017822265625, -2.10906982421875, -2.016357421875, -1.92364501953125, -1.8309326171875, -1.73822021484375, -1.6455078125, -1.55279541015625, -1.4600830078125, -1.36737060546875, -1.274658203125, -1.18194580078125, -1.0892333984375, -0.99652099609375, -0.90380859375, -0.81109619140625, -0.7183837890625, -0.62567138671875, -0.532958984375, -0.44024658203125, -0.3475341796875, -0.25482177734375, -0.162109375, -0.06939697265625, 0.0233154296875, 0.11602783203125, 0.208740234375, 0.30145263671875, 0.3941650390625, 0.48687744140625, 0.57958984375, 0.67230224609375, 0.7650146484375, 0.85772705078125, 0.950439453125, 1.04315185546875, 1.1358642578125, 1.22857666015625, 1.3212890625, 1.41400146484375, 1.5067138671875, 1.59942626953125, 1.692138671875, 1.78485107421875, 1.8775634765625, 1.97027587890625, 2.06298828125, 2.15570068359375, 2.2484130859375, 2.34112548828125, 2.433837890625, 2.52655029296875, 2.6192626953125, 2.71197509765625, 2.8046875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 8.0, 3.0, 17.0, 13.0, 17.0, 25.0, 22.0, 32.0, 28.0, 45.0, 37.0, 30.0, 35.0, 49.0, 51.0, 45.0, 57.0, 44.0, 52.0, 49.0, 53.0, 37.0, 45.0, 33.0, 40.0, 32.0, 22.0, 22.0, 13.0, 9.0, 8.0, 12.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.478515625, -2.406524658203125, -2.33453369140625, -2.262542724609375, -2.1905517578125, -2.118560791015625, -2.04656982421875, -1.974578857421875, -1.902587890625, -1.830596923828125, -1.75860595703125, -1.686614990234375, -1.6146240234375, -1.542633056640625, -1.47064208984375, -1.398651123046875, -1.32666015625, -1.254669189453125, -1.18267822265625, -1.110687255859375, -1.0386962890625, -0.966705322265625, -0.89471435546875, -0.822723388671875, -0.750732421875, -0.678741455078125, -0.60675048828125, -0.534759521484375, -0.4627685546875, -0.390777587890625, -0.31878662109375, -0.246795654296875, -0.1748046875, -0.102813720703125, -0.03082275390625, 0.041168212890625, 0.1131591796875, 0.185150146484375, 0.25714111328125, 0.329132080078125, 0.401123046875, 0.473114013671875, 0.54510498046875, 0.617095947265625, 0.6890869140625, 0.761077880859375, 0.83306884765625, 0.905059814453125, 0.97705078125, 1.049041748046875, 1.12103271484375, 1.193023681640625, 1.2650146484375, 1.337005615234375, 1.40899658203125, 1.480987548828125, 1.552978515625, 1.624969482421875, 1.69696044921875, 1.768951416015625, 1.8409423828125, 1.912933349609375, 1.98492431640625, 2.056915283203125, 2.12890625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 5.0, 16.0, 9.0, 7.0, 9.0, 19.0, 26.0, 44.0, 41.0, 60.0, 81.0, 165.0, 335.0, 844.0, 2362.0, 9133.0, 48273.0, 336074.0, 573438.0, 61725.0, 11240.0, 2769.0, 934.0, 354.0, 197.0, 107.0, 56.0, 43.0, 39.0, 29.0, 18.0, 18.0, 12.0, 9.0, 11.0, 8.0, 8.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.70306396484375, -5.4998779296875, -5.29669189453125, -5.093505859375, -4.89031982421875, -4.6871337890625, -4.48394775390625, -4.28076171875, -4.07757568359375, -3.8743896484375, -3.67120361328125, -3.468017578125, -3.26483154296875, -3.0616455078125, -2.85845947265625, -2.6552734375, -2.45208740234375, -2.2489013671875, -2.04571533203125, -1.842529296875, -1.63934326171875, -1.4361572265625, -1.23297119140625, -1.02978515625, -0.82659912109375, -0.6234130859375, -0.42022705078125, -0.217041015625, -0.01385498046875, 0.1893310546875, 0.39251708984375, 0.595703125, 0.79888916015625, 1.0020751953125, 1.20526123046875, 1.408447265625, 1.61163330078125, 1.8148193359375, 2.01800537109375, 2.22119140625, 2.42437744140625, 2.6275634765625, 2.83074951171875, 3.033935546875, 3.23712158203125, 3.4403076171875, 3.64349365234375, 3.8466796875, 4.04986572265625, 4.2530517578125, 4.45623779296875, 4.659423828125, 4.86260986328125, 5.0657958984375, 5.26898193359375, 5.47216796875, 5.67535400390625, 5.8785400390625, 6.08172607421875, 6.284912109375, 6.48809814453125, 6.6912841796875, 6.89447021484375, 7.09765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 3.0, 8.0, 3.0, 3.0, 8.0, 7.0, 15.0, 9.0, 12.0, 21.0, 21.0, 29.0, 31.0, 31.0, 35.0, 45.0, 55.0, 39.0, 44.0, 41.0, 39.0, 53.0, 59.0, 37.0, 43.0, 36.0, 39.0, 33.0, 30.0, 33.0, 24.0, 17.0, 14.0, 12.0, 13.0, 14.0, 5.0, 12.0, 3.0, 6.0, 1.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.09765625, -5.887451171875, -5.67724609375, -5.467041015625, -5.2568359375, -5.046630859375, -4.83642578125, -4.626220703125, -4.416015625, -4.205810546875, -3.99560546875, -3.785400390625, -3.5751953125, -3.364990234375, -3.15478515625, -2.944580078125, -2.734375, -2.524169921875, -2.31396484375, -2.103759765625, -1.8935546875, -1.683349609375, -1.47314453125, -1.262939453125, -1.052734375, -0.842529296875, -0.63232421875, -0.422119140625, -0.2119140625, -0.001708984375, 0.20849609375, 0.418701171875, 0.62890625, 0.839111328125, 1.04931640625, 1.259521484375, 1.4697265625, 1.679931640625, 1.89013671875, 2.100341796875, 2.310546875, 2.520751953125, 2.73095703125, 2.941162109375, 3.1513671875, 3.361572265625, 3.57177734375, 3.781982421875, 3.9921875, 4.202392578125, 4.41259765625, 4.622802734375, 4.8330078125, 5.043212890625, 5.25341796875, 5.463623046875, 5.673828125, 5.884033203125, 6.09423828125, 6.304443359375, 6.5146484375, 6.724853515625, 6.93505859375, 7.145263671875, 7.35546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 18.0, 21.0, 31.0, 47.0, 110.0, 254.0, 758.0, 3155.0, 22904.0, 338482.0, 645935.0, 31303.0, 4062.0, 945.0, 260.0, 119.0, 45.0, 29.0, 21.0, 13.0, 8.0, 5.0, 7.0, 8.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.9921875, -2.9068603515625, -2.821533203125, -2.7362060546875, -2.65087890625, -2.5655517578125, -2.480224609375, -2.3948974609375, -2.3095703125, -2.2242431640625, -2.138916015625, -2.0535888671875, -1.96826171875, -1.8829345703125, -1.797607421875, -1.7122802734375, -1.626953125, -1.5416259765625, -1.456298828125, -1.3709716796875, -1.28564453125, -1.2003173828125, -1.114990234375, -1.0296630859375, -0.9443359375, -0.8590087890625, -0.773681640625, -0.6883544921875, -0.60302734375, -0.5177001953125, -0.432373046875, -0.3470458984375, -0.26171875, -0.1763916015625, -0.091064453125, -0.0057373046875, 0.07958984375, 0.1649169921875, 0.250244140625, 0.3355712890625, 0.4208984375, 0.5062255859375, 0.591552734375, 0.6768798828125, 0.76220703125, 0.8475341796875, 0.932861328125, 1.0181884765625, 1.103515625, 1.1888427734375, 1.274169921875, 1.3594970703125, 1.44482421875, 1.5301513671875, 1.615478515625, 1.7008056640625, 1.7861328125, 1.8714599609375, 1.956787109375, 2.0421142578125, 2.12744140625, 2.2127685546875, 2.298095703125, 2.3834228515625, 2.46875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 7.0, 4.0, 1.0, 8.0, 13.0, 9.0, 18.0, 19.0, 21.0, 37.0, 58.0, 52.0, 75.0, 83.0, 78.0, 87.0, 71.0, 75.0, 62.0, 50.0, 24.0, 34.0, 26.0, 18.0, 15.0, 13.0, 9.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036454200744628906, -0.0003500916063785553, -0.00033564120531082153, -0.00032119080424308777, -0.000306740403175354, -0.00029229000210762024, -0.0002778396010398865, -0.0002633891999721527, -0.00024893879890441895, -0.00023448839783668518, -0.00022003799676895142, -0.00020558759570121765, -0.0001911371946334839, -0.00017668679356575012, -0.00016223639249801636, -0.0001477859914302826, -0.00013333559036254883, -0.00011888518929481506, -0.0001044347882270813, -8.998438715934753e-05, -7.553398609161377e-05, -6.108358502388e-05, -4.663318395614624e-05, -3.2182782888412476e-05, -1.773238182067871e-05, -3.2819807529449463e-06, 1.1168420314788818e-05, 2.5618821382522583e-05, 4.006922245025635e-05, 5.451962351799011e-05, 6.897002458572388e-05, 8.342042565345764e-05, 9.78708267211914e-05, 0.00011232122778892517, 0.00012677162885665894, 0.0001412220299243927, 0.00015567243099212646, 0.00017012283205986023, 0.000184573233127594, 0.00019902363419532776, 0.00021347403526306152, 0.0002279244363307953, 0.00024237483739852905, 0.0002568252384662628, 0.0002712756395339966, 0.00028572604060173035, 0.0003001764416694641, 0.0003146268427371979, 0.00032907724380493164, 0.0003435276448726654, 0.00035797804594039917, 0.00037242844700813293, 0.0003868788480758667, 0.00040132924914360046, 0.00041577965021133423, 0.000430230051279068, 0.00044468045234680176, 0.0004591308534145355, 0.0004735812544822693, 0.00048803165555000305, 0.0005024820566177368, 0.0005169324576854706, 0.0005313828587532043, 0.0005458332598209381, 0.0005602836608886719]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 8.0, 5.0, 9.0, 14.0, 21.0, 34.0, 24.0, 48.0, 95.0, 144.0, 293.0, 538.0, 1253.0, 3270.0, 12021.0, 61173.0, 526390.0, 369669.0, 56161.0, 11631.0, 3267.0, 1267.0, 554.0, 250.0, 138.0, 93.0, 63.0, 36.0, 26.0, 13.0, 12.0, 5.0, 9.0, 5.0, 5.0, 3.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.263671875, -1.20867919921875, -1.1536865234375, -1.09869384765625, -1.043701171875, -0.98870849609375, -0.9337158203125, -0.87872314453125, -0.82373046875, -0.76873779296875, -0.7137451171875, -0.65875244140625, -0.603759765625, -0.54876708984375, -0.4937744140625, -0.43878173828125, -0.3837890625, -0.32879638671875, -0.2738037109375, -0.21881103515625, -0.163818359375, -0.10882568359375, -0.0538330078125, 0.00115966796875, 0.05615234375, 0.11114501953125, 0.1661376953125, 0.22113037109375, 0.276123046875, 0.33111572265625, 0.3861083984375, 0.44110107421875, 0.49609375, 0.55108642578125, 0.6060791015625, 0.66107177734375, 0.716064453125, 0.77105712890625, 0.8260498046875, 0.88104248046875, 0.93603515625, 0.99102783203125, 1.0460205078125, 1.10101318359375, 1.156005859375, 1.21099853515625, 1.2659912109375, 1.32098388671875, 1.3759765625, 1.43096923828125, 1.4859619140625, 1.54095458984375, 1.595947265625, 1.65093994140625, 1.7059326171875, 1.76092529296875, 1.81591796875, 1.87091064453125, 1.9259033203125, 1.98089599609375, 2.035888671875, 2.09088134765625, 2.1458740234375, 2.20086669921875, 2.255859375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 8.0, 15.0, 19.0, 29.0, 42.0, 60.0, 89.0, 94.0, 122.0, 99.0, 113.0, 81.0, 60.0, 47.0, 38.0, 26.0, 13.0, 8.0, 12.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8134765625, -1.7393646240234375, -1.665252685546875, -1.5911407470703125, -1.51702880859375, -1.4429168701171875, -1.368804931640625, -1.2946929931640625, -1.2205810546875, -1.1464691162109375, -1.072357177734375, -0.9982452392578125, -0.92413330078125, -0.8500213623046875, -0.775909423828125, -0.7017974853515625, -0.627685546875, -0.5535736083984375, -0.479461669921875, -0.4053497314453125, -0.33123779296875, -0.2571258544921875, -0.183013916015625, -0.1089019775390625, -0.0347900390625, 0.0393218994140625, 0.113433837890625, 0.1875457763671875, 0.26165771484375, 0.3357696533203125, 0.409881591796875, 0.4839935302734375, 0.55810546875, 0.6322174072265625, 0.706329345703125, 0.7804412841796875, 0.85455322265625, 0.9286651611328125, 1.002777099609375, 1.0768890380859375, 1.1510009765625, 1.2251129150390625, 1.299224853515625, 1.3733367919921875, 1.44744873046875, 1.5215606689453125, 1.595672607421875, 1.6697845458984375, 1.743896484375, 1.8180084228515625, 1.892120361328125, 1.9662322998046875, 2.04034423828125, 2.1144561767578125, 2.188568115234375, 2.2626800537109375, 2.3367919921875, 2.4109039306640625, 2.485015869140625, 2.5591278076171875, 2.63323974609375, 2.7073516845703125, 2.781463623046875, 2.8555755615234375, 2.9296875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 5.0, 3.0, 7.0, 9.0, 11.0, 18.0, 38.0, 46.0, 100.0, 140.0, 234.0, 130.0, 84.0, 63.0, 37.0, 30.0, 16.0, 7.0, 6.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.138591766357422, -23.064472198486328, -21.9903507232666, -20.916229248046875, -19.84210968017578, -18.767990112304688, -17.69386863708496, -16.619747161865234, -15.54562759399414, -14.47150707244873, -13.39738655090332, -12.32326602935791, -11.2491455078125, -10.17502498626709, -9.10090446472168, -8.02678394317627, -6.952663421630859, -5.878542900085449, -4.804422378540039, -3.730301856994629, -2.6561813354492188, -1.5820608139038086, -0.5079402923583984, 0.5661802291870117, 1.6403007507324219, 2.714421272277832, 3.788541793823242, 4.862662315368652, 5.9367828369140625, 7.010903358459473, 8.085023880004883, 9.159144401550293, 10.233261108398438, 11.307381629943848, 12.381502151489258, 13.455622673034668, 14.529743194580078, 15.603863716125488, 16.6779842376709, 17.752105712890625, 18.82622528076172, 19.900344848632812, 20.97446632385254, 22.048587799072266, 23.12270736694336, 24.196826934814453, 25.27094841003418, 26.345069885253906, 27.419189453125, 28.493309020996094, 29.56743049621582, 30.641551971435547, 31.71567153930664, 32.789791107177734, 33.863914489746094, 34.93803405761719, 36.01215362548828, 37.086273193359375, 38.16039276123047, 39.23451614379883, 40.30863571166992, 41.382755279541016, 42.456878662109375, 43.53099822998047, 44.60511779785156]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 8.0, 11.0, 13.0, 11.0, 18.0, 16.0, 6.0, 17.0, 11.0, 18.0, 28.0, 26.0, 17.0, 29.0, 35.0, 28.0, 37.0, 61.0, 58.0, 78.0, 69.0, 60.0, 51.0, 30.0, 34.0, 32.0, 19.0, 34.0, 15.0, 19.0, 16.0, 10.0, 8.0, 13.0, 16.0, 8.0, 5.0, 13.0, 3.0, 4.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.756919860839844, -25.931365966796875, -25.105810165405273, -24.280256271362305, -23.454700469970703, -22.629146575927734, -21.803592681884766, -20.978036880493164, -20.152481079101562, -19.326927185058594, -18.501371383666992, -17.675817489624023, -16.850261688232422, -16.024707794189453, -15.199152946472168, -14.373598098754883, -13.548044204711914, -12.722489356994629, -11.896934509277344, -11.071380615234375, -10.245824813842773, -9.420270919799805, -8.59471607208252, -7.769161224365234, -6.943606376647949, -6.118051528930664, -5.292496681213379, -4.466942310333252, -3.641387462615967, -2.8158326148986816, -1.9902782440185547, -1.1647233963012695, -0.3391685485839844, 0.48638617992401123, 1.3119409084320068, 2.137495517730713, 2.963050365447998, 3.788605213165283, 4.61415958404541, 5.439714431762695, 6.2652692794799805, 7.090824127197266, 7.916378974914551, 8.741933822631836, 9.567487716674805, 10.393043518066406, 11.218597412109375, 12.04415225982666, 12.869707107543945, 13.69526195526123, 14.520816802978516, 15.346370697021484, 16.171926498413086, 16.997480392456055, 17.823036193847656, 18.648590087890625, 19.474143981933594, 20.299697875976562, 21.125253677368164, 21.950807571411133, 22.776363372802734, 23.601917266845703, 24.427471160888672, 25.253026962280273, 26.078582763671875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 6.0, 1.0, 4.0, 5.0, 4.0, 8.0, 7.0, 16.0, 19.0, 25.0, 42.0, 58.0, 100.0, 136.0, 299.0, 563.0, 1229.0, 3537.0, 12279.0, 92444.0, 2439006.0, 1559680.0, 68187.0, 11159.0, 3118.0, 1149.0, 534.0, 276.0, 140.0, 89.0, 43.0, 43.0, 22.0, 18.0, 13.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.4296875, -5.300201416015625, -5.17071533203125, -5.041229248046875, -4.9117431640625, -4.782257080078125, -4.65277099609375, -4.523284912109375, -4.393798828125, -4.264312744140625, -4.13482666015625, -4.005340576171875, -3.8758544921875, -3.746368408203125, -3.61688232421875, -3.487396240234375, -3.35791015625, -3.228424072265625, -3.09893798828125, -2.969451904296875, -2.8399658203125, -2.710479736328125, -2.58099365234375, -2.451507568359375, -2.322021484375, -2.192535400390625, -2.06304931640625, -1.933563232421875, -1.8040771484375, -1.674591064453125, -1.54510498046875, -1.415618896484375, -1.2861328125, -1.156646728515625, -1.02716064453125, -0.897674560546875, -0.7681884765625, -0.638702392578125, -0.50921630859375, -0.379730224609375, -0.250244140625, -0.120758056640625, 0.00872802734375, 0.138214111328125, 0.2677001953125, 0.397186279296875, 0.52667236328125, 0.656158447265625, 0.78564453125, 0.915130615234375, 1.04461669921875, 1.174102783203125, 1.3035888671875, 1.433074951171875, 1.56256103515625, 1.692047119140625, 1.821533203125, 1.951019287109375, 2.08050537109375, 2.209991455078125, 2.3394775390625, 2.468963623046875, 2.59844970703125, 2.727935791015625, 2.857421875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 5.0, 11.0, 10.0, 12.0, 18.0, 21.0, 29.0, 30.0, 33.0, 51.0, 38.0, 49.0, 39.0, 31.0, 46.0, 61.0, 49.0, 58.0, 55.0, 55.0, 58.0, 38.0, 45.0, 31.0, 30.0, 24.0, 8.0, 24.0, 11.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4765625, -2.405242919921875, -2.33392333984375, -2.262603759765625, -2.1912841796875, -2.119964599609375, -2.04864501953125, -1.977325439453125, -1.906005859375, -1.834686279296875, -1.76336669921875, -1.692047119140625, -1.6207275390625, -1.549407958984375, -1.47808837890625, -1.406768798828125, -1.33544921875, -1.264129638671875, -1.19281005859375, -1.121490478515625, -1.0501708984375, -0.978851318359375, -0.90753173828125, -0.836212158203125, -0.764892578125, -0.693572998046875, -0.62225341796875, -0.550933837890625, -0.4796142578125, -0.408294677734375, -0.33697509765625, -0.265655517578125, -0.1943359375, -0.123016357421875, -0.05169677734375, 0.019622802734375, 0.0909423828125, 0.162261962890625, 0.23358154296875, 0.304901123046875, 0.376220703125, 0.447540283203125, 0.51885986328125, 0.590179443359375, 0.6614990234375, 0.732818603515625, 0.80413818359375, 0.875457763671875, 0.94677734375, 1.018096923828125, 1.08941650390625, 1.160736083984375, 1.2320556640625, 1.303375244140625, 1.37469482421875, 1.446014404296875, 1.517333984375, 1.588653564453125, 1.65997314453125, 1.731292724609375, 1.8026123046875, 1.873931884765625, 1.94525146484375, 2.016571044921875, 2.087890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 9.0, 12.0, 24.0, 35.0, 56.0, 111.0, 229.0, 544.0, 2629.0, 38200.0, 4063786.0, 83900.0, 3665.0, 606.0, 220.0, 105.0, 56.0, 38.0, 27.0, 17.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9609375, -9.612548828125, -9.26416015625, -8.915771484375, -8.5673828125, -8.218994140625, -7.87060546875, -7.522216796875, -7.173828125, -6.825439453125, -6.47705078125, -6.128662109375, -5.7802734375, -5.431884765625, -5.08349609375, -4.735107421875, -4.38671875, -4.038330078125, -3.68994140625, -3.341552734375, -2.9931640625, -2.644775390625, -2.29638671875, -1.947998046875, -1.599609375, -1.251220703125, -0.90283203125, -0.554443359375, -0.2060546875, 0.142333984375, 0.49072265625, 0.839111328125, 1.1875, 1.535888671875, 1.88427734375, 2.232666015625, 2.5810546875, 2.929443359375, 3.27783203125, 3.626220703125, 3.974609375, 4.322998046875, 4.67138671875, 5.019775390625, 5.3681640625, 5.716552734375, 6.06494140625, 6.413330078125, 6.76171875, 7.110107421875, 7.45849609375, 7.806884765625, 8.1552734375, 8.503662109375, 8.85205078125, 9.200439453125, 9.548828125, 9.897216796875, 10.24560546875, 10.593994140625, 10.9423828125, 11.290771484375, 11.63916015625, 11.987548828125, 12.3359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 7.0, 10.0, 17.0, 18.0, 32.0, 54.0, 112.0, 192.0, 459.0, 1036.0, 1095.0, 534.0, 232.0, 96.0, 71.0, 25.0, 24.0, 20.0, 11.0, 9.0, 5.0, 2.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.1484375, -7.96759033203125, -7.7867431640625, -7.60589599609375, -7.425048828125, -7.24420166015625, -7.0633544921875, -6.88250732421875, -6.70166015625, -6.52081298828125, -6.3399658203125, -6.15911865234375, -5.978271484375, -5.79742431640625, -5.6165771484375, -5.43572998046875, -5.2548828125, -5.07403564453125, -4.8931884765625, -4.71234130859375, -4.531494140625, -4.35064697265625, -4.1697998046875, -3.98895263671875, -3.80810546875, -3.62725830078125, -3.4464111328125, -3.26556396484375, -3.084716796875, -2.90386962890625, -2.7230224609375, -2.54217529296875, -2.361328125, -2.18048095703125, -1.9996337890625, -1.81878662109375, -1.637939453125, -1.45709228515625, -1.2762451171875, -1.09539794921875, -0.91455078125, -0.73370361328125, -0.5528564453125, -0.37200927734375, -0.191162109375, -0.01031494140625, 0.1705322265625, 0.35137939453125, 0.5322265625, 0.71307373046875, 0.8939208984375, 1.07476806640625, 1.255615234375, 1.43646240234375, 1.6173095703125, 1.79815673828125, 1.97900390625, 2.15985107421875, 2.3406982421875, 2.52154541015625, 2.702392578125, 2.88323974609375, 3.0640869140625, 3.24493408203125, 3.42578125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 25.0, 88.0, 355.0, 396.0, 96.0, 34.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.89376449584961, -50.90268325805664, -47.91160202026367, -44.9205207824707, -41.929439544677734, -38.938358306884766, -35.9472770690918, -32.95619583129883, -29.96511459350586, -26.97403335571289, -23.982952117919922, -20.991870880126953, -18.000789642333984, -15.009708404541016, -12.018627166748047, -9.027545928955078, -6.036464691162109, -3.0453834533691406, -0.054302215576171875, 2.936779022216797, 5.927860260009766, 8.918941497802734, 11.910022735595703, 14.901103973388672, 17.89218521118164, 20.88326644897461, 23.874347686767578, 26.865428924560547, 29.856510162353516, 32.847591400146484, 35.83867263793945, 38.82975387573242, 41.820831298828125, 44.811912536621094, 47.80299377441406, 50.79407501220703, 53.78515625, 56.77623748779297, 59.76731872558594, 62.758399963378906, 65.74948120117188, 68.74056243896484, 71.73164367675781, 74.72272491455078, 77.71380615234375, 80.70488739013672, 83.69596862792969, 86.68704986572266, 89.67813110351562, 92.6692123413086, 95.66029357910156, 98.65137481689453, 101.6424560546875, 104.63353729248047, 107.62461853027344, 110.6156997680664, 113.60678100585938, 116.59786224365234, 119.58894348144531, 122.58002471923828, 125.57110595703125, 128.56219482421875, 131.5532684326172, 134.54434204101562, 137.53543090820312]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 6.0, 4.0, 4.0, 7.0, 8.0, 8.0, 17.0, 19.0, 13.0, 22.0, 22.0, 29.0, 20.0, 29.0, 32.0, 31.0, 37.0, 35.0, 50.0, 49.0, 40.0, 50.0, 52.0, 48.0, 41.0, 45.0, 41.0, 22.0, 27.0, 30.0, 25.0, 19.0, 19.0, 16.0, 17.0, 16.0, 13.0, 7.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.770204544067383, -16.2814998626709, -15.792797088623047, -15.304093360900879, -14.815389633178711, -14.326684951782227, -13.837981224060059, -13.34927749633789, -12.860573768615723, -12.371870040893555, -11.883166313171387, -11.394462585449219, -10.905757904052734, -10.417055130004883, -9.928350448608398, -9.43964672088623, -8.950942993164062, -8.462239265441895, -7.973535537719727, -7.4848313331604, -6.996127605438232, -6.5074238777160645, -6.018719673156738, -5.53001594543457, -5.041312217712402, -4.552608489990234, -4.063904762268066, -3.5752005577087402, -3.0864968299865723, -2.5977931022644043, -2.1090891361236572, -1.6203851699829102, -1.1316814422607422, -0.6429775953292847, -0.15427374839782715, 0.33443009853363037, 0.8231339454650879, 1.3118376731872559, 1.800541639328003, 2.28924560546875, 2.777949333190918, 3.266653060913086, 3.755357027053833, 4.24406099319458, 4.732764720916748, 5.221468448638916, 5.710172653198242, 6.19887638092041, 6.687580108642578, 7.176283836364746, 7.664987564086914, 8.153691291809082, 8.64239501953125, 9.131099700927734, 9.619803428649902, 10.10850715637207, 10.597210884094238, 11.085914611816406, 11.574618339538574, 12.063322067260742, 12.552026748657227, 13.040729522705078, 13.529434204101562, 14.01813793182373, 14.506841659545898]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 9.0, 17.0, 22.0, 26.0, 39.0, 87.0, 109.0, 185.0, 291.0, 528.0, 932.0, 1686.0, 3393.0, 6872.0, 15279.0, 37109.0, 94123.0, 247677.0, 362401.0, 167365.0, 63470.0, 25371.0, 10956.0, 4951.0, 2448.0, 1365.0, 729.0, 406.0, 264.0, 172.0, 88.0, 57.0, 37.0, 18.0, 21.0, 16.0, 3.0, 12.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.220703125, -3.12396240234375, -3.0272216796875, -2.93048095703125, -2.833740234375, -2.73699951171875, -2.6402587890625, -2.54351806640625, -2.44677734375, -2.35003662109375, -2.2532958984375, -2.15655517578125, -2.059814453125, -1.96307373046875, -1.8663330078125, -1.76959228515625, -1.6728515625, -1.57611083984375, -1.4793701171875, -1.38262939453125, -1.285888671875, -1.18914794921875, -1.0924072265625, -0.99566650390625, -0.89892578125, -0.80218505859375, -0.7054443359375, -0.60870361328125, -0.511962890625, -0.41522216796875, -0.3184814453125, -0.22174072265625, -0.125, -0.02825927734375, 0.0684814453125, 0.16522216796875, 0.261962890625, 0.35870361328125, 0.4554443359375, 0.55218505859375, 0.64892578125, 0.74566650390625, 0.8424072265625, 0.93914794921875, 1.035888671875, 1.13262939453125, 1.2293701171875, 1.32611083984375, 1.4228515625, 1.51959228515625, 1.6163330078125, 1.71307373046875, 1.809814453125, 1.90655517578125, 2.0032958984375, 2.10003662109375, 2.19677734375, 2.29351806640625, 2.3902587890625, 2.48699951171875, 2.583740234375, 2.68048095703125, 2.7772216796875, 2.87396240234375, 2.970703125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 14.0, 18.0, 16.0, 19.0, 30.0, 25.0, 40.0, 42.0, 50.0, 49.0, 41.0, 44.0, 51.0, 58.0, 61.0, 51.0, 58.0, 41.0, 54.0, 55.0, 30.0, 29.0, 32.0, 16.0, 14.0, 15.0, 7.0, 10.0, 1.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.654296875, -2.57916259765625, -2.5040283203125, -2.42889404296875, -2.353759765625, -2.27862548828125, -2.2034912109375, -2.12835693359375, -2.05322265625, -1.97808837890625, -1.9029541015625, -1.82781982421875, -1.752685546875, -1.67755126953125, -1.6024169921875, -1.52728271484375, -1.4521484375, -1.37701416015625, -1.3018798828125, -1.22674560546875, -1.151611328125, -1.07647705078125, -1.0013427734375, -0.92620849609375, -0.85107421875, -0.77593994140625, -0.7008056640625, -0.62567138671875, -0.550537109375, -0.47540283203125, -0.4002685546875, -0.32513427734375, -0.25, -0.17486572265625, -0.0997314453125, -0.02459716796875, 0.050537109375, 0.12567138671875, 0.2008056640625, 0.27593994140625, 0.35107421875, 0.42620849609375, 0.5013427734375, 0.57647705078125, 0.651611328125, 0.72674560546875, 0.8018798828125, 0.87701416015625, 0.9521484375, 1.02728271484375, 1.1024169921875, 1.17755126953125, 1.252685546875, 1.32781982421875, 1.4029541015625, 1.47808837890625, 1.55322265625, 1.62835693359375, 1.7034912109375, 1.77862548828125, 1.853759765625, 1.92889404296875, 2.0040283203125, 2.07916259765625, 2.154296875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 10.0, 17.0, 11.0, 23.0, 39.0, 52.0, 76.0, 133.0, 210.0, 316.0, 584.0, 1179.0, 2846.0, 10319.0, 55768.0, 642580.0, 285686.0, 36795.0, 7467.0, 2155.0, 887.0, 482.0, 306.0, 172.0, 126.0, 64.0, 78.0, 38.0, 37.0, 18.0, 15.0, 11.0, 6.0, 7.0, 11.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.0859375, -5.89508056640625, -5.7042236328125, -5.51336669921875, -5.322509765625, -5.13165283203125, -4.9407958984375, -4.74993896484375, -4.55908203125, -4.36822509765625, -4.1773681640625, -3.98651123046875, -3.795654296875, -3.60479736328125, -3.4139404296875, -3.22308349609375, -3.0322265625, -2.84136962890625, -2.6505126953125, -2.45965576171875, -2.268798828125, -2.07794189453125, -1.8870849609375, -1.69622802734375, -1.50537109375, -1.31451416015625, -1.1236572265625, -0.93280029296875, -0.741943359375, -0.55108642578125, -0.3602294921875, -0.16937255859375, 0.021484375, 0.21234130859375, 0.4031982421875, 0.59405517578125, 0.784912109375, 0.97576904296875, 1.1666259765625, 1.35748291015625, 1.54833984375, 1.73919677734375, 1.9300537109375, 2.12091064453125, 2.311767578125, 2.50262451171875, 2.6934814453125, 2.88433837890625, 3.0751953125, 3.26605224609375, 3.4569091796875, 3.64776611328125, 3.838623046875, 4.02947998046875, 4.2203369140625, 4.41119384765625, 4.60205078125, 4.79290771484375, 4.9837646484375, 5.17462158203125, 5.365478515625, 5.55633544921875, 5.7471923828125, 5.93804931640625, 6.12890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 6.0, 3.0, 5.0, 8.0, 14.0, 13.0, 20.0, 19.0, 22.0, 24.0, 25.0, 36.0, 38.0, 39.0, 41.0, 54.0, 42.0, 52.0, 49.0, 55.0, 50.0, 45.0, 31.0, 35.0, 31.0, 36.0, 39.0, 22.0, 34.0, 20.0, 17.0, 15.0, 11.0, 7.0, 9.0, 11.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.4375, -6.229248046875, -6.02099609375, -5.812744140625, -5.6044921875, -5.396240234375, -5.18798828125, -4.979736328125, -4.771484375, -4.563232421875, -4.35498046875, -4.146728515625, -3.9384765625, -3.730224609375, -3.52197265625, -3.313720703125, -3.10546875, -2.897216796875, -2.68896484375, -2.480712890625, -2.2724609375, -2.064208984375, -1.85595703125, -1.647705078125, -1.439453125, -1.231201171875, -1.02294921875, -0.814697265625, -0.6064453125, -0.398193359375, -0.18994140625, 0.018310546875, 0.2265625, 0.434814453125, 0.64306640625, 0.851318359375, 1.0595703125, 1.267822265625, 1.47607421875, 1.684326171875, 1.892578125, 2.100830078125, 2.30908203125, 2.517333984375, 2.7255859375, 2.933837890625, 3.14208984375, 3.350341796875, 3.55859375, 3.766845703125, 3.97509765625, 4.183349609375, 4.3916015625, 4.599853515625, 4.80810546875, 5.016357421875, 5.224609375, 5.432861328125, 5.64111328125, 5.849365234375, 6.0576171875, 6.265869140625, 6.47412109375, 6.682373046875, 6.890625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 11.0, 12.0, 20.0, 30.0, 42.0, 69.0, 97.0, 143.0, 269.0, 578.0, 1257.0, 3236.0, 10550.0, 40918.0, 219564.0, 661394.0, 82879.0, 18673.0, 5155.0, 1889.0, 780.0, 388.0, 240.0, 125.0, 75.0, 58.0, 23.0, 22.0, 9.0, 15.0, 7.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4990234375, -1.4564666748046875, -1.413909912109375, -1.3713531494140625, -1.32879638671875, -1.2862396240234375, -1.243682861328125, -1.2011260986328125, -1.1585693359375, -1.1160125732421875, -1.073455810546875, -1.0308990478515625, -0.98834228515625, -0.9457855224609375, -0.903228759765625, -0.8606719970703125, -0.818115234375, -0.7755584716796875, -0.733001708984375, -0.6904449462890625, -0.64788818359375, -0.6053314208984375, -0.562774658203125, -0.5202178955078125, -0.4776611328125, -0.4351043701171875, -0.392547607421875, -0.3499908447265625, -0.30743408203125, -0.2648773193359375, -0.222320556640625, -0.1797637939453125, -0.13720703125, -0.0946502685546875, -0.052093505859375, -0.0095367431640625, 0.03302001953125, 0.0755767822265625, 0.118133544921875, 0.1606903076171875, 0.2032470703125, 0.2458038330078125, 0.288360595703125, 0.3309173583984375, 0.37347412109375, 0.4160308837890625, 0.458587646484375, 0.5011444091796875, 0.543701171875, 0.5862579345703125, 0.628814697265625, 0.6713714599609375, 0.71392822265625, 0.7564849853515625, 0.799041748046875, 0.8415985107421875, 0.8841552734375, 0.9267120361328125, 0.969268798828125, 1.0118255615234375, 1.05438232421875, 1.0969390869140625, 1.139495849609375, 1.1820526123046875, 1.224609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 10.0, 13.0, 10.0, 14.0, 17.0, 24.0, 26.0, 40.0, 39.0, 66.0, 64.0, 89.0, 77.0, 82.0, 98.0, 77.0, 48.0, 49.0, 25.0, 35.0, 16.0, 12.0, 14.0, 8.0, 11.0, 4.0, 7.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000293731689453125, -0.00028191879391670227, -0.00027010589838027954, -0.0002582930028438568, -0.0002464801073074341, -0.00023466721177101135, -0.00022285431623458862, -0.0002110414206981659, -0.00019922852516174316, -0.00018741562962532043, -0.0001756027340888977, -0.00016378983855247498, -0.00015197694301605225, -0.00014016404747962952, -0.0001283511519432068, -0.00011653825640678406, -0.00010472536087036133, -9.29124653339386e-05, -8.109956979751587e-05, -6.928667426109314e-05, -5.747377872467041e-05, -4.566088318824768e-05, -3.384798765182495e-05, -2.203509211540222e-05, -1.0222196578979492e-05, 1.5906989574432373e-06, 1.3403594493865967e-05, 2.5216490030288696e-05, 3.7029385566711426e-05, 4.8842281103134155e-05, 6.0655176639556885e-05, 7.246807217597961e-05, 8.428096771240234e-05, 9.609386324882507e-05, 0.0001079067587852478, 0.00011971965432167053, 0.00013153254985809326, 0.000143345445394516, 0.00015515834093093872, 0.00016697123646736145, 0.00017878413200378418, 0.0001905970275402069, 0.00020240992307662964, 0.00021422281861305237, 0.0002260357141494751, 0.00023784860968589783, 0.00024966150522232056, 0.0002614744007587433, 0.000273287296295166, 0.00028510019183158875, 0.0002969130873680115, 0.0003087259829044342, 0.00032053887844085693, 0.00033235177397727966, 0.0003441646695137024, 0.0003559775650501251, 0.00036779046058654785, 0.0003796033561229706, 0.0003914162516593933, 0.00040322914719581604, 0.00041504204273223877, 0.0004268549382686615, 0.00043866783380508423, 0.00045048072934150696, 0.0004622936248779297]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 6.0, 11.0, 14.0, 12.0, 26.0, 36.0, 64.0, 72.0, 131.0, 204.0, 328.0, 638.0, 1346.0, 3176.0, 9318.0, 33069.0, 156495.0, 682980.0, 120653.0, 26780.0, 7788.0, 2770.0, 1253.0, 602.0, 284.0, 167.0, 91.0, 77.0, 55.0, 40.0, 25.0, 7.0, 10.0, 8.0, 7.0, 4.0, 3.0, 5.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.4345703125, -1.394073486328125, -1.35357666015625, -1.313079833984375, -1.2725830078125, -1.232086181640625, -1.19158935546875, -1.151092529296875, -1.110595703125, -1.070098876953125, -1.02960205078125, -0.989105224609375, -0.9486083984375, -0.908111572265625, -0.86761474609375, -0.827117919921875, -0.78662109375, -0.746124267578125, -0.70562744140625, -0.665130615234375, -0.6246337890625, -0.584136962890625, -0.54364013671875, -0.503143310546875, -0.462646484375, -0.422149658203125, -0.38165283203125, -0.341156005859375, -0.3006591796875, -0.260162353515625, -0.21966552734375, -0.179168701171875, -0.138671875, -0.098175048828125, -0.05767822265625, -0.017181396484375, 0.0233154296875, 0.063812255859375, 0.10430908203125, 0.144805908203125, 0.185302734375, 0.225799560546875, 0.26629638671875, 0.306793212890625, 0.3472900390625, 0.387786865234375, 0.42828369140625, 0.468780517578125, 0.50927734375, 0.549774169921875, 0.59027099609375, 0.630767822265625, 0.6712646484375, 0.711761474609375, 0.75225830078125, 0.792755126953125, 0.833251953125, 0.873748779296875, 0.91424560546875, 0.954742431640625, 0.9952392578125, 1.035736083984375, 1.07623291015625, 1.116729736328125, 1.1572265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 12.0, 8.0, 15.0, 12.0, 22.0, 24.0, 43.0, 40.0, 61.0, 94.0, 117.0, 104.0, 101.0, 88.0, 63.0, 52.0, 32.0, 27.0, 28.0, 10.0, 5.0, 8.0, 10.0, 4.0, 9.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3974609375, -1.3499755859375, -1.302490234375, -1.2550048828125, -1.20751953125, -1.1600341796875, -1.112548828125, -1.0650634765625, -1.017578125, -0.9700927734375, -0.922607421875, -0.8751220703125, -0.82763671875, -0.7801513671875, -0.732666015625, -0.6851806640625, -0.6376953125, -0.5902099609375, -0.542724609375, -0.4952392578125, -0.44775390625, -0.4002685546875, -0.352783203125, -0.3052978515625, -0.2578125, -0.2103271484375, -0.162841796875, -0.1153564453125, -0.06787109375, -0.0203857421875, 0.027099609375, 0.0745849609375, 0.1220703125, 0.1695556640625, 0.217041015625, 0.2645263671875, 0.31201171875, 0.3594970703125, 0.406982421875, 0.4544677734375, 0.501953125, 0.5494384765625, 0.596923828125, 0.6444091796875, 0.69189453125, 0.7393798828125, 0.786865234375, 0.8343505859375, 0.8818359375, 0.9293212890625, 0.976806640625, 1.0242919921875, 1.07177734375, 1.1192626953125, 1.166748046875, 1.2142333984375, 1.26171875, 1.3092041015625, 1.356689453125, 1.4041748046875, 1.45166015625, 1.4991455078125, 1.546630859375, 1.5941162109375, 1.6416015625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 19.0, 51.0, 154.0, 417.0, 202.0, 90.0, 38.0, 12.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.793182373046875, -34.68589782714844, -32.57861328125, -30.471332550048828, -28.36404800415039, -26.256763458251953, -24.14948081970215, -22.042198181152344, -19.934913635253906, -17.82762908935547, -15.720346450805664, -13.613062858581543, -11.505779266357422, -9.3984956741333, -7.29121208190918, -5.183928489685059, -3.0766448974609375, -0.9693613052368164, 1.1379222869873047, 3.245205879211426, 5.352489471435547, 7.459773063659668, 9.567056655883789, 11.67434024810791, 13.781623840332031, 15.888907432556152, 17.996191024780273, 20.103473663330078, 22.210758209228516, 24.318042755126953, 26.425325393676758, 28.532608032226562, 30.639892578125, 32.74717712402344, 34.854461669921875, 36.96174240112305, 39.069026947021484, 41.17631149291992, 43.283592224121094, 45.39087677001953, 47.49816131591797, 49.605445861816406, 51.712730407714844, 53.820011138916016, 55.92729568481445, 58.03458023071289, 60.14186096191406, 62.2491455078125, 64.35643005371094, 66.46371459960938, 68.57099914550781, 70.67828369140625, 72.78556823730469, 74.8928451538086, 77.00012969970703, 79.10741424560547, 81.2146987915039, 83.32198333740234, 85.42926788330078, 87.53655242919922, 89.64382934570312, 91.75111389160156, 93.8583984375, 95.96568298339844, 98.07296752929688]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 4.0, 4.0, 5.0, 8.0, 11.0, 14.0, 13.0, 10.0, 25.0, 17.0, 17.0, 17.0, 20.0, 28.0, 32.0, 46.0, 42.0, 66.0, 104.0, 94.0, 67.0, 50.0, 32.0, 32.0, 33.0, 26.0, 21.0, 20.0, 23.0, 23.0, 13.0, 12.0, 12.0, 16.0, 17.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-31.447511672973633, -30.556249618530273, -29.664987564086914, -28.773725509643555, -27.882461547851562, -26.991199493408203, -26.099937438964844, -25.208675384521484, -24.317413330078125, -23.426151275634766, -22.534889221191406, -21.643627166748047, -20.752365112304688, -19.861103057861328, -18.969839096069336, -18.078577041625977, -17.187314987182617, -16.296052932739258, -15.404790878295898, -14.513527870178223, -13.622265815734863, -12.731003761291504, -11.839740753173828, -10.948478698730469, -10.05721664428711, -9.16595458984375, -8.27469253540039, -7.383429527282715, -6.4921674728393555, -5.600905418395996, -4.7096428871154785, -3.818380355834961, -2.9271163940429688, -2.0358541011810303, -1.1445918083190918, -0.2533295154571533, 0.6379327774047852, 1.5291948318481445, 2.420457363128662, 3.3117198944091797, 4.202981948852539, 5.094244003295898, 5.985506534576416, 6.876769065856934, 7.768031120300293, 8.659293174743652, 9.550556182861328, 10.441818237304688, 11.333080291748047, 12.224342346191406, 13.115604400634766, 14.006867408752441, 14.8981294631958, 15.78939151763916, 16.680654525756836, 17.571916580200195, 18.463178634643555, 19.354440689086914, 20.245702743530273, 21.136964797973633, 22.028228759765625, 22.919490814208984, 23.810752868652344, 24.702014923095703, 25.593276977539062]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 3.0, 11.0, 12.0, 13.0, 26.0, 33.0, 52.0, 84.0, 154.0, 265.0, 573.0, 1276.0, 3131.0, 9517.0, 41679.0, 393486.0, 2860709.0, 784722.0, 74952.0, 15611.0, 4813.0, 1728.0, 689.0, 337.0, 163.0, 93.0, 43.0, 36.0, 26.0, 17.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.17578125, -4.0704345703125, -3.965087890625, -3.8597412109375, -3.75439453125, -3.6490478515625, -3.543701171875, -3.4383544921875, -3.3330078125, -3.2276611328125, -3.122314453125, -3.0169677734375, -2.91162109375, -2.8062744140625, -2.700927734375, -2.5955810546875, -2.490234375, -2.3848876953125, -2.279541015625, -2.1741943359375, -2.06884765625, -1.9635009765625, -1.858154296875, -1.7528076171875, -1.6474609375, -1.5421142578125, -1.436767578125, -1.3314208984375, -1.22607421875, -1.1207275390625, -1.015380859375, -0.9100341796875, -0.8046875, -0.6993408203125, -0.593994140625, -0.4886474609375, -0.38330078125, -0.2779541015625, -0.172607421875, -0.0672607421875, 0.0380859375, 0.1434326171875, 0.248779296875, 0.3541259765625, 0.45947265625, 0.5648193359375, 0.670166015625, 0.7755126953125, 0.880859375, 0.9862060546875, 1.091552734375, 1.1968994140625, 1.30224609375, 1.4075927734375, 1.512939453125, 1.6182861328125, 1.7236328125, 1.8289794921875, 1.934326171875, 2.0396728515625, 2.14501953125, 2.2503662109375, 2.355712890625, 2.4610595703125, 2.56640625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 2.0, 10.0, 12.0, 9.0, 15.0, 18.0, 21.0, 26.0, 33.0, 50.0, 37.0, 45.0, 49.0, 44.0, 42.0, 48.0, 70.0, 59.0, 52.0, 49.0, 48.0, 37.0, 38.0, 40.0, 30.0, 25.0, 18.0, 17.0, 12.0, 13.0, 7.0, 5.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.669921875, -2.6013641357421875, -2.532806396484375, -2.4642486572265625, -2.39569091796875, -2.3271331787109375, -2.258575439453125, -2.1900177001953125, -2.1214599609375, -2.0529022216796875, -1.984344482421875, -1.9157867431640625, -1.84722900390625, -1.7786712646484375, -1.710113525390625, -1.6415557861328125, -1.572998046875, -1.5044403076171875, -1.435882568359375, -1.3673248291015625, -1.29876708984375, -1.2302093505859375, -1.161651611328125, -1.0930938720703125, -1.0245361328125, -0.9559783935546875, -0.887420654296875, -0.8188629150390625, -0.75030517578125, -0.6817474365234375, -0.613189697265625, -0.5446319580078125, -0.47607421875, -0.4075164794921875, -0.338958740234375, -0.2704010009765625, -0.20184326171875, -0.1332855224609375, -0.064727783203125, 0.0038299560546875, 0.0723876953125, 0.1409454345703125, 0.209503173828125, 0.2780609130859375, 0.34661865234375, 0.4151763916015625, 0.483734130859375, 0.5522918701171875, 0.620849609375, 0.6894073486328125, 0.757965087890625, 0.8265228271484375, 0.89508056640625, 0.9636383056640625, 1.032196044921875, 1.1007537841796875, 1.1693115234375, 1.2378692626953125, 1.306427001953125, 1.3749847412109375, 1.44354248046875, 1.5121002197265625, 1.580657958984375, 1.6492156982421875, 1.7177734375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 2.0, 5.0, 15.0, 17.0, 34.0, 67.0, 99.0, 182.0, 469.0, 1486.0, 10113.0, 1423508.0, 2743348.0, 12301.0, 1658.0, 545.0, 196.0, 109.0, 52.0, 29.0, 16.0, 8.0, 7.0, 6.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.890625, -9.537841796875, -9.18505859375, -8.832275390625, -8.4794921875, -8.126708984375, -7.77392578125, -7.421142578125, -7.068359375, -6.715576171875, -6.36279296875, -6.010009765625, -5.6572265625, -5.304443359375, -4.95166015625, -4.598876953125, -4.24609375, -3.893310546875, -3.54052734375, -3.187744140625, -2.8349609375, -2.482177734375, -2.12939453125, -1.776611328125, -1.423828125, -1.071044921875, -0.71826171875, -0.365478515625, -0.0126953125, 0.340087890625, 0.69287109375, 1.045654296875, 1.3984375, 1.751220703125, 2.10400390625, 2.456787109375, 2.8095703125, 3.162353515625, 3.51513671875, 3.867919921875, 4.220703125, 4.573486328125, 4.92626953125, 5.279052734375, 5.6318359375, 5.984619140625, 6.33740234375, 6.690185546875, 7.04296875, 7.395751953125, 7.74853515625, 8.101318359375, 8.4541015625, 8.806884765625, 9.15966796875, 9.512451171875, 9.865234375, 10.218017578125, 10.57080078125, 10.923583984375, 11.2763671875, 11.629150390625, 11.98193359375, 12.334716796875, 12.6875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 9.0, 3.0, 10.0, 9.0, 12.0, 21.0, 33.0, 55.0, 106.0, 195.0, 457.0, 988.0, 1101.0, 545.0, 251.0, 128.0, 43.0, 41.0, 28.0, 11.0, 10.0, 10.0, 7.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.96875, -8.75567626953125, -8.5426025390625, -8.32952880859375, -8.116455078125, -7.90338134765625, -7.6903076171875, -7.47723388671875, -7.26416015625, -7.05108642578125, -6.8380126953125, -6.62493896484375, -6.411865234375, -6.19879150390625, -5.9857177734375, -5.77264404296875, -5.5595703125, -5.34649658203125, -5.1334228515625, -4.92034912109375, -4.707275390625, -4.49420166015625, -4.2811279296875, -4.06805419921875, -3.85498046875, -3.64190673828125, -3.4288330078125, -3.21575927734375, -3.002685546875, -2.78961181640625, -2.5765380859375, -2.36346435546875, -2.150390625, -1.93731689453125, -1.7242431640625, -1.51116943359375, -1.298095703125, -1.08502197265625, -0.8719482421875, -0.65887451171875, -0.44580078125, -0.23272705078125, -0.0196533203125, 0.19342041015625, 0.406494140625, 0.61956787109375, 0.8326416015625, 1.04571533203125, 1.2587890625, 1.47186279296875, 1.6849365234375, 1.89801025390625, 2.111083984375, 2.32415771484375, 2.5372314453125, 2.75030517578125, 2.96337890625, 3.17645263671875, 3.3895263671875, 3.60260009765625, 3.815673828125, 4.02874755859375, 4.2418212890625, 4.45489501953125, 4.66796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 14.0, 27.0, 50.0, 102.0, 206.0, 241.0, 183.0, 86.0, 35.0, 20.0, 9.0, 7.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.060401916503906, -34.367637634277344, -32.67487716674805, -30.982112884521484, -29.289350509643555, -27.596588134765625, -25.903823852539062, -24.211061477661133, -22.518299102783203, -20.825536727905273, -19.13277244567871, -17.44001007080078, -15.747247695922852, -14.054484367370605, -12.36172103881836, -10.66895866394043, -8.976194381713867, -7.283431529998779, -5.590668678283691, -3.8979053497314453, -2.2051424980163574, -0.5123796463012695, 1.1803836822509766, 2.8731460571289062, 4.565909385681152, 6.25867223739624, 7.951435089111328, 9.644198417663574, 11.33696174621582, 13.02972412109375, 14.722487449645996, 16.41524887084961, 18.108013153076172, 19.8007755279541, 21.493539810180664, 23.186302185058594, 24.879064559936523, 26.571826934814453, 28.264591217041016, 29.957353591918945, 31.650115966796875, 33.34288024902344, 35.035640716552734, 36.7284049987793, 38.42116928100586, 40.113929748535156, 41.80669403076172, 43.49945831298828, 45.192222595214844, 46.884986877441406, 48.5777473449707, 50.270511627197266, 51.96327590942383, 53.656036376953125, 55.34880065917969, 57.04156494140625, 58.73432540893555, 60.42708969116211, 62.119850158691406, 63.81261444091797, 65.50537872314453, 67.1981430053711, 68.89089965820312, 70.58366394042969, 72.27642822265625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 9.0, 14.0, 15.0, 14.0, 17.0, 22.0, 24.0, 21.0, 27.0, 44.0, 39.0, 46.0, 55.0, 68.0, 54.0, 38.0, 43.0, 46.0, 51.0, 55.0, 49.0, 43.0, 28.0, 24.0, 17.0, 21.0, 19.0, 18.0, 18.0, 12.0, 10.0, 3.0, 6.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.67736053466797, -21.046173095703125, -20.41498565673828, -19.783798217773438, -19.152610778808594, -18.52142333984375, -17.890235900878906, -17.259050369262695, -16.62786293029785, -15.996675491333008, -15.365488052368164, -14.73430061340332, -14.103114128112793, -13.47192668914795, -12.840739250183105, -12.209552764892578, -11.578364372253418, -10.947176933288574, -10.31598949432373, -9.684803009033203, -9.05361557006836, -8.422428131103516, -7.791240692138672, -7.160053730010986, -6.528866291046143, -5.897678852081299, -5.266491889953613, -4.6353044509887695, -4.004117012023926, -3.3729300498962402, -2.7417426109313965, -2.110555648803711, -1.4793682098388672, -0.8481809496879578, -0.21699368953704834, 0.41419363021850586, 1.0453808307647705, 1.6765680313110352, 2.307755470275879, 2.9389424324035645, 3.570129871368408, 4.201317310333252, 4.8325042724609375, 5.463691711425781, 6.094879150390625, 6.7260661125183105, 7.357253551483154, 7.98844051361084, 8.619627952575684, 9.250815391540527, 9.882002830505371, 10.513189315795898, 11.144376754760742, 11.775564193725586, 12.40675163269043, 13.037939071655273, 13.669126510620117, 14.300313949584961, 14.931501388549805, 15.562688827514648, 16.193876266479492, 16.825061798095703, 17.456249237060547, 18.08743667602539, 18.718624114990234]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 9.0, 7.0, 17.0, 16.0, 28.0, 39.0, 87.0, 119.0, 163.0, 294.0, 610.0, 1132.0, 2327.0, 5475.0, 13610.0, 39737.0, 140063.0, 476652.0, 262550.0, 69019.0, 21739.0, 8170.0, 3336.0, 1555.0, 789.0, 446.0, 209.0, 120.0, 86.0, 57.0, 23.0, 18.0, 16.0, 11.0, 7.0, 6.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.9281005859375, -4.781982421875, -4.6358642578125, -4.48974609375, -4.3436279296875, -4.197509765625, -4.0513916015625, -3.9052734375, -3.7591552734375, -3.613037109375, -3.4669189453125, -3.32080078125, -3.1746826171875, -3.028564453125, -2.8824462890625, -2.736328125, -2.5902099609375, -2.444091796875, -2.2979736328125, -2.15185546875, -2.0057373046875, -1.859619140625, -1.7135009765625, -1.5673828125, -1.4212646484375, -1.275146484375, -1.1290283203125, -0.98291015625, -0.8367919921875, -0.690673828125, -0.5445556640625, -0.3984375, -0.2523193359375, -0.106201171875, 0.0399169921875, 0.18603515625, 0.3321533203125, 0.478271484375, 0.6243896484375, 0.7705078125, 0.9166259765625, 1.062744140625, 1.2088623046875, 1.35498046875, 1.5010986328125, 1.647216796875, 1.7933349609375, 1.939453125, 2.0855712890625, 2.231689453125, 2.3778076171875, 2.52392578125, 2.6700439453125, 2.816162109375, 2.9622802734375, 3.1083984375, 3.2545166015625, 3.400634765625, 3.5467529296875, 3.69287109375, 3.8389892578125, 3.985107421875, 4.1312255859375, 4.27734375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 11.0, 7.0, 8.0, 22.0, 23.0, 19.0, 30.0, 43.0, 34.0, 46.0, 33.0, 43.0, 46.0, 57.0, 41.0, 56.0, 71.0, 53.0, 47.0, 44.0, 49.0, 39.0, 39.0, 25.0, 29.0, 18.0, 12.0, 10.0, 9.0, 6.0, 6.0, 6.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0], "bins": [-2.947265625, -2.8737030029296875, -2.800140380859375, -2.7265777587890625, -2.65301513671875, -2.5794525146484375, -2.505889892578125, -2.4323272705078125, -2.3587646484375, -2.2852020263671875, -2.211639404296875, -2.1380767822265625, -2.06451416015625, -1.9909515380859375, -1.917388916015625, -1.8438262939453125, -1.770263671875, -1.6967010498046875, -1.623138427734375, -1.5495758056640625, -1.47601318359375, -1.4024505615234375, -1.328887939453125, -1.2553253173828125, -1.1817626953125, -1.1082000732421875, -1.034637451171875, -0.9610748291015625, -0.88751220703125, -0.8139495849609375, -0.740386962890625, -0.6668243408203125, -0.59326171875, -0.5196990966796875, -0.446136474609375, -0.3725738525390625, -0.29901123046875, -0.2254486083984375, -0.151885986328125, -0.0783233642578125, -0.0047607421875, 0.0688018798828125, 0.142364501953125, 0.2159271240234375, 0.28948974609375, 0.3630523681640625, 0.436614990234375, 0.5101776123046875, 0.583740234375, 0.6573028564453125, 0.730865478515625, 0.8044281005859375, 0.87799072265625, 0.9515533447265625, 1.025115966796875, 1.0986785888671875, 1.1722412109375, 1.2458038330078125, 1.319366455078125, 1.3929290771484375, 1.46649169921875, 1.5400543212890625, 1.613616943359375, 1.6871795654296875, 1.7607421875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 6.0, 5.0, 12.0, 11.0, 21.0, 21.0, 22.0, 46.0, 52.0, 114.0, 153.0, 280.0, 475.0, 909.0, 2020.0, 6633.0, 50993.0, 841448.0, 127707.0, 12193.0, 2855.0, 1138.0, 597.0, 320.0, 193.0, 107.0, 75.0, 38.0, 35.0, 23.0, 15.0, 6.0, 7.0, 4.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2890625, -8.02734375, -7.765625, -7.50390625, -7.2421875, -6.98046875, -6.71875, -6.45703125, -6.1953125, -5.93359375, -5.671875, -5.41015625, -5.1484375, -4.88671875, -4.625, -4.36328125, -4.1015625, -3.83984375, -3.578125, -3.31640625, -3.0546875, -2.79296875, -2.53125, -2.26953125, -2.0078125, -1.74609375, -1.484375, -1.22265625, -0.9609375, -0.69921875, -0.4375, -0.17578125, 0.0859375, 0.34765625, 0.609375, 0.87109375, 1.1328125, 1.39453125, 1.65625, 1.91796875, 2.1796875, 2.44140625, 2.703125, 2.96484375, 3.2265625, 3.48828125, 3.75, 4.01171875, 4.2734375, 4.53515625, 4.796875, 5.05859375, 5.3203125, 5.58203125, 5.84375, 6.10546875, 6.3671875, 6.62890625, 6.890625, 7.15234375, 7.4140625, 7.67578125, 7.9375, 8.19921875, 8.4609375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 9.0, 19.0, 16.0, 34.0, 29.0, 36.0, 41.0, 56.0, 40.0, 54.0, 69.0, 85.0, 90.0, 74.0, 54.0, 59.0, 43.0, 45.0, 34.0, 21.0, 25.0, 19.0, 16.0, 6.0, 3.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.9765625, -11.66839599609375, -11.3602294921875, -11.05206298828125, -10.743896484375, -10.43572998046875, -10.1275634765625, -9.81939697265625, -9.51123046875, -9.20306396484375, -8.8948974609375, -8.58673095703125, -8.278564453125, -7.97039794921875, -7.6622314453125, -7.35406494140625, -7.0458984375, -6.73773193359375, -6.4295654296875, -6.12139892578125, -5.813232421875, -5.50506591796875, -5.1968994140625, -4.88873291015625, -4.58056640625, -4.27239990234375, -3.9642333984375, -3.65606689453125, -3.347900390625, -3.03973388671875, -2.7315673828125, -2.42340087890625, -2.115234375, -1.80706787109375, -1.4989013671875, -1.19073486328125, -0.882568359375, -0.57440185546875, -0.2662353515625, 0.04193115234375, 0.35009765625, 0.65826416015625, 0.9664306640625, 1.27459716796875, 1.582763671875, 1.89093017578125, 2.1990966796875, 2.50726318359375, 2.8154296875, 3.12359619140625, 3.4317626953125, 3.73992919921875, 4.048095703125, 4.35626220703125, 4.6644287109375, 4.97259521484375, 5.28076171875, 5.58892822265625, 5.8970947265625, 6.20526123046875, 6.513427734375, 6.82159423828125, 7.1297607421875, 7.43792724609375, 7.74609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 9.0, 7.0, 17.0, 14.0, 19.0, 35.0, 44.0, 87.0, 134.0, 261.0, 604.0, 1600.0, 5242.0, 24739.0, 253499.0, 714588.0, 37295.0, 6948.0, 2002.0, 728.0, 288.0, 147.0, 84.0, 49.0, 30.0, 17.0, 18.0, 7.0, 9.0, 5.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.533203125, -2.464935302734375, -2.39666748046875, -2.328399658203125, -2.2601318359375, -2.191864013671875, -2.12359619140625, -2.055328369140625, -1.987060546875, -1.918792724609375, -1.85052490234375, -1.782257080078125, -1.7139892578125, -1.645721435546875, -1.57745361328125, -1.509185791015625, -1.44091796875, -1.372650146484375, -1.30438232421875, -1.236114501953125, -1.1678466796875, -1.099578857421875, -1.03131103515625, -0.963043212890625, -0.894775390625, -0.826507568359375, -0.75823974609375, -0.689971923828125, -0.6217041015625, -0.553436279296875, -0.48516845703125, -0.416900634765625, -0.3486328125, -0.280364990234375, -0.21209716796875, -0.143829345703125, -0.0755615234375, -0.007293701171875, 0.06097412109375, 0.129241943359375, 0.197509765625, 0.265777587890625, 0.33404541015625, 0.402313232421875, 0.4705810546875, 0.538848876953125, 0.60711669921875, 0.675384521484375, 0.74365234375, 0.811920166015625, 0.88018798828125, 0.948455810546875, 1.0167236328125, 1.084991455078125, 1.15325927734375, 1.221527099609375, 1.289794921875, 1.358062744140625, 1.42633056640625, 1.494598388671875, 1.5628662109375, 1.631134033203125, 1.69940185546875, 1.767669677734375, 1.8359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 7.0, 3.0, 5.0, 7.0, 12.0, 6.0, 13.0, 9.0, 14.0, 11.0, 19.0, 26.0, 38.0, 34.0, 45.0, 65.0, 78.0, 87.0, 105.0, 82.0, 63.0, 35.0, 39.0, 33.0, 25.0, 26.0, 24.0, 21.0, 9.0, 14.0, 10.0, 8.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0004477500915527344, -0.00043338537216186523, -0.0004190206527709961, -0.00040465593338012695, -0.0003902912139892578, -0.00037592649459838867, -0.00036156177520751953, -0.0003471970558166504, -0.00033283233642578125, -0.0003184676170349121, -0.00030410289764404297, -0.00028973817825317383, -0.0002753734588623047, -0.00026100873947143555, -0.0002466440200805664, -0.00023227930068969727, -0.00021791458129882812, -0.00020354986190795898, -0.00018918514251708984, -0.0001748204231262207, -0.00016045570373535156, -0.00014609098434448242, -0.00013172626495361328, -0.00011736154556274414, -0.000102996826171875, -8.863210678100586e-05, -7.426738739013672e-05, -5.990266799926758e-05, -4.553794860839844e-05, -3.11732292175293e-05, -1.6808509826660156e-05, -2.4437904357910156e-06, 1.1920928955078125e-05, 2.6285648345947266e-05, 4.0650367736816406e-05, 5.501508712768555e-05, 6.937980651855469e-05, 8.374452590942383e-05, 9.810924530029297e-05, 0.00011247396469116211, 0.00012683868408203125, 0.0001412034034729004, 0.00015556812286376953, 0.00016993284225463867, 0.0001842975616455078, 0.00019866228103637695, 0.0002130270004272461, 0.00022739171981811523, 0.00024175643920898438, 0.0002561211585998535, 0.00027048587799072266, 0.0002848505973815918, 0.00029921531677246094, 0.0003135800361633301, 0.0003279447555541992, 0.00034230947494506836, 0.0003566741943359375, 0.00037103891372680664, 0.0003854036331176758, 0.0003997683525085449, 0.00041413307189941406, 0.0004284977912902832, 0.00044286251068115234, 0.0004572272300720215, 0.0004715919494628906]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 8.0, 5.0, 10.0, 20.0, 19.0, 24.0, 61.0, 69.0, 110.0, 240.0, 488.0, 1052.0, 2912.0, 11142.0, 78724.0, 827970.0, 106455.0, 13546.0, 3359.0, 1182.0, 502.0, 279.0, 148.0, 76.0, 56.0, 25.0, 27.0, 14.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.12109375, -2.057891845703125, -1.99468994140625, -1.931488037109375, -1.8682861328125, -1.805084228515625, -1.74188232421875, -1.678680419921875, -1.615478515625, -1.552276611328125, -1.48907470703125, -1.425872802734375, -1.3626708984375, -1.299468994140625, -1.23626708984375, -1.173065185546875, -1.10986328125, -1.046661376953125, -0.98345947265625, -0.920257568359375, -0.8570556640625, -0.793853759765625, -0.73065185546875, -0.667449951171875, -0.604248046875, -0.541046142578125, -0.47784423828125, -0.414642333984375, -0.3514404296875, -0.288238525390625, -0.22503662109375, -0.161834716796875, -0.0986328125, -0.035430908203125, 0.02777099609375, 0.090972900390625, 0.1541748046875, 0.217376708984375, 0.28057861328125, 0.343780517578125, 0.406982421875, 0.470184326171875, 0.53338623046875, 0.596588134765625, 0.6597900390625, 0.722991943359375, 0.78619384765625, 0.849395751953125, 0.91259765625, 0.975799560546875, 1.03900146484375, 1.102203369140625, 1.1654052734375, 1.228607177734375, 1.29180908203125, 1.355010986328125, 1.418212890625, 1.481414794921875, 1.54461669921875, 1.607818603515625, 1.6710205078125, 1.734222412109375, 1.79742431640625, 1.860626220703125, 1.923828125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 8.0, 9.0, 2.0, 5.0, 7.0, 15.0, 14.0, 19.0, 18.0, 23.0, 25.0, 36.0, 32.0, 48.0, 62.0, 60.0, 65.0, 71.0, 81.0, 59.0, 67.0, 44.0, 37.0, 30.0, 30.0, 21.0, 17.0, 19.0, 12.0, 15.0, 6.0, 7.0, 5.0, 8.0, 4.0, 8.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97705078125, -0.9403915405273438, -0.9037322998046875, -0.8670730590820312, -0.830413818359375, -0.7937545776367188, -0.7570953369140625, -0.7204360961914062, -0.68377685546875, -0.6471176147460938, -0.6104583740234375, -0.5737991333007812, -0.537139892578125, -0.5004806518554688, -0.4638214111328125, -0.42716217041015625, -0.3905029296875, -0.35384368896484375, -0.3171844482421875, -0.28052520751953125, -0.243865966796875, -0.20720672607421875, -0.1705474853515625, -0.13388824462890625, -0.09722900390625, -0.06056976318359375, -0.0239105224609375, 0.01274871826171875, 0.049407958984375, 0.08606719970703125, 0.1227264404296875, 0.15938568115234375, 0.196044921875, 0.23270416259765625, 0.2693634033203125, 0.30602264404296875, 0.342681884765625, 0.37934112548828125, 0.4160003662109375, 0.45265960693359375, 0.48931884765625, 0.5259780883789062, 0.5626373291015625, 0.5992965698242188, 0.635955810546875, 0.6726150512695312, 0.7092742919921875, 0.7459335327148438, 0.7825927734375, 0.8192520141601562, 0.8559112548828125, 0.8925704956054688, 0.929229736328125, 0.9658889770507812, 1.0025482177734375, 1.0392074584960938, 1.07586669921875, 1.1125259399414062, 1.1491851806640625, 1.1858444213867188, 1.222503662109375, 1.2591629028320312, 1.2958221435546875, 1.3324813842773438, 1.369140625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 20.0, 18.0, 25.0, 70.0, 104.0, 272.0, 232.0, 104.0, 52.0, 35.0, 21.0, 17.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.20669937133789, -49.92448425292969, -48.642269134521484, -47.36005401611328, -46.07783889770508, -44.795623779296875, -43.51340866088867, -42.23119354248047, -40.948978424072266, -39.66676330566406, -38.38454818725586, -37.102333068847656, -35.82011795043945, -34.53790283203125, -33.25568771362305, -31.973472595214844, -30.691259384155273, -29.40904426574707, -28.126829147338867, -26.844614028930664, -25.56239891052246, -24.280183792114258, -22.997970581054688, -21.715755462646484, -20.43354034423828, -19.151325225830078, -17.869110107421875, -16.586894989013672, -15.304679870605469, -14.022464752197266, -12.740250587463379, -11.458035469055176, -10.175817489624023, -8.89360237121582, -7.611387252807617, -6.329172611236572, -5.046957492828369, -3.764742374420166, -2.482527732849121, -1.200312614440918, 0.08190250396728516, 1.3641175031661987, 2.6463325023651123, 3.9285473823547363, 5.2107625007629395, 6.492977619171143, 7.7751922607421875, 9.05740737915039, 10.339622497558594, 11.621837615966797, 12.904052734375, 14.186267852783203, 15.468482971191406, 16.75069808959961, 18.032913208007812, 19.315128326416016, 20.59734344482422, 21.879558563232422, 23.161773681640625, 24.443988800048828, 25.72620391845703, 27.008419036865234, 28.290634155273438, 29.57284927368164, 30.85506248474121]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 2.0, 4.0, 6.0, 8.0, 7.0, 9.0, 11.0, 8.0, 13.0, 14.0, 23.0, 24.0, 24.0, 28.0, 28.0, 37.0, 49.0, 76.0, 126.0, 132.0, 65.0, 43.0, 28.0, 36.0, 23.0, 30.0, 22.0, 19.0, 17.0, 13.0, 21.0, 9.0, 9.0, 9.0, 10.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.73331642150879, -24.840646743774414, -23.947975158691406, -23.05530548095703, -22.162633895874023, -21.26996421813965, -20.37729263305664, -19.484622955322266, -18.59195327758789, -17.699283599853516, -16.806612014770508, -15.913942337036133, -15.021270751953125, -14.12860107421875, -13.235930442810059, -12.343259811401367, -11.45058822631836, -10.557917594909668, -9.665246963500977, -8.772577285766602, -7.879906177520752, -6.9872355461120605, -6.094565391540527, -5.201894760131836, -4.3092241287231445, -3.416553497314453, -2.523883104324341, -1.6312127113342285, -0.7385420799255371, 0.1541285514831543, 1.0467987060546875, 1.939469337463379, 2.8321380615234375, 3.724808692932129, 4.61747932434082, 5.5101494789123535, 6.402820110321045, 7.295490741729736, 8.18816089630127, 9.080831527709961, 9.973502159118652, 10.866172790527344, 11.758843421936035, 12.651514053344727, 13.544183731079102, 14.43685531616211, 15.329524993896484, 16.22219467163086, 17.114866256713867, 18.007535934448242, 18.90020751953125, 19.792877197265625, 20.685548782348633, 21.578218460083008, 22.470890045166016, 23.36355972290039, 24.256229400634766, 25.14889907836914, 26.04157066345215, 26.934240341186523, 27.82691192626953, 28.719581604003906, 29.61225128173828, 30.50492286682129, 31.397594451904297]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 11.0, 9.0, 14.0, 27.0, 32.0, 43.0, 66.0, 75.0, 109.0, 182.0, 261.0, 469.0, 759.0, 1295.0, 2523.0, 4895.0, 10547.0, 26719.0, 93146.0, 445703.0, 1781671.0, 1390467.0, 317576.0, 73327.0, 25343.0, 9511.0, 4332.0, 2131.0, 1175.0, 731.0, 432.0, 255.0, 151.0, 116.0, 56.0, 41.0, 28.0, 15.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.765625, -3.6688232421875, -3.572021484375, -3.4752197265625, -3.37841796875, -3.2816162109375, -3.184814453125, -3.0880126953125, -2.9912109375, -2.8944091796875, -2.797607421875, -2.7008056640625, -2.60400390625, -2.5072021484375, -2.410400390625, -2.3135986328125, -2.216796875, -2.1199951171875, -2.023193359375, -1.9263916015625, -1.82958984375, -1.7327880859375, -1.635986328125, -1.5391845703125, -1.4423828125, -1.3455810546875, -1.248779296875, -1.1519775390625, -1.05517578125, -0.9583740234375, -0.861572265625, -0.7647705078125, -0.66796875, -0.5711669921875, -0.474365234375, -0.3775634765625, -0.28076171875, -0.1839599609375, -0.087158203125, 0.0096435546875, 0.1064453125, 0.2032470703125, 0.300048828125, 0.3968505859375, 0.49365234375, 0.5904541015625, 0.687255859375, 0.7840576171875, 0.880859375, 0.9776611328125, 1.074462890625, 1.1712646484375, 1.26806640625, 1.3648681640625, 1.461669921875, 1.5584716796875, 1.6552734375, 1.7520751953125, 1.848876953125, 1.9456787109375, 2.04248046875, 2.1392822265625, 2.236083984375, 2.3328857421875, 2.4296875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 7.0, 9.0, 11.0, 13.0, 12.0, 29.0, 31.0, 36.0, 36.0, 31.0, 41.0, 34.0, 70.0, 52.0, 46.0, 64.0, 57.0, 70.0, 55.0, 47.0, 53.0, 35.0, 44.0, 27.0, 12.0, 12.0, 17.0, 14.0, 8.0, 9.0, 5.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.958984375, -2.88543701171875, -2.8118896484375, -2.73834228515625, -2.664794921875, -2.59124755859375, -2.5177001953125, -2.44415283203125, -2.37060546875, -2.29705810546875, -2.2235107421875, -2.14996337890625, -2.076416015625, -2.00286865234375, -1.9293212890625, -1.85577392578125, -1.7822265625, -1.70867919921875, -1.6351318359375, -1.56158447265625, -1.488037109375, -1.41448974609375, -1.3409423828125, -1.26739501953125, -1.19384765625, -1.12030029296875, -1.0467529296875, -0.97320556640625, -0.899658203125, -0.82611083984375, -0.7525634765625, -0.67901611328125, -0.60546875, -0.53192138671875, -0.4583740234375, -0.38482666015625, -0.311279296875, -0.23773193359375, -0.1641845703125, -0.09063720703125, -0.01708984375, 0.05645751953125, 0.1300048828125, 0.20355224609375, 0.277099609375, 0.35064697265625, 0.4241943359375, 0.49774169921875, 0.5712890625, 0.64483642578125, 0.7183837890625, 0.79193115234375, 0.865478515625, 0.93902587890625, 1.0125732421875, 1.08612060546875, 1.15966796875, 1.23321533203125, 1.3067626953125, 1.38031005859375, 1.453857421875, 1.52740478515625, 1.6009521484375, 1.67449951171875, 1.748046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 8.0, 12.0, 13.0, 38.0, 85.0, 212.0, 560.0, 2919.0, 2737201.0, 1450188.0, 2287.0, 462.0, 167.0, 62.0, 32.0, 16.0, 9.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.171875, -30.016845703125, -28.86181640625, -27.706787109375, -26.5517578125, -25.396728515625, -24.24169921875, -23.086669921875, -21.931640625, -20.776611328125, -19.62158203125, -18.466552734375, -17.3115234375, -16.156494140625, -15.00146484375, -13.846435546875, -12.69140625, -11.536376953125, -10.38134765625, -9.226318359375, -8.0712890625, -6.916259765625, -5.76123046875, -4.606201171875, -3.451171875, -2.296142578125, -1.14111328125, 0.013916015625, 1.1689453125, 2.323974609375, 3.47900390625, 4.634033203125, 5.7890625, 6.944091796875, 8.09912109375, 9.254150390625, 10.4091796875, 11.564208984375, 12.71923828125, 13.874267578125, 15.029296875, 16.184326171875, 17.33935546875, 18.494384765625, 19.6494140625, 20.804443359375, 21.95947265625, 23.114501953125, 24.26953125, 25.424560546875, 26.57958984375, 27.734619140625, 28.8896484375, 30.044677734375, 31.19970703125, 32.354736328125, 33.509765625, 34.664794921875, 35.81982421875, 36.974853515625, 38.1298828125, 39.284912109375, 40.43994140625, 41.594970703125, 42.75]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 11.0, 6.0, 18.0, 18.0, 41.0, 59.0, 106.0, 210.0, 419.0, 1060.0, 1225.0, 490.0, 221.0, 98.0, 44.0, 32.0, 10.0, 8.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-23.875, -23.40771484375, -22.9404296875, -22.47314453125, -22.005859375, -21.53857421875, -21.0712890625, -20.60400390625, -20.13671875, -19.66943359375, -19.2021484375, -18.73486328125, -18.267578125, -17.80029296875, -17.3330078125, -16.86572265625, -16.3984375, -15.93115234375, -15.4638671875, -14.99658203125, -14.529296875, -14.06201171875, -13.5947265625, -13.12744140625, -12.66015625, -12.19287109375, -11.7255859375, -11.25830078125, -10.791015625, -10.32373046875, -9.8564453125, -9.38916015625, -8.921875, -8.45458984375, -7.9873046875, -7.52001953125, -7.052734375, -6.58544921875, -6.1181640625, -5.65087890625, -5.18359375, -4.71630859375, -4.2490234375, -3.78173828125, -3.314453125, -2.84716796875, -2.3798828125, -1.91259765625, -1.4453125, -0.97802734375, -0.5107421875, -0.04345703125, 0.423828125, 0.89111328125, 1.3583984375, 1.82568359375, 2.29296875, 2.76025390625, 3.2275390625, 3.69482421875, 4.162109375, 4.62939453125, 5.0966796875, 5.56396484375, 6.03125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 0.0, 4.0, 8.0, 9.0, 20.0, 35.0, 110.0, 415.0, 319.0, 64.0, 13.0, 9.0, 3.0, 2.0, 2.0], "bins": [-436.5189208984375, -428.8507080078125, -421.1825256347656, -413.5143127441406, -405.84613037109375, -398.17791748046875, -390.5097351074219, -382.8415222167969, -375.17333984375, -367.505126953125, -359.8369445800781, -352.1687316894531, -344.50054931640625, -336.83233642578125, -329.1641540527344, -321.4959411621094, -313.8277282714844, -306.1595153808594, -298.4913330078125, -290.8231201171875, -283.1549377441406, -275.4867248535156, -267.81854248046875, -260.15032958984375, -252.4821319580078, -244.81393432617188, -237.14573669433594, -229.4775390625, -221.809326171875, -214.14114379882812, -206.47293090820312, -198.8047332763672, -191.13653564453125, -183.4683380126953, -175.80014038085938, -168.13194274902344, -160.4637451171875, -152.7955322265625, -145.12733459472656, -137.45913696289062, -129.7909393310547, -122.12274169921875, -114.45454406738281, -106.78633880615234, -99.1181411743164, -91.44994354248047, -83.78173828125, -76.11354064941406, -68.44534301757812, -60.77714538574219, -53.108943939208984, -45.44074249267578, -37.772544860839844, -30.104347229003906, -22.436145782470703, -14.7679443359375, -7.099750518798828, 0.5684490203857422, 8.236648559570312, 15.904848098754883, 23.573047637939453, 31.24124526977539, 38.909446716308594, 46.5776481628418, 54.245845794677734]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 10.0, 5.0, 15.0, 21.0, 28.0, 38.0, 50.0, 61.0, 91.0, 112.0, 102.0, 78.0, 92.0, 78.0, 69.0, 41.0, 30.0, 22.0, 15.0, 11.0, 5.0, 4.0, 5.0, 2.0, 4.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.37156677246094, -95.3665542602539, -92.36154174804688, -89.35652160644531, -86.35150909423828, -83.34649658203125, -80.34148406982422, -77.33647155761719, -74.33145141601562, -71.3264389038086, -68.32142639160156, -65.31640625, -62.31139373779297, -59.30638122558594, -56.301368713378906, -53.296356201171875, -50.291343688964844, -47.28633117675781, -44.281314849853516, -41.276302337646484, -38.27128601074219, -35.266273498535156, -32.261260986328125, -29.25624656677246, -26.251232147216797, -23.246217727661133, -20.24120330810547, -17.236190795898438, -14.231176376342773, -11.22616195678711, -8.221149444580078, -5.216135025024414, -2.21112060546875, 0.7938933372497559, 3.7989072799682617, 6.803920745849609, 9.808935165405273, 12.813949584960938, 15.818962097167969, 18.823976516723633, 21.828990936279297, 24.83400535583496, 27.839019775390625, 30.844032287597656, 33.84904479980469, 36.854061126708984, 39.859073638916016, 42.86408996582031, 45.869102478027344, 48.874114990234375, 51.87913131713867, 54.8841438293457, 57.88916015625, 60.89417266845703, 63.89918518066406, 66.9041976928711, 69.90921020507812, 72.91422271728516, 75.91923522949219, 78.92425537109375, 81.92926788330078, 84.93428039550781, 87.93929290771484, 90.94430541992188, 93.94932556152344]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 8.0, 9.0, 6.0, 16.0, 18.0, 32.0, 30.0, 50.0, 62.0, 74.0, 138.0, 228.0, 348.0, 539.0, 1108.0, 1879.0, 3695.0, 8358.0, 21610.0, 75463.0, 561141.0, 290655.0, 52467.0, 16995.0, 6764.0, 3003.0, 1586.0, 894.0, 517.0, 278.0, 182.0, 96.0, 76.0, 73.0, 39.0, 33.0, 26.0, 15.0, 15.0, 7.0, 8.0, 4.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0], "bins": [-5.8828125, -5.714111328125, -5.54541015625, -5.376708984375, -5.2080078125, -5.039306640625, -4.87060546875, -4.701904296875, -4.533203125, -4.364501953125, -4.19580078125, -4.027099609375, -3.8583984375, -3.689697265625, -3.52099609375, -3.352294921875, -3.18359375, -3.014892578125, -2.84619140625, -2.677490234375, -2.5087890625, -2.340087890625, -2.17138671875, -2.002685546875, -1.833984375, -1.665283203125, -1.49658203125, -1.327880859375, -1.1591796875, -0.990478515625, -0.82177734375, -0.653076171875, -0.484375, -0.315673828125, -0.14697265625, 0.021728515625, 0.1904296875, 0.359130859375, 0.52783203125, 0.696533203125, 0.865234375, 1.033935546875, 1.20263671875, 1.371337890625, 1.5400390625, 1.708740234375, 1.87744140625, 2.046142578125, 2.21484375, 2.383544921875, 2.55224609375, 2.720947265625, 2.8896484375, 3.058349609375, 3.22705078125, 3.395751953125, 3.564453125, 3.733154296875, 3.90185546875, 4.070556640625, 4.2392578125, 4.407958984375, 4.57666015625, 4.745361328125, 4.9140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 11.0, 4.0, 25.0, 31.0, 25.0, 44.0, 51.0, 47.0, 63.0, 59.0, 89.0, 80.0, 76.0, 70.0, 63.0, 55.0, 40.0, 27.0, 34.0, 22.0, 23.0, 16.0, 10.0, 6.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.69140625, -4.562591552734375, -4.43377685546875, -4.304962158203125, -4.1761474609375, -4.047332763671875, -3.91851806640625, -3.789703369140625, -3.660888671875, -3.532073974609375, -3.40325927734375, -3.274444580078125, -3.1456298828125, -3.016815185546875, -2.88800048828125, -2.759185791015625, -2.63037109375, -2.501556396484375, -2.37274169921875, -2.243927001953125, -2.1151123046875, -1.986297607421875, -1.85748291015625, -1.728668212890625, -1.599853515625, -1.471038818359375, -1.34222412109375, -1.213409423828125, -1.0845947265625, -0.955780029296875, -0.82696533203125, -0.698150634765625, -0.5693359375, -0.440521240234375, -0.31170654296875, -0.182891845703125, -0.0540771484375, 0.074737548828125, 0.20355224609375, 0.332366943359375, 0.461181640625, 0.589996337890625, 0.71881103515625, 0.847625732421875, 0.9764404296875, 1.105255126953125, 1.23406982421875, 1.362884521484375, 1.49169921875, 1.620513916015625, 1.74932861328125, 1.878143310546875, 2.0069580078125, 2.135772705078125, 2.26458740234375, 2.393402099609375, 2.522216796875, 2.651031494140625, 2.77984619140625, 2.908660888671875, 3.0374755859375, 3.166290283203125, 3.29510498046875, 3.423919677734375, 3.552734375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 6.0, 15.0, 12.0, 11.0, 16.0, 23.0, 35.0, 41.0, 70.0, 76.0, 152.0, 220.0, 370.0, 735.0, 1715.0, 4887.0, 20328.0, 214109.0, 770958.0, 25208.0, 5747.0, 1923.0, 805.0, 352.0, 250.0, 157.0, 95.0, 62.0, 37.0, 30.0, 21.0, 16.0, 12.0, 6.0, 10.0, 5.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.9453125, -6.71429443359375, -6.4832763671875, -6.25225830078125, -6.021240234375, -5.79022216796875, -5.5592041015625, -5.32818603515625, -5.09716796875, -4.86614990234375, -4.6351318359375, -4.40411376953125, -4.173095703125, -3.94207763671875, -3.7110595703125, -3.48004150390625, -3.2490234375, -3.01800537109375, -2.7869873046875, -2.55596923828125, -2.324951171875, -2.09393310546875, -1.8629150390625, -1.63189697265625, -1.40087890625, -1.16986083984375, -0.9388427734375, -0.70782470703125, -0.476806640625, -0.24578857421875, -0.0147705078125, 0.21624755859375, 0.447265625, 0.67828369140625, 0.9093017578125, 1.14031982421875, 1.371337890625, 1.60235595703125, 1.8333740234375, 2.06439208984375, 2.29541015625, 2.52642822265625, 2.7574462890625, 2.98846435546875, 3.219482421875, 3.45050048828125, 3.6815185546875, 3.91253662109375, 4.1435546875, 4.37457275390625, 4.6055908203125, 4.83660888671875, 5.067626953125, 5.29864501953125, 5.5296630859375, 5.76068115234375, 5.99169921875, 6.22271728515625, 6.4537353515625, 6.68475341796875, 6.915771484375, 7.14678955078125, 7.3778076171875, 7.60882568359375, 7.83984375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 8.0, 6.0, 6.0, 6.0, 11.0, 14.0, 11.0, 13.0, 17.0, 28.0, 26.0, 39.0, 27.0, 38.0, 51.0, 63.0, 74.0, 74.0, 79.0, 68.0, 65.0, 50.0, 39.0, 34.0, 28.0, 19.0, 15.0, 13.0, 15.0, 12.0, 9.0, 9.0, 9.0, 7.0, 9.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-15.59375, -15.19287109375, -14.7919921875, -14.39111328125, -13.990234375, -13.58935546875, -13.1884765625, -12.78759765625, -12.38671875, -11.98583984375, -11.5849609375, -11.18408203125, -10.783203125, -10.38232421875, -9.9814453125, -9.58056640625, -9.1796875, -8.77880859375, -8.3779296875, -7.97705078125, -7.576171875, -7.17529296875, -6.7744140625, -6.37353515625, -5.97265625, -5.57177734375, -5.1708984375, -4.77001953125, -4.369140625, -3.96826171875, -3.5673828125, -3.16650390625, -2.765625, -2.36474609375, -1.9638671875, -1.56298828125, -1.162109375, -0.76123046875, -0.3603515625, 0.04052734375, 0.44140625, 0.84228515625, 1.2431640625, 1.64404296875, 2.044921875, 2.44580078125, 2.8466796875, 3.24755859375, 3.6484375, 4.04931640625, 4.4501953125, 4.85107421875, 5.251953125, 5.65283203125, 6.0537109375, 6.45458984375, 6.85546875, 7.25634765625, 7.6572265625, 8.05810546875, 8.458984375, 8.85986328125, 9.2607421875, 9.66162109375, 10.0625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 2.0, 2.0, 6.0, 6.0, 12.0, 14.0, 20.0, 27.0, 27.0, 36.0, 109.0, 198.0, 419.0, 1041.0, 3484.0, 17329.0, 928194.0, 86503.0, 7755.0, 1998.0, 714.0, 276.0, 148.0, 88.0, 35.0, 23.0, 28.0, 11.0, 10.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.599151611328125, -2.51470947265625, -2.430267333984375, -2.3458251953125, -2.261383056640625, -2.17694091796875, -2.092498779296875, -2.008056640625, -1.923614501953125, -1.83917236328125, -1.754730224609375, -1.6702880859375, -1.585845947265625, -1.50140380859375, -1.416961669921875, -1.33251953125, -1.248077392578125, -1.16363525390625, -1.079193115234375, -0.9947509765625, -0.910308837890625, -0.82586669921875, -0.741424560546875, -0.656982421875, -0.572540283203125, -0.48809814453125, -0.403656005859375, -0.3192138671875, -0.234771728515625, -0.15032958984375, -0.065887451171875, 0.0185546875, 0.102996826171875, 0.18743896484375, 0.271881103515625, 0.3563232421875, 0.440765380859375, 0.52520751953125, 0.609649658203125, 0.694091796875, 0.778533935546875, 0.86297607421875, 0.947418212890625, 1.0318603515625, 1.116302490234375, 1.20074462890625, 1.285186767578125, 1.36962890625, 1.454071044921875, 1.53851318359375, 1.622955322265625, 1.7073974609375, 1.791839599609375, 1.87628173828125, 1.960723876953125, 2.045166015625, 2.129608154296875, 2.21405029296875, 2.298492431640625, 2.3829345703125, 2.467376708984375, 2.55181884765625, 2.636260986328125, 2.720703125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 16.0, 16.0, 12.0, 21.0, 35.0, 25.0, 56.0, 62.0, 112.0, 176.0, 125.0, 79.0, 61.0, 45.0, 25.0, 24.0, 19.0, 9.0, 6.0, 8.0, 8.0, 3.0, 6.0, 7.0, 3.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0005207061767578125, -0.000505201518535614, -0.0004896968603134155, -0.00047419220209121704, -0.00045868754386901855, -0.00044318288564682007, -0.0004276782274246216, -0.0004121735692024231, -0.0003966689109802246, -0.0003811642527580261, -0.00036565959453582764, -0.00035015493631362915, -0.00033465027809143066, -0.0003191456198692322, -0.0003036409616470337, -0.0002881363034248352, -0.0002726316452026367, -0.00025712698698043823, -0.00024162232875823975, -0.00022611767053604126, -0.00021061301231384277, -0.0001951083540916443, -0.0001796036958694458, -0.00016409903764724731, -0.00014859437942504883, -0.00013308972120285034, -0.00011758506298065186, -0.00010208040475845337, -8.657574653625488e-05, -7.10710883140564e-05, -5.556643009185791e-05, -4.0061771869659424e-05, -2.4557113647460938e-05, -9.052455425262451e-06, 6.452202796936035e-06, 2.195686101913452e-05, 3.746151924133301e-05, 5.2966177463531494e-05, 6.847083568572998e-05, 8.397549390792847e-05, 9.948015213012695e-05, 0.00011498481035232544, 0.00013048946857452393, 0.0001459941267967224, 0.0001614987850189209, 0.00017700344324111938, 0.00019250810146331787, 0.00020801275968551636, 0.00022351741790771484, 0.00023902207612991333, 0.0002545267343521118, 0.0002700313925743103, 0.0002855360507965088, 0.0003010407090187073, 0.00031654536724090576, 0.00033205002546310425, 0.00034755468368530273, 0.0003630593419075012, 0.0003785640001296997, 0.0003940686583518982, 0.0004095733165740967, 0.00042507797479629517, 0.00044058263301849365, 0.00045608729124069214, 0.0004715919494628906]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 3.0, 13.0, 12.0, 14.0, 24.0, 37.0, 51.0, 109.0, 182.0, 358.0, 699.0, 1771.0, 5024.0, 20381.0, 161342.0, 809149.0, 36967.0, 7862.0, 2488.0, 962.0, 480.0, 256.0, 124.0, 65.0, 55.0, 25.0, 14.0, 17.0, 9.0, 13.0, 7.0, 10.0, 6.0, 2.0, 4.0, 4.0, 0.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.099609375, -1.060577392578125, -1.02154541015625, -0.982513427734375, -0.9434814453125, -0.904449462890625, -0.86541748046875, -0.826385498046875, -0.787353515625, -0.748321533203125, -0.70928955078125, -0.670257568359375, -0.6312255859375, -0.592193603515625, -0.55316162109375, -0.514129638671875, -0.47509765625, -0.436065673828125, -0.39703369140625, -0.358001708984375, -0.3189697265625, -0.279937744140625, -0.24090576171875, -0.201873779296875, -0.162841796875, -0.123809814453125, -0.08477783203125, -0.045745849609375, -0.0067138671875, 0.032318115234375, 0.07135009765625, 0.110382080078125, 0.1494140625, 0.188446044921875, 0.22747802734375, 0.266510009765625, 0.3055419921875, 0.344573974609375, 0.38360595703125, 0.422637939453125, 0.461669921875, 0.500701904296875, 0.53973388671875, 0.578765869140625, 0.6177978515625, 0.656829833984375, 0.69586181640625, 0.734893798828125, 0.77392578125, 0.812957763671875, 0.85198974609375, 0.891021728515625, 0.9300537109375, 0.969085693359375, 1.00811767578125, 1.047149658203125, 1.086181640625, 1.125213623046875, 1.16424560546875, 1.203277587890625, 1.2423095703125, 1.281341552734375, 1.32037353515625, 1.359405517578125, 1.3984375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 7.0, 8.0, 3.0, 4.0, 7.0, 21.0, 21.0, 39.0, 53.0, 83.0, 122.0, 190.0, 163.0, 84.0, 63.0, 40.0, 10.0, 19.0, 10.0, 10.0, 6.0, 5.0, 5.0, 6.0, 7.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16796875, -2.103302001953125, -2.03863525390625, -1.973968505859375, -1.9093017578125, -1.844635009765625, -1.77996826171875, -1.715301513671875, -1.650634765625, -1.585968017578125, -1.52130126953125, -1.456634521484375, -1.3919677734375, -1.327301025390625, -1.26263427734375, -1.197967529296875, -1.13330078125, -1.068634033203125, -1.00396728515625, -0.939300537109375, -0.8746337890625, -0.809967041015625, -0.74530029296875, -0.680633544921875, -0.615966796875, -0.551300048828125, -0.48663330078125, -0.421966552734375, -0.3572998046875, -0.292633056640625, -0.22796630859375, -0.163299560546875, -0.0986328125, -0.033966064453125, 0.03070068359375, 0.095367431640625, 0.1600341796875, 0.224700927734375, 0.28936767578125, 0.354034423828125, 0.418701171875, 0.483367919921875, 0.54803466796875, 0.612701416015625, 0.6773681640625, 0.742034912109375, 0.80670166015625, 0.871368408203125, 0.93603515625, 1.000701904296875, 1.06536865234375, 1.130035400390625, 1.1947021484375, 1.259368896484375, 1.32403564453125, 1.388702392578125, 1.453369140625, 1.518035888671875, 1.58270263671875, 1.647369384765625, 1.7120361328125, 1.776702880859375, 1.84136962890625, 1.906036376953125, 1.970703125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 13.0, 31.0, 94.0, 591.0, 178.0, 63.0, 17.0, 15.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.619384765625, -111.98573303222656, -108.35208892822266, -104.71843719482422, -101.08479309082031, -97.45114135742188, -93.81749725341797, -90.18384552001953, -86.55020141601562, -82.91654968261719, -79.28290557861328, -75.64925384521484, -72.01560974121094, -68.3819580078125, -64.7483139038086, -61.114662170410156, -57.481014251708984, -53.84736633300781, -50.21371841430664, -46.58007049560547, -42.9464225769043, -39.312774658203125, -35.67912292480469, -32.04547882080078, -28.411828994750977, -24.778181076049805, -21.144533157348633, -17.510883331298828, -13.877236366271973, -10.243587493896484, -6.6099395751953125, -2.9762916564941406, 0.6573562622070312, 4.291004180908203, 7.924652576446533, 11.558300971984863, 15.191948890686035, 18.825597763061523, 22.459245681762695, 26.092893600463867, 29.72654151916504, 33.360191345214844, 36.993839263916016, 40.62748718261719, 44.26113510131836, 47.89478302001953, 51.5284309387207, 55.162078857421875, 58.79572677612305, 62.42937469482422, 66.06302642822266, 69.69667053222656, 73.330322265625, 76.9639663696289, 80.59761810302734, 84.23126220703125, 87.86491394042969, 91.49856567382812, 95.13220977783203, 98.76586151123047, 102.39950561523438, 106.03315734863281, 109.66680145263672, 113.30045318603516, 116.93409729003906]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 10.0, 5.0, 9.0, 9.0, 9.0, 18.0, 17.0, 24.0, 20.0, 23.0, 40.0, 50.0, 234.0, 239.0, 40.0, 36.0, 30.0, 32.0, 23.0, 21.0, 24.0, 15.0, 12.0, 12.0, 10.0, 9.0, 9.0, 5.0, 2.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0], "bins": [-61.98535919189453, -60.50719451904297, -59.029029846191406, -57.550865173339844, -56.07270050048828, -54.59453582763672, -53.116371154785156, -51.638206481933594, -50.16004180908203, -48.68187713623047, -47.203712463378906, -45.725547790527344, -44.24738311767578, -42.76921844482422, -41.291053771972656, -39.812889099121094, -38.33472442626953, -36.85655975341797, -35.378395080566406, -33.900230407714844, -32.42206573486328, -30.94390106201172, -29.465736389160156, -27.987571716308594, -26.50940704345703, -25.03124237060547, -23.553077697753906, -22.074913024902344, -20.59674835205078, -19.11858367919922, -17.640419006347656, -16.162254333496094, -14.684089660644531, -13.205924987792969, -11.727760314941406, -10.249595642089844, -8.771430969238281, -7.293266296386719, -5.815101623535156, -4.336936950683594, -2.8587722778320312, -1.3806076049804688, 0.09755706787109375, 1.5757217407226562, 3.0538864135742188, 4.532051086425781, 6.010215759277344, 7.488380432128906, 8.966545104980469, 10.444709777832031, 11.922874450683594, 13.401039123535156, 14.879203796386719, 16.35736846923828, 17.835533142089844, 19.313697814941406, 20.79186248779297, 22.27002716064453, 23.748191833496094, 25.226356506347656, 26.70452117919922, 28.18268585205078, 29.660850524902344, 31.139015197753906, 32.61717987060547]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 13.0, 12.0, 11.0, 17.0, 22.0, 31.0, 23.0, 34.0, 29.0, 77.0, 264.0, 142.0, 59.0, 48.0, 38.0, 29.0, 25.0, 24.0, 16.0, 18.0, 11.0, 9.0, 8.0, 8.0, 4.0, 8.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.685546875, -3.582550048828125, -3.47955322265625, -3.376556396484375, -3.2735595703125, -3.170562744140625, -3.06756591796875, -2.964569091796875, -2.861572265625, -2.758575439453125, -2.65557861328125, -2.552581787109375, -2.4495849609375, -2.346588134765625, -2.24359130859375, -2.140594482421875, -2.03759765625, -1.934600830078125, -1.83160400390625, -1.728607177734375, -1.6256103515625, -1.522613525390625, -1.41961669921875, -1.316619873046875, -1.213623046875, -1.110626220703125, -1.00762939453125, -0.904632568359375, -0.8016357421875, -0.698638916015625, -0.59564208984375, -0.492645263671875, -0.3896484375, -0.286651611328125, -0.18365478515625, -0.080657958984375, 0.0223388671875, 0.125335693359375, 0.22833251953125, 0.331329345703125, 0.434326171875, 0.537322998046875, 0.64031982421875, 0.743316650390625, 0.8463134765625, 0.949310302734375, 1.05230712890625, 1.155303955078125, 1.25830078125, 1.361297607421875, 1.46429443359375, 1.567291259765625, 1.6702880859375, 1.773284912109375, 1.87628173828125, 1.979278564453125, 2.082275390625, 2.185272216796875, 2.28826904296875, 2.391265869140625, 2.4942626953125, 2.597259521484375, 2.70025634765625, 2.803253173828125, 2.90625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 14.0, 8.0, 18.0, 25.0, 31.0, 59.0, 167.0, 675.0, 6428.0, 8370906.0, 8975.0, 843.0, 189.0, 75.0, 61.0, 15.0, 23.0, 16.0, 7.0, 7.0, 11.0, 1.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-49.537994384765625, -47.8031005859375, -46.068206787109375, -44.33331298828125, -42.598419189453125, -40.863525390625, -39.128631591796875, -37.39373779296875, -35.658843994140625, -33.9239501953125, -32.189056396484375, -30.45416259765625, -28.719268798828125, -26.984375, -25.249479293823242, -23.514585494995117, -21.77968978881836, -20.044795989990234, -18.30990219116211, -16.575008392333984, -14.840113639831543, -13.105219841003418, -11.370325088500977, -9.635431289672852, -7.900537490844727, -6.165643692016602, -4.430749416351318, -2.695855140686035, -0.9609613418579102, 0.7739324569702148, 2.5088272094726562, 4.243721008300781, 5.978614807128906, 7.713508605957031, 9.448402404785156, 11.183297157287598, 12.918190956115723, 14.653084754943848, 16.38797950744629, 18.122873306274414, 19.85776710510254, 21.592660903930664, 23.32755470275879, 25.062450408935547, 26.797344207763672, 28.532238006591797, 30.267131805419922, 32.00202560424805, 33.73691940307617, 35.4718132019043, 37.20670700073242, 38.94160079956055, 40.67649459838867, 42.4113883972168, 44.14628601074219, 45.88117980957031, 47.61607360839844, 49.35096740722656, 51.08586120605469, 52.82075500488281, 54.55564880371094, 56.29054260253906, 58.02543640136719, 59.76033020019531, 61.49522399902344]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 5.0, 2.0, 5.0, 3.0, 7.0, 4.0, 7.0, 8.0, 4.0, 4.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.089269638061523, -18.179800033569336, -17.27033233642578, -16.360862731933594, -15.451395034790039, -14.541925430297852, -13.63245677947998, -12.72298812866211, -11.813519477844238, -10.904050827026367, -9.994582176208496, -9.085113525390625, -8.175643920898438, -7.266175746917725, -6.356706619262695, -5.447237968444824, -4.537769317626953, -3.628300666809082, -2.718831777572632, -1.8093628883361816, -0.8998942375183105, 0.009574413299560547, 0.9190435409545898, 1.828512191772461, 2.737980842590332, 3.647449493408203, 4.556918144226074, 5.4663872718811035, 6.375855922698975, 7.285324573516846, 8.194793701171875, 9.104262351989746, 10.013729095458984, 10.923197746276855, 11.832666397094727, 12.742136001586914, 13.651603698730469, 14.561073303222656, 15.470541954040527, 16.3800106048584, 17.289478302001953, 18.19894790649414, 19.108415603637695, 20.017885208129883, 20.927352905273438, 21.836822509765625, 22.746292114257812, 23.655759811401367, 24.565229415893555, 25.474699020385742, 26.384166717529297, 27.293636322021484, 28.20310401916504, 29.112573623657227, 30.02204132080078, 30.93151092529297, 31.840980529785156, 32.750450134277344, 33.65991973876953, 34.56938552856445, 35.47885513305664, 36.38832473754883, 37.297794342041016, 38.20726013183594, 39.116729736328125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 15.0, 15.0, 34.0, 39.0, 104.0, 177.0, 384.0, 995.0, 3634.0, 21365.0, 203011.0, 262535.0, 25760.0, 4131.0, 1122.0, 452.0, 201.0, 116.0, 59.0, 41.0, 25.0, 10.0, 11.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.125, -36.7666015625, -35.408203125, -34.0498046875, -32.69140625, -31.3330078125, -29.974609375, -28.6162109375, -27.2578125, -25.8994140625, -24.541015625, -23.1826171875, -21.82421875, -20.4658203125, -19.107421875, -17.7490234375, -16.390625, -15.0322265625, -13.673828125, -12.3154296875, -10.95703125, -9.5986328125, -8.240234375, -6.8818359375, -5.5234375, -4.1650390625, -2.806640625, -1.4482421875, -0.08984375, 1.2685546875, 2.626953125, 3.9853515625, 5.34375, 6.7021484375, 8.060546875, 9.4189453125, 10.77734375, 12.1357421875, 13.494140625, 14.8525390625, 16.2109375, 17.5693359375, 18.927734375, 20.2861328125, 21.64453125, 23.0029296875, 24.361328125, 25.7197265625, 27.078125, 28.4365234375, 29.794921875, 31.1533203125, 32.51171875, 33.8701171875, 35.228515625, 36.5869140625, 37.9453125, 39.3037109375, 40.662109375, 42.0205078125, 43.37890625, 44.7373046875, 46.095703125, 47.4541015625, 48.8125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 0.0, 3.0, 3.0, 9.0, 10.0, 18.0, 18.0, 25.0, 42.0, 43.0, 55.0, 69.0, 81.0, 109.0, 100.0, 80.0, 85.0, 64.0, 54.0, 32.0, 30.0, 21.0, 13.0, 8.0, 3.0, 9.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-5.05859375, -4.91949462890625, -4.7803955078125, -4.64129638671875, -4.502197265625, -4.36309814453125, -4.2239990234375, -4.08489990234375, -3.94580078125, -3.80670166015625, -3.6676025390625, -3.52850341796875, -3.389404296875, -3.25030517578125, -3.1112060546875, -2.97210693359375, -2.8330078125, -2.69390869140625, -2.5548095703125, -2.41571044921875, -2.276611328125, -2.13751220703125, -1.9984130859375, -1.85931396484375, -1.72021484375, -1.58111572265625, -1.4420166015625, -1.30291748046875, -1.163818359375, -1.02471923828125, -0.8856201171875, -0.74652099609375, -0.607421875, -0.46832275390625, -0.3292236328125, -0.19012451171875, -0.051025390625, 0.08807373046875, 0.2271728515625, 0.36627197265625, 0.50537109375, 0.64447021484375, 0.7835693359375, 0.92266845703125, 1.061767578125, 1.20086669921875, 1.3399658203125, 1.47906494140625, 1.6181640625, 1.75726318359375, 1.8963623046875, 2.03546142578125, 2.174560546875, 2.31365966796875, 2.4527587890625, 2.59185791015625, 2.73095703125, 2.87005615234375, 3.0091552734375, 3.14825439453125, 3.287353515625, 3.42645263671875, 3.5655517578125, 3.70465087890625, 3.84375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 2.0, 9.0, 11.0, 26.0, 52.0, 132.0, 125.0, 63.0, 34.0, 5.0, 10.0, 3.0, 5.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.15226745605469, -43.020484924316406, -41.88870620727539, -40.756927490234375, -39.625144958496094, -38.49336242675781, -37.3615837097168, -36.22980499267578, -35.0980224609375, -33.96623992919922, -32.8344612121582, -31.702680587768555, -30.570899963378906, -29.439119338989258, -28.30733871459961, -27.17555809020996, -26.043777465820312, -24.911996841430664, -23.780216217041016, -22.648435592651367, -21.51665496826172, -20.38487434387207, -19.253093719482422, -18.121313095092773, -16.989532470703125, -15.857751846313477, -14.725971221923828, -13.59419059753418, -12.462409973144531, -11.330629348754883, -10.198848724365234, -9.067068099975586, -7.935285568237305, -6.803504943847656, -5.671724319458008, -4.539943695068359, -3.408163070678711, -2.2763824462890625, -1.144601821899414, -0.012821197509765625, 1.1189594268798828, 2.2507400512695312, 3.3825206756591797, 4.514301300048828, 5.646081924438477, 6.777862548828125, 7.909643173217773, 9.041423797607422, 10.17320442199707, 11.304985046386719, 12.436765670776367, 13.568546295166016, 14.700326919555664, 15.832107543945312, 16.96388816833496, 18.09566879272461, 19.227449417114258, 20.359230041503906, 21.491010665893555, 22.622791290283203, 23.75457191467285, 24.8863525390625, 26.01813316345215, 27.149913787841797, 28.281694412231445]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 6.0, 4.0, 7.0, 22.0, 35.0, 75.0, 137.0, 88.0, 40.0, 16.0, 11.0, 7.0, 3.0, 5.0, 7.0, 2.0, 7.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.07525634765625, -25.367338180541992, -24.659420013427734, -23.951501846313477, -23.24358367919922, -22.535667419433594, -21.827749252319336, -21.119831085205078, -20.41191291809082, -19.703994750976562, -18.996076583862305, -18.288158416748047, -17.580242156982422, -16.872323989868164, -16.164405822753906, -15.456487655639648, -14.74856948852539, -14.040651321411133, -13.332733154296875, -12.624815940856934, -11.916897773742676, -11.208979606628418, -10.501062393188477, -9.793144226074219, -9.085226058959961, -8.377307891845703, -7.6693902015686035, -6.961472511291504, -6.253554344177246, -5.545636177062988, -4.837718486785889, -4.129800796508789, -3.421884536743164, -2.7139666080474854, -2.0060486793518066, -1.298130750656128, -0.5902128219604492, 0.11770510673522949, 0.8256230354309082, 1.5335407257080078, 2.2414588928222656, 2.9493768215179443, 3.657294750213623, 4.365212440490723, 5.0731306076049805, 5.781048774719238, 6.488966464996338, 7.1968841552734375, 7.904802322387695, 8.612720489501953, 9.320638656616211, 10.028555870056152, 10.73647403717041, 11.444392204284668, 12.15230941772461, 12.860227584838867, 13.568145751953125, 14.276063919067383, 14.98398208618164, 15.691899299621582, 16.399818420410156, 17.10773468017578, 17.81565284729004, 18.523571014404297, 19.231489181518555]}, "eval/loss": 4.305517673492432, "eval/wer": 1.9549980166600556, "eval/runtime": 784.9234, "eval/samples_per_second": 3.366, "eval/steps_per_second": 0.282} \ No newline at end of file +{"train/loss": 4.7853, "train/learning_rate": 5.805515239477504e-07, "train/epoch": 1.0, "train/global_step": 1189, "_runtime": 6633, "_timestamp": 1646186014, "_step": 1191, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 7.0, 21.0, 31.0, 147.0, 519.0, 207.0, 32.0, 21.0, 12.0, 6.0, 4.0, 4.0], "bins": [-485.33099365234375, -476.75994873046875, -468.1888732910156, -459.6178283691406, -451.0467834472656, -442.4757385253906, -433.9046630859375, -425.3336181640625, -416.7625732421875, -408.1915283203125, -399.6204528808594, -391.0494079589844, -382.4783630371094, -373.9073181152344, -365.33624267578125, -356.76519775390625, -348.19415283203125, -339.62310791015625, -331.0520324707031, -322.4809875488281, -313.9099426269531, -305.3388977050781, -296.767822265625, -288.19677734375, -279.6257019042969, -271.0546569824219, -262.48358154296875, -253.91253662109375, -245.34149169921875, -236.7704315185547, -228.19937133789062, -219.62832641601562, -211.0572967529297, -202.48623657226562, -193.91519165039062, -185.34413146972656, -176.77308654785156, -168.2020263671875, -159.6309814453125, -151.05992126464844, -142.48887634277344, -133.91781616210938, -125.34677124023438, -116.77571105957031, -108.20466613769531, -99.63360595703125, -91.06255340576172, -82.49150085449219, -73.92044067382812, -65.3493881225586, -56.77833557128906, -48.207279205322266, -39.636226654052734, -31.065174102783203, -22.494117736816406, -13.923065185546875, -5.352016448974609, 3.2190370559692383, 11.790090560913086, 20.36114501953125, 28.93219757080078, 37.50325012207031, 46.07430648803711, 54.64535903930664, 63.21641159057617]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 6.0, 5.0, 0.0, 6.0, 4.0, 3.0, 4.0, 8.0, 10.0, 8.0, 15.0, 15.0, 23.0, 15.0, 22.0, 28.0, 21.0, 33.0, 43.0, 50.0, 59.0, 73.0, 74.0, 62.0, 69.0, 55.0, 48.0, 32.0, 32.0, 32.0, 22.0, 16.0, 22.0, 18.0, 14.0, 16.0, 7.0, 13.0, 6.0, 2.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-121.59696960449219, -117.4406509399414, -113.28433227539062, -109.12801361083984, -104.97169494628906, -100.81536865234375, -96.65904998779297, -92.50273132324219, -88.3464126586914, -84.19009399414062, -80.03377532958984, -75.87745666503906, -71.72113037109375, -67.5648193359375, -63.40849304199219, -59.252174377441406, -55.095855712890625, -50.939537048339844, -46.78321838378906, -42.626895904541016, -38.470577239990234, -34.31425857543945, -30.15793800354004, -26.001617431640625, -21.845298767089844, -17.688980102539062, -13.532659530639648, -9.37633991241455, -5.220020294189453, -1.0637016296386719, 3.092618942260742, 7.248939514160156, 11.405258178710938, 15.561577796936035, 19.717897415161133, 23.874217987060547, 28.030536651611328, 32.18685531616211, 36.343177795410156, 40.49949645996094, 44.65581512451172, 48.8121337890625, 52.96845245361328, 57.12477493286133, 61.28109359741211, 65.43740844726562, 69.59373474121094, 73.75005340576172, 77.9063720703125, 82.06269073486328, 86.21900939941406, 90.37532806396484, 94.53164672851562, 98.68797302246094, 102.84429168701172, 107.0006103515625, 111.15692901611328, 115.31324768066406, 119.46956634521484, 123.62588500976562, 127.78221130371094, 131.9385223388672, 136.0948486328125, 140.25115966796875, 144.40748596191406]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 6.0, 7.0, 11.0, 13.0, 8.0, 11.0, 23.0, 19.0, 16.0, 17.0, 40.0, 45.0, 60.0, 86.0, 108.0, 101.0, 73.0, 57.0, 41.0, 43.0, 29.0, 21.0, 22.0, 17.0, 14.0, 19.0, 10.0, 10.0, 14.0, 9.0, 6.0, 9.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.4140625, -9.10400390625, -8.7939453125, -8.48388671875, -8.173828125, -7.86376953125, -7.5537109375, -7.24365234375, -6.93359375, -6.62353515625, -6.3134765625, -6.00341796875, -5.693359375, -5.38330078125, -5.0732421875, -4.76318359375, -4.453125, -4.14306640625, -3.8330078125, -3.52294921875, -3.212890625, -2.90283203125, -2.5927734375, -2.28271484375, -1.97265625, -1.66259765625, -1.3525390625, -1.04248046875, -0.732421875, -0.42236328125, -0.1123046875, 0.19775390625, 0.5078125, 0.81787109375, 1.1279296875, 1.43798828125, 1.748046875, 2.05810546875, 2.3681640625, 2.67822265625, 2.98828125, 3.29833984375, 3.6083984375, 3.91845703125, 4.228515625, 4.53857421875, 4.8486328125, 5.15869140625, 5.46875, 5.77880859375, 6.0888671875, 6.39892578125, 6.708984375, 7.01904296875, 7.3291015625, 7.63916015625, 7.94921875, 8.25927734375, 8.5693359375, 8.87939453125, 9.189453125, 9.49951171875, 9.8095703125, 10.11962890625, 10.4296875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 4.0, 7.0, 9.0, 11.0, 15.0, 29.0, 44.0, 54.0, 80.0, 105.0, 128.0, 156.0, 270.0, 398.0, 602.0, 878.0, 1353.0, 2231.0, 3736.0, 6684.0, 13309.0, 37672.0, 481680.0, 3393357.0, 195460.0, 27874.0, 11931.0, 6384.0, 3601.0, 2235.0, 1322.0, 900.0, 554.0, 390.0, 257.0, 175.0, 112.0, 85.0, 44.0, 43.0, 22.0, 26.0, 14.0, 14.0, 10.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.3125, -28.34716796875, -27.3818359375, -26.41650390625, -25.451171875, -24.48583984375, -23.5205078125, -22.55517578125, -21.58984375, -20.62451171875, -19.6591796875, -18.69384765625, -17.728515625, -16.76318359375, -15.7978515625, -14.83251953125, -13.8671875, -12.90185546875, -11.9365234375, -10.97119140625, -10.005859375, -9.04052734375, -8.0751953125, -7.10986328125, -6.14453125, -5.17919921875, -4.2138671875, -3.24853515625, -2.283203125, -1.31787109375, -0.3525390625, 0.61279296875, 1.578125, 2.54345703125, 3.5087890625, 4.47412109375, 5.439453125, 6.40478515625, 7.3701171875, 8.33544921875, 9.30078125, 10.26611328125, 11.2314453125, 12.19677734375, 13.162109375, 14.12744140625, 15.0927734375, 16.05810546875, 17.0234375, 17.98876953125, 18.9541015625, 19.91943359375, 20.884765625, 21.85009765625, 22.8154296875, 23.78076171875, 24.74609375, 25.71142578125, 26.6767578125, 27.64208984375, 28.607421875, 29.57275390625, 30.5380859375, 31.50341796875, 32.46875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 6.0, 4.0, 5.0, 10.0, 9.0, 6.0, 20.0, 12.0, 18.0, 25.0, 31.0, 49.0, 52.0, 46.0, 88.0, 109.0, 236.0, 401.0, 660.0, 783.0, 593.0, 324.0, 186.0, 89.0, 63.0, 40.0, 42.0, 26.0, 26.0, 15.0, 23.0, 15.0, 18.0, 11.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-28.46875, -27.5576171875, -26.646484375, -25.7353515625, -24.82421875, -23.9130859375, -23.001953125, -22.0908203125, -21.1796875, -20.2685546875, -19.357421875, -18.4462890625, -17.53515625, -16.6240234375, -15.712890625, -14.8017578125, -13.890625, -12.9794921875, -12.068359375, -11.1572265625, -10.24609375, -9.3349609375, -8.423828125, -7.5126953125, -6.6015625, -5.6904296875, -4.779296875, -3.8681640625, -2.95703125, -2.0458984375, -1.134765625, -0.2236328125, 0.6875, 1.5986328125, 2.509765625, 3.4208984375, 4.33203125, 5.2431640625, 6.154296875, 7.0654296875, 7.9765625, 8.8876953125, 9.798828125, 10.7099609375, 11.62109375, 12.5322265625, 13.443359375, 14.3544921875, 15.265625, 16.1767578125, 17.087890625, 17.9990234375, 18.91015625, 19.8212890625, 20.732421875, 21.6435546875, 22.5546875, 23.4658203125, 24.376953125, 25.2880859375, 26.19921875, 27.1103515625, 28.021484375, 28.9326171875, 29.84375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 11.0, 17.0, 8.0, 20.0, 26.0, 20.0, 25.0, 53.0, 40.0, 71.0, 119.0, 124.0, 227.0, 391.0, 848.0, 2284.0, 6817.0, 26358.0, 165688.0, 3781773.0, 171036.0, 27069.0, 6961.0, 2279.0, 863.0, 371.0, 221.0, 138.0, 76.0, 59.0, 55.0, 51.0, 41.0, 28.0, 17.0, 22.0, 8.0, 6.0, 6.0, 6.0, 9.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-81.625, -79.0341796875, -76.443359375, -73.8525390625, -71.26171875, -68.6708984375, -66.080078125, -63.4892578125, -60.8984375, -58.3076171875, -55.716796875, -53.1259765625, -50.53515625, -47.9443359375, -45.353515625, -42.7626953125, -40.171875, -37.5810546875, -34.990234375, -32.3994140625, -29.80859375, -27.2177734375, -24.626953125, -22.0361328125, -19.4453125, -16.8544921875, -14.263671875, -11.6728515625, -9.08203125, -6.4912109375, -3.900390625, -1.3095703125, 1.28125, 3.8720703125, 6.462890625, 9.0537109375, 11.64453125, 14.2353515625, 16.826171875, 19.4169921875, 22.0078125, 24.5986328125, 27.189453125, 29.7802734375, 32.37109375, 34.9619140625, 37.552734375, 40.1435546875, 42.734375, 45.3251953125, 47.916015625, 50.5068359375, 53.09765625, 55.6884765625, 58.279296875, 60.8701171875, 63.4609375, 66.0517578125, 68.642578125, 71.2333984375, 73.82421875, 76.4150390625, 79.005859375, 81.5966796875, 84.1875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 9.0, 26.0, 22.0, 56.0, 85.0, 184.0, 248.0, 152.0, 102.0, 46.0, 31.0, 23.0, 6.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.32012939453125, -82.11811065673828, -77.91609191894531, -73.71407318115234, -69.51205444335938, -65.31004333496094, -61.10802459716797, -56.906005859375, -52.70398712158203, -48.50196838378906, -44.299949645996094, -40.09793472290039, -35.89591598510742, -31.693897247314453, -27.491880416870117, -23.28986358642578, -19.087844848632812, -14.88582706451416, -10.683809280395508, -6.4817914962768555, -2.279773712158203, 1.9222450256347656, 6.124261856079102, 10.326278686523438, 14.528297424316406, 18.730316162109375, 22.93233299255371, 27.134349822998047, 31.336368560791016, 35.538387298583984, 39.74040222167969, 43.942420959472656, 48.144439697265625, 52.346458435058594, 56.54847717285156, 60.750492095947266, 64.9525146484375, 69.15452575683594, 73.3565444946289, 77.55856323242188, 81.76058197021484, 85.96260070800781, 90.16461944580078, 94.36663818359375, 98.56864929199219, 102.77067565917969, 106.97268676757812, 111.1747055053711, 115.37672424316406, 119.57874298095703, 123.78076171875, 127.98278045654297, 132.18479919433594, 136.38681030273438, 140.58883666992188, 144.7908477783203, 148.99285888671875, 153.1948699951172, 157.3968963623047, 161.59890747070312, 165.80093383789062, 170.00294494628906, 174.20497131347656, 178.406982421875, 182.6090087890625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 9.0, 14.0, 6.0, 13.0, 22.0, 14.0, 21.0, 31.0, 25.0, 24.0, 29.0, 31.0, 31.0, 52.0, 38.0, 40.0, 49.0, 51.0, 47.0, 34.0, 36.0, 34.0, 39.0, 44.0, 37.0, 29.0, 24.0, 26.0, 23.0, 20.0, 18.0, 17.0, 13.0, 17.0, 5.0, 8.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-98.53227233886719, -95.51553344726562, -92.49879455566406, -89.4820556640625, -86.46531677246094, -83.4485855102539, -80.43184661865234, -77.41510772705078, -74.39836883544922, -71.38162994384766, -68.3648910522461, -65.34815216064453, -62.331417083740234, -59.31467819213867, -56.297943115234375, -53.28120422363281, -50.26446533203125, -47.24772644042969, -44.230987548828125, -41.21425247192383, -38.197513580322266, -35.1807746887207, -32.164039611816406, -29.147300720214844, -26.13056182861328, -23.11382293701172, -20.09708595275879, -17.08034896850586, -14.063610076904297, -11.04687213897705, -8.030134201049805, -5.013397216796875, -1.9966583251953125, 1.0200796127319336, 4.03681755065918, 7.053555488586426, 10.070293426513672, 13.087031364440918, 16.103769302368164, 19.120506286621094, 22.137245178222656, 25.15398406982422, 28.17072105407715, 31.187458038330078, 34.20419692993164, 37.2209358215332, 40.2376708984375, 43.25440979003906, 46.271148681640625, 49.28788757324219, 52.30462646484375, 55.32136154174805, 58.33810043334961, 61.35483932495117, 64.37157440185547, 67.38831329345703, 70.4050521850586, 73.42179107666016, 76.43852996826172, 79.45526885986328, 82.47200012207031, 85.48873901367188, 88.50547790527344, 91.522216796875, 94.53895568847656]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 9.0, 8.0, 14.0, 13.0, 13.0, 31.0, 28.0, 34.0, 30.0, 57.0, 62.0, 60.0, 75.0, 74.0, 66.0, 60.0, 61.0, 55.0, 27.0, 33.0, 35.0, 20.0, 20.0, 19.0, 13.0, 20.0, 9.0, 8.0, 4.0, 4.0, 7.0, 6.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.287841796875, -9.94287109375, -9.597900390625, -9.2529296875, -8.907958984375, -8.56298828125, -8.218017578125, -7.873046875, -7.528076171875, -7.18310546875, -6.838134765625, -6.4931640625, -6.148193359375, -5.80322265625, -5.458251953125, -5.11328125, -4.768310546875, -4.42333984375, -4.078369140625, -3.7333984375, -3.388427734375, -3.04345703125, -2.698486328125, -2.353515625, -2.008544921875, -1.66357421875, -1.318603515625, -0.9736328125, -0.628662109375, -0.28369140625, 0.061279296875, 0.40625, 0.751220703125, 1.09619140625, 1.441162109375, 1.7861328125, 2.131103515625, 2.47607421875, 2.821044921875, 3.166015625, 3.510986328125, 3.85595703125, 4.200927734375, 4.5458984375, 4.890869140625, 5.23583984375, 5.580810546875, 5.92578125, 6.270751953125, 6.61572265625, 6.960693359375, 7.3056640625, 7.650634765625, 7.99560546875, 8.340576171875, 8.685546875, 9.030517578125, 9.37548828125, 9.720458984375, 10.0654296875, 10.410400390625, 10.75537109375, 11.100341796875, 11.4453125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 12.0, 14.0, 17.0, 42.0, 39.0, 57.0, 94.0, 121.0, 171.0, 277.0, 344.0, 493.0, 667.0, 920.0, 1331.0, 1903.0, 2991.0, 4489.0, 6866.0, 10835.0, 18452.0, 32866.0, 64598.0, 148587.0, 325822.0, 225996.0, 93543.0, 44193.0, 23773.0, 13738.0, 8494.0, 5386.0, 3556.0, 2406.0, 1620.0, 1072.0, 831.0, 534.0, 422.0, 279.0, 183.0, 164.0, 107.0, 76.0, 53.0, 46.0, 20.0, 16.0, 12.0, 13.0, 2.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0], "bins": [-1.0390625, -1.006317138671875, -0.97357177734375, -0.940826416015625, -0.9080810546875, -0.875335693359375, -0.84259033203125, -0.809844970703125, -0.777099609375, -0.744354248046875, -0.71160888671875, -0.678863525390625, -0.6461181640625, -0.613372802734375, -0.58062744140625, -0.547882080078125, -0.51513671875, -0.482391357421875, -0.44964599609375, -0.416900634765625, -0.3841552734375, -0.351409912109375, -0.31866455078125, -0.285919189453125, -0.253173828125, -0.220428466796875, -0.18768310546875, -0.154937744140625, -0.1221923828125, -0.089447021484375, -0.05670166015625, -0.023956298828125, 0.0087890625, 0.041534423828125, 0.07427978515625, 0.107025146484375, 0.1397705078125, 0.172515869140625, 0.20526123046875, 0.238006591796875, 0.270751953125, 0.303497314453125, 0.33624267578125, 0.368988037109375, 0.4017333984375, 0.434478759765625, 0.46722412109375, 0.499969482421875, 0.53271484375, 0.565460205078125, 0.59820556640625, 0.630950927734375, 0.6636962890625, 0.696441650390625, 0.72918701171875, 0.761932373046875, 0.794677734375, 0.827423095703125, 0.86016845703125, 0.892913818359375, 0.9256591796875, 0.958404541015625, 0.99114990234375, 1.023895263671875, 1.056640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 10.0, 8.0, 6.0, 10.0, 6.0, 12.0, 8.0, 23.0, 21.0, 16.0, 22.0, 23.0, 20.0, 19.0, 33.0, 26.0, 37.0, 27.0, 40.0, 36.0, 39.0, 39.0, 1056.0, 35.0, 45.0, 40.0, 42.0, 41.0, 32.0, 21.0, 19.0, 20.0, 25.0, 21.0, 15.0, 21.0, 19.0, 18.0, 12.0, 11.0, 10.0, 5.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-5.01171875, -4.8643798828125, -4.717041015625, -4.5697021484375, -4.42236328125, -4.2750244140625, -4.127685546875, -3.9803466796875, -3.8330078125, -3.6856689453125, -3.538330078125, -3.3909912109375, -3.24365234375, -3.0963134765625, -2.948974609375, -2.8016357421875, -2.654296875, -2.5069580078125, -2.359619140625, -2.2122802734375, -2.06494140625, -1.9176025390625, -1.770263671875, -1.6229248046875, -1.4755859375, -1.3282470703125, -1.180908203125, -1.0335693359375, -0.88623046875, -0.7388916015625, -0.591552734375, -0.4442138671875, -0.296875, -0.1495361328125, -0.002197265625, 0.1451416015625, 0.29248046875, 0.4398193359375, 0.587158203125, 0.7344970703125, 0.8818359375, 1.0291748046875, 1.176513671875, 1.3238525390625, 1.47119140625, 1.6185302734375, 1.765869140625, 1.9132080078125, 2.060546875, 2.2078857421875, 2.355224609375, 2.5025634765625, 2.64990234375, 2.7972412109375, 2.944580078125, 3.0919189453125, 3.2392578125, 3.3865966796875, 3.533935546875, 3.6812744140625, 3.82861328125, 3.9759521484375, 4.123291015625, 4.2706298828125, 4.41796875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 12.0, 12.0, 31.0, 55.0, 76.0, 116.0, 174.0, 259.0, 400.0, 579.0, 855.0, 1238.0, 1783.0, 2665.0, 3875.0, 5694.0, 8397.0, 12192.0, 18147.0, 26811.0, 40711.0, 64764.0, 106952.0, 202669.0, 1231618.0, 136620.0, 80462.0, 49767.0, 32694.0, 21568.0, 14531.0, 9897.0, 6739.0, 4687.0, 3225.0, 2187.0, 1521.0, 1016.0, 714.0, 464.0, 328.0, 204.0, 143.0, 93.0, 60.0, 43.0, 23.0, 17.0, 11.0, 7.0, 5.0, 8.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.416015625, -0.402252197265625, -0.38848876953125, -0.374725341796875, -0.3609619140625, -0.347198486328125, -0.33343505859375, -0.319671630859375, -0.305908203125, -0.292144775390625, -0.27838134765625, -0.264617919921875, -0.2508544921875, -0.237091064453125, -0.22332763671875, -0.209564208984375, -0.19580078125, -0.182037353515625, -0.16827392578125, -0.154510498046875, -0.1407470703125, -0.126983642578125, -0.11322021484375, -0.099456787109375, -0.085693359375, -0.071929931640625, -0.05816650390625, -0.044403076171875, -0.0306396484375, -0.016876220703125, -0.00311279296875, 0.010650634765625, 0.0244140625, 0.038177490234375, 0.05194091796875, 0.065704345703125, 0.0794677734375, 0.093231201171875, 0.10699462890625, 0.120758056640625, 0.134521484375, 0.148284912109375, 0.16204833984375, 0.175811767578125, 0.1895751953125, 0.203338623046875, 0.21710205078125, 0.230865478515625, 0.24462890625, 0.258392333984375, 0.27215576171875, 0.285919189453125, 0.2996826171875, 0.313446044921875, 0.32720947265625, 0.340972900390625, 0.354736328125, 0.368499755859375, 0.38226318359375, 0.396026611328125, 0.4097900390625, 0.423553466796875, 0.43731689453125, 0.451080322265625, 0.46484375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 5.0, 6.0, 7.0, 10.0, 12.0, 15.0, 16.0, 19.0, 20.0, 18.0, 24.0, 32.0, 31.0, 34.0, 40.0, 37.0, 33.0, 36.0, 38.0, 44.0, 46.0, 41.0, 48.0, 37.0, 46.0, 33.0, 37.0, 31.0, 36.0, 28.0, 29.0, 14.0, 17.0, 13.0, 16.0, 5.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 1.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0209808349609375, -0.020348072052001953, -0.019715309143066406, -0.01908254623413086, -0.018449783325195312, -0.017817020416259766, -0.01718425750732422, -0.016551494598388672, -0.015918731689453125, -0.015285968780517578, -0.014653205871582031, -0.014020442962646484, -0.013387680053710938, -0.01275491714477539, -0.012122154235839844, -0.011489391326904297, -0.01085662841796875, -0.010223865509033203, -0.009591102600097656, -0.00895833969116211, -0.008325576782226562, -0.007692813873291016, -0.007060050964355469, -0.006427288055419922, -0.005794525146484375, -0.005161762237548828, -0.004528999328613281, -0.0038962364196777344, -0.0032634735107421875, -0.0026307106018066406, -0.0019979476928710938, -0.0013651847839355469, -0.000732421875, -9.965896606445312e-05, 0.0005331039428710938, 0.0011658668518066406, 0.0017986297607421875, 0.0024313926696777344, 0.0030641555786132812, 0.003696918487548828, 0.004329681396484375, 0.004962444305419922, 0.005595207214355469, 0.006227970123291016, 0.0068607330322265625, 0.007493495941162109, 0.008126258850097656, 0.008759021759033203, 0.00939178466796875, 0.010024547576904297, 0.010657310485839844, 0.01129007339477539, 0.011922836303710938, 0.012555599212646484, 0.013188362121582031, 0.013821125030517578, 0.014453887939453125, 0.015086650848388672, 0.01571941375732422, 0.016352176666259766, 0.016984939575195312, 0.01761770248413086, 0.018250465393066406, 0.018883228302001953, 0.0195159912109375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 3.0, 5.0, 4.0, 12.0, 13.0, 6.0, 13.0, 20.0, 21.0, 27.0, 42.0, 54.0, 65.0, 111.0, 159.0, 211.0, 314.0, 496.0, 988.0, 1004028.0, 39967.0, 627.0, 393.0, 287.0, 190.0, 128.0, 92.0, 51.0, 40.0, 48.0, 22.0, 24.0, 16.0, 17.0, 13.0, 10.0, 6.0, 10.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5166015625, -0.4998321533203125, -0.483062744140625, -0.4662933349609375, -0.44952392578125, -0.4327545166015625, -0.415985107421875, -0.3992156982421875, -0.3824462890625, -0.3656768798828125, -0.348907470703125, -0.3321380615234375, -0.31536865234375, -0.2985992431640625, -0.281829833984375, -0.2650604248046875, -0.248291015625, -0.2315216064453125, -0.214752197265625, -0.1979827880859375, -0.18121337890625, -0.1644439697265625, -0.147674560546875, -0.1309051513671875, -0.1141357421875, -0.0973663330078125, -0.080596923828125, -0.0638275146484375, -0.04705810546875, -0.0302886962890625, -0.013519287109375, 0.0032501220703125, 0.02001953125, 0.0367889404296875, 0.053558349609375, 0.0703277587890625, 0.08709716796875, 0.1038665771484375, 0.120635986328125, 0.1374053955078125, 0.1541748046875, 0.1709442138671875, 0.187713623046875, 0.2044830322265625, 0.22125244140625, 0.2380218505859375, 0.254791259765625, 0.2715606689453125, 0.288330078125, 0.3050994873046875, 0.321868896484375, 0.3386383056640625, 0.35540771484375, 0.3721771240234375, 0.388946533203125, 0.4057159423828125, 0.4224853515625, 0.4392547607421875, 0.456024169921875, 0.4727935791015625, 0.48956298828125, 0.5063323974609375, 0.523101806640625, 0.5398712158203125, 0.556640625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 929.0, 84.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5500984191894531, -0.527895450592041, -0.5056924819946289, -0.4834895431995392, -0.4612865746021271, -0.43908363580703735, -0.41688066720962524, -0.39467769861221313, -0.372474730014801, -0.3502717614173889, -0.3280688226222992, -0.3058658540248871, -0.283662885427475, -0.26145994663238525, -0.23925697803497314, -0.21705400943756104, -0.1948510706424713, -0.1726481169462204, -0.1504451483488083, -0.12824219465255737, -0.10603923350572586, -0.08383627235889435, -0.06163331866264343, -0.03943035006523132, -0.017227396368980408, 0.0049755629152059555, 0.02717852219939232, 0.04938147962093353, 0.07158444076776505, 0.09378740191459656, 0.11599035561084747, 0.13819332420825958, 0.1603962779045105, 0.1825992316007614, 0.20480220019817352, 0.22700515389442444, 0.24920812249183655, 0.27141106128692627, 0.2936140298843384, 0.3158169984817505, 0.3380199670791626, 0.3602229356765747, 0.38242587447166443, 0.40462884306907654, 0.42683181166648865, 0.44903475046157837, 0.4712377190589905, 0.4934406876564026, 0.5156435966491699, 0.537846565246582, 0.5600495338439941, 0.5822525024414062, 0.6044554114341736, 0.6266583800315857, 0.6488613486289978, 0.6710643172264099, 0.693267285823822, 0.7154702544212341, 0.7376732230186462, 0.7598761320114136, 0.7820791006088257, 0.8042820692062378, 0.8264850378036499, 0.848688006401062, 0.8708909749984741]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 9.0, 7.0, 11.0, 7.0, 17.0, 22.0, 25.0, 39.0, 64.0, 46.0, 39.0, 70.0, 71.0, 54.0, 59.0, 66.0, 57.0, 63.0, 61.0, 56.0, 44.0, 32.0, 26.0, 22.0, 12.0, 5.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1001366376876831, -0.09781963378190994, -0.09550262987613678, -0.09318562597036362, -0.09086862206459045, -0.08855162560939789, -0.08623462170362473, -0.08391761779785156, -0.0816006138920784, -0.07928360998630524, -0.07696660608053207, -0.07464960217475891, -0.07233260571956635, -0.07001560181379318, -0.06769859790802002, -0.06538159400224686, -0.0630645900964737, -0.06074758619070053, -0.05843058228492737, -0.056113582104444504, -0.05379657819867134, -0.05147957429289818, -0.049162574112415314, -0.04684557020664215, -0.04452856630086899, -0.042211562395095825, -0.03989455848932266, -0.0375775583088398, -0.035260554403066635, -0.03294355049729347, -0.03062654845416546, -0.028309546411037445, -0.025992542505264282, -0.02367553859949112, -0.021358536556363106, -0.019041534513235092, -0.01672453060746193, -0.014407527633011341, -0.012090524658560753, -0.00977352261543274, -0.007456518709659576, -0.005139515735208988, -0.0028225127607584, -0.0005055097863078117, 0.0018114931881427765, 0.004128496162593365, 0.006445499137043953, 0.008762501180171967, 0.01107950508594513, 0.013396508060395718, 0.015713511034846306, 0.01803051307797432, 0.020347516983747482, 0.022664520889520645, 0.02498152293264866, 0.027298524975776672, 0.029615528881549835, 0.031932532787323, 0.03424953669309616, 0.036566536873579025, 0.03888354077935219, 0.04120054468512535, 0.043517544865608215, 0.04583454877138138, 0.04815155267715454]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 9.0, 8.0, 14.0, 13.0, 12.0, 32.0, 28.0, 34.0, 30.0, 57.0, 62.0, 60.0, 75.0, 74.0, 66.0, 60.0, 61.0, 55.0, 27.0, 33.0, 35.0, 20.0, 20.0, 19.0, 13.0, 20.0, 9.0, 8.0, 4.0, 4.0, 7.0, 6.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.287841796875, -9.94287109375, -9.597900390625, -9.2529296875, -8.907958984375, -8.56298828125, -8.218017578125, -7.873046875, -7.528076171875, -7.18310546875, -6.838134765625, -6.4931640625, -6.148193359375, -5.80322265625, -5.458251953125, -5.11328125, -4.768310546875, -4.42333984375, -4.078369140625, -3.7333984375, -3.388427734375, -3.04345703125, -2.698486328125, -2.353515625, -2.008544921875, -1.66357421875, -1.318603515625, -0.9736328125, -0.628662109375, -0.28369140625, 0.061279296875, 0.40625, 0.751220703125, 1.09619140625, 1.441162109375, 1.7861328125, 2.131103515625, 2.47607421875, 2.821044921875, 3.166015625, 3.510986328125, 3.85595703125, 4.200927734375, 4.5458984375, 4.890869140625, 5.23583984375, 5.580810546875, 5.92578125, 6.270751953125, 6.61572265625, 6.960693359375, 7.3056640625, 7.650634765625, 7.99560546875, 8.340576171875, 8.685546875, 9.030517578125, 9.37548828125, 9.720458984375, 10.0654296875, 10.410400390625, 10.75537109375, 11.100341796875, 11.4453125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 6.0, 6.0, 9.0, 21.0, 26.0, 27.0, 47.0, 77.0, 84.0, 109.0, 186.0, 245.0, 370.0, 503.0, 849.0, 1229.0, 2019.0, 3340.0, 6277.0, 13250.0, 39339.0, 327918.0, 570727.0, 49799.0, 15466.0, 6798.0, 3676.0, 2077.0, 1313.0, 893.0, 564.0, 398.0, 258.0, 171.0, 150.0, 90.0, 59.0, 55.0, 48.0, 21.0, 17.0, 12.0, 13.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.453125, -30.407470703125, -29.36181640625, -28.316162109375, -27.2705078125, -26.224853515625, -25.17919921875, -24.133544921875, -23.087890625, -22.042236328125, -20.99658203125, -19.950927734375, -18.9052734375, -17.859619140625, -16.81396484375, -15.768310546875, -14.72265625, -13.677001953125, -12.63134765625, -11.585693359375, -10.5400390625, -9.494384765625, -8.44873046875, -7.403076171875, -6.357421875, -5.311767578125, -4.26611328125, -3.220458984375, -2.1748046875, -1.129150390625, -0.08349609375, 0.962158203125, 2.0078125, 3.053466796875, 4.09912109375, 5.144775390625, 6.1904296875, 7.236083984375, 8.28173828125, 9.327392578125, 10.373046875, 11.418701171875, 12.46435546875, 13.510009765625, 14.5556640625, 15.601318359375, 16.64697265625, 17.692626953125, 18.73828125, 19.783935546875, 20.82958984375, 21.875244140625, 22.9208984375, 23.966552734375, 25.01220703125, 26.057861328125, 27.103515625, 28.149169921875, 29.19482421875, 30.240478515625, 31.2861328125, 32.331787109375, 33.37744140625, 34.423095703125, 35.46875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 8.0, 6.0, 7.0, 11.0, 9.0, 21.0, 15.0, 19.0, 26.0, 23.0, 28.0, 29.0, 37.0, 33.0, 37.0, 52.0, 66.0, 84.0, 136.0, 1698.0, 172.0, 80.0, 61.0, 54.0, 42.0, 24.0, 27.0, 42.0, 20.0, 31.0, 25.0, 21.0, 19.0, 11.0, 6.0, 15.0, 10.0, 6.0, 6.0, 5.0, 7.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-29.6875, -28.804443359375, -27.92138671875, -27.038330078125, -26.1552734375, -25.272216796875, -24.38916015625, -23.506103515625, -22.623046875, -21.739990234375, -20.85693359375, -19.973876953125, -19.0908203125, -18.207763671875, -17.32470703125, -16.441650390625, -15.55859375, -14.675537109375, -13.79248046875, -12.909423828125, -12.0263671875, -11.143310546875, -10.26025390625, -9.377197265625, -8.494140625, -7.611083984375, -6.72802734375, -5.844970703125, -4.9619140625, -4.078857421875, -3.19580078125, -2.312744140625, -1.4296875, -0.546630859375, 0.33642578125, 1.219482421875, 2.1025390625, 2.985595703125, 3.86865234375, 4.751708984375, 5.634765625, 6.517822265625, 7.40087890625, 8.283935546875, 9.1669921875, 10.050048828125, 10.93310546875, 11.816162109375, 12.69921875, 13.582275390625, 14.46533203125, 15.348388671875, 16.2314453125, 17.114501953125, 17.99755859375, 18.880615234375, 19.763671875, 20.646728515625, 21.52978515625, 22.412841796875, 23.2958984375, 24.178955078125, 25.06201171875, 25.945068359375, 26.828125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 2.0, 7.0, 5.0, 9.0, 15.0, 5.0, 17.0, 20.0, 21.0, 20.0, 16.0, 34.0, 32.0, 36.0, 59.0, 118.0, 175.0, 519.0, 4826.0, 3073946.0, 63939.0, 1080.0, 300.0, 122.0, 76.0, 55.0, 38.0, 33.0, 25.0, 19.0, 22.0, 20.0, 15.0, 8.0, 12.0, 8.0, 7.0, 5.0, 8.0, 8.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.5, -123.3515625, -119.203125, -115.0546875, -110.90625, -106.7578125, -102.609375, -98.4609375, -94.3125, -90.1640625, -86.015625, -81.8671875, -77.71875, -73.5703125, -69.421875, -65.2734375, -61.125, -56.9765625, -52.828125, -48.6796875, -44.53125, -40.3828125, -36.234375, -32.0859375, -27.9375, -23.7890625, -19.640625, -15.4921875, -11.34375, -7.1953125, -3.046875, 1.1015625, 5.25, 9.3984375, 13.546875, 17.6953125, 21.84375, 25.9921875, 30.140625, 34.2890625, 38.4375, 42.5859375, 46.734375, 50.8828125, 55.03125, 59.1796875, 63.328125, 67.4765625, 71.625, 75.7734375, 79.921875, 84.0703125, 88.21875, 92.3671875, 96.515625, 100.6640625, 104.8125, 108.9609375, 113.109375, 117.2578125, 121.40625, 125.5546875, 129.703125, 133.8515625, 138.0]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 971.0, 42.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-937.2486572265625, -917.9788818359375, -898.7090454101562, -879.4392700195312, -860.16943359375, -840.899658203125, -821.6298217773438, -802.3600463867188, -783.0902099609375, -763.8204345703125, -744.5505981445312, -725.2808227539062, -706.010986328125, -686.7412109375, -667.4713745117188, -648.2015991210938, -628.9318237304688, -609.6620483398438, -590.3922119140625, -571.1224365234375, -551.8526000976562, -532.5828247070312, -513.31298828125, -494.043212890625, -474.7734069824219, -455.50360107421875, -436.2337951660156, -416.9639892578125, -397.6942138671875, -378.42437744140625, -359.15460205078125, -339.8847961425781, -320.6149597167969, -301.34515380859375, -282.0753479003906, -262.8055419921875, -243.53575134277344, -224.2659454345703, -204.99615478515625, -185.72634887695312, -166.45654296875, -147.18673706054688, -127.91693878173828, -108.64714050292969, -89.37733459472656, -70.10752868652344, -50.837730407714844, -31.56793212890625, -12.298126220703125, 6.971675872802734, 26.241477966308594, 45.51128005981445, 64.78108215332031, 84.05088806152344, 103.32068634033203, 122.59048461914062, 141.86029052734375, 161.13009643554688, 180.39990234375, 199.66969299316406, 218.9394989013672, 238.2093048095703, 257.4790954589844, 276.7489013671875, 296.0187072753906]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 6.0, 4.0, 9.0, 7.0, 11.0, 13.0, 17.0, 14.0, 14.0, 22.0, 24.0, 35.0, 25.0, 29.0, 21.0, 31.0, 36.0, 43.0, 38.0, 35.0, 47.0, 31.0, 41.0, 47.0, 41.0, 27.0, 37.0, 32.0, 24.0, 40.0, 38.0, 24.0, 25.0, 13.0, 11.0, 10.0, 13.0, 15.0, 12.0, 6.0, 8.0, 8.0, 5.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.83245086669922, -90.99108123779297, -88.14971923828125, -85.308349609375, -82.46697998046875, -79.62561798095703, -76.78424835205078, -73.94288635253906, -71.10151672363281, -68.26014709472656, -65.41878509521484, -62.577415466308594, -59.73604965209961, -56.894683837890625, -54.053314208984375, -51.21194839477539, -48.370582580566406, -45.52921676635742, -42.68785095214844, -39.84648132324219, -37.0051155090332, -34.16374969482422, -31.3223819732666, -28.481014251708984, -25.6396484375, -22.798282623291016, -19.9569149017334, -17.11554718017578, -14.274181365966797, -11.432814598083496, -8.591447830200195, -5.750080108642578, -2.908721923828125, -0.06735515594482422, 2.7740116119384766, 5.615378379821777, 8.456745147705078, 11.298111915588379, 14.13947868347168, 16.980846405029297, 19.82221221923828, 22.663578033447266, 25.504945755004883, 28.3463134765625, 31.187679290771484, 34.02904510498047, 36.87041473388672, 39.7117805480957, 42.55314636230469, 45.39451217651367, 48.235877990722656, 51.077247619628906, 53.91861343383789, 56.759979248046875, 59.601348876953125, 62.44271469116211, 65.2840805053711, 68.12545013427734, 70.96681213378906, 73.80818176269531, 76.64955139160156, 79.49091339111328, 82.33228302001953, 85.17364501953125, 88.0150146484375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 8.0, 7.0, 5.0, 6.0, 14.0, 14.0, 12.0, 21.0, 33.0, 36.0, 31.0, 40.0, 53.0, 65.0, 66.0, 76.0, 84.0, 69.0, 61.0, 46.0, 34.0, 38.0, 32.0, 24.0, 21.0, 19.0, 15.0, 21.0, 12.0, 9.0, 1.0, 7.0, 8.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1953125, -10.8250732421875, -10.454833984375, -10.0845947265625, -9.71435546875, -9.3441162109375, -8.973876953125, -8.6036376953125, -8.2333984375, -7.8631591796875, -7.492919921875, -7.1226806640625, -6.75244140625, -6.3822021484375, -6.011962890625, -5.6417236328125, -5.271484375, -4.9012451171875, -4.531005859375, -4.1607666015625, -3.79052734375, -3.4202880859375, -3.050048828125, -2.6798095703125, -2.3095703125, -1.9393310546875, -1.569091796875, -1.1988525390625, -0.82861328125, -0.4583740234375, -0.088134765625, 0.2821044921875, 0.65234375, 1.0225830078125, 1.392822265625, 1.7630615234375, 2.13330078125, 2.5035400390625, 2.873779296875, 3.2440185546875, 3.6142578125, 3.9844970703125, 4.354736328125, 4.7249755859375, 5.09521484375, 5.4654541015625, 5.835693359375, 6.2059326171875, 6.576171875, 6.9464111328125, 7.316650390625, 7.6868896484375, 8.05712890625, 8.4273681640625, 8.797607421875, 9.1678466796875, 9.5380859375, 9.9083251953125, 10.278564453125, 10.6488037109375, 11.01904296875, 11.3892822265625, 11.759521484375, 12.1297607421875, 12.5]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 3.0, 10.0, 15.0, 22.0, 23.0, 41.0, 45.0, 74.0, 99.0, 186.0, 251.0, 462.0, 722.0, 1303.0, 2501.0, 5252.0, 12910.0, 54356.0, 2474029.0, 1576471.0, 41683.0, 12439.0, 5330.0, 2612.0, 1367.0, 757.0, 499.0, 264.0, 178.0, 121.0, 71.0, 46.0, 37.0, 25.0, 18.0, 19.0, 8.0, 13.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.125, -38.78515625, -37.4453125, -36.10546875, -34.765625, -33.42578125, -32.0859375, -30.74609375, -29.40625, -28.06640625, -26.7265625, -25.38671875, -24.046875, -22.70703125, -21.3671875, -20.02734375, -18.6875, -17.34765625, -16.0078125, -14.66796875, -13.328125, -11.98828125, -10.6484375, -9.30859375, -7.96875, -6.62890625, -5.2890625, -3.94921875, -2.609375, -1.26953125, 0.0703125, 1.41015625, 2.75, 4.08984375, 5.4296875, 6.76953125, 8.109375, 9.44921875, 10.7890625, 12.12890625, 13.46875, 14.80859375, 16.1484375, 17.48828125, 18.828125, 20.16796875, 21.5078125, 22.84765625, 24.1875, 25.52734375, 26.8671875, 28.20703125, 29.546875, 30.88671875, 32.2265625, 33.56640625, 34.90625, 36.24609375, 37.5859375, 38.92578125, 40.265625, 41.60546875, 42.9453125, 44.28515625, 45.625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 11.0, 5.0, 8.0, 12.0, 12.0, 12.0, 19.0, 17.0, 22.0, 23.0, 27.0, 55.0, 59.0, 88.0, 151.0, 313.0, 528.0, 756.0, 758.0, 417.0, 287.0, 155.0, 65.0, 59.0, 35.0, 30.0, 30.0, 20.0, 14.0, 10.0, 10.0, 8.0, 9.0, 8.0, 9.0, 3.0, 3.0, 5.0, 1.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-28.828125, -27.924072265625, -27.02001953125, -26.115966796875, -25.2119140625, -24.307861328125, -23.40380859375, -22.499755859375, -21.595703125, -20.691650390625, -19.78759765625, -18.883544921875, -17.9794921875, -17.075439453125, -16.17138671875, -15.267333984375, -14.36328125, -13.459228515625, -12.55517578125, -11.651123046875, -10.7470703125, -9.843017578125, -8.93896484375, -8.034912109375, -7.130859375, -6.226806640625, -5.32275390625, -4.418701171875, -3.5146484375, -2.610595703125, -1.70654296875, -0.802490234375, 0.1015625, 1.005615234375, 1.90966796875, 2.813720703125, 3.7177734375, 4.621826171875, 5.52587890625, 6.429931640625, 7.333984375, 8.238037109375, 9.14208984375, 10.046142578125, 10.9501953125, 11.854248046875, 12.75830078125, 13.662353515625, 14.56640625, 15.470458984375, 16.37451171875, 17.278564453125, 18.1826171875, 19.086669921875, 19.99072265625, 20.894775390625, 21.798828125, 22.702880859375, 23.60693359375, 24.510986328125, 25.4150390625, 26.319091796875, 27.22314453125, 28.127197265625, 29.03125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 7.0, 9.0, 4.0, 6.0, 10.0, 10.0, 21.0, 34.0, 39.0, 45.0, 67.0, 105.0, 171.0, 263.0, 410.0, 730.0, 1127.0, 1890.0, 3069.0, 5297.0, 9380.0, 17635.0, 36546.0, 97020.0, 940385.0, 2811242.0, 169229.0, 49047.0, 22540.0, 11639.0, 6560.0, 3831.0, 2250.0, 1274.0, 816.0, 539.0, 388.0, 236.0, 146.0, 106.0, 71.0, 45.0, 23.0, 14.0, 4.0, 11.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25, -33.953125, -32.65625, -31.359375, -30.0625, -28.765625, -27.46875, -26.171875, -24.875, -23.578125, -22.28125, -20.984375, -19.6875, -18.390625, -17.09375, -15.796875, -14.5, -13.203125, -11.90625, -10.609375, -9.3125, -8.015625, -6.71875, -5.421875, -4.125, -2.828125, -1.53125, -0.234375, 1.0625, 2.359375, 3.65625, 4.953125, 6.25, 7.546875, 8.84375, 10.140625, 11.4375, 12.734375, 14.03125, 15.328125, 16.625, 17.921875, 19.21875, 20.515625, 21.8125, 23.109375, 24.40625, 25.703125, 27.0, 28.296875, 29.59375, 30.890625, 32.1875, 33.484375, 34.78125, 36.078125, 37.375, 38.671875, 39.96875, 41.265625, 42.5625, 43.859375, 45.15625, 46.453125, 47.75]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 12.0, 16.0, 25.0, 55.0, 83.0, 221.0, 277.0, 155.0, 69.0, 39.0, 21.0, 12.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-302.0759582519531, -296.0727233886719, -290.0694580078125, -284.06622314453125, -278.0629577636719, -272.0597229003906, -266.05645751953125, -260.05322265625, -254.0499725341797, -248.04672241210938, -242.04347229003906, -236.04022216796875, -230.0369873046875, -224.0337371826172, -218.03048706054688, -212.02723693847656, -206.02398681640625, -200.02073669433594, -194.01748657226562, -188.0142364501953, -182.010986328125, -176.00775146484375, -170.00450134277344, -164.00125122070312, -157.9980010986328, -151.9947509765625, -145.9915008544922, -139.98825073242188, -133.98501586914062, -127.98175811767578, -121.978515625, -115.97526550292969, -109.97200775146484, -103.96875762939453, -97.96551513671875, -91.96226501464844, -85.95901489257812, -79.95576477050781, -73.9525146484375, -67.94927215576172, -61.946022033691406, -55.942771911621094, -49.93952560424805, -43.936279296875, -37.93302917480469, -31.929780960083008, -25.926532745361328, -19.92328643798828, -13.920036315917969, -7.916788101196289, -1.9135398864746094, 4.08970832824707, 10.09295654296875, 16.09620475769043, 22.09945297241211, 28.102699279785156, 34.10594940185547, 40.10919952392578, 46.11244583129883, 52.115692138671875, 58.11894226074219, 64.1221923828125, 70.12544250488281, 76.1286849975586, 82.1319351196289]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 12.0, 6.0, 12.0, 12.0, 18.0, 18.0, 25.0, 27.0, 29.0, 21.0, 34.0, 34.0, 38.0, 39.0, 43.0, 37.0, 42.0, 39.0, 34.0, 58.0, 50.0, 51.0, 37.0, 23.0, 19.0, 28.0, 28.0, 24.0, 32.0, 19.0, 16.0, 18.0, 12.0, 10.0, 11.0, 6.0, 13.0, 11.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-99.378662109375, -96.53338623046875, -93.68810272216797, -90.84281921386719, -87.99754333496094, -85.15226745605469, -82.3069839477539, -79.46170043945312, -76.61642456054688, -73.77114868164062, -70.92586517333984, -68.08058166503906, -65.23530578613281, -62.3900260925293, -59.54474639892578, -56.699466705322266, -53.85418701171875, -51.008907318115234, -48.16362762451172, -45.3183479309082, -42.47306823730469, -39.62778854370117, -36.782508850097656, -33.93722915649414, -31.091949462890625, -28.24666976928711, -25.401390075683594, -22.556110382080078, -19.710830688476562, -16.865550994873047, -14.020271301269531, -11.174991607666016, -8.3297119140625, -5.484432220458984, -2.6391525268554688, 0.20612716674804688, 3.0514068603515625, 5.896686553955078, 8.741966247558594, 11.58724594116211, 14.432525634765625, 17.27780532836914, 20.123085021972656, 22.968364715576172, 25.813644409179688, 28.658924102783203, 31.50420379638672, 34.349483489990234, 37.19476318359375, 40.040042877197266, 42.88532257080078, 45.7306022644043, 48.57588195800781, 51.42116165161133, 54.266441345214844, 57.11172103881836, 59.957000732421875, 62.80228042602539, 65.6475601196289, 68.49284362792969, 71.33811950683594, 74.18339538574219, 77.02867889404297, 79.87396240234375, 82.71923828125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 11.0, 10.0, 12.0, 9.0, 19.0, 16.0, 26.0, 38.0, 34.0, 39.0, 45.0, 58.0, 58.0, 63.0, 55.0, 43.0, 60.0, 63.0, 47.0, 48.0, 35.0, 41.0, 38.0, 17.0, 15.0, 16.0, 15.0, 16.0, 8.0, 4.0, 10.0, 3.0, 4.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.25048828125, -10.8759765625, -10.50146484375, -10.126953125, -9.75244140625, -9.3779296875, -9.00341796875, -8.62890625, -8.25439453125, -7.8798828125, -7.50537109375, -7.130859375, -6.75634765625, -6.3818359375, -6.00732421875, -5.6328125, -5.25830078125, -4.8837890625, -4.50927734375, -4.134765625, -3.76025390625, -3.3857421875, -3.01123046875, -2.63671875, -2.26220703125, -1.8876953125, -1.51318359375, -1.138671875, -0.76416015625, -0.3896484375, -0.01513671875, 0.359375, 0.73388671875, 1.1083984375, 1.48291015625, 1.857421875, 2.23193359375, 2.6064453125, 2.98095703125, 3.35546875, 3.72998046875, 4.1044921875, 4.47900390625, 4.853515625, 5.22802734375, 5.6025390625, 5.97705078125, 6.3515625, 6.72607421875, 7.1005859375, 7.47509765625, 7.849609375, 8.22412109375, 8.5986328125, 8.97314453125, 9.34765625, 9.72216796875, 10.0966796875, 10.47119140625, 10.845703125, 11.22021484375, 11.5947265625, 11.96923828125, 12.34375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 9.0, 13.0, 20.0, 26.0, 30.0, 65.0, 67.0, 98.0, 175.0, 270.0, 421.0, 657.0, 1032.0, 1558.0, 2585.0, 4188.0, 7074.0, 12257.0, 22600.0, 42976.0, 90700.0, 223307.0, 348733.0, 150069.0, 65281.0, 32348.0, 17409.0, 9684.0, 5719.0, 3433.0, 2083.0, 1246.0, 911.0, 525.0, 331.0, 238.0, 134.0, 89.0, 55.0, 39.0, 45.0, 17.0, 24.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2451171875, -1.2065582275390625, -1.167999267578125, -1.1294403076171875, -1.09088134765625, -1.0523223876953125, -1.013763427734375, -0.9752044677734375, -0.9366455078125, -0.8980865478515625, -0.859527587890625, -0.8209686279296875, -0.78240966796875, -0.7438507080078125, -0.705291748046875, -0.6667327880859375, -0.628173828125, -0.5896148681640625, -0.551055908203125, -0.5124969482421875, -0.47393798828125, -0.4353790283203125, -0.396820068359375, -0.3582611083984375, -0.3197021484375, -0.2811431884765625, -0.242584228515625, -0.2040252685546875, -0.16546630859375, -0.1269073486328125, -0.088348388671875, -0.0497894287109375, -0.01123046875, 0.0273284912109375, 0.065887451171875, 0.1044464111328125, 0.14300537109375, 0.1815643310546875, 0.220123291015625, 0.2586822509765625, 0.2972412109375, 0.3358001708984375, 0.374359130859375, 0.4129180908203125, 0.45147705078125, 0.4900360107421875, 0.528594970703125, 0.5671539306640625, 0.605712890625, 0.6442718505859375, 0.682830810546875, 0.7213897705078125, 0.75994873046875, 0.7985076904296875, 0.837066650390625, 0.8756256103515625, 0.9141845703125, 0.9527435302734375, 0.991302490234375, 1.0298614501953125, 1.06842041015625, 1.1069793701171875, 1.145538330078125, 1.1840972900390625, 1.22265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 5.0, 6.0, 13.0, 10.0, 13.0, 8.0, 12.0, 20.0, 19.0, 22.0, 29.0, 50.0, 27.0, 35.0, 40.0, 47.0, 51.0, 52.0, 35.0, 1064.0, 37.0, 45.0, 48.0, 42.0, 43.0, 39.0, 28.0, 26.0, 23.0, 21.0, 22.0, 15.0, 15.0, 11.0, 14.0, 18.0, 7.0, 5.0, 6.0, 0.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.86114501953125, -7.6441650390625, -7.42718505859375, -7.210205078125, -6.99322509765625, -6.7762451171875, -6.55926513671875, -6.34228515625, -6.12530517578125, -5.9083251953125, -5.69134521484375, -5.474365234375, -5.25738525390625, -5.0404052734375, -4.82342529296875, -4.6064453125, -4.38946533203125, -4.1724853515625, -3.95550537109375, -3.738525390625, -3.52154541015625, -3.3045654296875, -3.08758544921875, -2.87060546875, -2.65362548828125, -2.4366455078125, -2.21966552734375, -2.002685546875, -1.78570556640625, -1.5687255859375, -1.35174560546875, -1.134765625, -0.91778564453125, -0.7008056640625, -0.48382568359375, -0.266845703125, -0.04986572265625, 0.1671142578125, 0.38409423828125, 0.60107421875, 0.81805419921875, 1.0350341796875, 1.25201416015625, 1.468994140625, 1.68597412109375, 1.9029541015625, 2.11993408203125, 2.3369140625, 2.55389404296875, 2.7708740234375, 2.98785400390625, 3.204833984375, 3.42181396484375, 3.6387939453125, 3.85577392578125, 4.07275390625, 4.28973388671875, 4.5067138671875, 4.72369384765625, 4.940673828125, 5.15765380859375, 5.3746337890625, 5.59161376953125, 5.80859375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 8.0, 17.0, 19.0, 16.0, 37.0, 37.0, 37.0, 97.0, 159.0, 256.0, 347.0, 649.0, 956.0, 1532.0, 2323.0, 3495.0, 5331.0, 8102.0, 12556.0, 19505.0, 32014.0, 54838.0, 98969.0, 188949.0, 1299646.0, 158256.0, 83730.0, 47685.0, 28437.0, 17474.0, 10990.0, 7183.0, 4692.0, 3165.0, 1980.0, 1358.0, 820.0, 495.0, 347.0, 245.0, 142.0, 75.0, 61.0, 30.0, 28.0, 16.0, 15.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.53515625, -0.5156021118164062, -0.4960479736328125, -0.47649383544921875, -0.456939697265625, -0.43738555908203125, -0.4178314208984375, -0.39827728271484375, -0.37872314453125, -0.35916900634765625, -0.3396148681640625, -0.32006072998046875, -0.300506591796875, -0.28095245361328125, -0.2613983154296875, -0.24184417724609375, -0.2222900390625, -0.20273590087890625, -0.1831817626953125, -0.16362762451171875, -0.144073486328125, -0.12451934814453125, -0.1049652099609375, -0.08541107177734375, -0.06585693359375, -0.04630279541015625, -0.0267486572265625, -0.00719451904296875, 0.012359619140625, 0.03191375732421875, 0.0514678955078125, 0.07102203369140625, 0.090576171875, 0.11013031005859375, 0.1296844482421875, 0.14923858642578125, 0.168792724609375, 0.18834686279296875, 0.2079010009765625, 0.22745513916015625, 0.24700927734375, 0.26656341552734375, 0.2861175537109375, 0.30567169189453125, 0.325225830078125, 0.34477996826171875, 0.3643341064453125, 0.38388824462890625, 0.4034423828125, 0.42299652099609375, 0.4425506591796875, 0.46210479736328125, 0.481658935546875, 0.5012130737304688, 0.5207672119140625, 0.5403213500976562, 0.55987548828125, 0.5794296264648438, 0.5989837646484375, 0.6185379028320312, 0.638092041015625, 0.6576461791992188, 0.6772003173828125, 0.6967544555664062, 0.71630859375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 7.0, 9.0, 11.0, 9.0, 12.0, 15.0, 16.0, 26.0, 37.0, 35.0, 40.0, 37.0, 38.0, 35.0, 53.0, 49.0, 50.0, 49.0, 70.0, 53.0, 51.0, 42.0, 46.0, 25.0, 31.0, 26.0, 13.0, 15.0, 14.0, 16.0, 10.0, 12.0, 7.0, 8.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.016937255859375, -0.016445398330688477, -0.015953540802001953, -0.01546168327331543, -0.014969825744628906, -0.014477968215942383, -0.01398611068725586, -0.013494253158569336, -0.013002395629882812, -0.012510538101196289, -0.012018680572509766, -0.011526823043823242, -0.011034965515136719, -0.010543107986450195, -0.010051250457763672, -0.009559392929077148, -0.009067535400390625, -0.008575677871704102, -0.008083820343017578, -0.007591962814331055, -0.007100105285644531, -0.006608247756958008, -0.006116390228271484, -0.005624532699584961, -0.0051326751708984375, -0.004640817642211914, -0.004148960113525391, -0.003657102584838867, -0.0031652450561523438, -0.0026733875274658203, -0.002181529998779297, -0.0016896724700927734, -0.00119781494140625, -0.0007059574127197266, -0.00021409988403320312, 0.0002777576446533203, 0.0007696151733398438, 0.0012614727020263672, 0.0017533302307128906, 0.002245187759399414, 0.0027370452880859375, 0.003228902816772461, 0.0037207603454589844, 0.004212617874145508, 0.004704475402832031, 0.005196332931518555, 0.005688190460205078, 0.0061800479888916016, 0.006671905517578125, 0.0071637630462646484, 0.007655620574951172, 0.008147478103637695, 0.008639335632324219, 0.009131193161010742, 0.009623050689697266, 0.010114908218383789, 0.010606765747070312, 0.011098623275756836, 0.01159048080444336, 0.012082338333129883, 0.012574195861816406, 0.01306605339050293, 0.013557910919189453, 0.014049768447875977, 0.0145416259765625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 0.0, 6.0, 3.0, 12.0, 13.0, 8.0, 25.0, 17.0, 10.0, 26.0, 33.0, 37.0, 29.0, 47.0, 77.0, 82.0, 121.0, 224.0, 502.0, 117316.0, 928720.0, 516.0, 215.0, 112.0, 73.0, 53.0, 38.0, 50.0, 37.0, 36.0, 17.0, 14.0, 15.0, 13.0, 12.0, 13.0, 8.0, 3.0, 5.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.513671875, -0.49658203125, -0.4794921875, -0.46240234375, -0.4453125, -0.42822265625, -0.4111328125, -0.39404296875, -0.376953125, -0.35986328125, -0.3427734375, -0.32568359375, -0.30859375, -0.29150390625, -0.2744140625, -0.25732421875, -0.240234375, -0.22314453125, -0.2060546875, -0.18896484375, -0.171875, -0.15478515625, -0.1376953125, -0.12060546875, -0.103515625, -0.08642578125, -0.0693359375, -0.05224609375, -0.03515625, -0.01806640625, -0.0009765625, 0.01611328125, 0.033203125, 0.05029296875, 0.0673828125, 0.08447265625, 0.1015625, 0.11865234375, 0.1357421875, 0.15283203125, 0.169921875, 0.18701171875, 0.2041015625, 0.22119140625, 0.23828125, 0.25537109375, 0.2724609375, 0.28955078125, 0.306640625, 0.32373046875, 0.3408203125, 0.35791015625, 0.375, 0.39208984375, 0.4091796875, 0.42626953125, 0.443359375, 0.46044921875, 0.4775390625, 0.49462890625, 0.51171875, 0.52880859375, 0.5458984375, 0.56298828125, 0.580078125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1012.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007155167404562235, 0.007726811338216066, 0.022608790546655655, 0.03749076649546623, 0.05237274616956711, 0.06725472956895828, 0.08213670551776886, 0.09701868891716003, 0.11190066486597061, 0.1267826408147812, 0.14166462421417236, 0.15654659271240234, 0.17142857611179352, 0.1863105595111847, 0.20119252800941467, 0.21607452630996704, 0.23095649480819702, 0.2458384782075882, 0.26072046160697937, 0.27560243010520935, 0.29048439860343933, 0.3053663969039917, 0.3202483654022217, 0.33513033390045166, 0.35001233220100403, 0.364894300699234, 0.3797762989997864, 0.39465826749801636, 0.40954023599624634, 0.4244222342967987, 0.4393042027950287, 0.45418620109558105, 0.46906813979148865, 0.48395010828971863, 0.498832106590271, 0.513714075088501, 0.528596043586731, 0.5434780120849609, 0.5583599805831909, 0.5732420086860657, 0.5881239771842957, 0.6030059456825256, 0.6178879141807556, 0.6327699422836304, 0.6476519107818604, 0.6625338792800903, 0.6774158477783203, 0.6922978162765503, 0.7071797847747803, 0.7220617532730103, 0.7369437217712402, 0.7518256902694702, 0.766707718372345, 0.781589686870575, 0.7964716553688049, 0.8113536238670349, 0.8262356519699097, 0.8411176204681396, 0.8559995889663696, 0.8708815574645996, 0.8857635855674744, 0.9006455540657043, 0.9155275225639343, 0.9304094910621643, 0.9452914595603943]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 8.0, 18.0, 19.0, 15.0, 16.0, 28.0, 26.0, 33.0, 30.0, 40.0, 33.0, 46.0, 45.0, 53.0, 47.0, 49.0, 61.0, 47.0, 43.0, 44.0, 58.0, 38.0, 38.0, 29.0, 32.0, 24.0, 10.0, 23.0, 8.0, 12.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.05142170190811157, -0.0501592755317688, -0.048896849155426025, -0.04763442650437355, -0.04637200012803078, -0.045109573751688004, -0.04384715110063553, -0.042584724724292755, -0.04132229834794998, -0.04005987197160721, -0.038797445595264435, -0.03753502294421196, -0.036272596567869186, -0.03501017019152641, -0.03374774754047394, -0.032485321164131165, -0.03122289478778839, -0.029960468411445618, -0.028698043897747993, -0.02743561938405037, -0.026173193007707596, -0.024910766631364822, -0.023648342117667198, -0.022385917603969574, -0.0211234912276268, -0.019861064851284027, -0.018598640337586403, -0.01733621582388878, -0.016073789447546005, -0.014811364002525806, -0.013548938557505608, -0.012286513112485409, -0.01102408766746521, -0.009761662222445011, -0.008499236777424812, -0.0072368113324046135, -0.005974385887384415, -0.004711960442364216, -0.003449534997344017, -0.002187109552323818, -0.0009246841073036194, 0.00033774133771657944, 0.0016001667827367783, 0.002862592227756977, 0.004125017672777176, 0.005387443117797375, 0.0066498685628175735, 0.007912294007837772, 0.009174719452857971, 0.01043714489787817, 0.011699570342898369, 0.012961995787918568, 0.014224421232938766, 0.015486846677958965, 0.016749272122979164, 0.01801169663667679, 0.019274123013019562, 0.020536549389362335, 0.02179897390305996, 0.023061398416757584, 0.024323824793100357, 0.02558625116944313, 0.026848675683140755, 0.02811110019683838, 0.029373526573181152]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 11.0, 10.0, 12.0, 9.0, 19.0, 16.0, 26.0, 38.0, 34.0, 39.0, 45.0, 58.0, 58.0, 63.0, 55.0, 43.0, 60.0, 63.0, 48.0, 47.0, 35.0, 41.0, 38.0, 17.0, 15.0, 16.0, 15.0, 16.0, 8.0, 4.0, 10.0, 3.0, 4.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.25048828125, -10.8759765625, -10.50146484375, -10.126953125, -9.75244140625, -9.3779296875, -9.00341796875, -8.62890625, -8.25439453125, -7.8798828125, -7.50537109375, -7.130859375, -6.75634765625, -6.3818359375, -6.00732421875, -5.6328125, -5.25830078125, -4.8837890625, -4.50927734375, -4.134765625, -3.76025390625, -3.3857421875, -3.01123046875, -2.63671875, -2.26220703125, -1.8876953125, -1.51318359375, -1.138671875, -0.76416015625, -0.3896484375, -0.01513671875, 0.359375, 0.73388671875, 1.1083984375, 1.48291015625, 1.857421875, 2.23193359375, 2.6064453125, 2.98095703125, 3.35546875, 3.72998046875, 4.1044921875, 4.47900390625, 4.853515625, 5.22802734375, 5.6025390625, 5.97705078125, 6.3515625, 6.72607421875, 7.1005859375, 7.47509765625, 7.849609375, 8.22412109375, 8.5986328125, 8.97314453125, 9.34765625, 9.72216796875, 10.0966796875, 10.47119140625, 10.845703125, 11.22021484375, 11.5947265625, 11.96923828125, 12.34375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 5.0, 5.0, 15.0, 20.0, 29.0, 39.0, 44.0, 65.0, 94.0, 165.0, 197.0, 318.0, 553.0, 1065.0, 1991.0, 4532.0, 12482.0, 44583.0, 266744.0, 596431.0, 85712.0, 20666.0, 6867.0, 2719.0, 1299.0, 712.0, 371.0, 260.0, 153.0, 125.0, 83.0, 51.0, 45.0, 30.0, 19.0, 21.0, 11.0, 10.0, 4.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.640625, -10.2996826171875, -9.958740234375, -9.6177978515625, -9.27685546875, -8.9359130859375, -8.594970703125, -8.2540283203125, -7.9130859375, -7.5721435546875, -7.231201171875, -6.8902587890625, -6.54931640625, -6.2083740234375, -5.867431640625, -5.5264892578125, -5.185546875, -4.8446044921875, -4.503662109375, -4.1627197265625, -3.82177734375, -3.4808349609375, -3.139892578125, -2.7989501953125, -2.4580078125, -2.1170654296875, -1.776123046875, -1.4351806640625, -1.09423828125, -0.7532958984375, -0.412353515625, -0.0714111328125, 0.26953125, 0.6104736328125, 0.951416015625, 1.2923583984375, 1.63330078125, 1.9742431640625, 2.315185546875, 2.6561279296875, 2.9970703125, 3.3380126953125, 3.678955078125, 4.0198974609375, 4.36083984375, 4.7017822265625, 5.042724609375, 5.3836669921875, 5.724609375, 6.0655517578125, 6.406494140625, 6.7474365234375, 7.08837890625, 7.4293212890625, 7.770263671875, 8.1112060546875, 8.4521484375, 8.7930908203125, 9.134033203125, 9.4749755859375, 9.81591796875, 10.1568603515625, 10.497802734375, 10.8387451171875, 11.1796875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 6.0, 2.0, 5.0, 8.0, 9.0, 9.0, 8.0, 14.0, 13.0, 14.0, 24.0, 15.0, 39.0, 25.0, 41.0, 31.0, 34.0, 47.0, 49.0, 55.0, 64.0, 1865.0, 188.0, 66.0, 53.0, 35.0, 45.0, 29.0, 32.0, 23.0, 36.0, 25.0, 20.0, 18.0, 18.0, 19.0, 13.0, 8.0, 9.0, 8.0, 9.0, 5.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-41.0, -39.8544921875, -38.708984375, -37.5634765625, -36.41796875, -35.2724609375, -34.126953125, -32.9814453125, -31.8359375, -30.6904296875, -29.544921875, -28.3994140625, -27.25390625, -26.1083984375, -24.962890625, -23.8173828125, -22.671875, -21.5263671875, -20.380859375, -19.2353515625, -18.08984375, -16.9443359375, -15.798828125, -14.6533203125, -13.5078125, -12.3623046875, -11.216796875, -10.0712890625, -8.92578125, -7.7802734375, -6.634765625, -5.4892578125, -4.34375, -3.1982421875, -2.052734375, -0.9072265625, 0.23828125, 1.3837890625, 2.529296875, 3.6748046875, 4.8203125, 5.9658203125, 7.111328125, 8.2568359375, 9.40234375, 10.5478515625, 11.693359375, 12.8388671875, 13.984375, 15.1298828125, 16.275390625, 17.4208984375, 18.56640625, 19.7119140625, 20.857421875, 22.0029296875, 23.1484375, 24.2939453125, 25.439453125, 26.5849609375, 27.73046875, 28.8759765625, 30.021484375, 31.1669921875, 32.3125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 6.0, 5.0, 7.0, 8.0, 11.0, 7.0, 13.0, 16.0, 21.0, 19.0, 20.0, 28.0, 47.0, 38.0, 55.0, 64.0, 104.0, 199.0, 450.0, 1436.0, 28177.0, 3106234.0, 6901.0, 904.0, 335.0, 174.0, 80.0, 63.0, 59.0, 36.0, 46.0, 18.0, 29.0, 15.0, 10.0, 19.0, 9.0, 9.0, 8.0, 5.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.3125, -70.7255859375, -68.138671875, -65.5517578125, -62.96484375, -60.3779296875, -57.791015625, -55.2041015625, -52.6171875, -50.0302734375, -47.443359375, -44.8564453125, -42.26953125, -39.6826171875, -37.095703125, -34.5087890625, -31.921875, -29.3349609375, -26.748046875, -24.1611328125, -21.57421875, -18.9873046875, -16.400390625, -13.8134765625, -11.2265625, -8.6396484375, -6.052734375, -3.4658203125, -0.87890625, 1.7080078125, 4.294921875, 6.8818359375, 9.46875, 12.0556640625, 14.642578125, 17.2294921875, 19.81640625, 22.4033203125, 24.990234375, 27.5771484375, 30.1640625, 32.7509765625, 35.337890625, 37.9248046875, 40.51171875, 43.0986328125, 45.685546875, 48.2724609375, 50.859375, 53.4462890625, 56.033203125, 58.6201171875, 61.20703125, 63.7939453125, 66.380859375, 68.9677734375, 71.5546875, 74.1416015625, 76.728515625, 79.3154296875, 81.90234375, 84.4892578125, 87.076171875, 89.6630859375, 92.25]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 164.0, 857.0], "bins": [-921.3816528320312, -906.7872924804688, -892.1929321289062, -877.5985717773438, -863.004150390625, -848.4097900390625, -833.8154296875, -819.2210693359375, -804.626708984375, -790.0323486328125, -775.43798828125, -760.8436279296875, -746.249267578125, -731.6548461914062, -717.0604858398438, -702.4661254882812, -687.8717651367188, -673.2774047851562, -658.6830444335938, -644.0886840820312, -629.4942626953125, -614.89990234375, -600.3055419921875, -585.711181640625, -571.1168212890625, -556.5224609375, -541.9281005859375, -527.333740234375, -512.7393798828125, -498.1449890136719, -483.55059814453125, -468.95623779296875, -454.36187744140625, -439.76751708984375, -425.17315673828125, -410.5787658691406, -395.9844055175781, -381.3900451660156, -366.795654296875, -352.2012939453125, -337.60693359375, -323.0125732421875, -308.418212890625, -293.8238220214844, -279.2294616699219, -264.6351013183594, -250.0407257080078, -235.44635009765625, -220.85198974609375, -206.25762939453125, -191.6632537841797, -177.06887817382812, -162.47451782226562, -147.88015747070312, -133.28578186035156, -118.69141387939453, -104.0970458984375, -89.50267791748047, -74.90830993652344, -60.313941955566406, -45.719573974609375, -31.125205993652344, -16.530838012695312, -1.9364700317382812, 12.657898902893066]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 5.0, 5.0, 14.0, 9.0, 18.0, 11.0, 20.0, 21.0, 20.0, 18.0, 33.0, 33.0, 32.0, 31.0, 44.0, 35.0, 34.0, 33.0, 45.0, 58.0, 41.0, 37.0, 35.0, 37.0, 32.0, 23.0, 33.0, 33.0, 39.0, 21.0, 26.0, 23.0, 22.0, 15.0, 6.0, 7.0, 12.0, 7.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-106.93266296386719, -103.48381042480469, -100.03496551513672, -96.58611297607422, -93.13726806640625, -89.68841552734375, -86.23956298828125, -82.79071807861328, -79.34187316894531, -75.89302062988281, -72.44417572021484, -68.99532318115234, -65.54647827148438, -62.097625732421875, -58.64877700805664, -55.199928283691406, -51.751075744628906, -48.30222702026367, -44.85337829589844, -41.40452575683594, -37.95568084716797, -34.50682830810547, -31.057979583740234, -27.609130859375, -24.160282135009766, -20.71143341064453, -17.262584686279297, -13.81373405456543, -10.364885330200195, -6.916036605834961, -3.4671859741210938, -0.018337249755859375, 3.4305038452148438, 6.879353046417236, 10.328202247619629, 13.77705192565918, 17.225900650024414, 20.67474937438965, 24.123600006103516, 27.57244873046875, 31.021297454833984, 34.47014617919922, 37.91899490356445, 41.36784362792969, 44.81669616699219, 48.265541076660156, 51.714393615722656, 55.16324234008789, 58.612091064453125, 62.06093978881836, 65.5097885131836, 68.9586410522461, 72.40748596191406, 75.85633850097656, 79.30519104003906, 82.75403594970703, 86.202880859375, 89.6517333984375, 93.10057830810547, 96.54943084716797, 99.99827575683594, 103.44712829589844, 106.89598083496094, 110.3448257446289, 113.7936782836914]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 5.0, 3.0, 4.0, 10.0, 11.0, 10.0, 9.0, 16.0, 22.0, 24.0, 32.0, 39.0, 39.0, 40.0, 49.0, 65.0, 63.0, 57.0, 52.0, 61.0, 63.0, 44.0, 41.0, 46.0, 38.0, 33.0, 22.0, 20.0, 10.0, 18.0, 16.0, 7.0, 8.0, 6.0, 1.0, 5.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0390625, -11.6522216796875, -11.265380859375, -10.8785400390625, -10.49169921875, -10.1048583984375, -9.718017578125, -9.3311767578125, -8.9443359375, -8.5574951171875, -8.170654296875, -7.7838134765625, -7.39697265625, -7.0101318359375, -6.623291015625, -6.2364501953125, -5.849609375, -5.4627685546875, -5.075927734375, -4.6890869140625, -4.30224609375, -3.9154052734375, -3.528564453125, -3.1417236328125, -2.7548828125, -2.3680419921875, -1.981201171875, -1.5943603515625, -1.20751953125, -0.8206787109375, -0.433837890625, -0.0469970703125, 0.33984375, 0.7266845703125, 1.113525390625, 1.5003662109375, 1.88720703125, 2.2740478515625, 2.660888671875, 3.0477294921875, 3.4345703125, 3.8214111328125, 4.208251953125, 4.5950927734375, 4.98193359375, 5.3687744140625, 5.755615234375, 6.1424560546875, 6.529296875, 6.9161376953125, 7.302978515625, 7.6898193359375, 8.07666015625, 8.4635009765625, 8.850341796875, 9.2371826171875, 9.6240234375, 10.0108642578125, 10.397705078125, 10.7845458984375, 11.17138671875, 11.5582275390625, 11.945068359375, 12.3319091796875, 12.71875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 1.0, 6.0, 9.0, 11.0, 16.0, 24.0, 32.0, 44.0, 65.0, 131.0, 226.0, 335.0, 572.0, 1241.0, 2543.0, 5728.0, 16076.0, 187857.0, 3871790.0, 84485.0, 13119.0, 5010.0, 2276.0, 1161.0, 621.0, 373.0, 198.0, 111.0, 68.0, 46.0, 34.0, 15.0, 19.0, 8.0, 6.0, 6.0, 8.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.5, -51.796875, -50.09375, -48.390625, -46.6875, -44.984375, -43.28125, -41.578125, -39.875, -38.171875, -36.46875, -34.765625, -33.0625, -31.359375, -29.65625, -27.953125, -26.25, -24.546875, -22.84375, -21.140625, -19.4375, -17.734375, -16.03125, -14.328125, -12.625, -10.921875, -9.21875, -7.515625, -5.8125, -4.109375, -2.40625, -0.703125, 1.0, 2.703125, 4.40625, 6.109375, 7.8125, 9.515625, 11.21875, 12.921875, 14.625, 16.328125, 18.03125, 19.734375, 21.4375, 23.140625, 24.84375, 26.546875, 28.25, 29.953125, 31.65625, 33.359375, 35.0625, 36.765625, 38.46875, 40.171875, 41.875, 43.578125, 45.28125, 46.984375, 48.6875, 50.390625, 52.09375, 53.796875, 55.5]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 6.0, 8.0, 9.0, 10.0, 15.0, 14.0, 23.0, 21.0, 21.0, 34.0, 29.0, 59.0, 107.0, 222.0, 385.0, 733.0, 882.0, 668.0, 310.0, 170.0, 93.0, 59.0, 33.0, 32.0, 23.0, 14.0, 8.0, 9.0, 8.0, 11.0, 6.0, 8.0, 4.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.84375, -27.86083984375, -26.8779296875, -25.89501953125, -24.912109375, -23.92919921875, -22.9462890625, -21.96337890625, -20.98046875, -19.99755859375, -19.0146484375, -18.03173828125, -17.048828125, -16.06591796875, -15.0830078125, -14.10009765625, -13.1171875, -12.13427734375, -11.1513671875, -10.16845703125, -9.185546875, -8.20263671875, -7.2197265625, -6.23681640625, -5.25390625, -4.27099609375, -3.2880859375, -2.30517578125, -1.322265625, -0.33935546875, 0.6435546875, 1.62646484375, 2.609375, 3.59228515625, 4.5751953125, 5.55810546875, 6.541015625, 7.52392578125, 8.5068359375, 9.48974609375, 10.47265625, 11.45556640625, 12.4384765625, 13.42138671875, 14.404296875, 15.38720703125, 16.3701171875, 17.35302734375, 18.3359375, 19.31884765625, 20.3017578125, 21.28466796875, 22.267578125, 23.25048828125, 24.2333984375, 25.21630859375, 26.19921875, 27.18212890625, 28.1650390625, 29.14794921875, 30.130859375, 31.11376953125, 32.0966796875, 33.07958984375, 34.0625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 0.0, 3.0, 7.0, 11.0, 3.0, 7.0, 9.0, 16.0, 29.0, 37.0, 50.0, 60.0, 102.0, 115.0, 172.0, 226.0, 340.0, 487.0, 666.0, 1002.0, 1420.0, 2092.0, 3205.0, 4710.0, 7480.0, 12036.0, 20583.0, 40210.0, 113751.0, 1051310.0, 2608134.0, 206224.0, 53991.0, 25447.0, 14428.0, 8786.0, 5526.0, 3690.0, 2435.0, 1655.0, 1115.0, 793.0, 551.0, 369.0, 295.0, 185.0, 166.0, 113.0, 61.0, 47.0, 34.0, 22.0, 21.0, 21.0, 18.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0], "bins": [-35.25, -34.1875, -33.125, -32.0625, -31.0, -29.9375, -28.875, -27.8125, -26.75, -25.6875, -24.625, -23.5625, -22.5, -21.4375, -20.375, -19.3125, -18.25, -17.1875, -16.125, -15.0625, -14.0, -12.9375, -11.875, -10.8125, -9.75, -8.6875, -7.625, -6.5625, -5.5, -4.4375, -3.375, -2.3125, -1.25, -0.1875, 0.875, 1.9375, 3.0, 4.0625, 5.125, 6.1875, 7.25, 8.3125, 9.375, 10.4375, 11.5, 12.5625, 13.625, 14.6875, 15.75, 16.8125, 17.875, 18.9375, 20.0, 21.0625, 22.125, 23.1875, 24.25, 25.3125, 26.375, 27.4375, 28.5, 29.5625, 30.625, 31.6875, 32.75]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 6.0, 23.0, 45.0, 60.0, 144.0, 306.0, 215.0, 103.0, 51.0, 24.0, 11.0, 4.0, 7.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-384.76837158203125, -377.0287170410156, -369.2890625, -361.54937744140625, -353.8097229003906, -346.070068359375, -338.3304138183594, -330.59075927734375, -322.85107421875, -315.1114196777344, -307.37176513671875, -299.632080078125, -291.8924255371094, -284.15277099609375, -276.4131164550781, -268.6734619140625, -260.9338073730469, -253.19415283203125, -245.45448303222656, -237.71482849121094, -229.97515869140625, -222.23550415039062, -214.495849609375, -206.75619506835938, -199.0165252685547, -191.27687072753906, -183.53720092773438, -175.79754638671875, -168.05789184570312, -160.31822204589844, -152.5785675048828, -144.83889770507812, -137.09925842285156, -129.35960388183594, -121.61993408203125, -113.88027954101562, -106.14061737060547, -98.40095520019531, -90.66130065917969, -82.92163848876953, -75.18197631835938, -67.44231414794922, -59.70265579223633, -51.96299743652344, -44.22333526611328, -36.483673095703125, -28.744014739990234, -21.004356384277344, -13.264694213867188, -5.525033950805664, 2.2146263122558594, 9.954286575317383, 17.693946838378906, 25.433609008789062, 33.17326736450195, 40.912925720214844, 48.652587890625, 56.392250061035156, 64.13191223144531, 71.87156677246094, 79.6112289428711, 87.35089111328125, 95.09054565429688, 102.83020782470703, 110.56986999511719]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 10.0, 10.0, 15.0, 15.0, 19.0, 17.0, 25.0, 27.0, 20.0, 15.0, 32.0, 41.0, 39.0, 32.0, 32.0, 31.0, 44.0, 33.0, 33.0, 39.0, 41.0, 52.0, 39.0, 43.0, 30.0, 28.0, 30.0, 24.0, 28.0, 22.0, 16.0, 19.0, 14.0, 17.0, 8.0, 8.0, 8.0, 11.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-87.39977264404297, -84.71659851074219, -82.03343200683594, -79.35026550292969, -76.6670913696289, -73.98391723632812, -71.30075073242188, -68.61758422851562, -65.93441009521484, -63.25123977661133, -60.56806945800781, -57.8848991394043, -55.20172882080078, -52.518558502197266, -49.83538818359375, -47.152217864990234, -44.46904754638672, -41.7858772277832, -39.10270690917969, -36.41953659057617, -33.736366271972656, -31.05319595336914, -28.370025634765625, -25.68685531616211, -23.003684997558594, -20.320514678955078, -17.637344360351562, -14.954174041748047, -12.271003723144531, -9.587833404541016, -6.9046630859375, -4.221492767333984, -1.5383148193359375, 1.1448554992675781, 3.8280258178710938, 6.511196136474609, 9.194366455078125, 11.87753677368164, 14.560707092285156, 17.243877410888672, 19.927047729492188, 22.610218048095703, 25.29338836669922, 27.976558685302734, 30.65972900390625, 33.342899322509766, 36.02606964111328, 38.7092399597168, 41.39241027832031, 44.07558059692383, 46.758750915527344, 49.44192123413086, 52.125091552734375, 54.80826187133789, 57.491432189941406, 60.17460250854492, 62.85777282714844, 65.54093933105469, 68.22411346435547, 70.90728759765625, 73.5904541015625, 76.27362060546875, 78.95679473876953, 81.63996887207031, 84.32313537597656]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 2.0, 4.0, 8.0, 6.0, 6.0, 6.0, 18.0, 17.0, 17.0, 15.0, 32.0, 20.0, 36.0, 39.0, 31.0, 50.0, 55.0, 58.0, 65.0, 56.0, 58.0, 40.0, 52.0, 47.0, 36.0, 26.0, 27.0, 34.0, 31.0, 18.0, 12.0, 15.0, 18.0, 7.0, 5.0, 6.0, 5.0, 7.0, 5.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.4609375, -11.0955810546875, -10.730224609375, -10.3648681640625, -9.99951171875, -9.6341552734375, -9.268798828125, -8.9034423828125, -8.5380859375, -8.1727294921875, -7.807373046875, -7.4420166015625, -7.07666015625, -6.7113037109375, -6.345947265625, -5.9805908203125, -5.615234375, -5.2498779296875, -4.884521484375, -4.5191650390625, -4.15380859375, -3.7884521484375, -3.423095703125, -3.0577392578125, -2.6923828125, -2.3270263671875, -1.961669921875, -1.5963134765625, -1.23095703125, -0.8656005859375, -0.500244140625, -0.1348876953125, 0.23046875, 0.5958251953125, 0.961181640625, 1.3265380859375, 1.69189453125, 2.0572509765625, 2.422607421875, 2.7879638671875, 3.1533203125, 3.5186767578125, 3.884033203125, 4.2493896484375, 4.61474609375, 4.9801025390625, 5.345458984375, 5.7108154296875, 6.076171875, 6.4415283203125, 6.806884765625, 7.1722412109375, 7.53759765625, 7.9029541015625, 8.268310546875, 8.6336669921875, 8.9990234375, 9.3643798828125, 9.729736328125, 10.0950927734375, 10.46044921875, 10.8258056640625, 11.191162109375, 11.5565185546875, 11.921875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 9.0, 13.0, 11.0, 9.0, 33.0, 37.0, 47.0, 82.0, 123.0, 185.0, 237.0, 370.0, 495.0, 727.0, 1025.0, 1598.0, 2362.0, 3592.0, 5670.0, 9006.0, 14921.0, 24869.0, 43867.0, 84457.0, 178833.0, 304704.0, 178403.0, 84017.0, 43960.0, 24737.0, 14612.0, 8967.0, 5615.0, 3610.0, 2351.0, 1591.0, 1080.0, 753.0, 503.0, 303.0, 248.0, 176.0, 103.0, 76.0, 56.0, 40.0, 28.0, 25.0, 16.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.119140625, -1.0847015380859375, -1.050262451171875, -1.0158233642578125, -0.98138427734375, -0.9469451904296875, -0.912506103515625, -0.8780670166015625, -0.8436279296875, -0.8091888427734375, -0.774749755859375, -0.7403106689453125, -0.70587158203125, -0.6714324951171875, -0.636993408203125, -0.6025543212890625, -0.568115234375, -0.5336761474609375, -0.499237060546875, -0.4647979736328125, -0.43035888671875, -0.3959197998046875, -0.361480712890625, -0.3270416259765625, -0.2926025390625, -0.2581634521484375, -0.223724365234375, -0.1892852783203125, -0.15484619140625, -0.1204071044921875, -0.085968017578125, -0.0515289306640625, -0.01708984375, 0.0173492431640625, 0.051788330078125, 0.0862274169921875, 0.12066650390625, 0.1551055908203125, 0.189544677734375, 0.2239837646484375, 0.2584228515625, 0.2928619384765625, 0.327301025390625, 0.3617401123046875, 0.39617919921875, 0.4306182861328125, 0.465057373046875, 0.4994964599609375, 0.533935546875, 0.5683746337890625, 0.602813720703125, 0.6372528076171875, 0.67169189453125, 0.7061309814453125, 0.740570068359375, 0.7750091552734375, 0.8094482421875, 0.8438873291015625, 0.878326416015625, 0.9127655029296875, 0.94720458984375, 0.9816436767578125, 1.016082763671875, 1.0505218505859375, 1.0849609375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 6.0, 6.0, 4.0, 1.0, 4.0, 5.0, 5.0, 7.0, 9.0, 8.0, 12.0, 11.0, 16.0, 21.0, 21.0, 12.0, 27.0, 25.0, 42.0, 28.0, 35.0, 41.0, 32.0, 36.0, 39.0, 47.0, 1079.0, 36.0, 33.0, 36.0, 29.0, 35.0, 33.0, 25.0, 28.0, 26.0, 29.0, 27.0, 19.0, 16.0, 16.0, 10.0, 10.0, 16.0, 6.0, 5.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.06640625, -5.86688232421875, -5.6673583984375, -5.46783447265625, -5.268310546875, -5.06878662109375, -4.8692626953125, -4.66973876953125, -4.47021484375, -4.27069091796875, -4.0711669921875, -3.87164306640625, -3.672119140625, -3.47259521484375, -3.2730712890625, -3.07354736328125, -2.8740234375, -2.67449951171875, -2.4749755859375, -2.27545166015625, -2.075927734375, -1.87640380859375, -1.6768798828125, -1.47735595703125, -1.27783203125, -1.07830810546875, -0.8787841796875, -0.67926025390625, -0.479736328125, -0.28021240234375, -0.0806884765625, 0.11883544921875, 0.318359375, 0.51788330078125, 0.7174072265625, 0.91693115234375, 1.116455078125, 1.31597900390625, 1.5155029296875, 1.71502685546875, 1.91455078125, 2.11407470703125, 2.3135986328125, 2.51312255859375, 2.712646484375, 2.91217041015625, 3.1116943359375, 3.31121826171875, 3.5107421875, 3.71026611328125, 3.9097900390625, 4.10931396484375, 4.308837890625, 4.50836181640625, 4.7078857421875, 4.90740966796875, 5.10693359375, 5.30645751953125, 5.5059814453125, 5.70550537109375, 5.905029296875, 6.10455322265625, 6.3040771484375, 6.50360107421875, 6.703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 14.0, 16.0, 30.0, 67.0, 94.0, 143.0, 201.0, 283.0, 424.0, 605.0, 939.0, 1322.0, 2057.0, 3098.0, 4697.0, 6991.0, 10652.0, 16160.0, 24753.0, 39659.0, 67568.0, 119524.0, 317240.0, 1155977.0, 130534.0, 73189.0, 43345.0, 26832.0, 17116.0, 11157.0, 7344.0, 4958.0, 3259.0, 2366.0, 1444.0, 1045.0, 679.0, 435.0, 298.0, 203.0, 135.0, 93.0, 57.0, 35.0, 27.0, 16.0, 13.0, 13.0, 3.0, 5.0, 4.0, 4.0], "bins": [-0.673828125, -0.6546173095703125, -0.635406494140625, -0.6161956787109375, -0.59698486328125, -0.5777740478515625, -0.558563232421875, -0.5393524169921875, -0.5201416015625, -0.5009307861328125, -0.481719970703125, -0.4625091552734375, -0.44329833984375, -0.4240875244140625, -0.404876708984375, -0.3856658935546875, -0.366455078125, -0.3472442626953125, -0.328033447265625, -0.3088226318359375, -0.28961181640625, -0.2704010009765625, -0.251190185546875, -0.2319793701171875, -0.2127685546875, -0.1935577392578125, -0.174346923828125, -0.1551361083984375, -0.13592529296875, -0.1167144775390625, -0.097503662109375, -0.0782928466796875, -0.05908203125, -0.0398712158203125, -0.020660400390625, -0.0014495849609375, 0.01776123046875, 0.0369720458984375, 0.056182861328125, 0.0753936767578125, 0.0946044921875, 0.1138153076171875, 0.133026123046875, 0.1522369384765625, 0.17144775390625, 0.1906585693359375, 0.209869384765625, 0.2290802001953125, 0.248291015625, 0.2675018310546875, 0.286712646484375, 0.3059234619140625, 0.32513427734375, 0.3443450927734375, 0.363555908203125, 0.3827667236328125, 0.4019775390625, 0.4211883544921875, 0.440399169921875, 0.4596099853515625, 0.47882080078125, 0.4980316162109375, 0.517242431640625, 0.5364532470703125, 0.5556640625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 6.0, 6.0, 13.0, 8.0, 7.0, 16.0, 15.0, 18.0, 20.0, 19.0, 31.0, 32.0, 41.0, 60.0, 62.0, 95.0, 76.0, 85.0, 59.0, 64.0, 51.0, 35.0, 29.0, 20.0, 31.0, 13.0, 5.0, 16.0, 9.0, 11.0, 11.0, 7.0, 6.0, 4.0, 7.0, 6.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020294189453125, -0.019631385803222656, -0.018968582153320312, -0.01830577850341797, -0.017642974853515625, -0.01698017120361328, -0.016317367553710938, -0.015654563903808594, -0.01499176025390625, -0.014328956604003906, -0.013666152954101562, -0.013003349304199219, -0.012340545654296875, -0.011677742004394531, -0.011014938354492188, -0.010352134704589844, -0.0096893310546875, -0.009026527404785156, -0.008363723754882812, -0.007700920104980469, -0.007038116455078125, -0.006375312805175781, -0.0057125091552734375, -0.005049705505371094, -0.00438690185546875, -0.0037240982055664062, -0.0030612945556640625, -0.0023984909057617188, -0.001735687255859375, -0.0010728836059570312, -0.0004100799560546875, 0.00025272369384765625, 0.00091552734375, 0.0015783309936523438, 0.0022411346435546875, 0.0029039382934570312, 0.003566741943359375, 0.004229545593261719, 0.0048923492431640625, 0.005555152893066406, 0.00621795654296875, 0.006880760192871094, 0.0075435638427734375, 0.008206367492675781, 0.008869171142578125, 0.009531974792480469, 0.010194778442382812, 0.010857582092285156, 0.0115203857421875, 0.012183189392089844, 0.012845993041992188, 0.013508796691894531, 0.014171600341796875, 0.014834403991699219, 0.015497207641601562, 0.016160011291503906, 0.01682281494140625, 0.017485618591308594, 0.018148422241210938, 0.01881122589111328, 0.019474029541015625, 0.02013683319091797, 0.020799636840820312, 0.021462440490722656, 0.022125244140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 6.0, 8.0, 10.0, 10.0, 13.0, 14.0, 6.0, 16.0, 28.0, 26.0, 25.0, 37.0, 69.0, 104.0, 163.0, 594.0, 32613.0, 1012452.0, 1635.0, 275.0, 132.0, 65.0, 46.0, 22.0, 26.0, 29.0, 19.0, 18.0, 20.0, 12.0, 8.0, 9.0, 14.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63818359375, -0.6183624267578125, -0.598541259765625, -0.5787200927734375, -0.55889892578125, -0.5390777587890625, -0.519256591796875, -0.4994354248046875, -0.4796142578125, -0.4597930908203125, -0.439971923828125, -0.4201507568359375, -0.40032958984375, -0.3805084228515625, -0.360687255859375, -0.3408660888671875, -0.321044921875, -0.3012237548828125, -0.281402587890625, -0.2615814208984375, -0.24176025390625, -0.2219390869140625, -0.202117919921875, -0.1822967529296875, -0.1624755859375, -0.1426544189453125, -0.122833251953125, -0.1030120849609375, -0.08319091796875, -0.0633697509765625, -0.043548583984375, -0.0237274169921875, -0.00390625, 0.0159149169921875, 0.035736083984375, 0.0555572509765625, 0.07537841796875, 0.0951995849609375, 0.115020751953125, 0.1348419189453125, 0.1546630859375, 0.1744842529296875, 0.194305419921875, 0.2141265869140625, 0.23394775390625, 0.2537689208984375, 0.273590087890625, 0.2934112548828125, 0.313232421875, 0.3330535888671875, 0.352874755859375, 0.3726959228515625, 0.39251708984375, 0.4123382568359375, 0.432159423828125, 0.4519805908203125, 0.4718017578125, 0.4916229248046875, 0.511444091796875, 0.5312652587890625, 0.55108642578125, 0.5709075927734375, 0.590728759765625, 0.6105499267578125, 0.63037109375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [34.0, 851.0, 127.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018961401656270027, -0.007432793267071247, 0.004095815122127533, 0.015624424442648888, 0.027153031900525093, 0.03868164122104645, 0.05021025240421295, 0.06173885613679886, 0.07326746731996536, 0.08479607850313187, 0.09632468223571777, 0.10785329341888428, 0.11938190460205078, 0.13091051578521729, 0.1424391269683838, 0.1539677232503891, 0.1654963344335556, 0.1770249456167221, 0.1885535567998886, 0.20008215308189392, 0.21161076426506042, 0.22313937544822693, 0.23466798663139343, 0.24619659781455994, 0.25772520899772644, 0.26925382018089294, 0.28078243136405945, 0.29231104254722595, 0.30383965373039246, 0.3153682351112366, 0.3268968462944031, 0.3384254574775696, 0.3499540388584137, 0.3614826500415802, 0.3730112612247467, 0.3845398724079132, 0.3960684835910797, 0.40759706497192383, 0.41912567615509033, 0.43065428733825684, 0.44218289852142334, 0.45371150970458984, 0.46524012088775635, 0.47676873207092285, 0.48829734325408936, 0.49982595443725586, 0.5113545656204224, 0.5228831768035889, 0.5344117879867554, 0.5459403991699219, 0.5574690103530884, 0.5689976215362549, 0.5805262327194214, 0.5920548439025879, 0.6035834550857544, 0.6151120662689209, 0.6266406178474426, 0.6381692290306091, 0.6496978402137756, 0.6612264513969421, 0.6727550625801086, 0.6842836737632751, 0.6958122849464417, 0.7073408961296082, 0.7188695073127747]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 8.0, 7.0, 12.0, 10.0, 6.0, 23.0, 18.0, 12.0, 19.0, 15.0, 24.0, 20.0, 28.0, 40.0, 31.0, 42.0, 41.0, 39.0, 42.0, 35.0, 46.0, 43.0, 36.0, 43.0, 41.0, 42.0, 32.0, 29.0, 25.0, 41.0, 23.0, 19.0, 16.0, 14.0, 20.0, 16.0, 12.0, 8.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.04014807939529419, -0.03895947337150574, -0.037770871073007584, -0.03658226877450943, -0.03539366275072098, -0.034205056726932526, -0.03301645442843437, -0.03182785212993622, -0.030639246106147766, -0.029450641945004463, -0.02826203778386116, -0.027073433622717857, -0.025884829461574554, -0.02469622530043125, -0.02350762113928795, -0.022319016978144646, -0.021130412817001343, -0.01994180865585804, -0.018753204494714737, -0.017564600333571434, -0.01637599617242813, -0.015187392011284828, -0.013998787850141525, -0.012810183688998222, -0.01162157952785492, -0.010432975366711617, -0.009244371205568314, -0.00805576704442501, -0.006867162883281708, -0.005678558722138405, -0.004489954560995102, -0.003301350399851799, -0.002112746238708496, -0.0009241420775651932, 0.00026446208357810974, 0.0014530662447214127, 0.0026416704058647156, 0.0038302745670080185, 0.005018878728151321, 0.006207482889294624, 0.007396087050437927, 0.00858469121158123, 0.009773295372724533, 0.010961899533867836, 0.012150503695011139, 0.013339107856154442, 0.014527712017297745, 0.015716316178441048, 0.01690492033958435, 0.018093524500727654, 0.019282128661870956, 0.02047073282301426, 0.021659336984157562, 0.022847941145300865, 0.024036545306444168, 0.02522514946758747, 0.026413753628730774, 0.027602357789874077, 0.02879096195101738, 0.029979566112160683, 0.031168170273303986, 0.03235677629709244, 0.03354537859559059, 0.034733980894088745, 0.0359225869178772]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 2.0, 4.0, 8.0, 6.0, 6.0, 6.0, 19.0, 16.0, 17.0, 15.0, 32.0, 20.0, 36.0, 39.0, 31.0, 50.0, 55.0, 58.0, 65.0, 56.0, 58.0, 40.0, 52.0, 47.0, 36.0, 26.0, 27.0, 34.0, 31.0, 18.0, 12.0, 15.0, 18.0, 7.0, 5.0, 6.0, 5.0, 7.0, 5.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.4609375, -11.0955810546875, -10.730224609375, -10.3648681640625, -9.99951171875, -9.6341552734375, -9.268798828125, -8.9034423828125, -8.5380859375, -8.1727294921875, -7.807373046875, -7.4420166015625, -7.07666015625, -6.7113037109375, -6.345947265625, -5.9805908203125, -5.615234375, -5.2498779296875, -4.884521484375, -4.5191650390625, -4.15380859375, -3.7884521484375, -3.423095703125, -3.0577392578125, -2.6923828125, -2.3270263671875, -1.961669921875, -1.5963134765625, -1.23095703125, -0.8656005859375, -0.500244140625, -0.1348876953125, 0.23046875, 0.5958251953125, 0.961181640625, 1.3265380859375, 1.69189453125, 2.0572509765625, 2.422607421875, 2.7879638671875, 3.1533203125, 3.5186767578125, 3.884033203125, 4.2493896484375, 4.61474609375, 4.9801025390625, 5.345458984375, 5.7108154296875, 6.076171875, 6.4415283203125, 6.806884765625, 7.1722412109375, 7.53759765625, 7.9029541015625, 8.268310546875, 8.6336669921875, 8.9990234375, 9.3643798828125, 9.729736328125, 10.0950927734375, 10.46044921875, 10.8258056640625, 11.191162109375, 11.5565185546875, 11.921875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 12.0, 7.0, 15.0, 20.0, 25.0, 38.0, 43.0, 73.0, 83.0, 123.0, 188.0, 267.0, 372.0, 512.0, 882.0, 1433.0, 2624.0, 5438.0, 13326.0, 42394.0, 190395.0, 606277.0, 130529.0, 32001.0, 10921.0, 4587.0, 2258.0, 1252.0, 783.0, 469.0, 321.0, 231.0, 162.0, 134.0, 78.0, 76.0, 53.0, 34.0, 20.0, 26.0, 17.0, 14.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.4453125, -8.1845703125, -7.923828125, -7.6630859375, -7.40234375, -7.1416015625, -6.880859375, -6.6201171875, -6.359375, -6.0986328125, -5.837890625, -5.5771484375, -5.31640625, -5.0556640625, -4.794921875, -4.5341796875, -4.2734375, -4.0126953125, -3.751953125, -3.4912109375, -3.23046875, -2.9697265625, -2.708984375, -2.4482421875, -2.1875, -1.9267578125, -1.666015625, -1.4052734375, -1.14453125, -0.8837890625, -0.623046875, -0.3623046875, -0.1015625, 0.1591796875, 0.419921875, 0.6806640625, 0.94140625, 1.2021484375, 1.462890625, 1.7236328125, 1.984375, 2.2451171875, 2.505859375, 2.7666015625, 3.02734375, 3.2880859375, 3.548828125, 3.8095703125, 4.0703125, 4.3310546875, 4.591796875, 4.8525390625, 5.11328125, 5.3740234375, 5.634765625, 5.8955078125, 6.15625, 6.4169921875, 6.677734375, 6.9384765625, 7.19921875, 7.4599609375, 7.720703125, 7.9814453125, 8.2421875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 7.0, 5.0, 11.0, 8.0, 15.0, 16.0, 19.0, 31.0, 33.0, 22.0, 30.0, 25.0, 38.0, 30.0, 47.0, 34.0, 42.0, 77.0, 266.0, 1730.0, 94.0, 51.0, 37.0, 44.0, 32.0, 34.0, 37.0, 29.0, 24.0, 28.0, 16.0, 22.0, 15.0, 14.0, 11.0, 15.0, 11.0, 9.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-35.15625, -34.02734375, -32.8984375, -31.76953125, -30.640625, -29.51171875, -28.3828125, -27.25390625, -26.125, -24.99609375, -23.8671875, -22.73828125, -21.609375, -20.48046875, -19.3515625, -18.22265625, -17.09375, -15.96484375, -14.8359375, -13.70703125, -12.578125, -11.44921875, -10.3203125, -9.19140625, -8.0625, -6.93359375, -5.8046875, -4.67578125, -3.546875, -2.41796875, -1.2890625, -0.16015625, 0.96875, 2.09765625, 3.2265625, 4.35546875, 5.484375, 6.61328125, 7.7421875, 8.87109375, 10.0, 11.12890625, 12.2578125, 13.38671875, 14.515625, 15.64453125, 16.7734375, 17.90234375, 19.03125, 20.16015625, 21.2890625, 22.41796875, 23.546875, 24.67578125, 25.8046875, 26.93359375, 28.0625, 29.19140625, 30.3203125, 31.44921875, 32.578125, 33.70703125, 34.8359375, 35.96484375, 37.09375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 10.0, 13.0, 19.0, 11.0, 10.0, 22.0, 16.0, 30.0, 41.0, 38.0, 58.0, 70.0, 114.0, 174.0, 331.0, 833.0, 5113.0, 1908376.0, 1223594.0, 5021.0, 756.0, 382.0, 193.0, 94.0, 80.0, 50.0, 40.0, 28.0, 34.0, 33.0, 20.0, 18.0, 7.0, 15.0, 12.0, 5.0, 8.0, 5.0, 4.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-62.84375, -60.93896484375, -59.0341796875, -57.12939453125, -55.224609375, -53.31982421875, -51.4150390625, -49.51025390625, -47.60546875, -45.70068359375, -43.7958984375, -41.89111328125, -39.986328125, -38.08154296875, -36.1767578125, -34.27197265625, -32.3671875, -30.46240234375, -28.5576171875, -26.65283203125, -24.748046875, -22.84326171875, -20.9384765625, -19.03369140625, -17.12890625, -15.22412109375, -13.3193359375, -11.41455078125, -9.509765625, -7.60498046875, -5.7001953125, -3.79541015625, -1.890625, 0.01416015625, 1.9189453125, 3.82373046875, 5.728515625, 7.63330078125, 9.5380859375, 11.44287109375, 13.34765625, 15.25244140625, 17.1572265625, 19.06201171875, 20.966796875, 22.87158203125, 24.7763671875, 26.68115234375, 28.5859375, 30.49072265625, 32.3955078125, 34.30029296875, 36.205078125, 38.10986328125, 40.0146484375, 41.91943359375, 43.82421875, 45.72900390625, 47.6337890625, 49.53857421875, 51.443359375, 53.34814453125, 55.2529296875, 57.15771484375, 59.0625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 20.0, 840.0, 160.0], "bins": [-659.6683959960938, -649.1531982421875, -638.637939453125, -628.1227416992188, -617.6075439453125, -607.09228515625, -596.5770874023438, -586.0618896484375, -575.5466918945312, -565.031494140625, -554.5162353515625, -544.0010375976562, -533.48583984375, -522.9705810546875, -512.4553833007812, -501.940185546875, -491.4249267578125, -480.9096984863281, -470.3945007324219, -459.8792724609375, -449.36407470703125, -438.8488464355469, -428.3336181640625, -417.81842041015625, -407.30322265625, -396.7879943847656, -386.2727966308594, -375.757568359375, -365.24237060546875, -354.7271423339844, -344.2119140625, -333.69671630859375, -323.1814880371094, -312.666259765625, -302.15106201171875, -291.6358337402344, -281.1206359863281, -270.60540771484375, -260.0902099609375, -249.57498168945312, -239.0597686767578, -228.5445556640625, -218.0293426513672, -207.51412963867188, -196.9989013671875, -186.4836883544922, -175.96847534179688, -165.4532470703125, -154.93804931640625, -144.42283630371094, -133.90762329101562, -123.39240264892578, -112.87718200683594, -102.36196899414062, -91.84675598144531, -81.33153533935547, -70.81632232666016, -60.30110549926758, -49.785888671875, -39.27067565917969, -28.75545883178711, -18.24024200439453, -7.725028991699219, 2.790191650390625, 13.305407524108887]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 8.0, 6.0, 11.0, 15.0, 16.0, 16.0, 20.0, 19.0, 17.0, 25.0, 24.0, 30.0, 39.0, 38.0, 34.0, 41.0, 33.0, 39.0, 33.0, 48.0, 49.0, 49.0, 49.0, 46.0, 36.0, 29.0, 28.0, 34.0, 19.0, 27.0, 19.0, 22.0, 11.0, 13.0, 12.0, 9.0, 8.0, 3.0, 6.0, 3.0, 2.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-133.70159912109375, -129.6881866455078, -125.67477416992188, -121.66136169433594, -117.64794921875, -113.63453674316406, -109.62113189697266, -105.60771942138672, -101.59430694580078, -97.58089447021484, -93.5674819946289, -89.55406951904297, -85.54066467285156, -81.52725219726562, -77.51383972167969, -73.50042724609375, -69.48701477050781, -65.47360229492188, -61.46018981933594, -57.446781158447266, -53.43336868286133, -49.41995620727539, -45.40654754638672, -41.39313507080078, -37.379722595214844, -33.366310119628906, -29.3528995513916, -25.339488983154297, -21.32607650756836, -17.312664031982422, -13.299253463745117, -9.285842895507812, -5.2724456787109375, -1.2590341567993164, 2.7543773651123047, 6.767788887023926, 10.781200408935547, 14.794612884521484, 18.80802345275879, 22.821434020996094, 26.83484649658203, 30.84825897216797, 34.861671447753906, 38.87508010864258, 42.888492584228516, 46.90190505981445, 50.915313720703125, 54.92872619628906, 58.942138671875, 62.95555114746094, 66.96896362304688, 70.98237609863281, 74.99578857421875, 79.00920104980469, 83.0226058959961, 87.03601837158203, 91.04943084716797, 95.0628433227539, 99.07625579833984, 103.08966827392578, 107.10307312011719, 111.11648559570312, 115.12989807128906, 119.143310546875, 123.15672302246094]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 6.0, 4.0, 6.0, 7.0, 10.0, 19.0, 13.0, 17.0, 22.0, 23.0, 42.0, 34.0, 28.0, 34.0, 54.0, 49.0, 69.0, 67.0, 53.0, 51.0, 61.0, 44.0, 43.0, 37.0, 18.0, 38.0, 23.0, 31.0, 13.0, 15.0, 17.0, 9.0, 7.0, 4.0, 9.0, 3.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.96875, -11.582275390625, -11.19580078125, -10.809326171875, -10.4228515625, -10.036376953125, -9.64990234375, -9.263427734375, -8.876953125, -8.490478515625, -8.10400390625, -7.717529296875, -7.3310546875, -6.944580078125, -6.55810546875, -6.171630859375, -5.78515625, -5.398681640625, -5.01220703125, -4.625732421875, -4.2392578125, -3.852783203125, -3.46630859375, -3.079833984375, -2.693359375, -2.306884765625, -1.92041015625, -1.533935546875, -1.1474609375, -0.760986328125, -0.37451171875, 0.011962890625, 0.3984375, 0.784912109375, 1.17138671875, 1.557861328125, 1.9443359375, 2.330810546875, 2.71728515625, 3.103759765625, 3.490234375, 3.876708984375, 4.26318359375, 4.649658203125, 5.0361328125, 5.422607421875, 5.80908203125, 6.195556640625, 6.58203125, 6.968505859375, 7.35498046875, 7.741455078125, 8.1279296875, 8.514404296875, 8.90087890625, 9.287353515625, 9.673828125, 10.060302734375, 10.44677734375, 10.833251953125, 11.2197265625, 11.606201171875, 11.99267578125, 12.379150390625, 12.765625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 5.0, 3.0, 4.0, 11.0, 12.0, 18.0, 27.0, 24.0, 38.0, 61.0, 111.0, 192.0, 351.0, 771.0, 2086.0, 6530.0, 36187.0, 4021071.0, 112608.0, 9279.0, 2844.0, 1045.0, 425.0, 230.0, 91.0, 72.0, 47.0, 35.0, 22.0, 11.0, 24.0, 5.0, 9.0, 5.0, 7.0, 3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.0, -68.681640625, -66.36328125, -64.044921875, -61.7265625, -59.408203125, -57.08984375, -54.771484375, -52.453125, -50.134765625, -47.81640625, -45.498046875, -43.1796875, -40.861328125, -38.54296875, -36.224609375, -33.90625, -31.587890625, -29.26953125, -26.951171875, -24.6328125, -22.314453125, -19.99609375, -17.677734375, -15.359375, -13.041015625, -10.72265625, -8.404296875, -6.0859375, -3.767578125, -1.44921875, 0.869140625, 3.1875, 5.505859375, 7.82421875, 10.142578125, 12.4609375, 14.779296875, 17.09765625, 19.416015625, 21.734375, 24.052734375, 26.37109375, 28.689453125, 31.0078125, 33.326171875, 35.64453125, 37.962890625, 40.28125, 42.599609375, 44.91796875, 47.236328125, 49.5546875, 51.873046875, 54.19140625, 56.509765625, 58.828125, 61.146484375, 63.46484375, 65.783203125, 68.1015625, 70.419921875, 72.73828125, 75.056640625, 77.375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 6.0, 7.0, 4.0, 3.0, 3.0, 9.0, 8.0, 5.0, 13.0, 15.0, 20.0, 36.0, 37.0, 56.0, 117.0, 217.0, 446.0, 811.0, 926.0, 611.0, 296.0, 171.0, 71.0, 45.0, 25.0, 19.0, 12.0, 12.0, 10.0, 12.0, 7.0, 7.0, 8.0, 4.0, 5.0, 9.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.9375, -27.98095703125, -27.0244140625, -26.06787109375, -25.111328125, -24.15478515625, -23.1982421875, -22.24169921875, -21.28515625, -20.32861328125, -19.3720703125, -18.41552734375, -17.458984375, -16.50244140625, -15.5458984375, -14.58935546875, -13.6328125, -12.67626953125, -11.7197265625, -10.76318359375, -9.806640625, -8.85009765625, -7.8935546875, -6.93701171875, -5.98046875, -5.02392578125, -4.0673828125, -3.11083984375, -2.154296875, -1.19775390625, -0.2412109375, 0.71533203125, 1.671875, 2.62841796875, 3.5849609375, 4.54150390625, 5.498046875, 6.45458984375, 7.4111328125, 8.36767578125, 9.32421875, 10.28076171875, 11.2373046875, 12.19384765625, 13.150390625, 14.10693359375, 15.0634765625, 16.02001953125, 16.9765625, 17.93310546875, 18.8896484375, 19.84619140625, 20.802734375, 21.75927734375, 22.7158203125, 23.67236328125, 24.62890625, 25.58544921875, 26.5419921875, 27.49853515625, 28.455078125, 29.41162109375, 30.3681640625, 31.32470703125, 32.28125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 5.0, 11.0, 13.0, 22.0, 33.0, 57.0, 86.0, 155.0, 249.0, 430.0, 736.0, 1313.0, 2326.0, 4302.0, 8370.0, 18175.0, 52113.0, 638659.0, 3298913.0, 115672.0, 27938.0, 11777.0, 5725.0, 3145.0, 1718.0, 969.0, 581.0, 306.0, 177.0, 102.0, 77.0, 47.0, 27.0, 17.0, 13.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-56.5, -54.7998046875, -53.099609375, -51.3994140625, -49.69921875, -47.9990234375, -46.298828125, -44.5986328125, -42.8984375, -41.1982421875, -39.498046875, -37.7978515625, -36.09765625, -34.3974609375, -32.697265625, -30.9970703125, -29.296875, -27.5966796875, -25.896484375, -24.1962890625, -22.49609375, -20.7958984375, -19.095703125, -17.3955078125, -15.6953125, -13.9951171875, -12.294921875, -10.5947265625, -8.89453125, -7.1943359375, -5.494140625, -3.7939453125, -2.09375, -0.3935546875, 1.306640625, 3.0068359375, 4.70703125, 6.4072265625, 8.107421875, 9.8076171875, 11.5078125, 13.2080078125, 14.908203125, 16.6083984375, 18.30859375, 20.0087890625, 21.708984375, 23.4091796875, 25.109375, 26.8095703125, 28.509765625, 30.2099609375, 31.91015625, 33.6103515625, 35.310546875, 37.0107421875, 38.7109375, 40.4111328125, 42.111328125, 43.8115234375, 45.51171875, 47.2119140625, 48.912109375, 50.6123046875, 52.3125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 12.0, 17.0, 24.0, 41.0, 63.0, 99.0, 176.0, 204.0, 142.0, 90.0, 51.0, 26.0, 24.0, 11.0, 9.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-244.9332733154297, -239.7628936767578, -234.59251403808594, -229.42213439941406, -224.2517547607422, -219.0813751220703, -213.91099548339844, -208.74063110351562, -203.57025146484375, -198.39987182617188, -193.2294921875, -188.05911254882812, -182.88873291015625, -177.71835327148438, -172.5479736328125, -167.37759399414062, -162.20721435546875, -157.03683471679688, -151.866455078125, -146.69607543945312, -141.52569580078125, -136.35531616210938, -131.1849365234375, -126.01456451416016, -120.84418487548828, -115.6738052368164, -110.50342559814453, -105.33304595947266, -100.16267395019531, -94.99229431152344, -89.82191467285156, -84.65153503417969, -79.48117065429688, -74.310791015625, -69.14041137695312, -63.970035552978516, -58.79965591430664, -53.629276275634766, -48.458900451660156, -43.28852081298828, -38.118141174316406, -32.94776153564453, -27.77738380432129, -22.607006072998047, -17.436626434326172, -12.266246795654297, -7.095869064331055, -1.9254913330078125, 3.2448883056640625, 8.415266990661621, 13.58564567565918, 18.756023406982422, 23.926403045654297, 29.096782684326172, 34.26715850830078, 39.437538146972656, 44.60791778564453, 49.778297424316406, 54.94867706298828, 60.11905288696289, 65.2894287109375, 70.45980834960938, 75.63018798828125, 80.80056762695312, 85.970947265625]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 3.0, 1.0, 8.0, 7.0, 5.0, 6.0, 20.0, 13.0, 24.0, 18.0, 15.0, 25.0, 23.0, 23.0, 26.0, 32.0, 33.0, 30.0, 41.0, 40.0, 38.0, 43.0, 41.0, 31.0, 39.0, 45.0, 39.0, 44.0, 31.0, 37.0, 27.0, 31.0, 14.0, 21.0, 18.0, 16.0, 19.0, 10.0, 13.0, 8.0, 9.0, 7.0, 6.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.24476623535156, -66.90499877929688, -64.56523132324219, -62.225460052490234, -59.88569259643555, -57.545921325683594, -55.206153869628906, -52.86638641357422, -50.52661895751953, -48.186851501464844, -45.84708023071289, -43.5073127746582, -41.167545318603516, -38.82777404785156, -36.488006591796875, -34.14823913574219, -31.808467864990234, -29.468698501586914, -27.128931045532227, -24.789161682128906, -22.44939422607422, -20.1096248626709, -17.769855499267578, -15.43008804321289, -13.09031867980957, -10.750550270080566, -8.410781860351562, -6.071012496948242, -3.7312440872192383, -1.3914756774902344, 0.9482936859130859, 3.2880611419677734, 5.627830505371094, 7.967598915100098, 10.307367324829102, 12.647136688232422, 14.986905097961426, 17.32667350769043, 19.66644287109375, 22.006210327148438, 24.345979690551758, 26.685749053955078, 29.025516510009766, 31.365285873413086, 33.705055236816406, 36.044822692871094, 38.38459014892578, 40.72435760498047, 43.06412887573242, 45.40389633178711, 47.74366760253906, 50.08343505859375, 52.42320251464844, 54.762969970703125, 57.10274124145508, 59.442508697509766, 61.78227996826172, 64.1220474243164, 66.4618148803711, 68.80158996582031, 71.141357421875, 73.48112487792969, 75.82089233398438, 78.16065979003906, 80.50042724609375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 4.0, 9.0, 8.0, 6.0, 14.0, 12.0, 12.0, 21.0, 19.0, 25.0, 37.0, 31.0, 35.0, 30.0, 31.0, 49.0, 55.0, 54.0, 46.0, 57.0, 39.0, 48.0, 36.0, 39.0, 35.0, 33.0, 35.0, 32.0, 18.0, 25.0, 18.0, 19.0, 18.0, 13.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.265625, -10.899658203125, -10.53369140625, -10.167724609375, -9.8017578125, -9.435791015625, -9.06982421875, -8.703857421875, -8.337890625, -7.971923828125, -7.60595703125, -7.239990234375, -6.8740234375, -6.508056640625, -6.14208984375, -5.776123046875, -5.41015625, -5.044189453125, -4.67822265625, -4.312255859375, -3.9462890625, -3.580322265625, -3.21435546875, -2.848388671875, -2.482421875, -2.116455078125, -1.75048828125, -1.384521484375, -1.0185546875, -0.652587890625, -0.28662109375, 0.079345703125, 0.4453125, 0.811279296875, 1.17724609375, 1.543212890625, 1.9091796875, 2.275146484375, 2.64111328125, 3.007080078125, 3.373046875, 3.739013671875, 4.10498046875, 4.470947265625, 4.8369140625, 5.202880859375, 5.56884765625, 5.934814453125, 6.30078125, 6.666748046875, 7.03271484375, 7.398681640625, 7.7646484375, 8.130615234375, 8.49658203125, 8.862548828125, 9.228515625, 9.594482421875, 9.96044921875, 10.326416015625, 10.6923828125, 11.058349609375, 11.42431640625, 11.790283203125, 12.15625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 5.0, 7.0, 15.0, 18.0, 13.0, 29.0, 48.0, 68.0, 104.0, 129.0, 196.0, 268.0, 329.0, 546.0, 796.0, 1149.0, 1507.0, 2400.0, 3448.0, 5343.0, 8116.0, 12790.0, 20371.0, 33655.0, 58089.0, 108637.0, 222712.0, 262609.0, 132377.0, 68256.0, 39022.0, 23346.0, 14478.0, 9293.0, 6023.0, 3916.0, 2655.0, 1831.0, 1149.0, 808.0, 607.0, 405.0, 315.0, 213.0, 136.0, 97.0, 73.0, 51.0, 30.0, 33.0, 24.0, 16.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1142578125, -1.0784759521484375, -1.042694091796875, -1.0069122314453125, -0.97113037109375, -0.9353485107421875, -0.899566650390625, -0.8637847900390625, -0.8280029296875, -0.7922210693359375, -0.756439208984375, -0.7206573486328125, -0.68487548828125, -0.6490936279296875, -0.613311767578125, -0.5775299072265625, -0.541748046875, -0.5059661865234375, -0.470184326171875, -0.4344024658203125, -0.39862060546875, -0.3628387451171875, -0.327056884765625, -0.2912750244140625, -0.2554931640625, -0.2197113037109375, -0.183929443359375, -0.1481475830078125, -0.11236572265625, -0.0765838623046875, -0.040802001953125, -0.0050201416015625, 0.03076171875, 0.0665435791015625, 0.102325439453125, 0.1381072998046875, 0.17388916015625, 0.2096710205078125, 0.245452880859375, 0.2812347412109375, 0.3170166015625, 0.3527984619140625, 0.388580322265625, 0.4243621826171875, 0.46014404296875, 0.4959259033203125, 0.531707763671875, 0.5674896240234375, 0.603271484375, 0.6390533447265625, 0.674835205078125, 0.7106170654296875, 0.74639892578125, 0.7821807861328125, 0.817962646484375, 0.8537445068359375, 0.8895263671875, 0.9253082275390625, 0.961090087890625, 0.9968719482421875, 1.03265380859375, 1.0684356689453125, 1.104217529296875, 1.1399993896484375, 1.17578125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 9.0, 5.0, 4.0, 11.0, 16.0, 16.0, 16.0, 18.0, 31.0, 27.0, 26.0, 22.0, 31.0, 39.0, 24.0, 25.0, 36.0, 31.0, 40.0, 51.0, 1054.0, 42.0, 44.0, 33.0, 38.0, 30.0, 29.0, 33.0, 38.0, 30.0, 30.0, 23.0, 17.0, 17.0, 17.0, 14.0, 11.0, 10.0, 8.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.0234375, -5.8134765625, -5.603515625, -5.3935546875, -5.18359375, -4.9736328125, -4.763671875, -4.5537109375, -4.34375, -4.1337890625, -3.923828125, -3.7138671875, -3.50390625, -3.2939453125, -3.083984375, -2.8740234375, -2.6640625, -2.4541015625, -2.244140625, -2.0341796875, -1.82421875, -1.6142578125, -1.404296875, -1.1943359375, -0.984375, -0.7744140625, -0.564453125, -0.3544921875, -0.14453125, 0.0654296875, 0.275390625, 0.4853515625, 0.6953125, 0.9052734375, 1.115234375, 1.3251953125, 1.53515625, 1.7451171875, 1.955078125, 2.1650390625, 2.375, 2.5849609375, 2.794921875, 3.0048828125, 3.21484375, 3.4248046875, 3.634765625, 3.8447265625, 4.0546875, 4.2646484375, 4.474609375, 4.6845703125, 4.89453125, 5.1044921875, 5.314453125, 5.5244140625, 5.734375, 5.9443359375, 6.154296875, 6.3642578125, 6.57421875, 6.7841796875, 6.994140625, 7.2041015625, 7.4140625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 17.0, 16.0, 37.0, 49.0, 87.0, 116.0, 160.0, 279.0, 413.0, 685.0, 995.0, 1577.0, 2530.0, 3840.0, 6088.0, 9694.0, 15455.0, 24680.0, 40913.0, 69615.0, 124625.0, 683999.0, 806968.0, 126088.0, 69611.0, 40639.0, 25077.0, 15711.0, 9997.0, 6267.0, 3951.0, 2468.0, 1559.0, 1033.0, 643.0, 453.0, 270.0, 150.0, 125.0, 89.0, 56.0, 33.0, 20.0, 14.0, 8.0, 9.0, 4.0, 1.0, 5.0, 0.0, 2.0], "bins": [-0.767578125, -0.7456512451171875, -0.723724365234375, -0.7017974853515625, -0.67987060546875, -0.6579437255859375, -0.636016845703125, -0.6140899658203125, -0.5921630859375, -0.5702362060546875, -0.548309326171875, -0.5263824462890625, -0.50445556640625, -0.4825286865234375, -0.460601806640625, -0.4386749267578125, -0.416748046875, -0.3948211669921875, -0.372894287109375, -0.3509674072265625, -0.32904052734375, -0.3071136474609375, -0.285186767578125, -0.2632598876953125, -0.2413330078125, -0.2194061279296875, -0.197479248046875, -0.1755523681640625, -0.15362548828125, -0.1316986083984375, -0.109771728515625, -0.0878448486328125, -0.06591796875, -0.0439910888671875, -0.022064208984375, -0.0001373291015625, 0.02178955078125, 0.0437164306640625, 0.065643310546875, 0.0875701904296875, 0.1094970703125, 0.1314239501953125, 0.153350830078125, 0.1752777099609375, 0.19720458984375, 0.2191314697265625, 0.241058349609375, 0.2629852294921875, 0.284912109375, 0.3068389892578125, 0.328765869140625, 0.3506927490234375, 0.37261962890625, 0.3945465087890625, 0.416473388671875, 0.4384002685546875, 0.4603271484375, 0.4822540283203125, 0.504180908203125, 0.5261077880859375, 0.54803466796875, 0.5699615478515625, 0.591888427734375, 0.6138153076171875, 0.6357421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 3.0, 7.0, 2.0, 5.0, 10.0, 8.0, 13.0, 10.0, 9.0, 11.0, 18.0, 16.0, 18.0, 25.0, 28.0, 35.0, 39.0, 49.0, 62.0, 67.0, 72.0, 68.0, 72.0, 54.0, 47.0, 31.0, 38.0, 22.0, 25.0, 16.0, 19.0, 19.0, 12.0, 10.0, 13.0, 2.0, 4.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01110076904296875, -0.010750174522399902, -0.010399580001831055, -0.010048985481262207, -0.00969839096069336, -0.009347796440124512, -0.008997201919555664, -0.008646607398986816, -0.008296012878417969, -0.007945418357849121, -0.0075948238372802734, -0.007244229316711426, -0.006893634796142578, -0.0065430402755737305, -0.006192445755004883, -0.005841851234436035, -0.0054912567138671875, -0.00514066219329834, -0.004790067672729492, -0.0044394731521606445, -0.004088878631591797, -0.0037382841110229492, -0.0033876895904541016, -0.003037095069885254, -0.0026865005493164062, -0.0023359060287475586, -0.001985311508178711, -0.0016347169876098633, -0.0012841224670410156, -0.000933527946472168, -0.0005829334259033203, -0.00023233890533447266, 0.000118255615234375, 0.00046885013580322266, 0.0008194446563720703, 0.001170039176940918, 0.0015206336975097656, 0.0018712282180786133, 0.002221822738647461, 0.0025724172592163086, 0.0029230117797851562, 0.003273606300354004, 0.0036242008209228516, 0.003974795341491699, 0.004325389862060547, 0.0046759843826293945, 0.005026578903198242, 0.00537717342376709, 0.0057277679443359375, 0.006078362464904785, 0.006428956985473633, 0.0067795515060424805, 0.007130146026611328, 0.007480740547180176, 0.007831335067749023, 0.008181929588317871, 0.008532524108886719, 0.008883118629455566, 0.009233713150024414, 0.009584307670593262, 0.00993490219116211, 0.010285496711730957, 0.010636091232299805, 0.010986685752868652, 0.0113372802734375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 6.0, 8.0, 8.0, 10.0, 10.0, 10.0, 23.0, 27.0, 29.0, 28.0, 52.0, 79.0, 114.0, 154.0, 272.0, 743.0, 6406.0, 884851.0, 151469.0, 2998.0, 514.0, 235.0, 105.0, 101.0, 64.0, 44.0, 39.0, 30.0, 32.0, 23.0, 17.0, 9.0, 7.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.5537109375, -0.5373573303222656, -0.5210037231445312, -0.5046501159667969, -0.4882965087890625, -0.4719429016113281, -0.45558929443359375, -0.4392356872558594, -0.422882080078125, -0.4065284729003906, -0.39017486572265625, -0.3738212585449219, -0.3574676513671875, -0.3411140441894531, -0.32476043701171875, -0.3084068298339844, -0.29205322265625, -0.2756996154785156, -0.25934600830078125, -0.24299240112304688, -0.2266387939453125, -0.21028518676757812, -0.19393157958984375, -0.17757797241210938, -0.161224365234375, -0.14487075805664062, -0.12851715087890625, -0.11216354370117188, -0.0958099365234375, -0.07945632934570312, -0.06310272216796875, -0.046749114990234375, -0.0303955078125, -0.014041900634765625, 0.00231170654296875, 0.018665313720703125, 0.0350189208984375, 0.051372528076171875, 0.06772613525390625, 0.08407974243164062, 0.100433349609375, 0.11678695678710938, 0.13314056396484375, 0.14949417114257812, 0.1658477783203125, 0.18220138549804688, 0.19855499267578125, 0.21490859985351562, 0.23126220703125, 0.24761581420898438, 0.26396942138671875, 0.2803230285644531, 0.2966766357421875, 0.3130302429199219, 0.32938385009765625, 0.3457374572753906, 0.362091064453125, 0.3784446716308594, 0.39479827880859375, 0.4111518859863281, 0.4275054931640625, 0.4438591003417969, 0.46021270751953125, 0.4765663146972656, 0.492919921875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 14.0, 46.0, 226.0, 550.0, 136.0, 29.0, 10.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033143263310194016, -0.025342797860503197, -0.017542332410812378, -0.009741868823766708, -0.0019414033740758896, 0.005859062075614929, 0.013659525662660599, 0.021459992974996567, 0.029260456562042236, 0.037060920149087906, 0.044861387461423874, 0.05266185104846954, 0.06046231836080551, 0.06826278567314148, 0.07606324553489685, 0.08386371284723282, 0.09166418015956879, 0.09946464747190475, 0.10726510733366013, 0.1150655746459961, 0.12286604195833206, 0.13066650927066803, 0.1384669691324234, 0.14626744389533997, 0.15406790375709534, 0.1618683636188507, 0.16966883838176727, 0.17746929824352264, 0.18526975810527802, 0.19307023286819458, 0.20087069272994995, 0.20867115259170532, 0.2164716273546219, 0.22427208721637726, 0.23207256197929382, 0.2398730218410492, 0.24767348170280457, 0.25547394156455994, 0.2632744312286377, 0.27107489109039307, 0.27887535095214844, 0.2866758108139038, 0.2944762706756592, 0.30227673053741455, 0.3100772202014923, 0.3178776800632477, 0.32567813992500305, 0.3334785997867584, 0.3412790596485138, 0.34907951951026917, 0.35687997937202454, 0.3646804690361023, 0.37248092889785767, 0.38028138875961304, 0.3880818486213684, 0.3958823084831238, 0.40368279814720154, 0.4114832580089569, 0.4192837178707123, 0.42708420753479004, 0.4348846673965454, 0.4426851272583008, 0.45048558712005615, 0.4582860469818115, 0.4660865068435669]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 7.0, 5.0, 8.0, 7.0, 13.0, 11.0, 14.0, 14.0, 17.0, 20.0, 15.0, 11.0, 22.0, 29.0, 25.0, 41.0, 35.0, 35.0, 36.0, 37.0, 45.0, 40.0, 43.0, 39.0, 42.0, 38.0, 34.0, 29.0, 37.0, 30.0, 23.0, 27.0, 32.0, 22.0, 22.0, 15.0, 15.0, 22.0, 11.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.013226926326751709, -0.01282772421836853, -0.012428522109985352, -0.012029320001602173, -0.011630117893218994, -0.011230915784835815, -0.010831713676452637, -0.010432511568069458, -0.01003330945968628, -0.0096341073513031, -0.009234905242919922, -0.008835703134536743, -0.008436501026153564, -0.008037298917770386, -0.007638096809387207, -0.007238894701004028, -0.00683969259262085, -0.006440490484237671, -0.006041288375854492, -0.0056420862674713135, -0.005242884159088135, -0.004843682050704956, -0.004444479942321777, -0.004045277833938599, -0.00364607572555542, -0.003246873617172241, -0.0028476715087890625, -0.002448469400405884, -0.002049267292022705, -0.0016500651836395264, -0.0012508630752563477, -0.0008516609668731689, -0.00045245885848999023, -5.3256750106811523e-05, 0.0003459453582763672, 0.0007451474666595459, 0.0011443495750427246, 0.0015435516834259033, 0.001942753791809082, 0.0023419559001922607, 0.0027411580085754395, 0.003140360116958618, 0.003539562225341797, 0.003938764333724976, 0.004337966442108154, 0.004737168550491333, 0.005136370658874512, 0.00553557276725769, 0.005934774875640869, 0.006333976984024048, 0.0067331790924072266, 0.007132381200790405, 0.007531583309173584, 0.007930785417556763, 0.008329987525939941, 0.00872918963432312, 0.009128391742706299, 0.009527593851089478, 0.009926795959472656, 0.010325998067855835, 0.010725200176239014, 0.011124402284622192, 0.011523604393005371, 0.01192280650138855, 0.012322008609771729]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 4.0, 9.0, 8.0, 6.0, 15.0, 11.0, 12.0, 21.0, 19.0, 25.0, 37.0, 31.0, 35.0, 30.0, 31.0, 49.0, 55.0, 54.0, 46.0, 57.0, 39.0, 48.0, 36.0, 39.0, 35.0, 33.0, 35.0, 32.0, 18.0, 25.0, 18.0, 19.0, 18.0, 13.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.265625, -10.899658203125, -10.53369140625, -10.167724609375, -9.8017578125, -9.435791015625, -9.06982421875, -8.703857421875, -8.337890625, -7.971923828125, -7.60595703125, -7.239990234375, -6.8740234375, -6.508056640625, -6.14208984375, -5.776123046875, -5.41015625, -5.044189453125, -4.67822265625, -4.312255859375, -3.9462890625, -3.580322265625, -3.21435546875, -2.848388671875, -2.482421875, -2.116455078125, -1.75048828125, -1.384521484375, -1.0185546875, -0.652587890625, -0.28662109375, 0.079345703125, 0.4453125, 0.811279296875, 1.17724609375, 1.543212890625, 1.9091796875, 2.275146484375, 2.64111328125, 3.007080078125, 3.373046875, 3.739013671875, 4.10498046875, 4.470947265625, 4.8369140625, 5.202880859375, 5.56884765625, 5.934814453125, 6.30078125, 6.666748046875, 7.03271484375, 7.398681640625, 7.7646484375, 8.130615234375, 8.49658203125, 8.862548828125, 9.228515625, 9.594482421875, 9.96044921875, 10.326416015625, 10.6923828125, 11.058349609375, 11.42431640625, 11.790283203125, 12.15625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 13.0, 12.0, 12.0, 23.0, 30.0, 43.0, 59.0, 95.0, 108.0, 187.0, 237.0, 402.0, 593.0, 1053.0, 1863.0, 3594.0, 7412.0, 17179.0, 47684.0, 163485.0, 533642.0, 183643.0, 52206.0, 18566.0, 7611.0, 3629.0, 2009.0, 1122.0, 688.0, 410.0, 290.0, 182.0, 141.0, 95.0, 58.0, 46.0, 29.0, 20.0, 16.0, 18.0, 7.0, 7.0, 4.0, 6.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.06640625, -4.8948974609375, -4.723388671875, -4.5518798828125, -4.38037109375, -4.2088623046875, -4.037353515625, -3.8658447265625, -3.6943359375, -3.5228271484375, -3.351318359375, -3.1798095703125, -3.00830078125, -2.8367919921875, -2.665283203125, -2.4937744140625, -2.322265625, -2.1507568359375, -1.979248046875, -1.8077392578125, -1.63623046875, -1.4647216796875, -1.293212890625, -1.1217041015625, -0.9501953125, -0.7786865234375, -0.607177734375, -0.4356689453125, -0.26416015625, -0.0926513671875, 0.078857421875, 0.2503662109375, 0.421875, 0.5933837890625, 0.764892578125, 0.9364013671875, 1.10791015625, 1.2794189453125, 1.450927734375, 1.6224365234375, 1.7939453125, 1.9654541015625, 2.136962890625, 2.3084716796875, 2.47998046875, 2.6514892578125, 2.822998046875, 2.9945068359375, 3.166015625, 3.3375244140625, 3.509033203125, 3.6805419921875, 3.85205078125, 4.0235595703125, 4.195068359375, 4.3665771484375, 4.5380859375, 4.7095947265625, 4.881103515625, 5.0526123046875, 5.22412109375, 5.3956298828125, 5.567138671875, 5.7386474609375, 5.91015625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 7.0, 5.0, 5.0, 12.0, 8.0, 7.0, 15.0, 15.0, 19.0, 29.0, 19.0, 25.0, 25.0, 25.0, 34.0, 32.0, 34.0, 32.0, 44.0, 55.0, 206.0, 1890.0, 70.0, 40.0, 24.0, 44.0, 26.0, 33.0, 33.0, 28.0, 28.0, 16.0, 27.0, 22.0, 16.0, 16.0, 19.0, 10.0, 10.0, 11.0, 11.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-39.46875, -38.27880859375, -37.0888671875, -35.89892578125, -34.708984375, -33.51904296875, -32.3291015625, -31.13916015625, -29.94921875, -28.75927734375, -27.5693359375, -26.37939453125, -25.189453125, -23.99951171875, -22.8095703125, -21.61962890625, -20.4296875, -19.23974609375, -18.0498046875, -16.85986328125, -15.669921875, -14.47998046875, -13.2900390625, -12.10009765625, -10.91015625, -9.72021484375, -8.5302734375, -7.34033203125, -6.150390625, -4.96044921875, -3.7705078125, -2.58056640625, -1.390625, -0.20068359375, 0.9892578125, 2.17919921875, 3.369140625, 4.55908203125, 5.7490234375, 6.93896484375, 8.12890625, 9.31884765625, 10.5087890625, 11.69873046875, 12.888671875, 14.07861328125, 15.2685546875, 16.45849609375, 17.6484375, 18.83837890625, 20.0283203125, 21.21826171875, 22.408203125, 23.59814453125, 24.7880859375, 25.97802734375, 27.16796875, 28.35791015625, 29.5478515625, 30.73779296875, 31.927734375, 33.11767578125, 34.3076171875, 35.49755859375, 36.6875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 10.0, 10.0, 6.0, 15.0, 19.0, 14.0, 19.0, 21.0, 29.0, 25.0, 44.0, 55.0, 64.0, 117.0, 132.0, 213.0, 352.0, 664.0, 2958.0, 3031486.0, 106462.0, 1466.0, 528.0, 312.0, 199.0, 110.0, 79.0, 51.0, 40.0, 36.0, 23.0, 28.0, 22.0, 18.0, 15.0, 8.0, 8.0, 7.0, 6.0, 6.0, 7.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-60.1875, -58.2353515625, -56.283203125, -54.3310546875, -52.37890625, -50.4267578125, -48.474609375, -46.5224609375, -44.5703125, -42.6181640625, -40.666015625, -38.7138671875, -36.76171875, -34.8095703125, -32.857421875, -30.9052734375, -28.953125, -27.0009765625, -25.048828125, -23.0966796875, -21.14453125, -19.1923828125, -17.240234375, -15.2880859375, -13.3359375, -11.3837890625, -9.431640625, -7.4794921875, -5.52734375, -3.5751953125, -1.623046875, 0.3291015625, 2.28125, 4.2333984375, 6.185546875, 8.1376953125, 10.08984375, 12.0419921875, 13.994140625, 15.9462890625, 17.8984375, 19.8505859375, 21.802734375, 23.7548828125, 25.70703125, 27.6591796875, 29.611328125, 31.5634765625, 33.515625, 35.4677734375, 37.419921875, 39.3720703125, 41.32421875, 43.2763671875, 45.228515625, 47.1806640625, 49.1328125, 51.0849609375, 53.037109375, 54.9892578125, 56.94140625, 58.8935546875, 60.845703125, 62.7978515625, 64.75]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 412.0, 606.0, 1.0, 1.0, 2.0], "bins": [-669.5501708984375, -658.401123046875, -647.2520751953125, -636.10302734375, -624.9539794921875, -613.8049926757812, -602.6559448242188, -591.5068969726562, -580.3578491210938, -569.2088012695312, -558.0597534179688, -546.9107055664062, -535.7616577148438, -524.6126708984375, -513.463623046875, -502.3145751953125, -491.16552734375, -480.0164794921875, -468.867431640625, -457.7184143066406, -446.5693664550781, -435.4203186035156, -424.2712707519531, -413.12225341796875, -401.9731750488281, -390.8241271972656, -379.6750793457031, -368.52606201171875, -357.37701416015625, -346.22796630859375, -335.07891845703125, -323.92987060546875, -312.78082275390625, -301.63177490234375, -290.48272705078125, -279.3337097167969, -268.1846618652344, -257.0356140136719, -245.88656616210938, -234.73753356933594, -223.5885009765625, -212.439453125, -201.29042053222656, -190.14137268066406, -178.99234008789062, -167.84329223632812, -156.69424438476562, -145.5452117919922, -134.39617919921875, -123.24713897705078, -112.09809875488281, -100.94905090332031, -89.80001831054688, -78.65097045898438, -67.5019302368164, -56.35289001464844, -45.20384216308594, -34.05480194091797, -22.905759811401367, -11.756717681884766, -0.6076774597167969, 10.541362762451172, 21.690406799316406, 32.839447021484375, 43.988487243652344]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 2.0, 5.0, 10.0, 6.0, 6.0, 10.0, 14.0, 11.0, 12.0, 24.0, 26.0, 21.0, 26.0, 20.0, 28.0, 31.0, 42.0, 32.0, 34.0, 40.0, 30.0, 36.0, 46.0, 40.0, 35.0, 29.0, 25.0, 32.0, 33.0, 41.0, 32.0, 23.0, 22.0, 21.0, 16.0, 23.0, 12.0, 17.0, 9.0, 17.0, 11.0, 6.0, 10.0, 9.0, 8.0, 7.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-127.93402099609375, -124.18264770507812, -120.43128204345703, -116.67991638183594, -112.92854309082031, -109.17716979980469, -105.4258041381836, -101.6744384765625, -97.92306518554688, -94.17169189453125, -90.42032623291016, -86.66896057128906, -82.91758728027344, -79.16621398925781, -75.41484832763672, -71.66348266601562, -67.912109375, -64.16073608398438, -60.40937042236328, -56.65800094604492, -52.90663146972656, -49.1552619934082, -45.403892517089844, -41.652523040771484, -37.901153564453125, -34.149784088134766, -30.398414611816406, -26.647045135498047, -22.895675659179688, -19.144306182861328, -15.392936706542969, -11.64156723022461, -7.89019775390625, -4.138828277587891, -0.38745880126953125, 3.363910675048828, 7.1152801513671875, 10.866649627685547, 14.618019104003906, 18.369388580322266, 22.120758056640625, 25.872127532958984, 29.623497009277344, 33.3748664855957, 37.12623596191406, 40.87760543823242, 44.62897491455078, 48.38034439086914, 52.1317138671875, 55.88308334350586, 59.63445281982422, 63.38582229614258, 67.13719177246094, 70.88856506347656, 74.63993072509766, 78.39129638671875, 82.14266967773438, 85.89404296875, 89.6454086303711, 93.39677429199219, 97.14814758300781, 100.89952087402344, 104.65088653564453, 108.40225219726562, 112.15362548828125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 6.0, 6.0, 10.0, 14.0, 9.0, 13.0, 20.0, 11.0, 27.0, 34.0, 35.0, 28.0, 29.0, 37.0, 38.0, 54.0, 54.0, 47.0, 55.0, 42.0, 47.0, 39.0, 41.0, 32.0, 40.0, 30.0, 36.0, 23.0, 18.0, 24.0, 18.0, 14.0, 21.0, 8.0, 6.0, 4.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.3828125, -11.017822265625, -10.65283203125, -10.287841796875, -9.9228515625, -9.557861328125, -9.19287109375, -8.827880859375, -8.462890625, -8.097900390625, -7.73291015625, -7.367919921875, -7.0029296875, -6.637939453125, -6.27294921875, -5.907958984375, -5.54296875, -5.177978515625, -4.81298828125, -4.447998046875, -4.0830078125, -3.718017578125, -3.35302734375, -2.988037109375, -2.623046875, -2.258056640625, -1.89306640625, -1.528076171875, -1.1630859375, -0.798095703125, -0.43310546875, -0.068115234375, 0.296875, 0.661865234375, 1.02685546875, 1.391845703125, 1.7568359375, 2.121826171875, 2.48681640625, 2.851806640625, 3.216796875, 3.581787109375, 3.94677734375, 4.311767578125, 4.6767578125, 5.041748046875, 5.40673828125, 5.771728515625, 6.13671875, 6.501708984375, 6.86669921875, 7.231689453125, 7.5966796875, 7.961669921875, 8.32666015625, 8.691650390625, 9.056640625, 9.421630859375, 9.78662109375, 10.151611328125, 10.5166015625, 10.881591796875, 11.24658203125, 11.611572265625, 11.9765625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 5.0, 6.0, 9.0, 13.0, 9.0, 21.0, 31.0, 38.0, 44.0, 75.0, 85.0, 130.0, 147.0, 213.0, 336.0, 425.0, 713.0, 936.0, 1508.0, 2239.0, 3688.0, 6241.0, 11755.0, 47183.0, 1004766.0, 2944907.0, 131017.0, 17568.0, 7864.0, 4526.0, 2674.0, 1695.0, 1070.0, 743.0, 475.0, 330.0, 233.0, 158.0, 120.0, 79.0, 63.0, 38.0, 33.0, 23.0, 14.0, 7.0, 16.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-32.84375, -31.85400390625, -30.8642578125, -29.87451171875, -28.884765625, -27.89501953125, -26.9052734375, -25.91552734375, -24.92578125, -23.93603515625, -22.9462890625, -21.95654296875, -20.966796875, -19.97705078125, -18.9873046875, -17.99755859375, -17.0078125, -16.01806640625, -15.0283203125, -14.03857421875, -13.048828125, -12.05908203125, -11.0693359375, -10.07958984375, -9.08984375, -8.10009765625, -7.1103515625, -6.12060546875, -5.130859375, -4.14111328125, -3.1513671875, -2.16162109375, -1.171875, -0.18212890625, 0.8076171875, 1.79736328125, 2.787109375, 3.77685546875, 4.7666015625, 5.75634765625, 6.74609375, 7.73583984375, 8.7255859375, 9.71533203125, 10.705078125, 11.69482421875, 12.6845703125, 13.67431640625, 14.6640625, 15.65380859375, 16.6435546875, 17.63330078125, 18.623046875, 19.61279296875, 20.6025390625, 21.59228515625, 22.58203125, 23.57177734375, 24.5615234375, 25.55126953125, 26.541015625, 27.53076171875, 28.5205078125, 29.51025390625, 30.5]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 2.0, 6.0, 7.0, 6.0, 10.0, 11.0, 12.0, 10.0, 12.0, 19.0, 32.0, 30.0, 72.0, 126.0, 274.0, 530.0, 929.0, 877.0, 507.0, 245.0, 118.0, 61.0, 36.0, 29.0, 13.0, 16.0, 9.0, 13.0, 10.0, 4.0, 9.0, 6.0, 4.0, 9.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-34.375, -33.361572265625, -32.34814453125, -31.334716796875, -30.3212890625, -29.307861328125, -28.29443359375, -27.281005859375, -26.267578125, -25.254150390625, -24.24072265625, -23.227294921875, -22.2138671875, -21.200439453125, -20.18701171875, -19.173583984375, -18.16015625, -17.146728515625, -16.13330078125, -15.119873046875, -14.1064453125, -13.093017578125, -12.07958984375, -11.066162109375, -10.052734375, -9.039306640625, -8.02587890625, -7.012451171875, -5.9990234375, -4.985595703125, -3.97216796875, -2.958740234375, -1.9453125, -0.931884765625, 0.08154296875, 1.094970703125, 2.1083984375, 3.121826171875, 4.13525390625, 5.148681640625, 6.162109375, 7.175537109375, 8.18896484375, 9.202392578125, 10.2158203125, 11.229248046875, 12.24267578125, 13.256103515625, 14.26953125, 15.282958984375, 16.29638671875, 17.309814453125, 18.3232421875, 19.336669921875, 20.35009765625, 21.363525390625, 22.376953125, 23.390380859375, 24.40380859375, 25.417236328125, 26.4306640625, 27.444091796875, 28.45751953125, 29.470947265625, 30.484375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 15.0, 26.0, 21.0, 42.0, 67.0, 95.0, 143.0, 231.0, 316.0, 466.0, 726.0, 1139.0, 1694.0, 2780.0, 4390.0, 7326.0, 12642.0, 24948.0, 69090.0, 735850.0, 3090272.0, 162153.0, 37933.0, 17192.0, 9504.0, 5550.0, 3464.0, 2169.0, 1379.0, 915.0, 597.0, 370.0, 260.0, 160.0, 110.0, 65.0, 55.0, 45.0, 19.0, 15.0, 12.0, 12.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.03125, -36.6845703125, -35.337890625, -33.9912109375, -32.64453125, -31.2978515625, -29.951171875, -28.6044921875, -27.2578125, -25.9111328125, -24.564453125, -23.2177734375, -21.87109375, -20.5244140625, -19.177734375, -17.8310546875, -16.484375, -15.1376953125, -13.791015625, -12.4443359375, -11.09765625, -9.7509765625, -8.404296875, -7.0576171875, -5.7109375, -4.3642578125, -3.017578125, -1.6708984375, -0.32421875, 1.0224609375, 2.369140625, 3.7158203125, 5.0625, 6.4091796875, 7.755859375, 9.1025390625, 10.44921875, 11.7958984375, 13.142578125, 14.4892578125, 15.8359375, 17.1826171875, 18.529296875, 19.8759765625, 21.22265625, 22.5693359375, 23.916015625, 25.2626953125, 26.609375, 27.9560546875, 29.302734375, 30.6494140625, 31.99609375, 33.3427734375, 34.689453125, 36.0361328125, 37.3828125, 38.7294921875, 40.076171875, 41.4228515625, 42.76953125, 44.1162109375, 45.462890625, 46.8095703125, 48.15625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 21.0, 48.0, 92.0, 255.0, 344.0, 132.0, 51.0, 23.0, 17.0, 7.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.1599578857422, -126.76881408691406, -116.37767028808594, -105.98652648925781, -95.59538269042969, -85.20423889160156, -74.81310272216797, -64.42195892333984, -54.03081512451172, -43.639671325683594, -33.24852752685547, -22.85738754272461, -12.466243743896484, -2.0750999450683594, 8.3160400390625, 18.707183837890625, 29.09832763671875, 39.489471435546875, 49.880615234375, 60.27175521850586, 70.66290283203125, 81.05404663085938, 91.44518280029297, 101.8363265991211, 112.22747039794922, 122.61861419677734, 133.00975036621094, 143.40089416503906, 153.7920379638672, 164.1831817626953, 174.57432556152344, 184.96546936035156, 195.35659790039062, 205.74774169921875, 216.13888549804688, 226.530029296875, 236.92117309570312, 247.31231689453125, 257.7034606933594, 268.0946044921875, 278.4857482910156, 288.87689208984375, 299.2680358886719, 309.6591796875, 320.0503234863281, 330.44146728515625, 340.8326110839844, 351.2237548828125, 361.6148681640625, 372.0060119628906, 382.39715576171875, 392.7882995605469, 403.179443359375, 413.5705871582031, 423.96173095703125, 434.3528747558594, 444.7440185546875, 455.1351623535156, 465.52630615234375, 475.9174499511719, 486.30859375, 496.6997375488281, 507.09088134765625, 517.4819946289062, 527.8731689453125]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 5.0, 10.0, 14.0, 13.0, 20.0, 27.0, 16.0, 27.0, 23.0, 23.0, 25.0, 31.0, 34.0, 37.0, 35.0, 51.0, 42.0, 44.0, 49.0, 43.0, 55.0, 38.0, 41.0, 28.0, 32.0, 31.0, 24.0, 26.0, 31.0, 20.0, 17.0, 17.0, 11.0, 17.0, 6.0, 7.0, 12.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.45968627929688, -81.68390655517578, -78.90812683105469, -76.13233947753906, -73.35655975341797, -70.58078002929688, -67.80500030517578, -65.02922058105469, -62.25343704223633, -59.477657318115234, -56.701873779296875, -53.92609405517578, -51.15031433105469, -48.37453079223633, -45.598751068115234, -42.822967529296875, -40.04718780517578, -37.27140808105469, -34.49562454223633, -31.719844818115234, -28.944063186645508, -26.16828155517578, -23.392501831054688, -20.61672019958496, -17.840938568115234, -15.065156936645508, -12.289376258850098, -9.513595581054688, -6.737813949584961, -3.9620323181152344, -1.1862525939941406, 1.589529037475586, 4.365318298339844, 7.141099452972412, 9.91688060760498, 12.69266128540039, 15.468442916870117, 18.244224548339844, 21.020004272460938, 23.795785903930664, 26.57156753540039, 29.347349166870117, 32.123130798339844, 34.89891052246094, 37.67469024658203, 40.45047378540039, 43.226253509521484, 46.002037048339844, 48.77781677246094, 51.55359649658203, 54.32938003540039, 57.105159759521484, 59.880943298339844, 62.65672302246094, 65.43250274658203, 68.20828247070312, 70.98406982421875, 73.75984954833984, 76.53562927246094, 79.31141662597656, 82.08719635009766, 84.86297607421875, 87.63875579833984, 90.41453552246094, 93.19031524658203]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 8.0, 3.0, 9.0, 10.0, 6.0, 11.0, 10.0, 16.0, 14.0, 16.0, 32.0, 28.0, 31.0, 45.0, 34.0, 40.0, 36.0, 31.0, 55.0, 41.0, 60.0, 47.0, 52.0, 45.0, 31.0, 36.0, 27.0, 39.0, 34.0, 24.0, 24.0, 21.0, 19.0, 16.0, 12.0, 6.0, 7.0, 6.0, 8.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9453125, -11.5615234375, -11.177734375, -10.7939453125, -10.41015625, -10.0263671875, -9.642578125, -9.2587890625, -8.875, -8.4912109375, -8.107421875, -7.7236328125, -7.33984375, -6.9560546875, -6.572265625, -6.1884765625, -5.8046875, -5.4208984375, -5.037109375, -4.6533203125, -4.26953125, -3.8857421875, -3.501953125, -3.1181640625, -2.734375, -2.3505859375, -1.966796875, -1.5830078125, -1.19921875, -0.8154296875, -0.431640625, -0.0478515625, 0.3359375, 0.7197265625, 1.103515625, 1.4873046875, 1.87109375, 2.2548828125, 2.638671875, 3.0224609375, 3.40625, 3.7900390625, 4.173828125, 4.5576171875, 4.94140625, 5.3251953125, 5.708984375, 6.0927734375, 6.4765625, 6.8603515625, 7.244140625, 7.6279296875, 8.01171875, 8.3955078125, 8.779296875, 9.1630859375, 9.546875, 9.9306640625, 10.314453125, 10.6982421875, 11.08203125, 11.4658203125, 11.849609375, 12.2333984375, 12.6171875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 9.0, 4.0, 8.0, 9.0, 15.0, 34.0, 45.0, 64.0, 87.0, 138.0, 217.0, 265.0, 417.0, 672.0, 955.0, 1425.0, 2226.0, 3324.0, 5263.0, 9029.0, 14632.0, 25552.0, 45476.0, 87416.0, 182913.0, 296389.0, 178301.0, 85298.0, 44912.0, 25034.0, 14708.0, 8532.0, 5386.0, 3397.0, 2124.0, 1389.0, 921.0, 626.0, 422.0, 290.0, 201.0, 134.0, 90.0, 82.0, 40.0, 29.0, 21.0, 14.0, 12.0, 6.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.2529296875, -1.213134765625, -1.17333984375, -1.133544921875, -1.09375, -1.053955078125, -1.01416015625, -0.974365234375, -0.9345703125, -0.894775390625, -0.85498046875, -0.815185546875, -0.775390625, -0.735595703125, -0.69580078125, -0.656005859375, -0.6162109375, -0.576416015625, -0.53662109375, -0.496826171875, -0.45703125, -0.417236328125, -0.37744140625, -0.337646484375, -0.2978515625, -0.258056640625, -0.21826171875, -0.178466796875, -0.138671875, -0.098876953125, -0.05908203125, -0.019287109375, 0.0205078125, 0.060302734375, 0.10009765625, 0.139892578125, 0.1796875, 0.219482421875, 0.25927734375, 0.299072265625, 0.3388671875, 0.378662109375, 0.41845703125, 0.458251953125, 0.498046875, 0.537841796875, 0.57763671875, 0.617431640625, 0.6572265625, 0.697021484375, 0.73681640625, 0.776611328125, 0.81640625, 0.856201171875, 0.89599609375, 0.935791015625, 0.9755859375, 1.015380859375, 1.05517578125, 1.094970703125, 1.134765625, 1.174560546875, 1.21435546875, 1.254150390625, 1.2939453125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 11.0, 6.0, 16.0, 14.0, 21.0, 25.0, 18.0, 25.0, 36.0, 30.0, 33.0, 41.0, 35.0, 48.0, 42.0, 34.0, 49.0, 1063.0, 43.0, 35.0, 50.0, 31.0, 34.0, 25.0, 35.0, 20.0, 33.0, 31.0, 31.0, 19.0, 15.0, 5.0, 11.0, 7.0, 9.0, 11.0, 4.0, 7.0, 9.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.7265625, -8.49481201171875, -8.2630615234375, -8.03131103515625, -7.799560546875, -7.56781005859375, -7.3360595703125, -7.10430908203125, -6.87255859375, -6.64080810546875, -6.4090576171875, -6.17730712890625, -5.945556640625, -5.71380615234375, -5.4820556640625, -5.25030517578125, -5.0185546875, -4.78680419921875, -4.5550537109375, -4.32330322265625, -4.091552734375, -3.85980224609375, -3.6280517578125, -3.39630126953125, -3.16455078125, -2.93280029296875, -2.7010498046875, -2.46929931640625, -2.237548828125, -2.00579833984375, -1.7740478515625, -1.54229736328125, -1.310546875, -1.07879638671875, -0.8470458984375, -0.61529541015625, -0.383544921875, -0.15179443359375, 0.0799560546875, 0.31170654296875, 0.54345703125, 0.77520751953125, 1.0069580078125, 1.23870849609375, 1.470458984375, 1.70220947265625, 1.9339599609375, 2.16571044921875, 2.3974609375, 2.62921142578125, 2.8609619140625, 3.09271240234375, 3.324462890625, 3.55621337890625, 3.7879638671875, 4.01971435546875, 4.25146484375, 4.48321533203125, 4.7149658203125, 4.94671630859375, 5.178466796875, 5.41021728515625, 5.6419677734375, 5.87371826171875, 6.10546875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 11.0, 17.0, 16.0, 21.0, 54.0, 64.0, 132.0, 198.0, 297.0, 435.0, 696.0, 1140.0, 1791.0, 2708.0, 4280.0, 6849.0, 10664.0, 17273.0, 28949.0, 48769.0, 87465.0, 169389.0, 1312293.0, 179893.0, 92804.0, 51473.0, 30167.0, 18515.0, 11451.0, 7153.0, 4303.0, 2769.0, 1811.0, 1175.0, 760.0, 502.0, 298.0, 206.0, 146.0, 71.0, 32.0, 27.0, 18.0, 10.0, 17.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.666015625, -0.6426849365234375, -0.619354248046875, -0.5960235595703125, -0.57269287109375, -0.5493621826171875, -0.526031494140625, -0.5027008056640625, -0.4793701171875, -0.4560394287109375, -0.432708740234375, -0.4093780517578125, -0.38604736328125, -0.3627166748046875, -0.339385986328125, -0.3160552978515625, -0.292724609375, -0.2693939208984375, -0.246063232421875, -0.2227325439453125, -0.19940185546875, -0.1760711669921875, -0.152740478515625, -0.1294097900390625, -0.1060791015625, -0.0827484130859375, -0.059417724609375, -0.0360870361328125, -0.01275634765625, 0.0105743408203125, 0.033905029296875, 0.0572357177734375, 0.08056640625, 0.1038970947265625, 0.127227783203125, 0.1505584716796875, 0.17388916015625, 0.1972198486328125, 0.220550537109375, 0.2438812255859375, 0.2672119140625, 0.2905426025390625, 0.313873291015625, 0.3372039794921875, 0.36053466796875, 0.3838653564453125, 0.407196044921875, 0.4305267333984375, 0.453857421875, 0.4771881103515625, 0.500518798828125, 0.5238494873046875, 0.54718017578125, 0.5705108642578125, 0.593841552734375, 0.6171722412109375, 0.6405029296875, 0.6638336181640625, 0.687164306640625, 0.7104949951171875, 0.73382568359375, 0.7571563720703125, 0.780487060546875, 0.8038177490234375, 0.8271484375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 10.0, 6.0, 8.0, 9.0, 16.0, 13.0, 12.0, 20.0, 21.0, 19.0, 33.0, 35.0, 43.0, 44.0, 49.0, 50.0, 84.0, 78.0, 72.0, 71.0, 50.0, 48.0, 28.0, 29.0, 31.0, 20.0, 18.0, 14.0, 12.0, 9.0, 11.0, 8.0, 8.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0106048583984375, -0.010184049606323242, -0.009763240814208984, -0.009342432022094727, -0.008921623229980469, -0.008500814437866211, -0.008080005645751953, -0.007659196853637695, -0.0072383880615234375, -0.00681757926940918, -0.006396770477294922, -0.005975961685180664, -0.005555152893066406, -0.0051343441009521484, -0.004713535308837891, -0.004292726516723633, -0.003871917724609375, -0.003451108932495117, -0.0030303001403808594, -0.0026094913482666016, -0.0021886825561523438, -0.001767873764038086, -0.0013470649719238281, -0.0009262561798095703, -0.0005054473876953125, -8.463859558105469e-05, 0.0003361701965332031, 0.0007569789886474609, 0.0011777877807617188, 0.0015985965728759766, 0.0020194053649902344, 0.002440214157104492, 0.00286102294921875, 0.003281831741333008, 0.0037026405334472656, 0.0041234493255615234, 0.004544258117675781, 0.004965066909790039, 0.005385875701904297, 0.005806684494018555, 0.0062274932861328125, 0.00664830207824707, 0.007069110870361328, 0.007489919662475586, 0.007910728454589844, 0.008331537246704102, 0.00875234603881836, 0.009173154830932617, 0.009593963623046875, 0.010014772415161133, 0.01043558120727539, 0.010856389999389648, 0.011277198791503906, 0.011698007583618164, 0.012118816375732422, 0.01253962516784668, 0.012960433959960938, 0.013381242752075195, 0.013802051544189453, 0.014222860336303711, 0.014643669128417969, 0.015064477920532227, 0.015485286712646484, 0.015906095504760742, 0.016326904296875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 11.0, 6.0, 12.0, 8.0, 16.0, 22.0, 21.0, 19.0, 28.0, 30.0, 40.0, 55.0, 76.0, 125.0, 298.0, 1491.0, 25166.0, 1006211.0, 13133.0, 1069.0, 229.0, 119.0, 76.0, 50.0, 38.0, 28.0, 33.0, 21.0, 20.0, 13.0, 18.0, 12.0, 11.0, 13.0, 12.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4375, -0.4247894287109375, -0.412078857421875, -0.3993682861328125, -0.38665771484375, -0.3739471435546875, -0.361236572265625, -0.3485260009765625, -0.3358154296875, -0.3231048583984375, -0.310394287109375, -0.2976837158203125, -0.28497314453125, -0.2722625732421875, -0.259552001953125, -0.2468414306640625, -0.234130859375, -0.2214202880859375, -0.208709716796875, -0.1959991455078125, -0.18328857421875, -0.1705780029296875, -0.157867431640625, -0.1451568603515625, -0.1324462890625, -0.1197357177734375, -0.107025146484375, -0.0943145751953125, -0.08160400390625, -0.0688934326171875, -0.056182861328125, -0.0434722900390625, -0.03076171875, -0.0180511474609375, -0.005340576171875, 0.0073699951171875, 0.02008056640625, 0.0327911376953125, 0.045501708984375, 0.0582122802734375, 0.0709228515625, 0.0836334228515625, 0.096343994140625, 0.1090545654296875, 0.12176513671875, 0.1344757080078125, 0.147186279296875, 0.1598968505859375, 0.172607421875, 0.1853179931640625, 0.198028564453125, 0.2107391357421875, 0.22344970703125, 0.2361602783203125, 0.248870849609375, 0.2615814208984375, 0.2742919921875, 0.2870025634765625, 0.299713134765625, 0.3124237060546875, 0.32513427734375, 0.3378448486328125, 0.350555419921875, 0.3632659912109375, 0.3759765625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 16.0, 38.0, 94.0, 330.0, 350.0, 103.0, 36.0, 20.0, 11.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035230644047260284, -0.03170756995677948, -0.028184499591588974, -0.02466142736375332, -0.021138355135917664, -0.01761528290808201, -0.014092210680246353, -0.010569138452410698, -0.007046066224575043, -0.0035229939967393875, 7.82310962677002e-08, 0.003523150458931923, 0.007046222686767578, 0.010569294914603233, 0.014092367142438889, 0.017615439370274544, 0.0211385115981102, 0.024661583825945854, 0.02818465605378151, 0.031707726418972015, 0.03523080050945282, 0.038753874599933624, 0.04227694496512413, 0.045800015330314636, 0.04932308942079544, 0.052846163511276245, 0.05636923387646675, 0.05989230424165726, 0.06341537833213806, 0.06693845242261887, 0.07046152651309967, 0.07398459315299988, 0.07750765979290009, 0.08103073388338089, 0.0845538079738617, 0.0880768746137619, 0.0915999487042427, 0.09512302279472351, 0.09864608943462372, 0.10216916352510452, 0.10569223761558533, 0.10921531170606613, 0.11273838579654694, 0.11626145243644714, 0.11978452652692795, 0.12330760061740875, 0.12683066725730896, 0.13035374879837036, 0.13387681543827057, 0.13739988207817078, 0.14092296361923218, 0.14444603025913239, 0.1479690968990326, 0.151492178440094, 0.1550152450799942, 0.1585383266210556, 0.1620613932609558, 0.16558445990085602, 0.16910754144191742, 0.17263060808181763, 0.17615368962287903, 0.17967675626277924, 0.18319982290267944, 0.18672290444374084, 0.19024597108364105]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 7.0, 14.0, 10.0, 9.0, 20.0, 15.0, 24.0, 18.0, 18.0, 20.0, 20.0, 23.0, 34.0, 23.0, 20.0, 41.0, 38.0, 41.0, 44.0, 45.0, 37.0, 29.0, 38.0, 36.0, 43.0, 40.0, 53.0, 31.0, 34.0, 20.0, 27.0, 19.0, 16.0, 15.0, 15.0, 15.0, 13.0, 7.0, 5.0, 4.0, 5.0, 0.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.020763278007507324, -0.020069709047675133, -0.01937614008784294, -0.01868257112801075, -0.01798900216817856, -0.017295433208346367, -0.016601864248514175, -0.015908295288681984, -0.015214726328849792, -0.014521157369017601, -0.01382758840918541, -0.013134019449353218, -0.012440450489521027, -0.011746881529688835, -0.011053312569856644, -0.010359743610024452, -0.00966617465019226, -0.00897260569036007, -0.008279036730527878, -0.007585467770695686, -0.006891898810863495, -0.006198329851031303, -0.005504760891199112, -0.0048111919313669205, -0.004117622971534729, -0.0034240540117025375, -0.002730485051870346, -0.0020369160920381546, -0.0013433471322059631, -0.0006497781723737717, 4.37907874584198e-05, 0.0007373597472906113, 0.0014309287071228027, 0.002124497666954994, 0.0028180666267871857, 0.003511635586619377, 0.004205204546451569, 0.00489877350628376, 0.0055923424661159515, 0.006285911425948143, 0.0069794803857803345, 0.007673049345612526, 0.008366618305444717, 0.009060187265276909, 0.0097537562251091, 0.010447325184941292, 0.011140894144773483, 0.011834463104605675, 0.012528032064437866, 0.013221601024270058, 0.01391516998410225, 0.01460873894393444, 0.015302307903766632, 0.015995876863598824, 0.016689445823431015, 0.017383014783263206, 0.018076583743095398, 0.01877015270292759, 0.01946372166275978, 0.020157290622591972, 0.020850859582424164, 0.021544428542256355, 0.022237997502088547, 0.022931566461920738, 0.02362513542175293]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 8.0, 3.0, 9.0, 10.0, 6.0, 11.0, 10.0, 16.0, 14.0, 16.0, 32.0, 28.0, 31.0, 45.0, 34.0, 39.0, 37.0, 31.0, 55.0, 41.0, 60.0, 47.0, 52.0, 45.0, 31.0, 36.0, 27.0, 39.0, 34.0, 24.0, 25.0, 20.0, 19.0, 16.0, 12.0, 6.0, 7.0, 6.0, 8.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9453125, -11.5615234375, -11.177734375, -10.7939453125, -10.41015625, -10.0263671875, -9.642578125, -9.2587890625, -8.875, -8.4912109375, -8.107421875, -7.7236328125, -7.33984375, -6.9560546875, -6.572265625, -6.1884765625, -5.8046875, -5.4208984375, -5.037109375, -4.6533203125, -4.26953125, -3.8857421875, -3.501953125, -3.1181640625, -2.734375, -2.3505859375, -1.966796875, -1.5830078125, -1.19921875, -0.8154296875, -0.431640625, -0.0478515625, 0.3359375, 0.7197265625, 1.103515625, 1.4873046875, 1.87109375, 2.2548828125, 2.638671875, 3.0224609375, 3.40625, 3.7900390625, 4.173828125, 4.5576171875, 4.94140625, 5.3251953125, 5.708984375, 6.0927734375, 6.4765625, 6.8603515625, 7.244140625, 7.6279296875, 8.01171875, 8.3955078125, 8.779296875, 9.1630859375, 9.546875, 9.9306640625, 10.314453125, 10.6982421875, 11.08203125, 11.4658203125, 11.849609375, 12.2333984375, 12.6171875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 3.0, 8.0, 16.0, 6.0, 12.0, 18.0, 23.0, 38.0, 52.0, 108.0, 150.0, 276.0, 537.0, 1150.0, 2762.0, 7288.0, 21371.0, 71480.0, 297407.0, 480472.0, 115230.0, 32470.0, 10693.0, 3811.0, 1578.0, 719.0, 342.0, 197.0, 89.0, 60.0, 64.0, 32.0, 24.0, 19.0, 7.0, 10.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.38671875, -6.181884765625, -5.97705078125, -5.772216796875, -5.5673828125, -5.362548828125, -5.15771484375, -4.952880859375, -4.748046875, -4.543212890625, -4.33837890625, -4.133544921875, -3.9287109375, -3.723876953125, -3.51904296875, -3.314208984375, -3.109375, -2.904541015625, -2.69970703125, -2.494873046875, -2.2900390625, -2.085205078125, -1.88037109375, -1.675537109375, -1.470703125, -1.265869140625, -1.06103515625, -0.856201171875, -0.6513671875, -0.446533203125, -0.24169921875, -0.036865234375, 0.16796875, 0.372802734375, 0.57763671875, 0.782470703125, 0.9873046875, 1.192138671875, 1.39697265625, 1.601806640625, 1.806640625, 2.011474609375, 2.21630859375, 2.421142578125, 2.6259765625, 2.830810546875, 3.03564453125, 3.240478515625, 3.4453125, 3.650146484375, 3.85498046875, 4.059814453125, 4.2646484375, 4.469482421875, 4.67431640625, 4.879150390625, 5.083984375, 5.288818359375, 5.49365234375, 5.698486328125, 5.9033203125, 6.108154296875, 6.31298828125, 6.517822265625, 6.72265625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 4.0, 4.0, 6.0, 5.0, 12.0, 13.0, 13.0, 11.0, 19.0, 18.0, 20.0, 20.0, 31.0, 24.0, 36.0, 35.0, 32.0, 36.0, 40.0, 41.0, 68.0, 1762.0, 315.0, 62.0, 40.0, 23.0, 41.0, 31.0, 33.0, 43.0, 26.0, 34.0, 26.0, 26.0, 18.0, 15.0, 10.0, 9.0, 7.0, 13.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.21875, -39.92626953125, -38.6337890625, -37.34130859375, -36.048828125, -34.75634765625, -33.4638671875, -32.17138671875, -30.87890625, -29.58642578125, -28.2939453125, -27.00146484375, -25.708984375, -24.41650390625, -23.1240234375, -21.83154296875, -20.5390625, -19.24658203125, -17.9541015625, -16.66162109375, -15.369140625, -14.07666015625, -12.7841796875, -11.49169921875, -10.19921875, -8.90673828125, -7.6142578125, -6.32177734375, -5.029296875, -3.73681640625, -2.4443359375, -1.15185546875, 0.140625, 1.43310546875, 2.7255859375, 4.01806640625, 5.310546875, 6.60302734375, 7.8955078125, 9.18798828125, 10.48046875, 11.77294921875, 13.0654296875, 14.35791015625, 15.650390625, 16.94287109375, 18.2353515625, 19.52783203125, 20.8203125, 22.11279296875, 23.4052734375, 24.69775390625, 25.990234375, 27.28271484375, 28.5751953125, 29.86767578125, 31.16015625, 32.45263671875, 33.7451171875, 35.03759765625, 36.330078125, 37.62255859375, 38.9150390625, 40.20751953125, 41.5]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 10.0, 10.0, 7.0, 10.0, 11.0, 15.0, 19.0, 32.0, 36.0, 45.0, 45.0, 66.0, 91.0, 100.0, 205.0, 274.0, 536.0, 1568.0, 224126.0, 2914490.0, 2316.0, 629.0, 313.0, 189.0, 135.0, 102.0, 74.0, 40.0, 45.0, 21.0, 20.0, 22.0, 18.0, 15.0, 10.0, 15.0, 10.0, 5.0, 6.0, 4.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-67.5625, -65.4580078125, -63.353515625, -61.2490234375, -59.14453125, -57.0400390625, -54.935546875, -52.8310546875, -50.7265625, -48.6220703125, -46.517578125, -44.4130859375, -42.30859375, -40.2041015625, -38.099609375, -35.9951171875, -33.890625, -31.7861328125, -29.681640625, -27.5771484375, -25.47265625, -23.3681640625, -21.263671875, -19.1591796875, -17.0546875, -14.9501953125, -12.845703125, -10.7412109375, -8.63671875, -6.5322265625, -4.427734375, -2.3232421875, -0.21875, 1.8857421875, 3.990234375, 6.0947265625, 8.19921875, 10.3037109375, 12.408203125, 14.5126953125, 16.6171875, 18.7216796875, 20.826171875, 22.9306640625, 25.03515625, 27.1396484375, 29.244140625, 31.3486328125, 33.453125, 35.5576171875, 37.662109375, 39.7666015625, 41.87109375, 43.9755859375, 46.080078125, 48.1845703125, 50.2890625, 52.3935546875, 54.498046875, 56.6025390625, 58.70703125, 60.8115234375, 62.916015625, 65.0205078125, 67.125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [47.0, 850.0, 116.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.709879875183105, -4.412458419799805, 2.884963035583496, 10.182385444641113, 17.47980499267578, 24.777225494384766, 32.074649810791016, 39.3720703125, 46.669490814208984, 53.96691131591797, 61.26433563232422, 68.56175231933594, 75.85917663574219, 83.15660095214844, 90.45402526855469, 97.7514419555664, 105.04886627197266, 112.3462905883789, 119.64370727539062, 126.94113159179688, 134.23855590820312, 141.53598022460938, 148.83340454101562, 156.1308135986328, 163.42823791503906, 170.7256622314453, 178.02308654785156, 185.32049560546875, 192.617919921875, 199.91534423828125, 207.2127685546875, 214.51019287109375, 221.8076171875, 229.10504150390625, 236.4024658203125, 243.69989013671875, 250.99729919433594, 258.29473876953125, 265.5921630859375, 272.8895568847656, 280.1869812011719, 287.4844055175781, 294.7818298339844, 302.0792541503906, 309.3766784667969, 316.674072265625, 323.97149658203125, 331.2689208984375, 338.56634521484375, 345.86376953125, 353.16119384765625, 360.4586181640625, 367.75604248046875, 375.053466796875, 382.35089111328125, 389.6482849121094, 396.94573974609375, 404.2431640625, 411.54058837890625, 418.8380126953125, 426.13543701171875, 433.432861328125, 440.73028564453125, 448.0276794433594, 455.3251037597656]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 6.0, 2.0, 6.0, 7.0, 8.0, 3.0, 15.0, 13.0, 17.0, 19.0, 17.0, 21.0, 33.0, 21.0, 21.0, 48.0, 38.0, 28.0, 40.0, 34.0, 47.0, 42.0, 46.0, 47.0, 38.0, 43.0, 41.0, 34.0, 38.0, 31.0, 34.0, 27.0, 22.0, 14.0, 13.0, 14.0, 19.0, 4.0, 13.0, 11.0, 8.0, 3.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-133.54962158203125, -129.2626953125, -124.97576904296875, -120.6888427734375, -116.40191650390625, -112.114990234375, -107.82806396484375, -103.5411376953125, -99.25421142578125, -94.96728515625, -90.68035888671875, -86.3934326171875, -82.10650634765625, -77.819580078125, -73.53265380859375, -69.2457275390625, -64.95879364013672, -60.67186737060547, -56.38494110107422, -52.09801483154297, -47.81108856201172, -43.52416229248047, -39.23723220825195, -34.9503059387207, -30.663379669189453, -26.376453399658203, -22.089527130126953, -17.80259895324707, -13.51567268371582, -9.22874641418457, -4.9418182373046875, -0.6548919677734375, 3.6320343017578125, 7.918961048126221, 12.205887794494629, 16.492815017700195, 20.779741287231445, 25.066667556762695, 29.353595733642578, 33.64052200317383, 37.92744827270508, 42.21437454223633, 46.50130081176758, 50.788230895996094, 55.075157165527344, 59.362083435058594, 63.649009704589844, 67.9359359741211, 72.22286224365234, 76.5097885131836, 80.79671478271484, 85.0836410522461, 89.37056732177734, 93.6574935913086, 97.94442749023438, 102.23135375976562, 106.51828002929688, 110.80520629882812, 115.09213256835938, 119.37905883789062, 123.66598510742188, 127.95291137695312, 132.23983764648438, 136.52676391601562, 140.81369018554688]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 5.0, 10.0, 5.0, 10.0, 10.0, 12.0, 15.0, 17.0, 16.0, 36.0, 25.0, 45.0, 34.0, 29.0, 48.0, 35.0, 47.0, 39.0, 52.0, 64.0, 47.0, 51.0, 33.0, 33.0, 37.0, 31.0, 37.0, 27.0, 25.0, 23.0, 23.0, 15.0, 13.0, 9.0, 6.0, 7.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.692138671875, -11.29833984375, -10.904541015625, -10.5107421875, -10.116943359375, -9.72314453125, -9.329345703125, -8.935546875, -8.541748046875, -8.14794921875, -7.754150390625, -7.3603515625, -6.966552734375, -6.57275390625, -6.178955078125, -5.78515625, -5.391357421875, -4.99755859375, -4.603759765625, -4.2099609375, -3.816162109375, -3.42236328125, -3.028564453125, -2.634765625, -2.240966796875, -1.84716796875, -1.453369140625, -1.0595703125, -0.665771484375, -0.27197265625, 0.121826171875, 0.515625, 0.909423828125, 1.30322265625, 1.697021484375, 2.0908203125, 2.484619140625, 2.87841796875, 3.272216796875, 3.666015625, 4.059814453125, 4.45361328125, 4.847412109375, 5.2412109375, 5.635009765625, 6.02880859375, 6.422607421875, 6.81640625, 7.210205078125, 7.60400390625, 7.997802734375, 8.3916015625, 8.785400390625, 9.17919921875, 9.572998046875, 9.966796875, 10.360595703125, 10.75439453125, 11.148193359375, 11.5419921875, 11.935791015625, 12.32958984375, 12.723388671875, 13.1171875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 3.0, 9.0, 13.0, 14.0, 18.0, 20.0, 40.0, 58.0, 63.0, 121.0, 176.0, 245.0, 408.0, 645.0, 1020.0, 1872.0, 3459.0, 7205.0, 18453.0, 302157.0, 3660086.0, 169411.0, 15287.0, 6334.0, 3016.0, 1641.0, 921.0, 552.0, 353.0, 221.0, 143.0, 86.0, 75.0, 35.0, 45.0, 20.0, 15.0, 7.0, 16.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.75, -39.41064453125, -38.0712890625, -36.73193359375, -35.392578125, -34.05322265625, -32.7138671875, -31.37451171875, -30.03515625, -28.69580078125, -27.3564453125, -26.01708984375, -24.677734375, -23.33837890625, -21.9990234375, -20.65966796875, -19.3203125, -17.98095703125, -16.6416015625, -15.30224609375, -13.962890625, -12.62353515625, -11.2841796875, -9.94482421875, -8.60546875, -7.26611328125, -5.9267578125, -4.58740234375, -3.248046875, -1.90869140625, -0.5693359375, 0.77001953125, 2.109375, 3.44873046875, 4.7880859375, 6.12744140625, 7.466796875, 8.80615234375, 10.1455078125, 11.48486328125, 12.82421875, 14.16357421875, 15.5029296875, 16.84228515625, 18.181640625, 19.52099609375, 20.8603515625, 22.19970703125, 23.5390625, 24.87841796875, 26.2177734375, 27.55712890625, 28.896484375, 30.23583984375, 31.5751953125, 32.91455078125, 34.25390625, 35.59326171875, 36.9326171875, 38.27197265625, 39.611328125, 40.95068359375, 42.2900390625, 43.62939453125, 44.96875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 8.0, 6.0, 6.0, 3.0, 6.0, 5.0, 11.0, 9.0, 17.0, 17.0, 18.0, 38.0, 39.0, 69.0, 136.0, 350.0, 689.0, 1022.0, 805.0, 366.0, 186.0, 91.0, 49.0, 29.0, 25.0, 13.0, 14.0, 4.0, 5.0, 3.0, 8.0, 7.0, 9.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.875, -32.7685546875, -31.662109375, -30.5556640625, -29.44921875, -28.3427734375, -27.236328125, -26.1298828125, -25.0234375, -23.9169921875, -22.810546875, -21.7041015625, -20.59765625, -19.4912109375, -18.384765625, -17.2783203125, -16.171875, -15.0654296875, -13.958984375, -12.8525390625, -11.74609375, -10.6396484375, -9.533203125, -8.4267578125, -7.3203125, -6.2138671875, -5.107421875, -4.0009765625, -2.89453125, -1.7880859375, -0.681640625, 0.4248046875, 1.53125, 2.6376953125, 3.744140625, 4.8505859375, 5.95703125, 7.0634765625, 8.169921875, 9.2763671875, 10.3828125, 11.4892578125, 12.595703125, 13.7021484375, 14.80859375, 15.9150390625, 17.021484375, 18.1279296875, 19.234375, 20.3408203125, 21.447265625, 22.5537109375, 23.66015625, 24.7666015625, 25.873046875, 26.9794921875, 28.0859375, 29.1923828125, 30.298828125, 31.4052734375, 32.51171875, 33.6181640625, 34.724609375, 35.8310546875, 36.9375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 3.0, 10.0, 13.0, 17.0, 21.0, 28.0, 42.0, 62.0, 76.0, 121.0, 196.0, 249.0, 370.0, 554.0, 797.0, 1192.0, 1786.0, 2772.0, 4311.0, 7119.0, 12531.0, 24062.0, 59384.0, 374635.0, 3268337.0, 325281.0, 56228.0, 22948.0, 11877.0, 6889.0, 4175.0, 2691.0, 1798.0, 1104.0, 840.0, 519.0, 371.0, 255.0, 184.0, 134.0, 77.0, 63.0, 46.0, 27.0, 24.0, 18.0, 5.0, 14.0, 8.0, 4.0, 3.0, 5.0, 2.0, 0.0, 4.0], "bins": [-40.78125, -39.56298828125, -38.3447265625, -37.12646484375, -35.908203125, -34.68994140625, -33.4716796875, -32.25341796875, -31.03515625, -29.81689453125, -28.5986328125, -27.38037109375, -26.162109375, -24.94384765625, -23.7255859375, -22.50732421875, -21.2890625, -20.07080078125, -18.8525390625, -17.63427734375, -16.416015625, -15.19775390625, -13.9794921875, -12.76123046875, -11.54296875, -10.32470703125, -9.1064453125, -7.88818359375, -6.669921875, -5.45166015625, -4.2333984375, -3.01513671875, -1.796875, -0.57861328125, 0.6396484375, 1.85791015625, 3.076171875, 4.29443359375, 5.5126953125, 6.73095703125, 7.94921875, 9.16748046875, 10.3857421875, 11.60400390625, 12.822265625, 14.04052734375, 15.2587890625, 16.47705078125, 17.6953125, 18.91357421875, 20.1318359375, 21.35009765625, 22.568359375, 23.78662109375, 25.0048828125, 26.22314453125, 27.44140625, 28.65966796875, 29.8779296875, 31.09619140625, 32.314453125, 33.53271484375, 34.7509765625, 35.96923828125, 37.1875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 13.0, 13.0, 15.0, 21.0, 26.0, 54.0, 76.0, 108.0, 168.0, 184.0, 109.0, 78.0, 38.0, 32.0, 22.0, 8.0, 9.0, 6.0, 6.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.85140228271484, -115.04425048828125, -110.23709869384766, -105.42994689941406, -100.62278747558594, -95.81563568115234, -91.00848388671875, -86.20132446289062, -81.39418029785156, -76.58702850341797, -71.77987670898438, -66.97271728515625, -62.165565490722656, -57.35841369628906, -52.55126190185547, -47.74410629272461, -42.93695068359375, -38.129798889160156, -33.3226432800293, -28.515491485595703, -23.708337783813477, -18.90118408203125, -14.094032287597656, -9.286876678466797, -4.479724884033203, 0.32742834091186523, 5.134581565856934, 9.941734313964844, 14.74888801574707, 19.556041717529297, 24.36319351196289, 29.17034912109375, 33.977508544921875, 38.78466033935547, 43.59181594848633, 48.39896774291992, 53.20612335205078, 58.013275146484375, 62.82042694091797, 67.62757873535156, 72.43473815917969, 77.24188995361328, 82.04904174804688, 86.856201171875, 91.6633529663086, 96.47050476074219, 101.27765655517578, 106.08480834960938, 110.89196014404297, 115.69911193847656, 120.50626373291016, 125.31341552734375, 130.12057495117188, 134.927734375, 139.73487854003906, 144.5420379638672, 149.34918212890625, 154.15634155273438, 158.96348571777344, 163.77064514160156, 168.57778930664062, 173.38494873046875, 178.19210815429688, 182.99925231933594, 187.80641174316406]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 8.0, 7.0, 12.0, 15.0, 12.0, 17.0, 23.0, 30.0, 30.0, 26.0, 25.0, 30.0, 32.0, 45.0, 41.0, 44.0, 43.0, 38.0, 41.0, 45.0, 36.0, 48.0, 38.0, 39.0, 37.0, 35.0, 27.0, 26.0, 21.0, 28.0, 11.0, 14.0, 14.0, 12.0, 11.0, 5.0, 7.0, 2.0, 6.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.74385070800781, -74.01144409179688, -71.2790298461914, -68.54662322998047, -65.814208984375, -63.0817985534668, -60.349388122558594, -57.616981506347656, -54.88456726074219, -52.152156829833984, -49.41974639892578, -46.68733596801758, -43.954925537109375, -41.22251510620117, -38.49010467529297, -35.75769805908203, -33.02528762817383, -30.292877197265625, -27.560466766357422, -24.82805633544922, -22.095645904541016, -19.363235473632812, -16.630826950073242, -13.898416519165039, -11.166006088256836, -8.433595657348633, -5.701185703277588, -2.968775749206543, -0.23636531829833984, 2.4960451126098633, 5.22845458984375, 7.960865020751953, 10.693275451660156, 13.42568588256836, 16.158096313476562, 18.890506744384766, 21.62291717529297, 24.355327606201172, 27.087736129760742, 29.820146560668945, 32.55255889892578, 35.284969329833984, 38.01737976074219, 40.74979019165039, 43.482200622558594, 46.2146110534668, 48.947021484375, 51.67942810058594, 54.41183853149414, 57.144248962402344, 59.87665939331055, 62.60906982421875, 65.34147644042969, 68.07389068603516, 70.8062973022461, 73.53871154785156, 76.2711181640625, 79.00352478027344, 81.7359390258789, 84.46834564208984, 87.20075988769531, 89.93316650390625, 92.66558074951172, 95.39798736572266, 98.13040161132812]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 10.0, 7.0, 11.0, 8.0, 17.0, 16.0, 24.0, 19.0, 24.0, 27.0, 29.0, 35.0, 43.0, 42.0, 38.0, 45.0, 42.0, 51.0, 40.0, 35.0, 40.0, 32.0, 40.0, 40.0, 39.0, 40.0, 40.0, 25.0, 24.0, 13.0, 12.0, 25.0, 8.0, 13.0, 9.0, 7.0, 4.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.28125, -11.888671875, -11.49609375, -11.103515625, -10.7109375, -10.318359375, -9.92578125, -9.533203125, -9.140625, -8.748046875, -8.35546875, -7.962890625, -7.5703125, -7.177734375, -6.78515625, -6.392578125, -6.0, -5.607421875, -5.21484375, -4.822265625, -4.4296875, -4.037109375, -3.64453125, -3.251953125, -2.859375, -2.466796875, -2.07421875, -1.681640625, -1.2890625, -0.896484375, -0.50390625, -0.111328125, 0.28125, 0.673828125, 1.06640625, 1.458984375, 1.8515625, 2.244140625, 2.63671875, 3.029296875, 3.421875, 3.814453125, 4.20703125, 4.599609375, 4.9921875, 5.384765625, 5.77734375, 6.169921875, 6.5625, 6.955078125, 7.34765625, 7.740234375, 8.1328125, 8.525390625, 8.91796875, 9.310546875, 9.703125, 10.095703125, 10.48828125, 10.880859375, 11.2734375, 11.666015625, 12.05859375, 12.451171875, 12.84375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 3.0, 11.0, 12.0, 26.0, 21.0, 35.0, 46.0, 89.0, 117.0, 184.0, 260.0, 417.0, 611.0, 960.0, 1489.0, 2291.0, 3483.0, 5391.0, 8445.0, 13249.0, 21438.0, 35901.0, 62797.0, 120206.0, 238125.0, 244648.0, 125714.0, 65248.0, 36803.0, 22330.0, 13668.0, 8680.0, 5492.0, 3627.0, 2383.0, 1434.0, 986.0, 660.0, 425.0, 263.0, 183.0, 121.0, 102.0, 56.0, 46.0, 35.0, 9.0, 15.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.52734375, -1.4796600341796875, -1.431976318359375, -1.3842926025390625, -1.33660888671875, -1.2889251708984375, -1.241241455078125, -1.1935577392578125, -1.1458740234375, -1.0981903076171875, -1.050506591796875, -1.0028228759765625, -0.95513916015625, -0.9074554443359375, -0.859771728515625, -0.8120880126953125, -0.764404296875, -0.7167205810546875, -0.669036865234375, -0.6213531494140625, -0.57366943359375, -0.5259857177734375, -0.478302001953125, -0.4306182861328125, -0.3829345703125, -0.3352508544921875, -0.287567138671875, -0.2398834228515625, -0.19219970703125, -0.1445159912109375, -0.096832275390625, -0.0491485595703125, -0.00146484375, 0.0462188720703125, 0.093902587890625, 0.1415863037109375, 0.18927001953125, 0.2369537353515625, 0.284637451171875, 0.3323211669921875, 0.3800048828125, 0.4276885986328125, 0.475372314453125, 0.5230560302734375, 0.57073974609375, 0.6184234619140625, 0.666107177734375, 0.7137908935546875, 0.761474609375, 0.8091583251953125, 0.856842041015625, 0.9045257568359375, 0.95220947265625, 0.9998931884765625, 1.047576904296875, 1.0952606201171875, 1.1429443359375, 1.1906280517578125, 1.238311767578125, 1.2859954833984375, 1.33367919921875, 1.3813629150390625, 1.429046630859375, 1.4767303466796875, 1.5244140625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 7.0, 10.0, 6.0, 7.0, 15.0, 11.0, 12.0, 8.0, 18.0, 29.0, 27.0, 27.0, 26.0, 38.0, 31.0, 27.0, 38.0, 40.0, 36.0, 40.0, 45.0, 1063.0, 36.0, 43.0, 40.0, 31.0, 37.0, 21.0, 25.0, 38.0, 32.0, 24.0, 19.0, 17.0, 11.0, 15.0, 19.0, 14.0, 6.0, 9.0, 2.0, 8.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.8125, -7.5848388671875, -7.357177734375, -7.1295166015625, -6.90185546875, -6.6741943359375, -6.446533203125, -6.2188720703125, -5.9912109375, -5.7635498046875, -5.535888671875, -5.3082275390625, -5.08056640625, -4.8529052734375, -4.625244140625, -4.3975830078125, -4.169921875, -3.9422607421875, -3.714599609375, -3.4869384765625, -3.25927734375, -3.0316162109375, -2.803955078125, -2.5762939453125, -2.3486328125, -2.1209716796875, -1.893310546875, -1.6656494140625, -1.43798828125, -1.2103271484375, -0.982666015625, -0.7550048828125, -0.52734375, -0.2996826171875, -0.072021484375, 0.1556396484375, 0.38330078125, 0.6109619140625, 0.838623046875, 1.0662841796875, 1.2939453125, 1.5216064453125, 1.749267578125, 1.9769287109375, 2.20458984375, 2.4322509765625, 2.659912109375, 2.8875732421875, 3.115234375, 3.3428955078125, 3.570556640625, 3.7982177734375, 4.02587890625, 4.2535400390625, 4.481201171875, 4.7088623046875, 4.9365234375, 5.1641845703125, 5.391845703125, 5.6195068359375, 5.84716796875, 6.0748291015625, 6.302490234375, 6.5301513671875, 6.7578125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 12.0, 13.0, 20.0, 24.0, 44.0, 73.0, 115.0, 155.0, 196.0, 358.0, 600.0, 903.0, 1483.0, 2206.0, 3641.0, 5753.0, 9301.0, 14710.0, 24215.0, 40801.0, 71404.0, 130713.0, 1146535.0, 356218.0, 121711.0, 66563.0, 38656.0, 23115.0, 14109.0, 8651.0, 5437.0, 3438.0, 2082.0, 1375.0, 915.0, 568.0, 347.0, 211.0, 163.0, 111.0, 64.0, 54.0, 23.0, 13.0, 10.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.716796875, -0.6920318603515625, -0.667266845703125, -0.6425018310546875, -0.61773681640625, -0.5929718017578125, -0.568206787109375, -0.5434417724609375, -0.5186767578125, -0.4939117431640625, -0.469146728515625, -0.4443817138671875, -0.41961669921875, -0.3948516845703125, -0.370086669921875, -0.3453216552734375, -0.320556640625, -0.2957916259765625, -0.271026611328125, -0.2462615966796875, -0.22149658203125, -0.1967315673828125, -0.171966552734375, -0.1472015380859375, -0.1224365234375, -0.0976715087890625, -0.072906494140625, -0.0481414794921875, -0.02337646484375, 0.0013885498046875, 0.026153564453125, 0.0509185791015625, 0.07568359375, 0.1004486083984375, 0.125213623046875, 0.1499786376953125, 0.17474365234375, 0.1995086669921875, 0.224273681640625, 0.2490386962890625, 0.2738037109375, 0.2985687255859375, 0.323333740234375, 0.3480987548828125, 0.37286376953125, 0.3976287841796875, 0.422393798828125, 0.4471588134765625, 0.471923828125, 0.4966888427734375, 0.521453857421875, 0.5462188720703125, 0.57098388671875, 0.5957489013671875, 0.620513916015625, 0.6452789306640625, 0.6700439453125, 0.6948089599609375, 0.719573974609375, 0.7443389892578125, 0.76910400390625, 0.7938690185546875, 0.818634033203125, 0.8433990478515625, 0.8681640625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 6.0, 1.0, 8.0, 4.0, 6.0, 3.0, 5.0, 12.0, 14.0, 20.0, 32.0, 28.0, 90.0, 145.0, 159.0, 158.0, 92.0, 52.0, 32.0, 34.0, 13.0, 17.0, 2.0, 7.0, 10.0, 6.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04541015625, -0.0439763069152832, -0.042542457580566406, -0.04110860824584961, -0.03967475891113281, -0.038240909576416016, -0.03680706024169922, -0.03537321090698242, -0.033939361572265625, -0.03250551223754883, -0.03107166290283203, -0.029637813568115234, -0.028203964233398438, -0.02677011489868164, -0.025336265563964844, -0.023902416229248047, -0.02246856689453125, -0.021034717559814453, -0.019600868225097656, -0.01816701889038086, -0.016733169555664062, -0.015299320220947266, -0.013865470886230469, -0.012431621551513672, -0.010997772216796875, -0.009563922882080078, -0.008130073547363281, -0.006696224212646484, -0.0052623748779296875, -0.0038285255432128906, -0.0023946762084960938, -0.0009608268737792969, 0.0004730224609375, 0.0019068717956542969, 0.0033407211303710938, 0.004774570465087891, 0.0062084197998046875, 0.007642269134521484, 0.009076118469238281, 0.010509967803955078, 0.011943817138671875, 0.013377666473388672, 0.014811515808105469, 0.016245365142822266, 0.017679214477539062, 0.01911306381225586, 0.020546913146972656, 0.021980762481689453, 0.02341461181640625, 0.024848461151123047, 0.026282310485839844, 0.02771615982055664, 0.029150009155273438, 0.030583858489990234, 0.03201770782470703, 0.03345155715942383, 0.034885406494140625, 0.03631925582885742, 0.03775310516357422, 0.039186954498291016, 0.04062080383300781, 0.04205465316772461, 0.043488502502441406, 0.0449223518371582, 0.046356201171875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 8.0, 7.0, 9.0, 11.0, 31.0, 30.0, 54.0, 70.0, 106.0, 173.0, 1188.0, 45064.0, 993602.0, 7277.0, 472.0, 146.0, 100.0, 58.0, 34.0, 34.0, 22.0, 15.0, 9.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1376953125, -1.1024627685546875, -1.067230224609375, -1.0319976806640625, -0.99676513671875, -0.9615325927734375, -0.926300048828125, -0.8910675048828125, -0.8558349609375, -0.8206024169921875, -0.785369873046875, -0.7501373291015625, -0.71490478515625, -0.6796722412109375, -0.644439697265625, -0.6092071533203125, -0.573974609375, -0.5387420654296875, -0.503509521484375, -0.4682769775390625, -0.43304443359375, -0.3978118896484375, -0.362579345703125, -0.3273468017578125, -0.2921142578125, -0.2568817138671875, -0.221649169921875, -0.1864166259765625, -0.15118408203125, -0.1159515380859375, -0.080718994140625, -0.0454864501953125, -0.01025390625, 0.0249786376953125, 0.060211181640625, 0.0954437255859375, 0.13067626953125, 0.1659088134765625, 0.201141357421875, 0.2363739013671875, 0.2716064453125, 0.3068389892578125, 0.342071533203125, 0.3773040771484375, 0.41253662109375, 0.4477691650390625, 0.483001708984375, 0.5182342529296875, 0.553466796875, 0.5886993408203125, 0.623931884765625, 0.6591644287109375, 0.69439697265625, 0.7296295166015625, 0.764862060546875, 0.8000946044921875, 0.8353271484375, 0.8705596923828125, 0.905792236328125, 0.9410247802734375, 0.97625732421875, 1.0114898681640625, 1.046722412109375, 1.0819549560546875, 1.1171875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 15.0, 17.0, 34.0, 69.0, 121.0, 264.0, 240.0, 95.0, 64.0, 26.0, 21.0, 11.0, 8.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11927410215139389, -0.11261456459760666, -0.10595502704381943, -0.09929549694061279, -0.09263595938682556, -0.08597642183303833, -0.0793168842792511, -0.07265734672546387, -0.06599780917167664, -0.059338271617889404, -0.05267873778939247, -0.04601920023560524, -0.03935966640710831, -0.032700128853321075, -0.026040591299533844, -0.01938105747103691, -0.012721523642539978, -0.0060619874857366085, 0.000597548671066761, 0.007257085293531418, 0.0139166209846735, 0.020576156675815582, 0.027235694229602814, 0.03389522805809975, 0.04055476561188698, 0.04721430316567421, 0.05387383699417114, 0.060533374547958374, 0.0671929121017456, 0.07385244965553284, 0.08051198720932007, 0.0871715173125267, 0.09383104741573334, 0.10049058496952057, 0.1071501225233078, 0.11380966007709503, 0.12046919018030167, 0.1271287202835083, 0.13378825783729553, 0.14044779539108276, 0.14710733294487, 0.15376687049865723, 0.16042640805244446, 0.1670859456062317, 0.17374548316001892, 0.18040502071380615, 0.18706455826759338, 0.19372408092021942, 0.20038363337516785, 0.20704317092895508, 0.2137027084827423, 0.22036224603652954, 0.22702178359031677, 0.233681321144104, 0.24034085869789124, 0.24700038135051727, 0.2536599040031433, 0.26031944155693054, 0.2669789791107178, 0.273638516664505, 0.28029805421829224, 0.28695759177207947, 0.2936171293258667, 0.30027666687965393, 0.30693620443344116]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 3.0, 5.0, 8.0, 10.0, 11.0, 16.0, 13.0, 14.0, 21.0, 19.0, 26.0, 21.0, 19.0, 35.0, 41.0, 21.0, 31.0, 47.0, 31.0, 39.0, 35.0, 36.0, 39.0, 38.0, 38.0, 33.0, 46.0, 42.0, 29.0, 29.0, 21.0, 26.0, 31.0, 21.0, 17.0, 17.0, 15.0, 10.0, 6.0, 12.0, 8.0, 4.0, 3.0, 1.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.020572364330291748, -0.019920574501156807, -0.019268784672021866, -0.018616994842886925, -0.017965205013751984, -0.017313415184617043, -0.0166616253554821, -0.01600983552634716, -0.01535804569721222, -0.014706255868077278, -0.014054466038942337, -0.013402676209807396, -0.012750886380672455, -0.012099096551537514, -0.011447306722402573, -0.010795516893267632, -0.01014372706413269, -0.00949193723499775, -0.008840147405862808, -0.008188357576727867, -0.007536567747592926, -0.006884777918457985, -0.006232988089323044, -0.005581198260188103, -0.004929408431053162, -0.0042776186019182205, -0.0036258287727832794, -0.0029740389436483383, -0.002322249114513397, -0.0016704592853784561, -0.001018669456243515, -0.0003668796271085739, 0.0002849102020263672, 0.0009367000311613083, 0.0015884898602962494, 0.0022402796894311905, 0.0028920695185661316, 0.0035438593477010727, 0.004195649176836014, 0.004847439005970955, 0.005499228835105896, 0.006151018664240837, 0.006802808493375778, 0.007454598322510719, 0.00810638815164566, 0.008758177980780602, 0.009409967809915543, 0.010061757639050484, 0.010713547468185425, 0.011365337297320366, 0.012017127126455307, 0.012668916955590248, 0.01332070678472519, 0.01397249661386013, 0.014624286442995071, 0.015276076272130013, 0.015927866101264954, 0.016579655930399895, 0.017231445759534836, 0.017883235588669777, 0.018535025417804718, 0.01918681524693966, 0.0198386050760746, 0.02049039490520954, 0.021142184734344482]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 10.0, 7.0, 11.0, 8.0, 17.0, 16.0, 24.0, 19.0, 24.0, 27.0, 29.0, 36.0, 42.0, 42.0, 38.0, 45.0, 42.0, 51.0, 40.0, 35.0, 40.0, 33.0, 39.0, 39.0, 40.0, 40.0, 40.0, 25.0, 24.0, 13.0, 12.0, 25.0, 8.0, 13.0, 9.0, 7.0, 4.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.28125, -11.888671875, -11.49609375, -11.103515625, -10.7109375, -10.318359375, -9.92578125, -9.533203125, -9.140625, -8.748046875, -8.35546875, -7.962890625, -7.5703125, -7.177734375, -6.78515625, -6.392578125, -6.0, -5.607421875, -5.21484375, -4.822265625, -4.4296875, -4.037109375, -3.64453125, -3.251953125, -2.859375, -2.466796875, -2.07421875, -1.681640625, -1.2890625, -0.896484375, -0.50390625, -0.111328125, 0.28125, 0.673828125, 1.06640625, 1.458984375, 1.8515625, 2.244140625, 2.63671875, 3.029296875, 3.421875, 3.814453125, 4.20703125, 4.599609375, 4.9921875, 5.384765625, 5.77734375, 6.169921875, 6.5625, 6.955078125, 7.34765625, 7.740234375, 8.1328125, 8.525390625, 8.91796875, 9.310546875, 9.703125, 10.095703125, 10.48828125, 10.880859375, 11.2734375, 11.666015625, 12.05859375, 12.451171875, 12.84375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 6.0, 4.0, 9.0, 13.0, 16.0, 20.0, 33.0, 53.0, 61.0, 72.0, 121.0, 158.0, 219.0, 341.0, 473.0, 695.0, 946.0, 1585.0, 2795.0, 5517.0, 18934.0, 177877.0, 761669.0, 56649.0, 10249.0, 3818.0, 2135.0, 1269.0, 877.0, 563.0, 415.0, 275.0, 185.0, 154.0, 108.0, 66.0, 52.0, 43.0, 17.0, 23.0, 12.0, 15.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.828125, -17.27587890625, -16.7236328125, -16.17138671875, -15.619140625, -15.06689453125, -14.5146484375, -13.96240234375, -13.41015625, -12.85791015625, -12.3056640625, -11.75341796875, -11.201171875, -10.64892578125, -10.0966796875, -9.54443359375, -8.9921875, -8.43994140625, -7.8876953125, -7.33544921875, -6.783203125, -6.23095703125, -5.6787109375, -5.12646484375, -4.57421875, -4.02197265625, -3.4697265625, -2.91748046875, -2.365234375, -1.81298828125, -1.2607421875, -0.70849609375, -0.15625, 0.39599609375, 0.9482421875, 1.50048828125, 2.052734375, 2.60498046875, 3.1572265625, 3.70947265625, 4.26171875, 4.81396484375, 5.3662109375, 5.91845703125, 6.470703125, 7.02294921875, 7.5751953125, 8.12744140625, 8.6796875, 9.23193359375, 9.7841796875, 10.33642578125, 10.888671875, 11.44091796875, 11.9931640625, 12.54541015625, 13.09765625, 13.64990234375, 14.2021484375, 14.75439453125, 15.306640625, 15.85888671875, 16.4111328125, 16.96337890625, 17.515625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 6.0, 5.0, 6.0, 6.0, 8.0, 17.0, 15.0, 13.0, 12.0, 23.0, 24.0, 27.0, 31.0, 28.0, 33.0, 33.0, 34.0, 41.0, 35.0, 43.0, 103.0, 1950.0, 101.0, 40.0, 46.0, 33.0, 39.0, 40.0, 33.0, 20.0, 25.0, 25.0, 30.0, 18.0, 17.0, 14.0, 9.0, 15.0, 10.0, 6.0, 4.0, 6.0, 5.0, 5.0, 8.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-38.375, -37.19482421875, -36.0146484375, -34.83447265625, -33.654296875, -32.47412109375, -31.2939453125, -30.11376953125, -28.93359375, -27.75341796875, -26.5732421875, -25.39306640625, -24.212890625, -23.03271484375, -21.8525390625, -20.67236328125, -19.4921875, -18.31201171875, -17.1318359375, -15.95166015625, -14.771484375, -13.59130859375, -12.4111328125, -11.23095703125, -10.05078125, -8.87060546875, -7.6904296875, -6.51025390625, -5.330078125, -4.14990234375, -2.9697265625, -1.78955078125, -0.609375, 0.57080078125, 1.7509765625, 2.93115234375, 4.111328125, 5.29150390625, 6.4716796875, 7.65185546875, 8.83203125, 10.01220703125, 11.1923828125, 12.37255859375, 13.552734375, 14.73291015625, 15.9130859375, 17.09326171875, 18.2734375, 19.45361328125, 20.6337890625, 21.81396484375, 22.994140625, 24.17431640625, 25.3544921875, 26.53466796875, 27.71484375, 28.89501953125, 30.0751953125, 31.25537109375, 32.435546875, 33.61572265625, 34.7958984375, 35.97607421875, 37.15625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 13.0, 8.0, 7.0, 6.0, 7.0, 13.0, 16.0, 16.0, 25.0, 26.0, 48.0, 56.0, 62.0, 109.0, 162.0, 317.0, 711.0, 2232.0, 11178.0, 3103699.0, 22132.0, 2988.0, 851.0, 384.0, 203.0, 124.0, 78.0, 55.0, 39.0, 31.0, 19.0, 18.0, 24.0, 9.0, 6.0, 12.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.875, -69.3623046875, -66.849609375, -64.3369140625, -61.82421875, -59.3115234375, -56.798828125, -54.2861328125, -51.7734375, -49.2607421875, -46.748046875, -44.2353515625, -41.72265625, -39.2099609375, -36.697265625, -34.1845703125, -31.671875, -29.1591796875, -26.646484375, -24.1337890625, -21.62109375, -19.1083984375, -16.595703125, -14.0830078125, -11.5703125, -9.0576171875, -6.544921875, -4.0322265625, -1.51953125, 0.9931640625, 3.505859375, 6.0185546875, 8.53125, 11.0439453125, 13.556640625, 16.0693359375, 18.58203125, 21.0947265625, 23.607421875, 26.1201171875, 28.6328125, 31.1455078125, 33.658203125, 36.1708984375, 38.68359375, 41.1962890625, 43.708984375, 46.2216796875, 48.734375, 51.2470703125, 53.759765625, 56.2724609375, 58.78515625, 61.2978515625, 63.810546875, 66.3232421875, 68.8359375, 71.3486328125, 73.861328125, 76.3740234375, 78.88671875, 81.3994140625, 83.912109375, 86.4248046875, 88.9375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 11.0, 26.0, 44.0, 92.0, 108.0, 154.0, 206.0, 161.0, 89.0, 64.0, 23.0, 11.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.517452239990234, -53.011497497558594, -51.50553894042969, -49.99958419799805, -48.493629455566406, -46.9876708984375, -45.48171615600586, -43.97576141357422, -42.46980285644531, -40.96384811401367, -39.457889556884766, -37.951934814453125, -36.44597625732422, -34.94002151489258, -33.43406677246094, -31.928110122680664, -30.42215347290039, -28.916196823120117, -27.410240173339844, -25.904285430908203, -24.39832878112793, -22.892372131347656, -21.386417388916016, -19.880460739135742, -18.37450408935547, -16.868547439575195, -15.362591743469238, -13.856636047363281, -12.350679397583008, -10.844722747802734, -9.338767051696777, -7.83281135559082, -6.326854705810547, -4.820898532867432, -3.3149423599243164, -1.8089861869812012, -0.30303001403808594, 1.2029261589050293, 2.7088823318481445, 4.214838027954102, 5.720794677734375, 7.22675085067749, 8.732707023620605, 10.238662719726562, 11.744619369506836, 13.25057601928711, 14.756531715393066, 16.262487411499023, 17.768444061279297, 19.27440071105957, 20.780357360839844, 22.286312103271484, 23.792268753051758, 25.29822540283203, 26.804180145263672, 28.310136795043945, 29.81609344482422, 31.322050094604492, 32.828006744384766, 34.333961486816406, 35.83992004394531, 37.34587478637695, 38.851829528808594, 40.3577880859375, 41.86374282836914]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 2.0, 4.0, 4.0, 1.0, 4.0, 9.0, 9.0, 14.0, 19.0, 19.0, 10.0, 33.0, 22.0, 32.0, 32.0, 35.0, 38.0, 38.0, 39.0, 41.0, 31.0, 49.0, 62.0, 37.0, 37.0, 41.0, 44.0, 38.0, 31.0, 32.0, 33.0, 29.0, 26.0, 14.0, 28.0, 18.0, 12.0, 11.0, 6.0, 3.0, 5.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.0409698486328, -124.08228302001953, -120.12360382080078, -116.1649169921875, -112.20623779296875, -108.24755096435547, -104.28886413574219, -100.33018493652344, -96.37149810791016, -92.41281127929688, -88.45413208007812, -84.49544525146484, -80.53675842285156, -76.57807922363281, -72.61939239501953, -68.66070556640625, -64.7020263671875, -60.743343353271484, -56.78466033935547, -52.82597351074219, -48.86729049682617, -44.908607482910156, -40.949920654296875, -36.99123764038086, -33.032554626464844, -29.073871612548828, -25.11518669128418, -21.15650177001953, -17.197818756103516, -13.2391357421875, -9.280450820922852, -5.321765899658203, -1.3630828857421875, 2.5956010818481445, 6.554285049438477, 10.512969017028809, 14.47165298461914, 18.430335998535156, 22.389020919799805, 26.347705841064453, 30.30638885498047, 34.265071868896484, 38.2237548828125, 42.18244171142578, 46.1411247253418, 50.09980773925781, 54.058494567871094, 58.01717758178711, 61.975860595703125, 65.9345474243164, 69.89322662353516, 73.85191345214844, 77.81059265136719, 81.76927947998047, 85.72796630859375, 89.6866455078125, 93.64533233642578, 97.60401916503906, 101.56269836425781, 105.5213851928711, 109.48007202148438, 113.43875122070312, 117.3974380493164, 121.35612487792969, 125.31480407714844]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 10.0, 12.0, 9.0, 5.0, 17.0, 21.0, 19.0, 13.0, 28.0, 29.0, 28.0, 32.0, 51.0, 44.0, 33.0, 43.0, 50.0, 46.0, 41.0, 42.0, 31.0, 42.0, 37.0, 34.0, 46.0, 40.0, 35.0, 32.0, 15.0, 14.0, 14.0, 19.0, 11.0, 15.0, 8.0, 6.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.609375, -12.2059326171875, -11.802490234375, -11.3990478515625, -10.99560546875, -10.5921630859375, -10.188720703125, -9.7852783203125, -9.3818359375, -8.9783935546875, -8.574951171875, -8.1715087890625, -7.76806640625, -7.3646240234375, -6.961181640625, -6.5577392578125, -6.154296875, -5.7508544921875, -5.347412109375, -4.9439697265625, -4.54052734375, -4.1370849609375, -3.733642578125, -3.3302001953125, -2.9267578125, -2.5233154296875, -2.119873046875, -1.7164306640625, -1.31298828125, -0.9095458984375, -0.506103515625, -0.1026611328125, 0.30078125, 0.7042236328125, 1.107666015625, 1.5111083984375, 1.91455078125, 2.3179931640625, 2.721435546875, 3.1248779296875, 3.5283203125, 3.9317626953125, 4.335205078125, 4.7386474609375, 5.14208984375, 5.5455322265625, 5.948974609375, 6.3524169921875, 6.755859375, 7.1593017578125, 7.562744140625, 7.9661865234375, 8.36962890625, 8.7730712890625, 9.176513671875, 9.5799560546875, 9.9833984375, 10.3868408203125, 10.790283203125, 11.1937255859375, 11.59716796875, 12.0006103515625, 12.404052734375, 12.8074951171875, 13.2109375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 4.0, 10.0, 2.0, 6.0, 7.0, 13.0, 21.0, 26.0, 28.0, 56.0, 74.0, 152.0, 240.0, 413.0, 655.0, 1126.0, 2000.0, 3791.0, 7390.0, 17567.0, 266943.0, 3569451.0, 290294.0, 18004.0, 7270.0, 3684.0, 2085.0, 1209.0, 698.0, 403.0, 237.0, 154.0, 80.0, 68.0, 34.0, 21.0, 20.0, 17.0, 10.0, 8.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.625, -41.31396484375, -40.0029296875, -38.69189453125, -37.380859375, -36.06982421875, -34.7587890625, -33.44775390625, -32.13671875, -30.82568359375, -29.5146484375, -28.20361328125, -26.892578125, -25.58154296875, -24.2705078125, -22.95947265625, -21.6484375, -20.33740234375, -19.0263671875, -17.71533203125, -16.404296875, -15.09326171875, -13.7822265625, -12.47119140625, -11.16015625, -9.84912109375, -8.5380859375, -7.22705078125, -5.916015625, -4.60498046875, -3.2939453125, -1.98291015625, -0.671875, 0.63916015625, 1.9501953125, 3.26123046875, 4.572265625, 5.88330078125, 7.1943359375, 8.50537109375, 9.81640625, 11.12744140625, 12.4384765625, 13.74951171875, 15.060546875, 16.37158203125, 17.6826171875, 18.99365234375, 20.3046875, 21.61572265625, 22.9267578125, 24.23779296875, 25.548828125, 26.85986328125, 28.1708984375, 29.48193359375, 30.79296875, 32.10400390625, 33.4150390625, 34.72607421875, 36.037109375, 37.34814453125, 38.6591796875, 39.97021484375, 41.28125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 2.0, 9.0, 5.0, 6.0, 6.0, 10.0, 8.0, 11.0, 18.0, 33.0, 51.0, 87.0, 177.0, 480.0, 931.0, 1041.0, 581.0, 283.0, 121.0, 61.0, 36.0, 28.0, 12.0, 21.0, 15.0, 3.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 6.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.0, -37.75048828125, -36.5009765625, -35.25146484375, -34.001953125, -32.75244140625, -31.5029296875, -30.25341796875, -29.00390625, -27.75439453125, -26.5048828125, -25.25537109375, -24.005859375, -22.75634765625, -21.5068359375, -20.25732421875, -19.0078125, -17.75830078125, -16.5087890625, -15.25927734375, -14.009765625, -12.76025390625, -11.5107421875, -10.26123046875, -9.01171875, -7.76220703125, -6.5126953125, -5.26318359375, -4.013671875, -2.76416015625, -1.5146484375, -0.26513671875, 0.984375, 2.23388671875, 3.4833984375, 4.73291015625, 5.982421875, 7.23193359375, 8.4814453125, 9.73095703125, 10.98046875, 12.22998046875, 13.4794921875, 14.72900390625, 15.978515625, 17.22802734375, 18.4775390625, 19.72705078125, 20.9765625, 22.22607421875, 23.4755859375, 24.72509765625, 25.974609375, 27.22412109375, 28.4736328125, 29.72314453125, 30.97265625, 32.22216796875, 33.4716796875, 34.72119140625, 35.970703125, 37.22021484375, 38.4697265625, 39.71923828125, 40.96875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 11.0, 12.0, 21.0, 35.0, 40.0, 79.0, 111.0, 129.0, 212.0, 322.0, 509.0, 800.0, 1142.0, 1812.0, 2926.0, 4846.0, 8742.0, 17545.0, 45119.0, 307881.0, 3448619.0, 271582.0, 43565.0, 16886.0, 8460.0, 4815.0, 2853.0, 1811.0, 1183.0, 715.0, 455.0, 350.0, 223.0, 174.0, 113.0, 50.0, 30.0, 23.0, 25.0, 18.0, 13.0, 7.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.71875, -41.21875, -39.71875, -38.21875, -36.71875, -35.21875, -33.71875, -32.21875, -30.71875, -29.21875, -27.71875, -26.21875, -24.71875, -23.21875, -21.71875, -20.21875, -18.71875, -17.21875, -15.71875, -14.21875, -12.71875, -11.21875, -9.71875, -8.21875, -6.71875, -5.21875, -3.71875, -2.21875, -0.71875, 0.78125, 2.28125, 3.78125, 5.28125, 6.78125, 8.28125, 9.78125, 11.28125, 12.78125, 14.28125, 15.78125, 17.28125, 18.78125, 20.28125, 21.78125, 23.28125, 24.78125, 26.28125, 27.78125, 29.28125, 30.78125, 32.28125, 33.78125, 35.28125, 36.78125, 38.28125, 39.78125, 41.28125, 42.78125, 44.28125, 45.78125, 47.28125, 48.78125, 50.28125, 51.78125, 53.28125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 8.0, 8.0, 6.0, 7.0, 6.0, 14.0, 17.0, 18.0, 39.0, 44.0, 61.0, 96.0, 119.0, 125.0, 115.0, 85.0, 56.0, 43.0, 30.0, 13.0, 17.0, 18.0, 12.0, 7.0, 8.0, 11.0, 1.0, 5.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-121.70426177978516, -117.93956756591797, -114.17488098144531, -110.41018676757812, -106.64549255371094, -102.88079833984375, -99.11610412597656, -95.3514175415039, -91.58672332763672, -87.82202911376953, -84.05734252929688, -80.29264831542969, -76.5279541015625, -72.76325988769531, -68.99856567382812, -65.23387908935547, -61.46918487548828, -57.704490661621094, -53.93980026245117, -50.17510986328125, -46.41041564941406, -42.645721435546875, -38.88103103637695, -35.11634063720703, -31.351646423339844, -27.58695411682129, -23.822261810302734, -20.05756950378418, -16.292877197265625, -12.52818489074707, -8.763492584228516, -4.998800277709961, -1.2341079711914062, 2.5305843353271484, 6.295276641845703, 10.059968948364258, 13.824661254882812, 17.589353561401367, 21.354045867919922, 25.118738174438477, 28.88343048095703, 32.64812469482422, 36.41281509399414, 40.17750549316406, 43.94219970703125, 47.70689392089844, 51.47158432006836, 55.23627471923828, 59.00096893310547, 62.765663146972656, 66.53034973144531, 70.2950439453125, 74.05973815917969, 77.82443237304688, 81.58912658691406, 85.35381317138672, 89.1185073852539, 92.8832015991211, 96.64788818359375, 100.41258239746094, 104.17727661132812, 107.94197082519531, 111.7066650390625, 115.47135162353516, 119.23604583740234]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 10.0, 10.0, 7.0, 11.0, 13.0, 15.0, 22.0, 20.0, 23.0, 21.0, 30.0, 28.0, 31.0, 29.0, 28.0, 41.0, 50.0, 44.0, 52.0, 35.0, 54.0, 50.0, 46.0, 37.0, 34.0, 31.0, 32.0, 26.0, 34.0, 24.0, 16.0, 18.0, 14.0, 10.0, 10.0, 12.0, 8.0, 9.0, 5.0, 2.0, 0.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.22354125976562, -81.3347396850586, -78.44593048095703, -75.55712890625, -72.66832733154297, -69.77952575683594, -66.89071655273438, -64.00191497802734, -61.11310958862305, -58.22430419921875, -55.33550262451172, -52.44669723510742, -49.557891845703125, -46.669090270996094, -43.7802848815918, -40.8914794921875, -38.00267791748047, -35.11387252807617, -32.22507095336914, -29.336265563964844, -26.44746208190918, -23.558658599853516, -20.66985321044922, -17.781049728393555, -14.89224624633789, -12.003442764282227, -9.114638328552246, -6.225833892822266, -3.3370304107666016, -0.4482269287109375, 2.4405784606933594, 5.329381942749023, 8.218185424804688, 11.106988906860352, 13.995793342590332, 16.884597778320312, 19.773401260375977, 22.66220474243164, 25.551010131835938, 28.4398136138916, 31.328617095947266, 34.21742248535156, 37.106224060058594, 39.99502944946289, 42.88383483886719, 45.77263641357422, 48.661441802978516, 51.55024719238281, 54.439048767089844, 57.32785415649414, 60.21665573120117, 63.10546112060547, 65.9942626953125, 68.88307189941406, 71.7718734741211, 74.66067504882812, 77.54948425292969, 80.43828582763672, 83.32709503173828, 86.21589660644531, 89.10469818115234, 91.99349975585938, 94.88230895996094, 97.77111053466797, 100.659912109375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 9.0, 9.0, 13.0, 10.0, 16.0, 19.0, 22.0, 24.0, 40.0, 29.0, 35.0, 30.0, 35.0, 36.0, 54.0, 54.0, 44.0, 44.0, 39.0, 42.0, 43.0, 43.0, 36.0, 40.0, 28.0, 30.0, 31.0, 20.0, 14.0, 21.0, 9.0, 12.0, 12.0, 12.0, 12.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.5078125, -14.083984375, -13.66015625, -13.236328125, -12.8125, -12.388671875, -11.96484375, -11.541015625, -11.1171875, -10.693359375, -10.26953125, -9.845703125, -9.421875, -8.998046875, -8.57421875, -8.150390625, -7.7265625, -7.302734375, -6.87890625, -6.455078125, -6.03125, -5.607421875, -5.18359375, -4.759765625, -4.3359375, -3.912109375, -3.48828125, -3.064453125, -2.640625, -2.216796875, -1.79296875, -1.369140625, -0.9453125, -0.521484375, -0.09765625, 0.326171875, 0.75, 1.173828125, 1.59765625, 2.021484375, 2.4453125, 2.869140625, 3.29296875, 3.716796875, 4.140625, 4.564453125, 4.98828125, 5.412109375, 5.8359375, 6.259765625, 6.68359375, 7.107421875, 7.53125, 7.955078125, 8.37890625, 8.802734375, 9.2265625, 9.650390625, 10.07421875, 10.498046875, 10.921875, 11.345703125, 11.76953125, 12.193359375, 12.6171875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 16.0, 20.0, 21.0, 40.0, 46.0, 75.0, 109.0, 204.0, 306.0, 501.0, 783.0, 1315.0, 2224.0, 3715.0, 6279.0, 10634.0, 18509.0, 32781.0, 62056.0, 130434.0, 288271.0, 254085.0, 111762.0, 54668.0, 29391.0, 16475.0, 9680.0, 5749.0, 3242.0, 2017.0, 1195.0, 746.0, 419.0, 296.0, 152.0, 126.0, 78.0, 36.0, 33.0, 20.0, 15.0, 12.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7900390625, -1.73211669921875, -1.6741943359375, -1.61627197265625, -1.558349609375, -1.50042724609375, -1.4425048828125, -1.38458251953125, -1.32666015625, -1.26873779296875, -1.2108154296875, -1.15289306640625, -1.094970703125, -1.03704833984375, -0.9791259765625, -0.92120361328125, -0.86328125, -0.80535888671875, -0.7474365234375, -0.68951416015625, -0.631591796875, -0.57366943359375, -0.5157470703125, -0.45782470703125, -0.39990234375, -0.34197998046875, -0.2840576171875, -0.22613525390625, -0.168212890625, -0.11029052734375, -0.0523681640625, 0.00555419921875, 0.0634765625, 0.12139892578125, 0.1793212890625, 0.23724365234375, 0.295166015625, 0.35308837890625, 0.4110107421875, 0.46893310546875, 0.52685546875, 0.58477783203125, 0.6427001953125, 0.70062255859375, 0.758544921875, 0.81646728515625, 0.8743896484375, 0.93231201171875, 0.990234375, 1.04815673828125, 1.1060791015625, 1.16400146484375, 1.221923828125, 1.27984619140625, 1.3377685546875, 1.39569091796875, 1.45361328125, 1.51153564453125, 1.5694580078125, 1.62738037109375, 1.685302734375, 1.74322509765625, 1.8011474609375, 1.85906982421875, 1.9169921875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 6.0, 8.0, 10.0, 9.0, 11.0, 17.0, 22.0, 26.0, 22.0, 28.0, 26.0, 25.0, 34.0, 30.0, 32.0, 26.0, 44.0, 43.0, 36.0, 1065.0, 35.0, 50.0, 45.0, 34.0, 43.0, 24.0, 30.0, 24.0, 26.0, 40.0, 21.0, 14.0, 19.0, 20.0, 12.0, 7.0, 15.0, 9.0, 7.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.0390625, -7.792236328125, -7.54541015625, -7.298583984375, -7.0517578125, -6.804931640625, -6.55810546875, -6.311279296875, -6.064453125, -5.817626953125, -5.57080078125, -5.323974609375, -5.0771484375, -4.830322265625, -4.58349609375, -4.336669921875, -4.08984375, -3.843017578125, -3.59619140625, -3.349365234375, -3.1025390625, -2.855712890625, -2.60888671875, -2.362060546875, -2.115234375, -1.868408203125, -1.62158203125, -1.374755859375, -1.1279296875, -0.881103515625, -0.63427734375, -0.387451171875, -0.140625, 0.106201171875, 0.35302734375, 0.599853515625, 0.8466796875, 1.093505859375, 1.34033203125, 1.587158203125, 1.833984375, 2.080810546875, 2.32763671875, 2.574462890625, 2.8212890625, 3.068115234375, 3.31494140625, 3.561767578125, 3.80859375, 4.055419921875, 4.30224609375, 4.549072265625, 4.7958984375, 5.042724609375, 5.28955078125, 5.536376953125, 5.783203125, 6.030029296875, 6.27685546875, 6.523681640625, 6.7705078125, 7.017333984375, 7.26416015625, 7.510986328125, 7.7578125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 18.0, 16.0, 37.0, 66.0, 96.0, 152.0, 210.0, 326.0, 446.0, 727.0, 1000.0, 1507.0, 2221.0, 3435.0, 5141.0, 7787.0, 11880.0, 17991.0, 28046.0, 45058.0, 75261.0, 132252.0, 1183360.0, 276062.0, 119283.0, 68693.0, 41181.0, 25713.0, 16424.0, 10920.0, 7192.0, 4871.0, 3214.0, 2218.0, 1410.0, 996.0, 612.0, 429.0, 320.0, 174.0, 117.0, 89.0, 60.0, 41.0, 23.0, 12.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.76708984375, -0.7437820434570312, -0.7204742431640625, -0.6971664428710938, -0.673858642578125, -0.6505508422851562, -0.6272430419921875, -0.6039352416992188, -0.58062744140625, -0.5573196411132812, -0.5340118408203125, -0.5107040405273438, -0.487396240234375, -0.46408843994140625, -0.4407806396484375, -0.41747283935546875, -0.3941650390625, -0.37085723876953125, -0.3475494384765625, -0.32424163818359375, -0.300933837890625, -0.27762603759765625, -0.2543182373046875, -0.23101043701171875, -0.20770263671875, -0.18439483642578125, -0.1610870361328125, -0.13777923583984375, -0.114471435546875, -0.09116363525390625, -0.0678558349609375, -0.04454803466796875, -0.021240234375, 0.00206756591796875, 0.0253753662109375, 0.04868316650390625, 0.071990966796875, 0.09529876708984375, 0.1186065673828125, 0.14191436767578125, 0.16522216796875, 0.18852996826171875, 0.2118377685546875, 0.23514556884765625, 0.258453369140625, 0.28176116943359375, 0.3050689697265625, 0.32837677001953125, 0.3516845703125, 0.37499237060546875, 0.3983001708984375, 0.42160797119140625, 0.444915771484375, 0.46822357177734375, 0.4915313720703125, 0.5148391723632812, 0.53814697265625, 0.5614547729492188, 0.5847625732421875, 0.6080703735351562, 0.631378173828125, 0.6546859741210938, 0.6779937744140625, 0.7013015747070312, 0.724609375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 2.0, 10.0, 11.0, 18.0, 20.0, 25.0, 43.0, 59.0, 72.0, 131.0, 190.0, 122.0, 77.0, 68.0, 41.0, 36.0, 24.0, 12.0, 9.0, 4.0, 1.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.032501220703125, -0.031502723693847656, -0.030504226684570312, -0.02950572967529297, -0.028507232666015625, -0.02750873565673828, -0.026510238647460938, -0.025511741638183594, -0.02451324462890625, -0.023514747619628906, -0.022516250610351562, -0.02151775360107422, -0.020519256591796875, -0.01952075958251953, -0.018522262573242188, -0.017523765563964844, -0.0165252685546875, -0.015526771545410156, -0.014528274536132812, -0.013529777526855469, -0.012531280517578125, -0.011532783508300781, -0.010534286499023438, -0.009535789489746094, -0.00853729248046875, -0.007538795471191406, -0.0065402984619140625, -0.005541801452636719, -0.004543304443359375, -0.0035448074340820312, -0.0025463104248046875, -0.0015478134155273438, -0.00054931640625, 0.00044918060302734375, 0.0014476776123046875, 0.0024461746215820312, 0.003444671630859375, 0.004443168640136719, 0.0054416656494140625, 0.006440162658691406, 0.00743865966796875, 0.008437156677246094, 0.009435653686523438, 0.010434150695800781, 0.011432647705078125, 0.012431144714355469, 0.013429641723632812, 0.014428138732910156, 0.0154266357421875, 0.016425132751464844, 0.017423629760742188, 0.01842212677001953, 0.019420623779296875, 0.02041912078857422, 0.021417617797851562, 0.022416114807128906, 0.02341461181640625, 0.024413108825683594, 0.025411605834960938, 0.02641010284423828, 0.027408599853515625, 0.02840709686279297, 0.029405593872070312, 0.030404090881347656, 0.031402587890625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 9.0, 5.0, 14.0, 18.0, 21.0, 32.0, 33.0, 46.0, 67.0, 106.0, 123.0, 199.0, 347.0, 800.0, 3335.0, 25974.0, 921342.0, 87163.0, 6444.0, 1329.0, 438.0, 206.0, 123.0, 95.0, 62.0, 53.0, 29.0, 23.0, 25.0, 18.0, 13.0, 9.0, 5.0, 11.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50927734375, -0.49320220947265625, -0.4771270751953125, -0.46105194091796875, -0.444976806640625, -0.42890167236328125, -0.4128265380859375, -0.39675140380859375, -0.38067626953125, -0.36460113525390625, -0.3485260009765625, -0.33245086669921875, -0.316375732421875, -0.30030059814453125, -0.2842254638671875, -0.26815032958984375, -0.2520751953125, -0.23600006103515625, -0.2199249267578125, -0.20384979248046875, -0.187774658203125, -0.17169952392578125, -0.1556243896484375, -0.13954925537109375, -0.12347412109375, -0.10739898681640625, -0.0913238525390625, -0.07524871826171875, -0.059173583984375, -0.04309844970703125, -0.0270233154296875, -0.01094818115234375, 0.005126953125, 0.02120208740234375, 0.0372772216796875, 0.05335235595703125, 0.069427490234375, 0.08550262451171875, 0.1015777587890625, 0.11765289306640625, 0.13372802734375, 0.14980316162109375, 0.1658782958984375, 0.18195343017578125, 0.198028564453125, 0.21410369873046875, 0.2301788330078125, 0.24625396728515625, 0.2623291015625, 0.27840423583984375, 0.2944793701171875, 0.31055450439453125, 0.326629638671875, 0.34270477294921875, 0.3587799072265625, 0.37485504150390625, 0.39093017578125, 0.40700531005859375, 0.4230804443359375, 0.43915557861328125, 0.455230712890625, 0.47130584716796875, 0.4873809814453125, 0.5034561157226562, 0.51953125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 16.0, 66.0, 250.0, 454.0, 128.0, 52.0, 16.0, 12.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2257242053747177, -0.21600471436977386, -0.20628522336483002, -0.19656573235988617, -0.18684624135494232, -0.17712675034999847, -0.16740724444389343, -0.15768775343894958, -0.14796826243400574, -0.1382487714290619, -0.12852928042411804, -0.1188097894191742, -0.10909029841423035, -0.0993708074092865, -0.08965130895376205, -0.0799318179488182, -0.07021233439445496, -0.06049284338951111, -0.05077335238456726, -0.041053857654333115, -0.03133436664938927, -0.02161487564444542, -0.011895380914211273, -0.0021758899092674255, 0.007543601095676422, 0.01726309210062027, 0.026982584968209267, 0.036702077835798264, 0.04642156884074211, 0.05614105984568596, 0.0658605545759201, 0.07558004558086395, 0.0852995216846466, 0.09501901268959045, 0.1047385036945343, 0.11445799469947815, 0.124177485704422, 0.13389697670936584, 0.1436164677143097, 0.15333595871925354, 0.1630554497241974, 0.17277494072914124, 0.18249443173408508, 0.19221392273902893, 0.20193341374397278, 0.21165290474891663, 0.22137239575386047, 0.23109188675880432, 0.24081139266490936, 0.2505308985710144, 0.26025038957595825, 0.2699698805809021, 0.27968937158584595, 0.2894088625907898, 0.29912835359573364, 0.3088478446006775, 0.31856733560562134, 0.3282868266105652, 0.33800631761550903, 0.3477258086204529, 0.35744529962539673, 0.3671647906303406, 0.3768842816352844, 0.38660377264022827, 0.3963232636451721]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 5.0, 7.0, 7.0, 14.0, 21.0, 13.0, 20.0, 18.0, 16.0, 21.0, 34.0, 33.0, 26.0, 31.0, 31.0, 39.0, 48.0, 46.0, 39.0, 32.0, 43.0, 32.0, 36.0, 37.0, 41.0, 30.0, 26.0, 20.0, 37.0, 29.0, 28.0, 23.0, 21.0, 16.0, 13.0, 11.0, 10.0, 12.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01572597026824951, -0.015226421877741814, -0.014726873487234116, -0.014227325096726418, -0.01372777670621872, -0.013228228315711021, -0.012728679925203323, -0.012229131534695625, -0.011729583144187927, -0.01123003475368023, -0.010730486363172531, -0.010230937972664833, -0.009731389582157135, -0.009231841191649437, -0.008732292801141739, -0.00823274441063404, -0.007733196020126343, -0.007233647629618645, -0.006734099239110947, -0.006234550848603249, -0.0057350024580955505, -0.0052354540675878525, -0.004735905677080154, -0.004236357286572456, -0.0037368088960647583, -0.0032372605055570602, -0.002737712115049362, -0.002238163724541664, -0.001738615334033966, -0.001239066943526268, -0.00073951855301857, -0.0002399701625108719, 0.00025957822799682617, 0.0007591266185045242, 0.0012586750090122223, 0.0017582233995199203, 0.0022577717900276184, 0.0027573201805353165, 0.0032568685710430145, 0.0037564169615507126, 0.004255965352058411, 0.004755513742566109, 0.005255062133073807, 0.005754610523581505, 0.006254158914089203, 0.006753707304596901, 0.007253255695104599, 0.007752804085612297, 0.008252352476119995, 0.008751900866627693, 0.009251449257135391, 0.00975099764764309, 0.010250546038150787, 0.010750094428658485, 0.011249642819166183, 0.011749191209673882, 0.01224873960018158, 0.012748287990689278, 0.013247836381196976, 0.013747384771704674, 0.014246933162212372, 0.01474648155272007, 0.015246029943227768, 0.015745578333735466, 0.016245126724243164]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 9.0, 9.0, 13.0, 11.0, 15.0, 20.0, 21.0, 25.0, 40.0, 31.0, 34.0, 28.0, 35.0, 36.0, 54.0, 55.0, 44.0, 44.0, 38.0, 44.0, 42.0, 43.0, 35.0, 40.0, 30.0, 28.0, 32.0, 19.0, 15.0, 20.0, 9.0, 13.0, 12.0, 11.0, 12.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.5, -14.076171875, -13.65234375, -13.228515625, -12.8046875, -12.380859375, -11.95703125, -11.533203125, -11.109375, -10.685546875, -10.26171875, -9.837890625, -9.4140625, -8.990234375, -8.56640625, -8.142578125, -7.71875, -7.294921875, -6.87109375, -6.447265625, -6.0234375, -5.599609375, -5.17578125, -4.751953125, -4.328125, -3.904296875, -3.48046875, -3.056640625, -2.6328125, -2.208984375, -1.78515625, -1.361328125, -0.9375, -0.513671875, -0.08984375, 0.333984375, 0.7578125, 1.181640625, 1.60546875, 2.029296875, 2.453125, 2.876953125, 3.30078125, 3.724609375, 4.1484375, 4.572265625, 4.99609375, 5.419921875, 5.84375, 6.267578125, 6.69140625, 7.115234375, 7.5390625, 7.962890625, 8.38671875, 8.810546875, 9.234375, 9.658203125, 10.08203125, 10.505859375, 10.9296875, 11.353515625, 11.77734375, 12.201171875, 12.625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 8.0, 12.0, 11.0, 15.0, 16.0, 28.0, 41.0, 54.0, 70.0, 106.0, 209.0, 316.0, 566.0, 1085.0, 2319.0, 5073.0, 12701.0, 36259.0, 129081.0, 522457.0, 246274.0, 58576.0, 19358.0, 7454.0, 3147.0, 1481.0, 746.0, 416.0, 219.0, 145.0, 78.0, 50.0, 37.0, 37.0, 35.0, 15.0, 17.0, 13.0, 7.0, 8.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.5625, -8.3157958984375, -8.069091796875, -7.8223876953125, -7.57568359375, -7.3289794921875, -7.082275390625, -6.8355712890625, -6.5888671875, -6.3421630859375, -6.095458984375, -5.8487548828125, -5.60205078125, -5.3553466796875, -5.108642578125, -4.8619384765625, -4.615234375, -4.3685302734375, -4.121826171875, -3.8751220703125, -3.62841796875, -3.3817138671875, -3.135009765625, -2.8883056640625, -2.6416015625, -2.3948974609375, -2.148193359375, -1.9014892578125, -1.65478515625, -1.4080810546875, -1.161376953125, -0.9146728515625, -0.66796875, -0.4212646484375, -0.174560546875, 0.0721435546875, 0.31884765625, 0.5655517578125, 0.812255859375, 1.0589599609375, 1.3056640625, 1.5523681640625, 1.799072265625, 2.0457763671875, 2.29248046875, 2.5391845703125, 2.785888671875, 3.0325927734375, 3.279296875, 3.5260009765625, 3.772705078125, 4.0194091796875, 4.26611328125, 4.5128173828125, 4.759521484375, 5.0062255859375, 5.2529296875, 5.4996337890625, 5.746337890625, 5.9930419921875, 6.23974609375, 6.4864501953125, 6.733154296875, 6.9798583984375, 7.2265625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 4.0, 6.0, 8.0, 13.0, 10.0, 10.0, 11.0, 18.0, 25.0, 27.0, 27.0, 33.0, 25.0, 44.0, 37.0, 48.0, 32.0, 37.0, 53.0, 150.0, 1888.0, 108.0, 40.0, 38.0, 31.0, 33.0, 43.0, 31.0, 28.0, 31.0, 29.0, 22.0, 16.0, 16.0, 13.0, 10.0, 9.0, 7.0, 10.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.4375, -41.08642578125, -39.7353515625, -38.38427734375, -37.033203125, -35.68212890625, -34.3310546875, -32.97998046875, -31.62890625, -30.27783203125, -28.9267578125, -27.57568359375, -26.224609375, -24.87353515625, -23.5224609375, -22.17138671875, -20.8203125, -19.46923828125, -18.1181640625, -16.76708984375, -15.416015625, -14.06494140625, -12.7138671875, -11.36279296875, -10.01171875, -8.66064453125, -7.3095703125, -5.95849609375, -4.607421875, -3.25634765625, -1.9052734375, -0.55419921875, 0.796875, 2.14794921875, 3.4990234375, 4.85009765625, 6.201171875, 7.55224609375, 8.9033203125, 10.25439453125, 11.60546875, 12.95654296875, 14.3076171875, 15.65869140625, 17.009765625, 18.36083984375, 19.7119140625, 21.06298828125, 22.4140625, 23.76513671875, 25.1162109375, 26.46728515625, 27.818359375, 29.16943359375, 30.5205078125, 31.87158203125, 33.22265625, 34.57373046875, 35.9248046875, 37.27587890625, 38.626953125, 39.97802734375, 41.3291015625, 42.68017578125, 44.03125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 6.0, 10.0, 6.0, 10.0, 16.0, 18.0, 11.0, 25.0, 28.0, 37.0, 56.0, 58.0, 93.0, 111.0, 125.0, 186.0, 355.0, 794.0, 5153.0, 3109949.0, 25971.0, 1271.0, 417.0, 217.0, 199.0, 114.0, 98.0, 72.0, 61.0, 50.0, 37.0, 29.0, 29.0, 11.0, 10.0, 14.0, 10.0, 7.0, 8.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-89.5, -86.841796875, -84.18359375, -81.525390625, -78.8671875, -76.208984375, -73.55078125, -70.892578125, -68.234375, -65.576171875, -62.91796875, -60.259765625, -57.6015625, -54.943359375, -52.28515625, -49.626953125, -46.96875, -44.310546875, -41.65234375, -38.994140625, -36.3359375, -33.677734375, -31.01953125, -28.361328125, -25.703125, -23.044921875, -20.38671875, -17.728515625, -15.0703125, -12.412109375, -9.75390625, -7.095703125, -4.4375, -1.779296875, 0.87890625, 3.537109375, 6.1953125, 8.853515625, 11.51171875, 14.169921875, 16.828125, 19.486328125, 22.14453125, 24.802734375, 27.4609375, 30.119140625, 32.77734375, 35.435546875, 38.09375, 40.751953125, 43.41015625, 46.068359375, 48.7265625, 51.384765625, 54.04296875, 56.701171875, 59.359375, 62.017578125, 64.67578125, 67.333984375, 69.9921875, 72.650390625, 75.30859375, 77.966796875, 80.625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 535.0, 480.0], "bins": [-804.3517456054688, -791.5792236328125, -778.806640625, -766.0341186523438, -753.2615966796875, -740.489013671875, -727.7164916992188, -714.9439697265625, -702.1714477539062, -689.39892578125, -676.6263427734375, -663.8538208007812, -651.081298828125, -638.3087158203125, -625.5361938476562, -612.763671875, -599.9910888671875, -587.2185668945312, -574.4459838867188, -561.6734619140625, -548.9009399414062, -536.12841796875, -523.3558349609375, -510.58331298828125, -497.810791015625, -485.0382385253906, -472.2657165527344, -459.4931640625, -446.72064208984375, -433.9480895996094, -421.175537109375, -408.40301513671875, -395.6304626464844, -382.85791015625, -370.08538818359375, -357.3128356933594, -344.5403137207031, -331.76776123046875, -318.9952392578125, -306.2226867675781, -293.45013427734375, -280.6775817871094, -267.9050598144531, -255.13250732421875, -242.35997009277344, -229.58743286132812, -216.8148956298828, -204.0423583984375, -191.2698211669922, -178.49728393554688, -165.72474670410156, -152.95220947265625, -140.17965698242188, -127.40711975097656, -114.63458251953125, -101.8620376586914, -89.08950805664062, -76.31697082519531, -63.54442596435547, -50.771888732910156, -37.99934768676758, -25.226806640625, -12.454269409179688, 0.31827545166015625, 13.090814590454102]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 3.0, 3.0, 9.0, 7.0, 8.0, 10.0, 8.0, 12.0, 8.0, 19.0, 12.0, 23.0, 13.0, 25.0, 29.0, 31.0, 34.0, 39.0, 38.0, 30.0, 38.0, 37.0, 37.0, 52.0, 49.0, 47.0, 31.0, 45.0, 39.0, 32.0, 27.0, 32.0, 26.0, 23.0, 19.0, 18.0, 12.0, 15.0, 12.0, 11.0, 13.0, 6.0, 5.0, 3.0, 3.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-108.20925903320312, -104.6911392211914, -101.17302703857422, -97.6549072265625, -94.13679504394531, -90.6186752319336, -87.10055541992188, -83.58244323730469, -80.0643310546875, -76.54621124267578, -73.0280990600586, -69.50997924804688, -65.99186706542969, -62.47374725341797, -58.955631256103516, -55.43751525878906, -51.919395446777344, -48.40127944946289, -44.88316345214844, -41.36504364013672, -37.84693145751953, -34.32881164550781, -30.81069564819336, -27.292579650878906, -23.774463653564453, -20.25634765625, -16.738231658935547, -13.220113754272461, -9.701997756958008, -6.183881759643555, -2.6657638549804688, 0.8523521423339844, 4.370460510253906, 7.888576984405518, 11.406693458557129, 14.924810409545898, 18.44292640686035, 21.961042404174805, 25.47916030883789, 28.997276306152344, 32.5153923034668, 36.03350830078125, 39.5516242980957, 43.069740295410156, 46.587860107421875, 50.10597229003906, 53.62409210205078, 57.142208099365234, 60.66032409667969, 64.1784439086914, 67.6965560913086, 71.21467590332031, 74.7327880859375, 78.25090789794922, 81.76902770996094, 85.28713989257812, 88.80525207519531, 92.32337188720703, 95.84148406982422, 99.35960388183594, 102.87771606445312, 106.39583587646484, 109.91395568847656, 113.43206787109375, 116.95018768310547]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 10.0, 10.0, 10.0, 15.0, 8.0, 19.0, 22.0, 25.0, 39.0, 27.0, 43.0, 31.0, 30.0, 38.0, 42.0, 54.0, 52.0, 48.0, 36.0, 44.0, 43.0, 37.0, 46.0, 41.0, 28.0, 23.0, 26.0, 25.0, 17.0, 20.0, 9.0, 13.0, 16.0, 8.0, 10.0, 7.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.578125, -14.15380859375, -13.7294921875, -13.30517578125, -12.880859375, -12.45654296875, -12.0322265625, -11.60791015625, -11.18359375, -10.75927734375, -10.3349609375, -9.91064453125, -9.486328125, -9.06201171875, -8.6376953125, -8.21337890625, -7.7890625, -7.36474609375, -6.9404296875, -6.51611328125, -6.091796875, -5.66748046875, -5.2431640625, -4.81884765625, -4.39453125, -3.97021484375, -3.5458984375, -3.12158203125, -2.697265625, -2.27294921875, -1.8486328125, -1.42431640625, -1.0, -0.57568359375, -0.1513671875, 0.27294921875, 0.697265625, 1.12158203125, 1.5458984375, 1.97021484375, 2.39453125, 2.81884765625, 3.2431640625, 3.66748046875, 4.091796875, 4.51611328125, 4.9404296875, 5.36474609375, 5.7890625, 6.21337890625, 6.6376953125, 7.06201171875, 7.486328125, 7.91064453125, 8.3349609375, 8.75927734375, 9.18359375, 9.60791015625, 10.0322265625, 10.45654296875, 10.880859375, 11.30517578125, 11.7294921875, 12.15380859375, 12.578125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 10.0, 12.0, 15.0, 12.0, 16.0, 19.0, 27.0, 48.0, 65.0, 102.0, 134.0, 239.0, 396.0, 758.0, 1507.0, 3345.0, 8351.0, 38971.0, 3227112.0, 881874.0, 19818.0, 6058.0, 2613.0, 1215.0, 631.0, 332.0, 196.0, 115.0, 77.0, 52.0, 41.0, 27.0, 13.0, 11.0, 13.0, 17.0, 8.0, 6.0, 7.0, 2.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.375, -58.5908203125, -56.806640625, -55.0224609375, -53.23828125, -51.4541015625, -49.669921875, -47.8857421875, -46.1015625, -44.3173828125, -42.533203125, -40.7490234375, -38.96484375, -37.1806640625, -35.396484375, -33.6123046875, -31.828125, -30.0439453125, -28.259765625, -26.4755859375, -24.69140625, -22.9072265625, -21.123046875, -19.3388671875, -17.5546875, -15.7705078125, -13.986328125, -12.2021484375, -10.41796875, -8.6337890625, -6.849609375, -5.0654296875, -3.28125, -1.4970703125, 0.287109375, 2.0712890625, 3.85546875, 5.6396484375, 7.423828125, 9.2080078125, 10.9921875, 12.7763671875, 14.560546875, 16.3447265625, 18.12890625, 19.9130859375, 21.697265625, 23.4814453125, 25.265625, 27.0498046875, 28.833984375, 30.6181640625, 32.40234375, 34.1865234375, 35.970703125, 37.7548828125, 39.5390625, 41.3232421875, 43.107421875, 44.8916015625, 46.67578125, 48.4599609375, 50.244140625, 52.0283203125, 53.8125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 4.0, 5.0, 9.0, 7.0, 9.0, 7.0, 12.0, 11.0, 17.0, 17.0, 25.0, 28.0, 49.0, 79.0, 178.0, 327.0, 641.0, 879.0, 764.0, 422.0, 222.0, 129.0, 69.0, 26.0, 21.0, 18.0, 14.0, 14.0, 12.0, 5.0, 5.0, 8.0, 7.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-35.40625, -34.38671875, -33.3671875, -32.34765625, -31.328125, -30.30859375, -29.2890625, -28.26953125, -27.25, -26.23046875, -25.2109375, -24.19140625, -23.171875, -22.15234375, -21.1328125, -20.11328125, -19.09375, -18.07421875, -17.0546875, -16.03515625, -15.015625, -13.99609375, -12.9765625, -11.95703125, -10.9375, -9.91796875, -8.8984375, -7.87890625, -6.859375, -5.83984375, -4.8203125, -3.80078125, -2.78125, -1.76171875, -0.7421875, 0.27734375, 1.296875, 2.31640625, 3.3359375, 4.35546875, 5.375, 6.39453125, 7.4140625, 8.43359375, 9.453125, 10.47265625, 11.4921875, 12.51171875, 13.53125, 14.55078125, 15.5703125, 16.58984375, 17.609375, 18.62890625, 19.6484375, 20.66796875, 21.6875, 22.70703125, 23.7265625, 24.74609375, 25.765625, 26.78515625, 27.8046875, 28.82421875, 29.84375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 0.0, 4.0, 1.0, 9.0, 7.0, 7.0, 23.0, 35.0, 75.0, 149.0, 247.0, 449.0, 839.0, 1760.0, 3441.0, 7470.0, 17801.0, 57515.0, 1956658.0, 2057528.0, 57897.0, 17732.0, 7434.0, 3519.0, 1732.0, 886.0, 478.0, 250.0, 129.0, 66.0, 57.0, 22.0, 19.0, 5.0, 9.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.65625, -59.45458984375, -57.2529296875, -55.05126953125, -52.849609375, -50.64794921875, -48.4462890625, -46.24462890625, -44.04296875, -41.84130859375, -39.6396484375, -37.43798828125, -35.236328125, -33.03466796875, -30.8330078125, -28.63134765625, -26.4296875, -24.22802734375, -22.0263671875, -19.82470703125, -17.623046875, -15.42138671875, -13.2197265625, -11.01806640625, -8.81640625, -6.61474609375, -4.4130859375, -2.21142578125, -0.009765625, 2.19189453125, 4.3935546875, 6.59521484375, 8.796875, 10.99853515625, 13.2001953125, 15.40185546875, 17.603515625, 19.80517578125, 22.0068359375, 24.20849609375, 26.41015625, 28.61181640625, 30.8134765625, 33.01513671875, 35.216796875, 37.41845703125, 39.6201171875, 41.82177734375, 44.0234375, 46.22509765625, 48.4267578125, 50.62841796875, 52.830078125, 55.03173828125, 57.2333984375, 59.43505859375, 61.63671875, 63.83837890625, 66.0400390625, 68.24169921875, 70.443359375, 72.64501953125, 74.8466796875, 77.04833984375, 79.25]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 6.0, 12.0, 17.0, 23.0, 51.0, 63.0, 101.0, 167.0, 157.0, 135.0, 75.0, 51.0, 37.0, 22.0, 14.0, 14.0, 10.0, 11.0, 5.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.67414855957031, -104.3000717163086, -98.92598724365234, -93.55191040039062, -88.17782592773438, -82.80374908447266, -77.42967224121094, -72.05558776855469, -66.68151092529297, -61.307430267333984, -55.933349609375, -50.55927276611328, -45.1851921081543, -39.81111145019531, -34.437034606933594, -29.06295394897461, -23.688873291015625, -18.31479263305664, -12.940713882446289, -7.5666351318359375, -2.192554473876953, 3.1815261840820312, 8.55560302734375, 13.929683685302734, 19.30376434326172, 24.677845001220703, 30.051923751831055, 35.426002502441406, 40.80008316040039, 46.174163818359375, 51.548240661621094, 56.92232131958008, 62.296417236328125, 67.67049407958984, 73.0445785522461, 78.41865539550781, 83.79273986816406, 89.16681671142578, 94.5408935546875, 99.91497802734375, 105.28905487060547, 110.66313171386719, 116.03721618652344, 121.41129302978516, 126.78536987304688, 132.15945434570312, 137.53353881835938, 142.90760803222656, 148.2816925048828, 153.65577697753906, 159.02984619140625, 164.4039306640625, 169.77801513671875, 175.152099609375, 180.5261688232422, 185.90025329589844, 191.27432250976562, 196.64840698242188, 202.02247619628906, 207.3965606689453, 212.77064514160156, 218.14471435546875, 223.518798828125, 228.89288330078125, 234.2669677734375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 9.0, 7.0, 8.0, 20.0, 21.0, 14.0, 21.0, 17.0, 11.0, 26.0, 28.0, 30.0, 30.0, 30.0, 42.0, 45.0, 39.0, 52.0, 43.0, 41.0, 33.0, 38.0, 35.0, 41.0, 32.0, 33.0, 33.0, 35.0, 24.0, 18.0, 16.0, 17.0, 20.0, 12.0, 13.0, 15.0, 13.0, 4.0, 9.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-88.70303344726562, -85.9404525756836, -83.17787170410156, -80.41529846191406, -77.65271759033203, -74.89013671875, -72.12755584716797, -69.36497497558594, -66.60240173339844, -63.839820861816406, -61.07724380493164, -58.31466293334961, -55.552085876464844, -52.78950500488281, -50.02692413330078, -47.26434326171875, -44.50176239013672, -41.73918151855469, -38.97660446166992, -36.21402359008789, -33.451446533203125, -30.688865661621094, -27.926284790039062, -25.163705825805664, -22.401126861572266, -19.638547897338867, -16.87596893310547, -14.113388061523438, -11.350809097290039, -8.58823013305664, -5.825649261474609, -3.063070297241211, -0.30049896240234375, 2.462080478668213, 5.2246599197387695, 7.987239837646484, 10.749818801879883, 13.512397766113281, 16.274978637695312, 19.03755760192871, 21.80013656616211, 24.562715530395508, 27.325294494628906, 30.087875366210938, 32.85045623779297, 35.613033294677734, 38.375614166259766, 41.13819122314453, 43.90077209472656, 46.663352966308594, 49.42593002319336, 52.18851089477539, 54.951087951660156, 57.71366882324219, 60.47624969482422, 63.23883056640625, 66.00140380859375, 68.76398468017578, 71.52656555175781, 74.28913879394531, 77.05171966552734, 79.81430053710938, 82.5768814086914, 85.33946228027344, 88.10204315185547]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 6.0, 2.0, 4.0, 14.0, 8.0, 18.0, 18.0, 11.0, 23.0, 21.0, 31.0, 37.0, 44.0, 26.0, 40.0, 31.0, 40.0, 58.0, 47.0, 47.0, 40.0, 44.0, 36.0, 31.0, 39.0, 36.0, 28.0, 27.0, 28.0, 27.0, 25.0, 19.0, 13.0, 15.0, 8.0, 12.0, 6.0, 9.0, 7.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.9375, -13.5235595703125, -13.109619140625, -12.6956787109375, -12.28173828125, -11.8677978515625, -11.453857421875, -11.0399169921875, -10.6259765625, -10.2120361328125, -9.798095703125, -9.3841552734375, -8.97021484375, -8.5562744140625, -8.142333984375, -7.7283935546875, -7.314453125, -6.9005126953125, -6.486572265625, -6.0726318359375, -5.65869140625, -5.2447509765625, -4.830810546875, -4.4168701171875, -4.0029296875, -3.5889892578125, -3.175048828125, -2.7611083984375, -2.34716796875, -1.9332275390625, -1.519287109375, -1.1053466796875, -0.69140625, -0.2774658203125, 0.136474609375, 0.5504150390625, 0.96435546875, 1.3782958984375, 1.792236328125, 2.2061767578125, 2.6201171875, 3.0340576171875, 3.447998046875, 3.8619384765625, 4.27587890625, 4.6898193359375, 5.103759765625, 5.5177001953125, 5.931640625, 6.3455810546875, 6.759521484375, 7.1734619140625, 7.58740234375, 8.0013427734375, 8.415283203125, 8.8292236328125, 9.2431640625, 9.6571044921875, 10.071044921875, 10.4849853515625, 10.89892578125, 11.3128662109375, 11.726806640625, 12.1407470703125, 12.5546875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 4.0, 5.0, 6.0, 16.0, 18.0, 27.0, 46.0, 68.0, 106.0, 169.0, 265.0, 363.0, 569.0, 782.0, 1159.0, 1752.0, 2398.0, 3775.0, 5636.0, 8416.0, 13411.0, 20949.0, 33847.0, 56956.0, 101411.0, 190447.0, 249411.0, 150500.0, 80700.0, 46652.0, 27766.0, 17628.0, 11219.0, 7398.0, 4822.0, 3235.0, 2176.0, 1470.0, 953.0, 671.0, 410.0, 270.0, 230.0, 150.0, 93.0, 57.0, 46.0, 48.0, 28.0, 12.0, 7.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.490234375, -1.44549560546875, -1.4007568359375, -1.35601806640625, -1.311279296875, -1.26654052734375, -1.2218017578125, -1.17706298828125, -1.13232421875, -1.08758544921875, -1.0428466796875, -0.99810791015625, -0.953369140625, -0.90863037109375, -0.8638916015625, -0.81915283203125, -0.7744140625, -0.72967529296875, -0.6849365234375, -0.64019775390625, -0.595458984375, -0.55072021484375, -0.5059814453125, -0.46124267578125, -0.41650390625, -0.37176513671875, -0.3270263671875, -0.28228759765625, -0.237548828125, -0.19281005859375, -0.1480712890625, -0.10333251953125, -0.05859375, -0.01385498046875, 0.0308837890625, 0.07562255859375, 0.120361328125, 0.16510009765625, 0.2098388671875, 0.25457763671875, 0.29931640625, 0.34405517578125, 0.3887939453125, 0.43353271484375, 0.478271484375, 0.52301025390625, 0.5677490234375, 0.61248779296875, 0.6572265625, 0.70196533203125, 0.7467041015625, 0.79144287109375, 0.836181640625, 0.88092041015625, 0.9256591796875, 0.97039794921875, 1.01513671875, 1.05987548828125, 1.1046142578125, 1.14935302734375, 1.194091796875, 1.23883056640625, 1.2835693359375, 1.32830810546875, 1.373046875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 15.0, 8.0, 6.0, 11.0, 9.0, 19.0, 16.0, 15.0, 18.0, 37.0, 34.0, 42.0, 40.0, 46.0, 39.0, 46.0, 46.0, 1059.0, 32.0, 55.0, 34.0, 38.0, 36.0, 42.0, 37.0, 30.0, 37.0, 30.0, 24.0, 23.0, 15.0, 21.0, 13.0, 10.0, 12.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -7.994384765625, -7.70751953125, -7.420654296875, -7.1337890625, -6.846923828125, -6.56005859375, -6.273193359375, -5.986328125, -5.699462890625, -5.41259765625, -5.125732421875, -4.8388671875, -4.552001953125, -4.26513671875, -3.978271484375, -3.69140625, -3.404541015625, -3.11767578125, -2.830810546875, -2.5439453125, -2.257080078125, -1.97021484375, -1.683349609375, -1.396484375, -1.109619140625, -0.82275390625, -0.535888671875, -0.2490234375, 0.037841796875, 0.32470703125, 0.611572265625, 0.8984375, 1.185302734375, 1.47216796875, 1.759033203125, 2.0458984375, 2.332763671875, 2.61962890625, 2.906494140625, 3.193359375, 3.480224609375, 3.76708984375, 4.053955078125, 4.3408203125, 4.627685546875, 4.91455078125, 5.201416015625, 5.48828125, 5.775146484375, 6.06201171875, 6.348876953125, 6.6357421875, 6.922607421875, 7.20947265625, 7.496337890625, 7.783203125, 8.070068359375, 8.35693359375, 8.643798828125, 8.9306640625, 9.217529296875, 9.50439453125, 9.791259765625, 10.078125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 10.0, 6.0, 11.0, 26.0, 23.0, 34.0, 51.0, 95.0, 141.0, 208.0, 353.0, 531.0, 779.0, 1158.0, 1703.0, 2637.0, 4079.0, 6391.0, 9630.0, 15220.0, 23818.0, 39471.0, 67695.0, 122264.0, 325804.0, 1158663.0, 131262.0, 72534.0, 42149.0, 25421.0, 15888.0, 10039.0, 6544.0, 4345.0, 2797.0, 1869.0, 1224.0, 773.0, 498.0, 325.0, 210.0, 146.0, 101.0, 66.0, 51.0, 34.0, 23.0, 12.0, 16.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.861328125, -0.8352737426757812, -0.8092193603515625, -0.7831649780273438, -0.757110595703125, -0.7310562133789062, -0.7050018310546875, -0.6789474487304688, -0.65289306640625, -0.6268386840820312, -0.6007843017578125, -0.5747299194335938, -0.548675537109375, -0.5226211547851562, -0.4965667724609375, -0.47051239013671875, -0.4444580078125, -0.41840362548828125, -0.3923492431640625, -0.36629486083984375, -0.340240478515625, -0.31418609619140625, -0.2881317138671875, -0.26207733154296875, -0.23602294921875, -0.20996856689453125, -0.1839141845703125, -0.15785980224609375, -0.131805419921875, -0.10575103759765625, -0.0796966552734375, -0.05364227294921875, -0.027587890625, -0.00153350830078125, 0.0245208740234375, 0.05057525634765625, 0.076629638671875, 0.10268402099609375, 0.1287384033203125, 0.15479278564453125, 0.18084716796875, 0.20690155029296875, 0.2329559326171875, 0.25901031494140625, 0.285064697265625, 0.31111907958984375, 0.3371734619140625, 0.36322784423828125, 0.3892822265625, 0.41533660888671875, 0.4413909912109375, 0.46744537353515625, 0.493499755859375, 0.5195541381835938, 0.5456085205078125, 0.5716629028320312, 0.59771728515625, 0.6237716674804688, 0.6498260498046875, 0.6758804321289062, 0.701934814453125, 0.7279891967773438, 0.7540435791015625, 0.7800979614257812, 0.80615234375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 10.0, 10.0, 9.0, 10.0, 14.0, 15.0, 19.0, 18.0, 21.0, 22.0, 52.0, 74.0, 77.0, 117.0, 121.0, 88.0, 55.0, 52.0, 30.0, 35.0, 22.0, 18.0, 16.0, 7.0, 11.0, 10.0, 2.0, 5.0, 4.0, 8.0, 5.0, 4.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0207366943359375, -0.02004241943359375, -0.01934814453125, -0.01865386962890625, -0.0179595947265625, -0.01726531982421875, -0.016571044921875, -0.01587677001953125, -0.0151824951171875, -0.01448822021484375, -0.0137939453125, -0.01309967041015625, -0.0124053955078125, -0.01171112060546875, -0.011016845703125, -0.01032257080078125, -0.0096282958984375, -0.00893402099609375, -0.00823974609375, -0.00754547119140625, -0.0068511962890625, -0.00615692138671875, -0.005462646484375, -0.00476837158203125, -0.0040740966796875, -0.00337982177734375, -0.002685546875, -0.00199127197265625, -0.0012969970703125, -0.00060272216796875, 9.1552734375e-05, 0.00078582763671875, 0.0014801025390625, 0.00217437744140625, 0.00286865234375, 0.00356292724609375, 0.0042572021484375, 0.00495147705078125, 0.005645751953125, 0.00634002685546875, 0.0070343017578125, 0.00772857666015625, 0.0084228515625, 0.00911712646484375, 0.0098114013671875, 0.01050567626953125, 0.011199951171875, 0.01189422607421875, 0.0125885009765625, 0.01328277587890625, 0.01397705078125, 0.01467132568359375, 0.0153656005859375, 0.01605987548828125, 0.016754150390625, 0.01744842529296875, 0.0181427001953125, 0.01883697509765625, 0.01953125, 0.02022552490234375, 0.0209197998046875, 0.02161407470703125, 0.022308349609375, 0.02300262451171875, 0.0236968994140625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 7.0, 4.0, 7.0, 8.0, 10.0, 11.0, 7.0, 19.0, 22.0, 15.0, 21.0, 24.0, 36.0, 45.0, 50.0, 88.0, 142.0, 218.0, 466.0, 1381.0, 7823.0, 170629.0, 842964.0, 20502.0, 2552.0, 650.0, 236.0, 162.0, 84.0, 67.0, 45.0, 45.0, 37.0, 30.0, 33.0, 26.0, 22.0, 12.0, 12.0, 12.0, 8.0, 4.0, 5.0, 6.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.416259765625, -0.4040870666503906, -0.39191436767578125, -0.3797416687011719, -0.3675689697265625, -0.3553962707519531, -0.34322357177734375, -0.3310508728027344, -0.318878173828125, -0.3067054748535156, -0.29453277587890625, -0.2823600769042969, -0.2701873779296875, -0.2580146789550781, -0.24584197998046875, -0.23366928100585938, -0.22149658203125, -0.20932388305664062, -0.19715118408203125, -0.18497848510742188, -0.1728057861328125, -0.16063308715820312, -0.14846038818359375, -0.13628768920898438, -0.124114990234375, -0.11194229125976562, -0.09976959228515625, -0.08759689331054688, -0.0754241943359375, -0.06325149536132812, -0.05107879638671875, -0.038906097412109375, -0.0267333984375, -0.014560699462890625, -0.00238800048828125, 0.009784698486328125, 0.0219573974609375, 0.034130096435546875, 0.04630279541015625, 0.058475494384765625, 0.070648193359375, 0.08282089233398438, 0.09499359130859375, 0.10716629028320312, 0.1193389892578125, 0.13151168823242188, 0.14368438720703125, 0.15585708618164062, 0.16802978515625, 0.18020248413085938, 0.19237518310546875, 0.20454788208007812, 0.2167205810546875, 0.22889328002929688, 0.24106597900390625, 0.2532386779785156, 0.265411376953125, 0.2775840759277344, 0.28975677490234375, 0.3019294738769531, 0.3141021728515625, 0.3262748718261719, 0.33844757080078125, 0.3506202697753906, 0.36279296875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 10.0, 16.0, 56.0, 218.0, 495.0, 120.0, 57.0, 18.0, 12.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10337348282337189, -0.09560608118772507, -0.08783868700265884, -0.08007128536701202, -0.0723038911819458, -0.06453648954629898, -0.05676908791065216, -0.04900169000029564, -0.04123429208993912, -0.033466894179582596, -0.025699494406580925, -0.017932094633579254, -0.010164696723222733, -0.002397298812866211, 0.005370102822780609, 0.01313750073313713, 0.020904898643493652, 0.028672296553850174, 0.036439694464206696, 0.044207096099853516, 0.05197449401021004, 0.05974189192056656, 0.06750929355621338, 0.0752766877412796, 0.08304408937692642, 0.09081149101257324, 0.09857888519763947, 0.10634628683328629, 0.1141136884689331, 0.12188108265399933, 0.12964847683906555, 0.13741588592529297, 0.14518329501152039, 0.1529506891965866, 0.16071809828281403, 0.16848549246788025, 0.17625288665294647, 0.1840202808380127, 0.1917876899242401, 0.19955508410930634, 0.20732247829437256, 0.21508987247943878, 0.2228572815656662, 0.23062467575073242, 0.23839206993579865, 0.24615946412086487, 0.2539268732070923, 0.2616942822933197, 0.2694616913795471, 0.27722910046577454, 0.28499647974967957, 0.292763888835907, 0.3005312979221344, 0.30829867720603943, 0.31606608629226685, 0.32383349537849426, 0.3316008746623993, 0.3393682837486267, 0.34713566303253174, 0.35490307211875916, 0.3626704812049866, 0.3704378604888916, 0.378205269575119, 0.38597267866134644, 0.39374005794525146]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 6.0, 4.0, 4.0, 6.0, 16.0, 9.0, 10.0, 12.0, 17.0, 12.0, 22.0, 23.0, 26.0, 20.0, 22.0, 33.0, 35.0, 26.0, 38.0, 30.0, 44.0, 32.0, 30.0, 35.0, 49.0, 26.0, 36.0, 35.0, 43.0, 32.0, 15.0, 31.0, 39.0, 23.0, 20.0, 22.0, 22.0, 16.0, 17.0, 9.0, 10.0, 15.0, 9.0, 3.0, 7.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.02029484510421753, -0.01967526413500309, -0.01905568316578865, -0.01843610219657421, -0.01781652122735977, -0.017196940258145332, -0.016577359288930893, -0.015957778319716454, -0.015338197350502014, -0.014718616381287575, -0.014099035412073135, -0.013479454442858696, -0.012859873473644257, -0.012240292504429817, -0.011620711535215378, -0.011001130566000938, -0.010381549596786499, -0.00976196862757206, -0.00914238765835762, -0.00852280668914318, -0.007903225719928741, -0.007283644750714302, -0.006664063781499863, -0.006044482812285423, -0.005424901843070984, -0.0048053208738565445, -0.004185739904642105, -0.0035661589354276657, -0.0029465779662132263, -0.002326996996998787, -0.0017074160277843475, -0.0010878350585699081, -0.00046825408935546875, 0.00015132687985897064, 0.00077090784907341, 0.0013904888182878494, 0.002010069787502289, 0.002629650756716728, 0.0032492317259311676, 0.003868812695145607, 0.004488393664360046, 0.005107974633574486, 0.005727555602788925, 0.0063471365720033646, 0.006966717541217804, 0.007586298510432243, 0.008205879479646683, 0.008825460448861122, 0.009445041418075562, 0.010064622387290001, 0.01068420335650444, 0.01130378432571888, 0.011923365294933319, 0.012542946264147758, 0.013162527233362198, 0.013782108202576637, 0.014401689171791077, 0.015021270141005516, 0.015640851110219955, 0.016260432079434395, 0.016880013048648834, 0.017499594017863274, 0.018119174987077713, 0.018738755956292152, 0.019358336925506592]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 6.0, 2.0, 4.0, 14.0, 9.0, 17.0, 18.0, 12.0, 22.0, 22.0, 30.0, 37.0, 44.0, 27.0, 39.0, 33.0, 38.0, 59.0, 46.0, 47.0, 41.0, 45.0, 34.0, 32.0, 39.0, 35.0, 28.0, 27.0, 28.0, 27.0, 25.0, 19.0, 13.0, 15.0, 8.0, 12.0, 6.0, 9.0, 7.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.9296875, -13.515869140625, -13.10205078125, -12.688232421875, -12.2744140625, -11.860595703125, -11.44677734375, -11.032958984375, -10.619140625, -10.205322265625, -9.79150390625, -9.377685546875, -8.9638671875, -8.550048828125, -8.13623046875, -7.722412109375, -7.30859375, -6.894775390625, -6.48095703125, -6.067138671875, -5.6533203125, -5.239501953125, -4.82568359375, -4.411865234375, -3.998046875, -3.584228515625, -3.17041015625, -2.756591796875, -2.3427734375, -1.928955078125, -1.51513671875, -1.101318359375, -0.6875, -0.273681640625, 0.14013671875, 0.553955078125, 0.9677734375, 1.381591796875, 1.79541015625, 2.209228515625, 2.623046875, 3.036865234375, 3.45068359375, 3.864501953125, 4.2783203125, 4.692138671875, 5.10595703125, 5.519775390625, 5.93359375, 6.347412109375, 6.76123046875, 7.175048828125, 7.5888671875, 8.002685546875, 8.41650390625, 8.830322265625, 9.244140625, 9.657958984375, 10.07177734375, 10.485595703125, 10.8994140625, 11.313232421875, 11.72705078125, 12.140869140625, 12.5546875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 11.0, 11.0, 13.0, 11.0, 25.0, 40.0, 59.0, 77.0, 174.0, 306.0, 432.0, 816.0, 1622.0, 3248.0, 7765.0, 21845.0, 71718.0, 294335.0, 486593.0, 108760.0, 31273.0, 10740.0, 4227.0, 2037.0, 1044.0, 520.0, 346.0, 194.0, 102.0, 67.0, 35.0, 32.0, 20.0, 13.0, 15.0, 7.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8828125, -6.66192626953125, -6.4410400390625, -6.22015380859375, -5.999267578125, -5.77838134765625, -5.5574951171875, -5.33660888671875, -5.11572265625, -4.89483642578125, -4.6739501953125, -4.45306396484375, -4.232177734375, -4.01129150390625, -3.7904052734375, -3.56951904296875, -3.3486328125, -3.12774658203125, -2.9068603515625, -2.68597412109375, -2.465087890625, -2.24420166015625, -2.0233154296875, -1.80242919921875, -1.58154296875, -1.36065673828125, -1.1397705078125, -0.91888427734375, -0.697998046875, -0.47711181640625, -0.2562255859375, -0.03533935546875, 0.185546875, 0.40643310546875, 0.6273193359375, 0.84820556640625, 1.069091796875, 1.28997802734375, 1.5108642578125, 1.73175048828125, 1.95263671875, 2.17352294921875, 2.3944091796875, 2.61529541015625, 2.836181640625, 3.05706787109375, 3.2779541015625, 3.49884033203125, 3.7197265625, 3.94061279296875, 4.1614990234375, 4.38238525390625, 4.603271484375, 4.82415771484375, 5.0450439453125, 5.26593017578125, 5.48681640625, 5.70770263671875, 5.9285888671875, 6.14947509765625, 6.370361328125, 6.59124755859375, 6.8121337890625, 7.03302001953125, 7.25390625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 13.0, 6.0, 10.0, 12.0, 13.0, 21.0, 20.0, 25.0, 16.0, 25.0, 30.0, 32.0, 36.0, 34.0, 33.0, 41.0, 48.0, 61.0, 1650.0, 431.0, 65.0, 36.0, 33.0, 40.0, 30.0, 35.0, 33.0, 24.0, 34.0, 23.0, 25.0, 12.0, 20.0, 16.0, 14.0, 10.0, 7.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.84375, -38.5146484375, -37.185546875, -35.8564453125, -34.52734375, -33.1982421875, -31.869140625, -30.5400390625, -29.2109375, -27.8818359375, -26.552734375, -25.2236328125, -23.89453125, -22.5654296875, -21.236328125, -19.9072265625, -18.578125, -17.2490234375, -15.919921875, -14.5908203125, -13.26171875, -11.9326171875, -10.603515625, -9.2744140625, -7.9453125, -6.6162109375, -5.287109375, -3.9580078125, -2.62890625, -1.2998046875, 0.029296875, 1.3583984375, 2.6875, 4.0166015625, 5.345703125, 6.6748046875, 8.00390625, 9.3330078125, 10.662109375, 11.9912109375, 13.3203125, 14.6494140625, 15.978515625, 17.3076171875, 18.63671875, 19.9658203125, 21.294921875, 22.6240234375, 23.953125, 25.2822265625, 26.611328125, 27.9404296875, 29.26953125, 30.5986328125, 31.927734375, 33.2568359375, 34.5859375, 35.9150390625, 37.244140625, 38.5732421875, 39.90234375, 41.2314453125, 42.560546875, 43.8896484375, 45.21875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 8.0, 10.0, 9.0, 16.0, 14.0, 27.0, 17.0, 30.0, 27.0, 61.0, 70.0, 78.0, 108.0, 136.0, 191.0, 270.0, 492.0, 1531.0, 64718.0, 3071773.0, 4114.0, 759.0, 355.0, 187.0, 143.0, 119.0, 104.0, 70.0, 60.0, 37.0, 29.0, 37.0, 20.0, 15.0, 13.0, 16.0, 7.0, 7.0, 10.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-80.75, -78.390625, -76.03125, -73.671875, -71.3125, -68.953125, -66.59375, -64.234375, -61.875, -59.515625, -57.15625, -54.796875, -52.4375, -50.078125, -47.71875, -45.359375, -43.0, -40.640625, -38.28125, -35.921875, -33.5625, -31.203125, -28.84375, -26.484375, -24.125, -21.765625, -19.40625, -17.046875, -14.6875, -12.328125, -9.96875, -7.609375, -5.25, -2.890625, -0.53125, 1.828125, 4.1875, 6.546875, 8.90625, 11.265625, 13.625, 15.984375, 18.34375, 20.703125, 23.0625, 25.421875, 27.78125, 30.140625, 32.5, 34.859375, 37.21875, 39.578125, 41.9375, 44.296875, 46.65625, 49.015625, 51.375, 53.734375, 56.09375, 58.453125, 60.8125, 63.171875, 65.53125, 67.890625, 70.25]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 12.0, 24.0, 103.0, 255.0, 284.0, 207.0, 88.0, 30.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.617923736572266, -20.640039443969727, -18.662155151367188, -16.684268951416016, -14.706384658813477, -12.728500366210938, -10.750615119934082, -8.772729873657227, -6.7948455810546875, -4.81696081161499, -2.839076042175293, -0.8611912727355957, 1.1166934967041016, 3.0945777893066406, 5.072463035583496, 7.050348281860352, 9.02823257446289, 11.00611686706543, 12.984002113342285, 14.96188735961914, 16.93977165222168, 18.91765594482422, 20.89554214477539, 22.87342643737793, 24.85131072998047, 26.829195022583008, 28.807079315185547, 30.78496551513672, 32.762847900390625, 34.7407341003418, 36.71862030029297, 38.696502685546875, 40.67439270019531, 42.652278900146484, 44.63016128540039, 46.60804748535156, 48.58592987060547, 50.56381607055664, 52.54170227050781, 54.51958465576172, 56.49747085571289, 58.47535705566406, 60.45323944091797, 62.43112564086914, 64.40901184082031, 66.38689422607422, 68.36477661132812, 70.34266662597656, 72.32054901123047, 74.29843139648438, 76.27632141113281, 78.25420379638672, 80.23208618164062, 82.20997619628906, 84.18785858154297, 86.16574096679688, 88.14363098144531, 90.12151336669922, 92.09940338134766, 94.07728576660156, 96.05516815185547, 98.03305053710938, 100.01094055175781, 101.98882293701172, 103.96670532226562]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 1.0, 10.0, 5.0, 8.0, 6.0, 13.0, 15.0, 10.0, 22.0, 29.0, 16.0, 29.0, 24.0, 27.0, 34.0, 41.0, 44.0, 33.0, 38.0, 45.0, 49.0, 37.0, 43.0, 39.0, 42.0, 25.0, 36.0, 31.0, 28.0, 33.0, 27.0, 21.0, 32.0, 16.0, 18.0, 17.0, 8.0, 11.0, 12.0, 6.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-128.55751037597656, -124.38248443603516, -120.20745086669922, -116.03242492675781, -111.85739135742188, -107.68236541748047, -103.50733947753906, -99.33230590820312, -95.15727996826172, -90.98225402832031, -86.80722045898438, -82.63219451904297, -78.45716857910156, -74.28213500976562, -70.10710906982422, -65.93208312988281, -61.757049560546875, -57.5820198059082, -53.40699005126953, -49.231964111328125, -45.05693435668945, -40.88190460205078, -36.706878662109375, -32.5318489074707, -28.35681915283203, -24.18178939819336, -20.00676155090332, -15.831732749938965, -11.65670394897461, -7.4816741943359375, -3.3066463470458984, 0.8683815002441406, 5.043426513671875, 9.21845531463623, 13.393484115600586, 17.568511962890625, 21.743541717529297, 25.91857147216797, 30.093599319458008, 34.26862716674805, 38.44365692138672, 42.61868667602539, 46.79371643066406, 50.96874237060547, 55.14377212524414, 59.31880187988281, 63.49382781982422, 67.66885375976562, 71.84388732910156, 76.01891326904297, 80.1939468383789, 84.36897277832031, 88.54400634765625, 92.71903228759766, 96.89405822753906, 101.069091796875, 105.2441177368164, 109.41914367675781, 113.59417724609375, 117.76920318603516, 121.94422912597656, 126.1192626953125, 130.29429626464844, 134.4693145751953, 138.64434814453125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 3.0, 5.0, 5.0, 7.0, 9.0, 14.0, 13.0, 20.0, 15.0, 23.0, 28.0, 26.0, 35.0, 47.0, 25.0, 40.0, 33.0, 46.0, 59.0, 51.0, 34.0, 49.0, 35.0, 34.0, 34.0, 39.0, 38.0, 23.0, 32.0, 26.0, 28.0, 23.0, 15.0, 12.0, 11.0, 12.0, 8.0, 10.0, 7.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.0546875, -13.6337890625, -13.212890625, -12.7919921875, -12.37109375, -11.9501953125, -11.529296875, -11.1083984375, -10.6875, -10.2666015625, -9.845703125, -9.4248046875, -9.00390625, -8.5830078125, -8.162109375, -7.7412109375, -7.3203125, -6.8994140625, -6.478515625, -6.0576171875, -5.63671875, -5.2158203125, -4.794921875, -4.3740234375, -3.953125, -3.5322265625, -3.111328125, -2.6904296875, -2.26953125, -1.8486328125, -1.427734375, -1.0068359375, -0.5859375, -0.1650390625, 0.255859375, 0.6767578125, 1.09765625, 1.5185546875, 1.939453125, 2.3603515625, 2.78125, 3.2021484375, 3.623046875, 4.0439453125, 4.46484375, 4.8857421875, 5.306640625, 5.7275390625, 6.1484375, 6.5693359375, 6.990234375, 7.4111328125, 7.83203125, 8.2529296875, 8.673828125, 9.0947265625, 9.515625, 9.9365234375, 10.357421875, 10.7783203125, 11.19921875, 11.6201171875, 12.041015625, 12.4619140625, 12.8828125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 7.0, 7.0, 8.0, 12.0, 15.0, 22.0, 29.0, 34.0, 45.0, 80.0, 118.0, 161.0, 236.0, 417.0, 830.0, 1586.0, 3121.0, 7385.0, 24870.0, 2289261.0, 1828677.0, 23115.0, 7147.0, 3138.0, 1679.0, 930.0, 502.0, 263.0, 156.0, 128.0, 87.0, 66.0, 38.0, 28.0, 19.0, 12.0, 20.0, 12.0, 11.0, 2.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.125, -64.234375, -62.34375, -60.453125, -58.5625, -56.671875, -54.78125, -52.890625, -51.0, -49.109375, -47.21875, -45.328125, -43.4375, -41.546875, -39.65625, -37.765625, -35.875, -33.984375, -32.09375, -30.203125, -28.3125, -26.421875, -24.53125, -22.640625, -20.75, -18.859375, -16.96875, -15.078125, -13.1875, -11.296875, -9.40625, -7.515625, -5.625, -3.734375, -1.84375, 0.046875, 1.9375, 3.828125, 5.71875, 7.609375, 9.5, 11.390625, 13.28125, 15.171875, 17.0625, 18.953125, 20.84375, 22.734375, 24.625, 26.515625, 28.40625, 30.296875, 32.1875, 34.078125, 35.96875, 37.859375, 39.75, 41.640625, 43.53125, 45.421875, 47.3125, 49.203125, 51.09375, 52.984375, 54.875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 12.0, 7.0, 13.0, 18.0, 12.0, 33.0, 44.0, 64.0, 118.0, 292.0, 626.0, 1064.0, 865.0, 422.0, 202.0, 90.0, 49.0, 36.0, 21.0, 14.0, 12.0, 7.0, 7.0, 9.0, 3.0, 6.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.125, -36.92578125, -35.7265625, -34.52734375, -33.328125, -32.12890625, -30.9296875, -29.73046875, -28.53125, -27.33203125, -26.1328125, -24.93359375, -23.734375, -22.53515625, -21.3359375, -20.13671875, -18.9375, -17.73828125, -16.5390625, -15.33984375, -14.140625, -12.94140625, -11.7421875, -10.54296875, -9.34375, -8.14453125, -6.9453125, -5.74609375, -4.546875, -3.34765625, -2.1484375, -0.94921875, 0.25, 1.44921875, 2.6484375, 3.84765625, 5.046875, 6.24609375, 7.4453125, 8.64453125, 9.84375, 11.04296875, 12.2421875, 13.44140625, 14.640625, 15.83984375, 17.0390625, 18.23828125, 19.4375, 20.63671875, 21.8359375, 23.03515625, 24.234375, 25.43359375, 26.6328125, 27.83203125, 29.03125, 30.23046875, 31.4296875, 32.62890625, 33.828125, 35.02734375, 36.2265625, 37.42578125, 38.625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 10.0, 7.0, 11.0, 13.0, 35.0, 51.0, 66.0, 113.0, 186.0, 282.0, 480.0, 763.0, 1284.0, 2206.0, 4084.0, 8124.0, 18193.0, 56896.0, 931847.0, 3030367.0, 93566.0, 24080.0, 10158.0, 4860.0, 2772.0, 1513.0, 869.0, 542.0, 336.0, 203.0, 139.0, 72.0, 52.0, 33.0, 25.0, 17.0, 12.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.0625, -53.349609375, -51.63671875, -49.923828125, -48.2109375, -46.498046875, -44.78515625, -43.072265625, -41.359375, -39.646484375, -37.93359375, -36.220703125, -34.5078125, -32.794921875, -31.08203125, -29.369140625, -27.65625, -25.943359375, -24.23046875, -22.517578125, -20.8046875, -19.091796875, -17.37890625, -15.666015625, -13.953125, -12.240234375, -10.52734375, -8.814453125, -7.1015625, -5.388671875, -3.67578125, -1.962890625, -0.25, 1.462890625, 3.17578125, 4.888671875, 6.6015625, 8.314453125, 10.02734375, 11.740234375, 13.453125, 15.166015625, 16.87890625, 18.591796875, 20.3046875, 22.017578125, 23.73046875, 25.443359375, 27.15625, 28.869140625, 30.58203125, 32.294921875, 34.0078125, 35.720703125, 37.43359375, 39.146484375, 40.859375, 42.572265625, 44.28515625, 45.998046875, 47.7109375, 49.423828125, 51.13671875, 52.849609375, 54.5625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 9.0, 13.0, 21.0, 21.0, 36.0, 65.0, 80.0, 130.0, 165.0, 150.0, 97.0, 58.0, 40.0, 24.0, 16.0, 19.0, 8.0, 10.0, 9.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.1263427734375, -152.4529266357422, -147.7794952392578, -143.1060791015625, -138.43264770507812, -133.7592315673828, -129.0858154296875, -124.41238403320312, -119.73896789550781, -115.06554412841797, -110.39212036132812, -105.71870422363281, -101.04528045654297, -96.37185668945312, -91.69843292236328, -87.02500915527344, -82.3515853881836, -77.67816162109375, -73.0047378540039, -68.33131408691406, -63.65789794921875, -58.984474182128906, -54.31105041503906, -49.637630462646484, -44.96420669555664, -40.2907829284668, -35.61736297607422, -30.943939208984375, -26.270517349243164, -21.597095489501953, -16.92367172241211, -12.250251770019531, -7.5768280029296875, -2.9034056663513184, 1.7700166702270508, 6.443439483642578, 11.116861343383789, 15.790283203125, 20.463706970214844, 25.137126922607422, 29.810550689697266, 34.48397445678711, 39.15739440917969, 43.83081817626953, 48.504241943359375, 53.17766189575195, 57.8510856628418, 62.524505615234375, 67.19792938232422, 71.87135314941406, 76.5447769165039, 81.21820068359375, 85.89161682128906, 90.5650405883789, 95.23846435546875, 99.91188049316406, 104.58531188964844, 109.25873565673828, 113.93215942382812, 118.60557556152344, 123.27899932861328, 127.95242309570312, 132.6258544921875, 137.2992706298828, 141.97268676757812]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 12.0, 15.0, 13.0, 16.0, 16.0, 21.0, 17.0, 36.0, 39.0, 35.0, 36.0, 36.0, 60.0, 39.0, 44.0, 49.0, 38.0, 41.0, 42.0, 41.0, 40.0, 56.0, 31.0, 30.0, 28.0, 23.0, 17.0, 23.0, 22.0, 9.0, 17.0, 16.0, 9.0, 10.0, 8.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.65242004394531, -82.71452331542969, -79.77661895751953, -76.8387222290039, -73.90081787109375, -70.96292114257812, -68.0250244140625, -65.08712005615234, -62.14921951293945, -59.21131896972656, -56.27341842651367, -53.33551788330078, -50.397621154785156, -47.459716796875, -44.521820068359375, -41.583919525146484, -38.646018981933594, -35.7081184387207, -32.77021789550781, -29.832319259643555, -26.894418716430664, -23.956518173217773, -21.018619537353516, -18.080718994140625, -15.142818450927734, -12.204917907714844, -9.26701831817627, -6.329118728637695, -3.3912181854248047, -0.45331764221191406, 2.4845809936523438, 5.422481536865234, 8.360374450683594, 11.298274993896484, 14.236174583435059, 17.174074172973633, 20.111974716186523, 23.049875259399414, 25.987773895263672, 28.925674438476562, 31.863574981689453, 34.801475524902344, 37.739376068115234, 40.677276611328125, 43.61517333984375, 46.553077697753906, 49.49097442626953, 52.42887496948242, 55.36677551269531, 58.3046760559082, 61.242576599121094, 64.18047332763672, 67.11837768554688, 70.0562744140625, 72.99417114257812, 75.93207550048828, 78.86997985839844, 81.80787658691406, 84.74578094482422, 87.68367767333984, 90.62158203125, 93.55947875976562, 96.49737548828125, 99.4352798461914, 102.37317657470703]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 7.0, 6.0, 9.0, 7.0, 9.0, 13.0, 24.0, 17.0, 16.0, 20.0, 29.0, 34.0, 30.0, 36.0, 31.0, 44.0, 47.0, 49.0, 44.0, 47.0, 55.0, 32.0, 37.0, 53.0, 50.0, 23.0, 29.0, 29.0, 30.0, 20.0, 20.0, 16.0, 13.0, 15.0, 19.0, 13.0, 7.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.5078125, -14.0758056640625, -13.643798828125, -13.2117919921875, -12.77978515625, -12.3477783203125, -11.915771484375, -11.4837646484375, -11.0517578125, -10.6197509765625, -10.187744140625, -9.7557373046875, -9.32373046875, -8.8917236328125, -8.459716796875, -8.0277099609375, -7.595703125, -7.1636962890625, -6.731689453125, -6.2996826171875, -5.86767578125, -5.4356689453125, -5.003662109375, -4.5716552734375, -4.1396484375, -3.7076416015625, -3.275634765625, -2.8436279296875, -2.41162109375, -1.9796142578125, -1.547607421875, -1.1156005859375, -0.68359375, -0.2515869140625, 0.180419921875, 0.6124267578125, 1.04443359375, 1.4764404296875, 1.908447265625, 2.3404541015625, 2.7724609375, 3.2044677734375, 3.636474609375, 4.0684814453125, 4.50048828125, 4.9324951171875, 5.364501953125, 5.7965087890625, 6.228515625, 6.6605224609375, 7.092529296875, 7.5245361328125, 7.95654296875, 8.3885498046875, 8.820556640625, 9.2525634765625, 9.6845703125, 10.1165771484375, 10.548583984375, 10.9805908203125, 11.41259765625, 11.8446044921875, 12.276611328125, 12.7086181640625, 13.140625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 11.0, 15.0, 19.0, 19.0, 47.0, 62.0, 92.0, 160.0, 226.0, 347.0, 516.0, 808.0, 1274.0, 1894.0, 3005.0, 4650.0, 7343.0, 11551.0, 18735.0, 31086.0, 53804.0, 101014.0, 199439.0, 267719.0, 154495.0, 78863.0, 43218.0, 25488.0, 15359.0, 9957.0, 6070.0, 3967.0, 2606.0, 1674.0, 1044.0, 696.0, 417.0, 314.0, 179.0, 123.0, 81.0, 59.0, 37.0, 27.0, 17.0, 13.0, 7.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5966796875, -1.545684814453125, -1.49468994140625, -1.443695068359375, -1.3927001953125, -1.341705322265625, -1.29071044921875, -1.239715576171875, -1.188720703125, -1.137725830078125, -1.08673095703125, -1.035736083984375, -0.9847412109375, -0.933746337890625, -0.88275146484375, -0.831756591796875, -0.78076171875, -0.729766845703125, -0.67877197265625, -0.627777099609375, -0.5767822265625, -0.525787353515625, -0.47479248046875, -0.423797607421875, -0.372802734375, -0.321807861328125, -0.27081298828125, -0.219818115234375, -0.1688232421875, -0.117828369140625, -0.06683349609375, -0.015838623046875, 0.03515625, 0.086151123046875, 0.13714599609375, 0.188140869140625, 0.2391357421875, 0.290130615234375, 0.34112548828125, 0.392120361328125, 0.443115234375, 0.494110107421875, 0.54510498046875, 0.596099853515625, 0.6470947265625, 0.698089599609375, 0.74908447265625, 0.800079345703125, 0.85107421875, 0.902069091796875, 0.95306396484375, 1.004058837890625, 1.0550537109375, 1.106048583984375, 1.15704345703125, 1.208038330078125, 1.259033203125, 1.310028076171875, 1.36102294921875, 1.412017822265625, 1.4630126953125, 1.514007568359375, 1.56500244140625, 1.615997314453125, 1.6669921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 12.0, 1.0, 11.0, 13.0, 9.0, 19.0, 19.0, 14.0, 14.0, 28.0, 25.0, 33.0, 25.0, 35.0, 27.0, 41.0, 28.0, 24.0, 33.0, 41.0, 1070.0, 44.0, 36.0, 37.0, 40.0, 28.0, 35.0, 31.0, 24.0, 32.0, 35.0, 23.0, 21.0, 15.0, 16.0, 9.0, 15.0, 6.0, 6.0, 9.0, 10.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.0703125, -6.8367919921875, -6.603271484375, -6.3697509765625, -6.13623046875, -5.9027099609375, -5.669189453125, -5.4356689453125, -5.2021484375, -4.9686279296875, -4.735107421875, -4.5015869140625, -4.26806640625, -4.0345458984375, -3.801025390625, -3.5675048828125, -3.333984375, -3.1004638671875, -2.866943359375, -2.6334228515625, -2.39990234375, -2.1663818359375, -1.932861328125, -1.6993408203125, -1.4658203125, -1.2322998046875, -0.998779296875, -0.7652587890625, -0.53173828125, -0.2982177734375, -0.064697265625, 0.1688232421875, 0.40234375, 0.6358642578125, 0.869384765625, 1.1029052734375, 1.33642578125, 1.5699462890625, 1.803466796875, 2.0369873046875, 2.2705078125, 2.5040283203125, 2.737548828125, 2.9710693359375, 3.20458984375, 3.4381103515625, 3.671630859375, 3.9051513671875, 4.138671875, 4.3721923828125, 4.605712890625, 4.8392333984375, 5.07275390625, 5.3062744140625, 5.539794921875, 5.7733154296875, 6.0068359375, 6.2403564453125, 6.473876953125, 6.7073974609375, 6.94091796875, 7.1744384765625, 7.407958984375, 7.6414794921875, 7.875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 12.0, 11.0, 19.0, 22.0, 28.0, 53.0, 87.0, 132.0, 235.0, 316.0, 505.0, 750.0, 1246.0, 1986.0, 2771.0, 4439.0, 6654.0, 10150.0, 15848.0, 24633.0, 40037.0, 68162.0, 119303.0, 260851.0, 1204070.0, 135753.0, 76914.0, 44762.0, 27460.0, 17520.0, 11225.0, 7361.0, 4905.0, 3044.0, 2113.0, 1365.0, 848.0, 526.0, 369.0, 230.0, 167.0, 90.0, 67.0, 36.0, 20.0, 18.0, 8.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75927734375, -0.7356338500976562, -0.7119903564453125, -0.6883468627929688, -0.664703369140625, -0.6410598754882812, -0.6174163818359375, -0.5937728881835938, -0.57012939453125, -0.5464859008789062, -0.5228424072265625, -0.49919891357421875, -0.475555419921875, -0.45191192626953125, -0.4282684326171875, -0.40462493896484375, -0.3809814453125, -0.35733795166015625, -0.3336944580078125, -0.31005096435546875, -0.286407470703125, -0.26276397705078125, -0.2391204833984375, -0.21547698974609375, -0.19183349609375, -0.16819000244140625, -0.1445465087890625, -0.12090301513671875, -0.097259521484375, -0.07361602783203125, -0.0499725341796875, -0.02632904052734375, -0.002685546875, 0.02095794677734375, 0.0446014404296875, 0.06824493408203125, 0.091888427734375, 0.11553192138671875, 0.1391754150390625, 0.16281890869140625, 0.18646240234375, 0.21010589599609375, 0.2337493896484375, 0.25739288330078125, 0.281036376953125, 0.30467987060546875, 0.3283233642578125, 0.35196685791015625, 0.3756103515625, 0.39925384521484375, 0.4228973388671875, 0.44654083251953125, 0.470184326171875, 0.49382781982421875, 0.5174713134765625, 0.5411148071289062, 0.56475830078125, 0.5884017944335938, 0.6120452880859375, 0.6356887817382812, 0.659332275390625, 0.6829757690429688, 0.7066192626953125, 0.7302627563476562, 0.75390625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 6.0, 6.0, 12.0, 11.0, 14.0, 14.0, 18.0, 48.0, 46.0, 51.0, 59.0, 76.0, 104.0, 76.0, 78.0, 68.0, 66.0, 67.0, 42.0, 33.0, 28.0, 13.0, 12.0, 5.0, 11.0, 8.0, 4.0, 4.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022979736328125, -0.02219676971435547, -0.021413803100585938, -0.020630836486816406, -0.019847869873046875, -0.019064903259277344, -0.018281936645507812, -0.01749897003173828, -0.01671600341796875, -0.01593303680419922, -0.015150070190429688, -0.014367103576660156, -0.013584136962890625, -0.012801170349121094, -0.012018203735351562, -0.011235237121582031, -0.0104522705078125, -0.009669303894042969, -0.008886337280273438, -0.008103370666503906, -0.007320404052734375, -0.006537437438964844, -0.0057544708251953125, -0.004971504211425781, -0.00418853759765625, -0.0034055709838867188, -0.0026226043701171875, -0.0018396377563476562, -0.001056671142578125, -0.00027370452880859375, 0.0005092620849609375, 0.0012922286987304688, 0.0020751953125, 0.0028581619262695312, 0.0036411285400390625, 0.004424095153808594, 0.005207061767578125, 0.005990028381347656, 0.0067729949951171875, 0.007555961608886719, 0.00833892822265625, 0.009121894836425781, 0.009904861450195312, 0.010687828063964844, 0.011470794677734375, 0.012253761291503906, 0.013036727905273438, 0.013819694519042969, 0.0146026611328125, 0.015385627746582031, 0.016168594360351562, 0.016951560974121094, 0.017734527587890625, 0.018517494201660156, 0.019300460815429688, 0.02008342742919922, 0.02086639404296875, 0.02164936065673828, 0.022432327270507812, 0.023215293884277344, 0.023998260498046875, 0.024781227111816406, 0.025564193725585938, 0.02634716033935547, 0.027130126953125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 2.0, 17.0, 20.0, 23.0, 33.0, 36.0, 33.0, 71.0, 90.0, 123.0, 242.0, 436.0, 1011.0, 3184.0, 23254.0, 909347.0, 101162.0, 6413.0, 1591.0, 591.0, 303.0, 160.0, 132.0, 66.0, 48.0, 32.0, 33.0, 18.0, 16.0, 12.0, 8.0, 10.0, 5.0, 3.0, 2.0, 6.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.466552734375, -0.4522895812988281, -0.43802642822265625, -0.4237632751464844, -0.4095001220703125, -0.3952369689941406, -0.38097381591796875, -0.3667106628417969, -0.352447509765625, -0.3381843566894531, -0.32392120361328125, -0.3096580505371094, -0.2953948974609375, -0.2811317443847656, -0.26686859130859375, -0.2526054382324219, -0.23834228515625, -0.22407913208007812, -0.20981597900390625, -0.19555282592773438, -0.1812896728515625, -0.16702651977539062, -0.15276336669921875, -0.13850021362304688, -0.124237060546875, -0.10997390747070312, -0.09571075439453125, -0.08144760131835938, -0.0671844482421875, -0.052921295166015625, -0.03865814208984375, -0.024394989013671875, -0.0101318359375, 0.004131317138671875, 0.01839447021484375, 0.032657623291015625, 0.0469207763671875, 0.061183929443359375, 0.07544708251953125, 0.08971023559570312, 0.103973388671875, 0.11823654174804688, 0.13249969482421875, 0.14676284790039062, 0.1610260009765625, 0.17528915405273438, 0.18955230712890625, 0.20381546020507812, 0.21807861328125, 0.23234176635742188, 0.24660491943359375, 0.2608680725097656, 0.2751312255859375, 0.2893943786621094, 0.30365753173828125, 0.3179206848144531, 0.332183837890625, 0.3464469909667969, 0.36071014404296875, 0.3749732971191406, 0.3892364501953125, 0.4034996032714844, 0.41776275634765625, 0.4320259094238281, 0.4462890625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 10.0, 28.0, 68.0, 203.0, 412.0, 153.0, 63.0, 33.0, 12.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0875474140048027, -0.0810135081410408, -0.0744796097278595, -0.0679457038640976, -0.06141179800033569, -0.05487789586186409, -0.04834399372339249, -0.041810087859630585, -0.03527618572115898, -0.02874228172004223, -0.022208377718925476, -0.015674475580453873, -0.00914057157933712, -0.0026066675782203674, 0.003927234560251236, 0.010461140424013138, 0.01699504256248474, 0.023528946563601494, 0.030062850564718246, 0.03659675270318985, 0.04313065856695175, 0.049664560705423355, 0.05619846284389496, 0.06273236870765686, 0.06926627457141876, 0.07580018043518066, 0.08233407884836197, 0.08886798471212387, 0.09540189057588577, 0.10193578898906708, 0.10846969485282898, 0.11500360071659088, 0.12153749167919159, 0.1280713975429535, 0.1346053034067154, 0.1411392092704773, 0.147673100233078, 0.1542070060968399, 0.1607409119606018, 0.1672748178243637, 0.1738087236881256, 0.1803426295518875, 0.18687653541564941, 0.19341042637825012, 0.19994433224201202, 0.20647823810577393, 0.21301214396953583, 0.21954604983329773, 0.22607994079589844, 0.23261384665966034, 0.23914775252342224, 0.24568164348602295, 0.25221556425094604, 0.25874945521354675, 0.26528334617614746, 0.27181726694107056, 0.27835118770599365, 0.28488507866859436, 0.29141899943351746, 0.29795289039611816, 0.30448681116104126, 0.31102070212364197, 0.3175545930862427, 0.32408851385116577, 0.3306224048137665]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 7.0, 12.0, 13.0, 15.0, 11.0, 14.0, 20.0, 17.0, 17.0, 16.0, 23.0, 26.0, 37.0, 28.0, 39.0, 44.0, 39.0, 31.0, 43.0, 44.0, 42.0, 37.0, 38.0, 34.0, 34.0, 33.0, 34.0, 33.0, 24.0, 18.0, 32.0, 25.0, 18.0, 17.0, 17.0, 17.0, 11.0, 7.0, 7.0, 7.0, 5.0, 5.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.027836382389068604, -0.027014771476387978, -0.02619316056370735, -0.025371549651026726, -0.0245499387383461, -0.023728327825665474, -0.022906716912984848, -0.022085106000304222, -0.021263495087623596, -0.02044188417494297, -0.019620273262262344, -0.01879866234958172, -0.017977051436901093, -0.017155440524220467, -0.01633382961153984, -0.015512218698859215, -0.014690607786178589, -0.013868996873497963, -0.013047385960817337, -0.012225775048136711, -0.011404164135456085, -0.01058255322277546, -0.009760942310094833, -0.008939331397414207, -0.008117720484733582, -0.007296109572052956, -0.00647449865937233, -0.005652887746691704, -0.004831276834011078, -0.004009665921330452, -0.003188055008649826, -0.0023664440959692, -0.0015448331832885742, -0.0007232222706079483, 9.838864207267761e-05, 0.0009199995547533035, 0.0017416104674339294, 0.0025632213801145554, 0.0033848322927951813, 0.004206443205475807, 0.005028054118156433, 0.005849665030837059, 0.006671275943517685, 0.007492886856198311, 0.008314497768878937, 0.009136108681559563, 0.009957719594240189, 0.010779330506920815, 0.01160094141960144, 0.012422552332282066, 0.013244163244962692, 0.014065774157643318, 0.014887385070323944, 0.01570899598300457, 0.016530606895685196, 0.017352217808365822, 0.018173828721046448, 0.018995439633727074, 0.0198170505464077, 0.020638661459088326, 0.02146027237176895, 0.022281883284449577, 0.023103494197130203, 0.02392510510981083, 0.024746716022491455]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 7.0, 6.0, 9.0, 7.0, 7.0, 15.0, 24.0, 16.0, 17.0, 19.0, 30.0, 34.0, 30.0, 35.0, 32.0, 44.0, 47.0, 49.0, 44.0, 47.0, 55.0, 31.0, 38.0, 53.0, 48.0, 25.0, 28.0, 30.0, 30.0, 20.0, 20.0, 16.0, 13.0, 15.0, 19.0, 13.0, 7.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -14.08349609375, -13.6513671875, -13.21923828125, -12.787109375, -12.35498046875, -11.9228515625, -11.49072265625, -11.05859375, -10.62646484375, -10.1943359375, -9.76220703125, -9.330078125, -8.89794921875, -8.4658203125, -8.03369140625, -7.6015625, -7.16943359375, -6.7373046875, -6.30517578125, -5.873046875, -5.44091796875, -5.0087890625, -4.57666015625, -4.14453125, -3.71240234375, -3.2802734375, -2.84814453125, -2.416015625, -1.98388671875, -1.5517578125, -1.11962890625, -0.6875, -0.25537109375, 0.1767578125, 0.60888671875, 1.041015625, 1.47314453125, 1.9052734375, 2.33740234375, 2.76953125, 3.20166015625, 3.6337890625, 4.06591796875, 4.498046875, 4.93017578125, 5.3623046875, 5.79443359375, 6.2265625, 6.65869140625, 7.0908203125, 7.52294921875, 7.955078125, 8.38720703125, 8.8193359375, 9.25146484375, 9.68359375, 10.11572265625, 10.5478515625, 10.97998046875, 11.412109375, 11.84423828125, 12.2763671875, 12.70849609375, 13.140625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 10.0, 17.0, 20.0, 26.0, 45.0, 46.0, 70.0, 100.0, 157.0, 227.0, 332.0, 639.0, 1069.0, 2064.0, 4333.0, 10008.0, 26216.0, 75178.0, 251741.0, 449274.0, 148791.0, 47257.0, 17170.0, 6853.0, 3075.0, 1561.0, 850.0, 498.0, 311.0, 174.0, 114.0, 93.0, 68.0, 49.0, 27.0, 17.0, 18.0, 14.0, 13.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.5390625, -7.298095703125, -7.05712890625, -6.816162109375, -6.5751953125, -6.334228515625, -6.09326171875, -5.852294921875, -5.611328125, -5.370361328125, -5.12939453125, -4.888427734375, -4.6474609375, -4.406494140625, -4.16552734375, -3.924560546875, -3.68359375, -3.442626953125, -3.20166015625, -2.960693359375, -2.7197265625, -2.478759765625, -2.23779296875, -1.996826171875, -1.755859375, -1.514892578125, -1.27392578125, -1.032958984375, -0.7919921875, -0.551025390625, -0.31005859375, -0.069091796875, 0.171875, 0.412841796875, 0.65380859375, 0.894775390625, 1.1357421875, 1.376708984375, 1.61767578125, 1.858642578125, 2.099609375, 2.340576171875, 2.58154296875, 2.822509765625, 3.0634765625, 3.304443359375, 3.54541015625, 3.786376953125, 4.02734375, 4.268310546875, 4.50927734375, 4.750244140625, 4.9912109375, 5.232177734375, 5.47314453125, 5.714111328125, 5.955078125, 6.196044921875, 6.43701171875, 6.677978515625, 6.9189453125, 7.159912109375, 7.40087890625, 7.641845703125, 7.8828125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 7.0, 7.0, 16.0, 16.0, 14.0, 21.0, 18.0, 21.0, 24.0, 24.0, 38.0, 32.0, 40.0, 52.0, 37.0, 49.0, 58.0, 130.0, 1807.0, 148.0, 76.0, 40.0, 35.0, 37.0, 33.0, 34.0, 36.0, 43.0, 27.0, 16.0, 14.0, 20.0, 9.0, 11.0, 14.0, 11.0, 8.0, 5.0, 4.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.875, -36.5947265625, -35.314453125, -34.0341796875, -32.75390625, -31.4736328125, -30.193359375, -28.9130859375, -27.6328125, -26.3525390625, -25.072265625, -23.7919921875, -22.51171875, -21.2314453125, -19.951171875, -18.6708984375, -17.390625, -16.1103515625, -14.830078125, -13.5498046875, -12.26953125, -10.9892578125, -9.708984375, -8.4287109375, -7.1484375, -5.8681640625, -4.587890625, -3.3076171875, -2.02734375, -0.7470703125, 0.533203125, 1.8134765625, 3.09375, 4.3740234375, 5.654296875, 6.9345703125, 8.21484375, 9.4951171875, 10.775390625, 12.0556640625, 13.3359375, 14.6162109375, 15.896484375, 17.1767578125, 18.45703125, 19.7373046875, 21.017578125, 22.2978515625, 23.578125, 24.8583984375, 26.138671875, 27.4189453125, 28.69921875, 29.9794921875, 31.259765625, 32.5400390625, 33.8203125, 35.1005859375, 36.380859375, 37.6611328125, 38.94140625, 40.2216796875, 41.501953125, 42.7822265625, 44.0625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 7.0, 8.0, 9.0, 17.0, 30.0, 30.0, 46.0, 57.0, 123.0, 176.0, 242.0, 599.0, 1898.0, 16542.0, 3109646.0, 13283.0, 1714.0, 535.0, 243.0, 191.0, 105.0, 58.0, 42.0, 32.0, 29.0, 19.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.75, -125.345703125, -120.94140625, -116.537109375, -112.1328125, -107.728515625, -103.32421875, -98.919921875, -94.515625, -90.111328125, -85.70703125, -81.302734375, -76.8984375, -72.494140625, -68.08984375, -63.685546875, -59.28125, -54.876953125, -50.47265625, -46.068359375, -41.6640625, -37.259765625, -32.85546875, -28.451171875, -24.046875, -19.642578125, -15.23828125, -10.833984375, -6.4296875, -2.025390625, 2.37890625, 6.783203125, 11.1875, 15.591796875, 19.99609375, 24.400390625, 28.8046875, 33.208984375, 37.61328125, 42.017578125, 46.421875, 50.826171875, 55.23046875, 59.634765625, 64.0390625, 68.443359375, 72.84765625, 77.251953125, 81.65625, 86.060546875, 90.46484375, 94.869140625, 99.2734375, 103.677734375, 108.08203125, 112.486328125, 116.890625, 121.294921875, 125.69921875, 130.103515625, 134.5078125, 138.912109375, 143.31640625, 147.720703125, 152.125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 33.0, 943.0, 45.0], "bins": [-1874.1378173828125, -1844.176513671875, -1814.215087890625, -1784.2537841796875, -1754.2923583984375, -1724.3310546875, -1694.36962890625, -1664.4083251953125, -1634.4468994140625, -1604.485595703125, -1574.524169921875, -1544.5628662109375, -1514.6014404296875, -1484.64013671875, -1454.6787109375, -1424.7174072265625, -1394.7559814453125, -1364.794677734375, -1334.833251953125, -1304.8719482421875, -1274.9105224609375, -1244.94921875, -1214.98779296875, -1185.0264892578125, -1155.0650634765625, -1125.103759765625, -1095.142333984375, -1065.1810302734375, -1035.2196044921875, -1005.2582397460938, -975.296875, -945.3355102539062, -915.3742065429688, -885.412841796875, -855.4514770507812, -825.4901123046875, -795.5287475585938, -765.5673828125, -735.6060180664062, -705.6446533203125, -675.683349609375, -645.7219848632812, -615.7606201171875, -585.7992553710938, -555.837890625, -525.8765258789062, -495.9151611328125, -465.95379638671875, -435.992431640625, -406.03106689453125, -376.0697021484375, -346.10833740234375, -316.14697265625, -286.18560791015625, -256.2242431640625, -226.2628936767578, -196.301513671875, -166.34014892578125, -136.3787841796875, -106.41742706298828, -76.45606231689453, -46.49470520019531, -16.533340454101562, 13.428024291992188, 43.38938903808594]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 9.0, 3.0, 12.0, 14.0, 18.0, 18.0, 16.0, 20.0, 24.0, 30.0, 22.0, 22.0, 32.0, 40.0, 35.0, 45.0, 51.0, 50.0, 43.0, 45.0, 43.0, 49.0, 40.0, 38.0, 33.0, 22.0, 34.0, 32.0, 20.0, 13.0, 27.0, 23.0, 16.0, 14.0, 13.0, 8.0, 7.0, 4.0, 5.0, 2.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-125.19329071044922, -121.64056396484375, -118.08784484863281, -114.53511810302734, -110.9823989868164, -107.42967224121094, -103.876953125, -100.32422637939453, -96.77149963378906, -93.2187728881836, -89.66605377197266, -86.11332702636719, -82.56060791015625, -79.00788116455078, -75.45515441894531, -71.90243530273438, -68.34971618652344, -64.79698944091797, -61.24427032470703, -57.69154357910156, -54.138824462890625, -50.586097717285156, -47.03337478637695, -43.48065185546875, -39.92792892456055, -36.375205993652344, -32.82248306274414, -29.269758224487305, -25.7170352935791, -22.1643123626709, -18.611587524414062, -15.05886459350586, -11.506134033203125, -7.953410625457764, -4.400687217712402, -0.8479633331298828, 2.7047595977783203, 6.257482528686523, 9.81020736694336, 13.362930297851562, 16.915653228759766, 20.46837615966797, 24.021099090576172, 27.573823928833008, 31.12654685974121, 34.67926788330078, 38.23199462890625, 41.78471755981445, 45.337440490722656, 48.89016342163086, 52.44288635253906, 55.99561309814453, 59.54833221435547, 63.10105895996094, 66.65377807617188, 70.20650482177734, 73.75923156738281, 77.31195831298828, 80.86467742919922, 84.41740417480469, 87.97012329101562, 91.5228500366211, 95.07557678222656, 98.6282958984375, 102.18101501464844]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 0.0, 3.0, 5.0, 15.0, 6.0, 10.0, 13.0, 16.0, 17.0, 13.0, 23.0, 23.0, 32.0, 28.0, 46.0, 36.0, 34.0, 45.0, 40.0, 51.0, 50.0, 51.0, 52.0, 40.0, 49.0, 28.0, 34.0, 26.0, 40.0, 23.0, 23.0, 22.0, 13.0, 23.0, 7.0, 19.0, 12.0, 10.0, 8.0, 5.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.1875, -14.73974609375, -14.2919921875, -13.84423828125, -13.396484375, -12.94873046875, -12.5009765625, -12.05322265625, -11.60546875, -11.15771484375, -10.7099609375, -10.26220703125, -9.814453125, -9.36669921875, -8.9189453125, -8.47119140625, -8.0234375, -7.57568359375, -7.1279296875, -6.68017578125, -6.232421875, -5.78466796875, -5.3369140625, -4.88916015625, -4.44140625, -3.99365234375, -3.5458984375, -3.09814453125, -2.650390625, -2.20263671875, -1.7548828125, -1.30712890625, -0.859375, -0.41162109375, 0.0361328125, 0.48388671875, 0.931640625, 1.37939453125, 1.8271484375, 2.27490234375, 2.72265625, 3.17041015625, 3.6181640625, 4.06591796875, 4.513671875, 4.96142578125, 5.4091796875, 5.85693359375, 6.3046875, 6.75244140625, 7.2001953125, 7.64794921875, 8.095703125, 8.54345703125, 8.9912109375, 9.43896484375, 9.88671875, 10.33447265625, 10.7822265625, 11.22998046875, 11.677734375, 12.12548828125, 12.5732421875, 13.02099609375, 13.46875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 10.0, 13.0, 10.0, 21.0, 19.0, 26.0, 33.0, 31.0, 69.0, 91.0, 135.0, 199.0, 289.0, 486.0, 883.0, 1596.0, 3138.0, 6799.0, 16900.0, 118393.0, 3600812.0, 402175.0, 24394.0, 8973.0, 4035.0, 2040.0, 1046.0, 567.0, 362.0, 219.0, 162.0, 87.0, 56.0, 57.0, 31.0, 25.0, 32.0, 20.0, 16.0, 7.0, 11.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-58.46875, -56.78125, -55.09375, -53.40625, -51.71875, -50.03125, -48.34375, -46.65625, -44.96875, -43.28125, -41.59375, -39.90625, -38.21875, -36.53125, -34.84375, -33.15625, -31.46875, -29.78125, -28.09375, -26.40625, -24.71875, -23.03125, -21.34375, -19.65625, -17.96875, -16.28125, -14.59375, -12.90625, -11.21875, -9.53125, -7.84375, -6.15625, -4.46875, -2.78125, -1.09375, 0.59375, 2.28125, 3.96875, 5.65625, 7.34375, 9.03125, 10.71875, 12.40625, 14.09375, 15.78125, 17.46875, 19.15625, 20.84375, 22.53125, 24.21875, 25.90625, 27.59375, 29.28125, 30.96875, 32.65625, 34.34375, 36.03125, 37.71875, 39.40625, 41.09375, 42.78125, 44.46875, 46.15625, 47.84375, 49.53125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 6.0, 7.0, 6.0, 5.0, 10.0, 9.0, 10.0, 18.0, 24.0, 32.0, 36.0, 63.0, 114.0, 225.0, 565.0, 1099.0, 946.0, 452.0, 172.0, 80.0, 47.0, 35.0, 24.0, 18.0, 16.0, 13.0, 19.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.6875, -32.38623046875, -31.0849609375, -29.78369140625, -28.482421875, -27.18115234375, -25.8798828125, -24.57861328125, -23.27734375, -21.97607421875, -20.6748046875, -19.37353515625, -18.072265625, -16.77099609375, -15.4697265625, -14.16845703125, -12.8671875, -11.56591796875, -10.2646484375, -8.96337890625, -7.662109375, -6.36083984375, -5.0595703125, -3.75830078125, -2.45703125, -1.15576171875, 0.1455078125, 1.44677734375, 2.748046875, 4.04931640625, 5.3505859375, 6.65185546875, 7.953125, 9.25439453125, 10.5556640625, 11.85693359375, 13.158203125, 14.45947265625, 15.7607421875, 17.06201171875, 18.36328125, 19.66455078125, 20.9658203125, 22.26708984375, 23.568359375, 24.86962890625, 26.1708984375, 27.47216796875, 28.7734375, 30.07470703125, 31.3759765625, 32.67724609375, 33.978515625, 35.27978515625, 36.5810546875, 37.88232421875, 39.18359375, 40.48486328125, 41.7861328125, 43.08740234375, 44.388671875, 45.68994140625, 46.9912109375, 48.29248046875, 49.59375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 4.0, 6.0, 13.0, 11.0, 29.0, 35.0, 64.0, 94.0, 162.0, 279.0, 460.0, 969.0, 1746.0, 3484.0, 7797.0, 19178.0, 61691.0, 1551409.0, 2439790.0, 70109.0, 20745.0, 8295.0, 3757.0, 1811.0, 939.0, 567.0, 314.0, 191.0, 106.0, 59.0, 45.0, 29.0, 30.0, 18.0, 9.0, 14.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-79.0, -76.92333984375, -74.8466796875, -72.77001953125, -70.693359375, -68.61669921875, -66.5400390625, -64.46337890625, -62.38671875, -60.31005859375, -58.2333984375, -56.15673828125, -54.080078125, -52.00341796875, -49.9267578125, -47.85009765625, -45.7734375, -43.69677734375, -41.6201171875, -39.54345703125, -37.466796875, -35.39013671875, -33.3134765625, -31.23681640625, -29.16015625, -27.08349609375, -25.0068359375, -22.93017578125, -20.853515625, -18.77685546875, -16.7001953125, -14.62353515625, -12.546875, -10.47021484375, -8.3935546875, -6.31689453125, -4.240234375, -2.16357421875, -0.0869140625, 1.98974609375, 4.06640625, 6.14306640625, 8.2197265625, 10.29638671875, 12.373046875, 14.44970703125, 16.5263671875, 18.60302734375, 20.6796875, 22.75634765625, 24.8330078125, 26.90966796875, 28.986328125, 31.06298828125, 33.1396484375, 35.21630859375, 37.29296875, 39.36962890625, 41.4462890625, 43.52294921875, 45.599609375, 47.67626953125, 49.7529296875, 51.82958984375, 53.90625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 6.0, 4.0, 6.0, 7.0, 12.0, 14.0, 29.0, 23.0, 40.0, 55.0, 101.0, 131.0, 153.0, 143.0, 97.0, 57.0, 39.0, 21.0, 17.0, 15.0, 6.0, 12.0, 6.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.68331909179688, -90.7453842163086, -85.80744934082031, -80.86951446533203, -75.93157958984375, -70.99364471435547, -66.05570983886719, -61.117774963378906, -56.179840087890625, -51.241905212402344, -46.30397033691406, -41.36603546142578, -36.4281005859375, -31.49016571044922, -26.552230834960938, -21.614295959472656, -16.676361083984375, -11.738426208496094, -6.8004913330078125, -1.8625564575195312, 3.07537841796875, 8.013313293457031, 12.951248168945312, 17.889183044433594, 22.827117919921875, 27.765052795410156, 32.70298767089844, 37.64092254638672, 42.578857421875, 47.51679229736328, 52.45472717285156, 57.392662048339844, 62.330596923828125, 67.2685317993164, 72.20646667480469, 77.14440155029297, 82.08233642578125, 87.02027130126953, 91.95820617675781, 96.8961410522461, 101.83407592773438, 106.77201080322266, 111.70994567871094, 116.64788055419922, 121.5858154296875, 126.52375030517578, 131.46168518066406, 136.39962768554688, 141.33755493164062, 146.27548217773438, 151.2134246826172, 156.1513671875, 161.08929443359375, 166.0272216796875, 170.9651641845703, 175.90310668945312, 180.84103393554688, 185.77896118164062, 190.71690368652344, 195.65484619140625, 200.5927734375, 205.53070068359375, 210.46864318847656, 215.40658569335938, 220.34451293945312]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 5.0, 4.0, 3.0, 6.0, 4.0, 4.0, 9.0, 6.0, 10.0, 4.0, 13.0, 14.0, 18.0, 15.0, 22.0, 19.0, 25.0, 35.0, 26.0, 29.0, 28.0, 26.0, 27.0, 28.0, 32.0, 30.0, 34.0, 30.0, 26.0, 36.0, 28.0, 37.0, 39.0, 42.0, 29.0, 27.0, 21.0, 27.0, 25.0, 21.0, 23.0, 17.0, 14.0, 11.0, 13.0, 7.0, 18.0, 4.0, 13.0, 8.0, 7.0, 3.0, 1.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-71.44918060302734, -69.10608673095703, -66.76298522949219, -64.41989135742188, -62.07678985595703, -59.73369598388672, -57.39059829711914, -55.04750061035156, -52.704402923583984, -50.361305236816406, -48.01820755004883, -45.67510986328125, -43.33201599121094, -40.988914489746094, -38.64582061767578, -36.3027229309082, -33.959625244140625, -31.616527557373047, -29.27342987060547, -26.930334091186523, -24.587236404418945, -22.244138717651367, -19.901042938232422, -17.557945251464844, -15.214847564697266, -12.871749877929688, -10.528653144836426, -8.185556411743164, -5.842458724975586, -3.499361038208008, -1.156264305114746, 1.1868324279785156, 3.5299224853515625, 5.873019695281982, 8.216116905212402, 10.559213638305664, 12.902311325073242, 15.24540901184082, 17.588504791259766, 19.931602478027344, 22.274700164794922, 24.6177978515625, 26.960895538330078, 29.303991317749023, 31.6470890045166, 33.99018859863281, 36.333282470703125, 38.6763801574707, 41.01947784423828, 43.36257553100586, 45.70567321777344, 48.048770904541016, 50.391868591308594, 52.734962463378906, 55.078060150146484, 57.42115783691406, 59.76425552368164, 62.10735321044922, 64.45044708251953, 66.79354858398438, 69.13664245605469, 71.47974395751953, 73.82283782958984, 76.16593933105469, 78.509033203125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 3.0, 10.0, 4.0, 11.0, 11.0, 15.0, 20.0, 22.0, 18.0, 14.0, 30.0, 32.0, 37.0, 29.0, 40.0, 40.0, 41.0, 52.0, 44.0, 56.0, 32.0, 50.0, 34.0, 38.0, 49.0, 30.0, 32.0, 26.0, 33.0, 19.0, 18.0, 18.0, 14.0, 14.0, 9.0, 7.0, 14.0, 8.0, 8.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.1015625, -14.6640625, -14.2265625, -13.7890625, -13.3515625, -12.9140625, -12.4765625, -12.0390625, -11.6015625, -11.1640625, -10.7265625, -10.2890625, -9.8515625, -9.4140625, -8.9765625, -8.5390625, -8.1015625, -7.6640625, -7.2265625, -6.7890625, -6.3515625, -5.9140625, -5.4765625, -5.0390625, -4.6015625, -4.1640625, -3.7265625, -3.2890625, -2.8515625, -2.4140625, -1.9765625, -1.5390625, -1.1015625, -0.6640625, -0.2265625, 0.2109375, 0.6484375, 1.0859375, 1.5234375, 1.9609375, 2.3984375, 2.8359375, 3.2734375, 3.7109375, 4.1484375, 4.5859375, 5.0234375, 5.4609375, 5.8984375, 6.3359375, 6.7734375, 7.2109375, 7.6484375, 8.0859375, 8.5234375, 8.9609375, 9.3984375, 9.8359375, 10.2734375, 10.7109375, 11.1484375, 11.5859375, 12.0234375, 12.4609375, 12.8984375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 6.0, 10.0, 7.0, 11.0, 24.0, 47.0, 64.0, 80.0, 157.0, 187.0, 353.0, 542.0, 802.0, 1300.0, 2014.0, 3027.0, 4632.0, 6996.0, 10469.0, 16438.0, 26657.0, 44942.0, 80533.0, 153109.0, 256905.0, 193934.0, 101840.0, 55475.0, 32057.0, 19737.0, 12626.0, 8317.0, 5343.0, 3391.0, 2303.0, 1480.0, 928.0, 626.0, 429.0, 255.0, 168.0, 115.0, 82.0, 47.0, 31.0, 20.0, 17.0, 8.0, 6.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.578125, -1.5283203125, -1.478515625, -1.4287109375, -1.37890625, -1.3291015625, -1.279296875, -1.2294921875, -1.1796875, -1.1298828125, -1.080078125, -1.0302734375, -0.98046875, -0.9306640625, -0.880859375, -0.8310546875, -0.78125, -0.7314453125, -0.681640625, -0.6318359375, -0.58203125, -0.5322265625, -0.482421875, -0.4326171875, -0.3828125, -0.3330078125, -0.283203125, -0.2333984375, -0.18359375, -0.1337890625, -0.083984375, -0.0341796875, 0.015625, 0.0654296875, 0.115234375, 0.1650390625, 0.21484375, 0.2646484375, 0.314453125, 0.3642578125, 0.4140625, 0.4638671875, 0.513671875, 0.5634765625, 0.61328125, 0.6630859375, 0.712890625, 0.7626953125, 0.8125, 0.8623046875, 0.912109375, 0.9619140625, 1.01171875, 1.0615234375, 1.111328125, 1.1611328125, 1.2109375, 1.2607421875, 1.310546875, 1.3603515625, 1.41015625, 1.4599609375, 1.509765625, 1.5595703125, 1.609375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 9.0, 7.0, 17.0, 6.0, 16.0, 17.0, 16.0, 27.0, 27.0, 34.0, 22.0, 22.0, 36.0, 32.0, 30.0, 40.0, 36.0, 46.0, 38.0, 1067.0, 52.0, 32.0, 32.0, 36.0, 28.0, 30.0, 39.0, 28.0, 29.0, 23.0, 21.0, 10.0, 28.0, 17.0, 12.0, 13.0, 6.0, 9.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-8.6171875, -8.35107421875, -8.0849609375, -7.81884765625, -7.552734375, -7.28662109375, -7.0205078125, -6.75439453125, -6.48828125, -6.22216796875, -5.9560546875, -5.68994140625, -5.423828125, -5.15771484375, -4.8916015625, -4.62548828125, -4.359375, -4.09326171875, -3.8271484375, -3.56103515625, -3.294921875, -3.02880859375, -2.7626953125, -2.49658203125, -2.23046875, -1.96435546875, -1.6982421875, -1.43212890625, -1.166015625, -0.89990234375, -0.6337890625, -0.36767578125, -0.1015625, 0.16455078125, 0.4306640625, 0.69677734375, 0.962890625, 1.22900390625, 1.4951171875, 1.76123046875, 2.02734375, 2.29345703125, 2.5595703125, 2.82568359375, 3.091796875, 3.35791015625, 3.6240234375, 3.89013671875, 4.15625, 4.42236328125, 4.6884765625, 4.95458984375, 5.220703125, 5.48681640625, 5.7529296875, 6.01904296875, 6.28515625, 6.55126953125, 6.8173828125, 7.08349609375, 7.349609375, 7.61572265625, 7.8818359375, 8.14794921875, 8.4140625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 1.0, 6.0, 13.0, 9.0, 21.0, 35.0, 61.0, 95.0, 120.0, 207.0, 333.0, 469.0, 725.0, 1115.0, 1558.0, 2436.0, 3623.0, 5558.0, 8203.0, 12869.0, 19744.0, 30939.0, 49893.0, 83158.0, 143531.0, 1257732.0, 191013.0, 109577.0, 64025.0, 38848.0, 24491.0, 16012.0, 10342.0, 6905.0, 4585.0, 3052.0, 1967.0, 1308.0, 844.0, 589.0, 373.0, 259.0, 153.0, 119.0, 70.0, 49.0, 35.0, 29.0, 12.0, 12.0, 6.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.77880859375, -0.7542800903320312, -0.7297515869140625, -0.7052230834960938, -0.680694580078125, -0.6561660766601562, -0.6316375732421875, -0.6071090698242188, -0.58258056640625, -0.5580520629882812, -0.5335235595703125, -0.5089950561523438, -0.484466552734375, -0.45993804931640625, -0.4354095458984375, -0.41088104248046875, -0.3863525390625, -0.36182403564453125, -0.3372955322265625, -0.31276702880859375, -0.288238525390625, -0.26371002197265625, -0.2391815185546875, -0.21465301513671875, -0.19012451171875, -0.16559600830078125, -0.1410675048828125, -0.11653900146484375, -0.092010498046875, -0.06748199462890625, -0.0429534912109375, -0.01842498779296875, 0.006103515625, 0.03063201904296875, 0.0551605224609375, 0.07968902587890625, 0.104217529296875, 0.12874603271484375, 0.1532745361328125, 0.17780303955078125, 0.20233154296875, 0.22686004638671875, 0.2513885498046875, 0.27591705322265625, 0.300445556640625, 0.32497406005859375, 0.3495025634765625, 0.37403106689453125, 0.3985595703125, 0.42308807373046875, 0.4476165771484375, 0.47214508056640625, 0.496673583984375, 0.5212020874023438, 0.5457305908203125, 0.5702590942382812, 0.59478759765625, 0.6193161010742188, 0.6438446044921875, 0.6683731079101562, 0.692901611328125, 0.7174301147460938, 0.7419586181640625, 0.7664871215820312, 0.791015625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 8.0, 6.0, 12.0, 18.0, 27.0, 39.0, 60.0, 83.0, 129.0, 183.0, 145.0, 90.0, 58.0, 28.0, 28.0, 14.0, 13.0, 11.0, 8.0, 6.0, 6.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04205322265625, -0.04076671600341797, -0.03948020935058594, -0.038193702697753906, -0.036907196044921875, -0.035620689392089844, -0.03433418273925781, -0.03304767608642578, -0.03176116943359375, -0.03047466278076172, -0.029188156127929688, -0.027901649475097656, -0.026615142822265625, -0.025328636169433594, -0.024042129516601562, -0.02275562286376953, -0.0214691162109375, -0.02018260955810547, -0.018896102905273438, -0.017609596252441406, -0.016323089599609375, -0.015036582946777344, -0.013750076293945312, -0.012463569641113281, -0.01117706298828125, -0.009890556335449219, -0.008604049682617188, -0.007317543029785156, -0.006031036376953125, -0.004744529724121094, -0.0034580230712890625, -0.0021715164184570312, -0.000885009765625, 0.00040149688720703125, 0.0016880035400390625, 0.0029745101928710938, 0.004261016845703125, 0.005547523498535156, 0.0068340301513671875, 0.008120536804199219, 0.00940704345703125, 0.010693550109863281, 0.011980056762695312, 0.013266563415527344, 0.014553070068359375, 0.015839576721191406, 0.017126083374023438, 0.01841259002685547, 0.0196990966796875, 0.02098560333251953, 0.022272109985351562, 0.023558616638183594, 0.024845123291015625, 0.026131629943847656, 0.027418136596679688, 0.02870464324951172, 0.02999114990234375, 0.03127765655517578, 0.03256416320800781, 0.033850669860839844, 0.035137176513671875, 0.036423683166503906, 0.03771018981933594, 0.03899669647216797, 0.040283203125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 13.0, 13.0, 21.0, 43.0, 43.0, 97.0, 138.0, 372.0, 1727.0, 68309.0, 969309.0, 7228.0, 650.0, 259.0, 122.0, 72.0, 39.0, 19.0, 19.0, 13.0, 8.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.81298828125, -0.7869720458984375, -0.760955810546875, -0.7349395751953125, -0.70892333984375, -0.6829071044921875, -0.656890869140625, -0.6308746337890625, -0.6048583984375, -0.5788421630859375, -0.552825927734375, -0.5268096923828125, -0.50079345703125, -0.4747772216796875, -0.448760986328125, -0.4227447509765625, -0.396728515625, -0.3707122802734375, -0.344696044921875, -0.3186798095703125, -0.29266357421875, -0.2666473388671875, -0.240631103515625, -0.2146148681640625, -0.1885986328125, -0.1625823974609375, -0.136566162109375, -0.1105499267578125, -0.08453369140625, -0.0585174560546875, -0.032501220703125, -0.0064849853515625, 0.01953125, 0.0455474853515625, 0.071563720703125, 0.0975799560546875, 0.12359619140625, 0.1496124267578125, 0.175628662109375, 0.2016448974609375, 0.2276611328125, 0.2536773681640625, 0.279693603515625, 0.3057098388671875, 0.33172607421875, 0.3577423095703125, 0.383758544921875, 0.4097747802734375, 0.435791015625, 0.4618072509765625, 0.487823486328125, 0.5138397216796875, 0.53985595703125, 0.5658721923828125, 0.591888427734375, 0.6179046630859375, 0.6439208984375, 0.6699371337890625, 0.695953369140625, 0.7219696044921875, 0.74798583984375, 0.7740020751953125, 0.800018310546875, 0.8260345458984375, 0.85205078125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 26.0, 92.0, 425.0, 315.0, 86.0, 30.0, 17.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12032121419906616, -0.1093047633767128, -0.09828831255435944, -0.08727185428142548, -0.07625540345907211, -0.06523895263671875, -0.05422249436378479, -0.04320604354143143, -0.032189592719078064, -0.02117314003407955, -0.01015668734908104, 0.0008597671985626221, 0.011876218020915985, 0.022892668843269348, 0.03390912711620331, 0.04492557793855667, 0.055942028760910034, 0.0669584795832634, 0.07797493040561676, 0.08899138867855072, 0.10000783950090408, 0.11102429032325745, 0.1220407485961914, 0.13305720686912537, 0.14407365024089813, 0.1550901085138321, 0.16610655188560486, 0.17712301015853882, 0.18813946843147278, 0.19915591180324554, 0.2101723700761795, 0.22118881344795227, 0.23220527172088623, 0.2432217299938202, 0.25423818826675415, 0.2652546167373657, 0.2762710750102997, 0.28728753328323364, 0.2983039915561676, 0.30932044982910156, 0.32033687829971313, 0.3313533365726471, 0.34236979484558105, 0.3533862233161926, 0.3644026815891266, 0.37541913986206055, 0.3864355981349945, 0.39745205640792847, 0.4084685146808624, 0.4194849729537964, 0.43050143122673035, 0.4415178894996643, 0.4525343179702759, 0.46355077624320984, 0.4745672345161438, 0.48558369278907776, 0.4966001510620117, 0.5076165795326233, 0.5186330676078796, 0.5296494960784912, 0.5406659841537476, 0.5516824126243591, 0.5626988410949707, 0.573715329170227, 0.5847317576408386]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 2.0, 9.0, 8.0, 13.0, 15.0, 10.0, 20.0, 27.0, 20.0, 26.0, 28.0, 19.0, 29.0, 27.0, 32.0, 32.0, 37.0, 27.0, 42.0, 33.0, 39.0, 44.0, 27.0, 38.0, 32.0, 56.0, 37.0, 42.0, 29.0, 30.0, 25.0, 19.0, 19.0, 19.0, 20.0, 16.0, 5.0, 9.0, 10.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048168838024139404, -0.04663674533367157, -0.045104652643203735, -0.0435725562274456, -0.04204046353697777, -0.040508370846509933, -0.0389762744307518, -0.037444181740283966, -0.03591208904981613, -0.0343799963593483, -0.03284790366888046, -0.03131580725312233, -0.029783714562654495, -0.02825162187218666, -0.026719527319073677, -0.025187432765960693, -0.02365534007549286, -0.022123247385025024, -0.02059115283191204, -0.019059058278799057, -0.017526965588331223, -0.015994872897863388, -0.014462778344750404, -0.012930684722959995, -0.011398591101169586, -0.009866497479379177, -0.008334403857588768, -0.006802310235798359, -0.00527021661400795, -0.0037381229922175407, -0.0022060293704271317, -0.0006739357486367226, 0.0008581578731536865, 0.0023902514949440956, 0.003922345116734505, 0.005454438738524914, 0.006986532360315323, 0.008518625982105732, 0.010050719603896141, 0.01158281322568655, 0.01311490684747696, 0.014647000469267368, 0.016179094091057777, 0.01771118864417076, 0.019243281334638596, 0.02077537402510643, 0.022307468578219414, 0.023839563131332397, 0.025371655821800232, 0.026903748512268066, 0.02843584306538105, 0.029967937618494034, 0.03150003030896187, 0.0330321229994297, 0.034564219415187836, 0.03609631210565567, 0.037628404796123505, 0.03916049748659134, 0.040692590177059174, 0.042224686592817307, 0.04375677928328514, 0.045288871973752975, 0.04682096838951111, 0.04835306107997894, 0.04988515377044678]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 3.0, 10.0, 4.0, 12.0, 10.0, 17.0, 19.0, 22.0, 17.0, 14.0, 30.0, 32.0, 38.0, 28.0, 41.0, 40.0, 40.0, 52.0, 45.0, 55.0, 32.0, 50.0, 34.0, 38.0, 49.0, 30.0, 32.0, 26.0, 33.0, 19.0, 18.0, 18.0, 14.0, 14.0, 9.0, 7.0, 14.0, 8.0, 8.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.09375, -14.6563720703125, -14.218994140625, -13.7816162109375, -13.34423828125, -12.9068603515625, -12.469482421875, -12.0321044921875, -11.5947265625, -11.1573486328125, -10.719970703125, -10.2825927734375, -9.84521484375, -9.4078369140625, -8.970458984375, -8.5330810546875, -8.095703125, -7.6583251953125, -7.220947265625, -6.7835693359375, -6.34619140625, -5.9088134765625, -5.471435546875, -5.0340576171875, -4.5966796875, -4.1593017578125, -3.721923828125, -3.2845458984375, -2.84716796875, -2.4097900390625, -1.972412109375, -1.5350341796875, -1.09765625, -0.6602783203125, -0.222900390625, 0.2144775390625, 0.65185546875, 1.0892333984375, 1.526611328125, 1.9639892578125, 2.4013671875, 2.8387451171875, 3.276123046875, 3.7135009765625, 4.15087890625, 4.5882568359375, 5.025634765625, 5.4630126953125, 5.900390625, 6.3377685546875, 6.775146484375, 7.2125244140625, 7.64990234375, 8.0872802734375, 8.524658203125, 8.9620361328125, 9.3994140625, 9.8367919921875, 10.274169921875, 10.7115478515625, 11.14892578125, 11.5863037109375, 12.023681640625, 12.4610595703125, 12.8984375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 5.0, 13.0, 14.0, 11.0, 11.0, 20.0, 20.0, 26.0, 36.0, 52.0, 71.0, 146.0, 260.0, 708.0, 1959.0, 7229.0, 29680.0, 142554.0, 573571.0, 230662.0, 46188.0, 10642.0, 2934.0, 878.0, 332.0, 180.0, 85.0, 71.0, 26.0, 37.0, 32.0, 20.0, 15.0, 17.0, 10.0, 4.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7734375, -8.4671630859375, -8.160888671875, -7.8546142578125, -7.54833984375, -7.2420654296875, -6.935791015625, -6.6295166015625, -6.3232421875, -6.0169677734375, -5.710693359375, -5.4044189453125, -5.09814453125, -4.7918701171875, -4.485595703125, -4.1793212890625, -3.873046875, -3.5667724609375, -3.260498046875, -2.9542236328125, -2.64794921875, -2.3416748046875, -2.035400390625, -1.7291259765625, -1.4228515625, -1.1165771484375, -0.810302734375, -0.5040283203125, -0.19775390625, 0.1085205078125, 0.414794921875, 0.7210693359375, 1.02734375, 1.3336181640625, 1.639892578125, 1.9461669921875, 2.25244140625, 2.5587158203125, 2.864990234375, 3.1712646484375, 3.4775390625, 3.7838134765625, 4.090087890625, 4.3963623046875, 4.70263671875, 5.0089111328125, 5.315185546875, 5.6214599609375, 5.927734375, 6.2340087890625, 6.540283203125, 6.8465576171875, 7.15283203125, 7.4591064453125, 7.765380859375, 8.0716552734375, 8.3779296875, 8.6842041015625, 8.990478515625, 9.2967529296875, 9.60302734375, 9.9093017578125, 10.215576171875, 10.5218505859375, 10.828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 10.0, 7.0, 9.0, 14.0, 13.0, 19.0, 19.0, 21.0, 25.0, 32.0, 33.0, 40.0, 55.0, 50.0, 62.0, 78.0, 350.0, 1687.0, 85.0, 55.0, 52.0, 43.0, 39.0, 36.0, 18.0, 31.0, 27.0, 26.0, 23.0, 18.0, 12.0, 9.0, 12.0, 6.0, 7.0, 6.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.71875, -46.318359375, -44.91796875, -43.517578125, -42.1171875, -40.716796875, -39.31640625, -37.916015625, -36.515625, -35.115234375, -33.71484375, -32.314453125, -30.9140625, -29.513671875, -28.11328125, -26.712890625, -25.3125, -23.912109375, -22.51171875, -21.111328125, -19.7109375, -18.310546875, -16.91015625, -15.509765625, -14.109375, -12.708984375, -11.30859375, -9.908203125, -8.5078125, -7.107421875, -5.70703125, -4.306640625, -2.90625, -1.505859375, -0.10546875, 1.294921875, 2.6953125, 4.095703125, 5.49609375, 6.896484375, 8.296875, 9.697265625, 11.09765625, 12.498046875, 13.8984375, 15.298828125, 16.69921875, 18.099609375, 19.5, 20.900390625, 22.30078125, 23.701171875, 25.1015625, 26.501953125, 27.90234375, 29.302734375, 30.703125, 32.103515625, 33.50390625, 34.904296875, 36.3046875, 37.705078125, 39.10546875, 40.505859375, 41.90625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 8.0, 5.0, 6.0, 7.0, 11.0, 7.0, 13.0, 14.0, 21.0, 31.0, 34.0, 54.0, 60.0, 75.0, 107.0, 132.0, 191.0, 300.0, 653.0, 3671.0, 3066963.0, 70334.0, 1642.0, 480.0, 236.0, 180.0, 112.0, 84.0, 67.0, 47.0, 37.0, 29.0, 24.0, 17.0, 14.0, 11.0, 6.0, 13.0, 5.0, 7.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-90.6875, -87.64453125, -84.6015625, -81.55859375, -78.515625, -75.47265625, -72.4296875, -69.38671875, -66.34375, -63.30078125, -60.2578125, -57.21484375, -54.171875, -51.12890625, -48.0859375, -45.04296875, -42.0, -38.95703125, -35.9140625, -32.87109375, -29.828125, -26.78515625, -23.7421875, -20.69921875, -17.65625, -14.61328125, -11.5703125, -8.52734375, -5.484375, -2.44140625, 0.6015625, 3.64453125, 6.6875, 9.73046875, 12.7734375, 15.81640625, 18.859375, 21.90234375, 24.9453125, 27.98828125, 31.03125, 34.07421875, 37.1171875, 40.16015625, 43.203125, 46.24609375, 49.2890625, 52.33203125, 55.375, 58.41796875, 61.4609375, 64.50390625, 67.546875, 70.58984375, 73.6328125, 76.67578125, 79.71875, 82.76171875, 85.8046875, 88.84765625, 91.890625, 94.93359375, 97.9765625, 101.01953125, 104.0625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 28.0, 930.0, 60.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-753.763671875, -740.4360961914062, -727.1084594726562, -713.7808837890625, -700.4532470703125, -687.1256713867188, -673.7980346679688, -660.470458984375, -647.142822265625, -633.8152465820312, -620.4876098632812, -607.1600341796875, -593.8323974609375, -580.5048217773438, -567.1771850585938, -553.849609375, -540.5220336914062, -527.1944580078125, -513.8668212890625, -500.5392150878906, -487.21160888671875, -473.884033203125, -460.556396484375, -447.22882080078125, -433.90118408203125, -420.5735778808594, -407.2459716796875, -393.9183654785156, -380.59075927734375, -367.26318359375, -353.935546875, -340.60797119140625, -327.28033447265625, -313.9527282714844, -300.6251220703125, -287.2975158691406, -273.96990966796875, -260.642333984375, -247.31471252441406, -233.98712158203125, -220.65951538085938, -207.3319091796875, -194.00430297851562, -180.67669677734375, -167.34910583496094, -154.02149963378906, -140.6938934326172, -127.36629486083984, -114.03868865966797, -100.7110824584961, -87.38348388671875, -74.05587768554688, -60.728275299072266, -47.400672912597656, -34.07306671142578, -20.745468139648438, -7.4178619384765625, 5.909741401672363, 19.23734474182129, 32.56494903564453, 45.89255142211914, 59.22015380859375, 72.54776000976562, 85.87535858154297, 99.20296478271484]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 11.0, 7.0, 10.0, 6.0, 14.0, 9.0, 15.0, 19.0, 18.0, 22.0, 20.0, 19.0, 27.0, 21.0, 22.0, 19.0, 17.0, 42.0, 29.0, 38.0, 45.0, 42.0, 41.0, 38.0, 43.0, 27.0, 35.0, 42.0, 34.0, 32.0, 24.0, 29.0, 31.0, 20.0, 21.0, 14.0, 25.0, 8.0, 8.0, 8.0, 8.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-97.35313415527344, -93.98736572265625, -90.62159729003906, -87.25582885742188, -83.89006042480469, -80.5242919921875, -77.15852355957031, -73.79275512695312, -70.42698669433594, -67.06121826171875, -63.69544982910156, -60.329681396484375, -56.96391296386719, -53.59814453125, -50.23237228393555, -46.86660385131836, -43.500831604003906, -40.13506317138672, -36.76929473876953, -33.403526306152344, -30.037755966186523, -26.671987533569336, -23.306217193603516, -19.940448760986328, -16.57468032836914, -13.208911895751953, -9.84314250946045, -6.477373123168945, -3.111604690551758, 0.2541637420654297, 3.61993408203125, 6.9857025146484375, 10.351463317871094, 13.717231750488281, 17.08300018310547, 20.44877052307129, 23.814538955688477, 27.180307388305664, 30.546077728271484, 33.91184616088867, 37.27761459350586, 40.64338302612305, 44.009151458740234, 47.37492370605469, 50.740692138671875, 54.10646057128906, 57.47222900390625, 60.83799743652344, 64.20376586914062, 67.56953430175781, 70.935302734375, 74.30107116699219, 77.66683959960938, 81.03260803222656, 84.39837646484375, 87.76414489746094, 91.12991333007812, 94.49568176269531, 97.8614501953125, 101.22721862792969, 104.59298706054688, 107.95875549316406, 111.32452392578125, 114.69029235839844, 118.05606842041016]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 12.0, 10.0, 14.0, 17.0, 16.0, 21.0, 19.0, 18.0, 34.0, 32.0, 29.0, 44.0, 37.0, 40.0, 45.0, 45.0, 52.0, 36.0, 46.0, 41.0, 43.0, 42.0, 43.0, 31.0, 35.0, 22.0, 19.0, 21.0, 17.0, 16.0, 17.0, 11.0, 7.0, 8.0, 15.0, 9.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.1171875, -14.673828125, -14.23046875, -13.787109375, -13.34375, -12.900390625, -12.45703125, -12.013671875, -11.5703125, -11.126953125, -10.68359375, -10.240234375, -9.796875, -9.353515625, -8.91015625, -8.466796875, -8.0234375, -7.580078125, -7.13671875, -6.693359375, -6.25, -5.806640625, -5.36328125, -4.919921875, -4.4765625, -4.033203125, -3.58984375, -3.146484375, -2.703125, -2.259765625, -1.81640625, -1.373046875, -0.9296875, -0.486328125, -0.04296875, 0.400390625, 0.84375, 1.287109375, 1.73046875, 2.173828125, 2.6171875, 3.060546875, 3.50390625, 3.947265625, 4.390625, 4.833984375, 5.27734375, 5.720703125, 6.1640625, 6.607421875, 7.05078125, 7.494140625, 7.9375, 8.380859375, 8.82421875, 9.267578125, 9.7109375, 10.154296875, 10.59765625, 11.041015625, 11.484375, 11.927734375, 12.37109375, 12.814453125, 13.2578125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 4.0, 12.0, 11.0, 10.0, 19.0, 21.0, 30.0, 38.0, 37.0, 64.0, 79.0, 110.0, 214.0, 527.0, 1316.0, 3713.0, 11272.0, 132950.0, 3935442.0, 91584.0, 10679.0, 3646.0, 1341.0, 533.0, 213.0, 96.0, 63.0, 52.0, 42.0, 32.0, 33.0, 20.0, 17.0, 15.0, 12.0, 11.0, 7.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-83.625, -81.33203125, -79.0390625, -76.74609375, -74.453125, -72.16015625, -69.8671875, -67.57421875, -65.28125, -62.98828125, -60.6953125, -58.40234375, -56.109375, -53.81640625, -51.5234375, -49.23046875, -46.9375, -44.64453125, -42.3515625, -40.05859375, -37.765625, -35.47265625, -33.1796875, -30.88671875, -28.59375, -26.30078125, -24.0078125, -21.71484375, -19.421875, -17.12890625, -14.8359375, -12.54296875, -10.25, -7.95703125, -5.6640625, -3.37109375, -1.078125, 1.21484375, 3.5078125, 5.80078125, 8.09375, 10.38671875, 12.6796875, 14.97265625, 17.265625, 19.55859375, 21.8515625, 24.14453125, 26.4375, 28.73046875, 31.0234375, 33.31640625, 35.609375, 37.90234375, 40.1953125, 42.48828125, 44.78125, 47.07421875, 49.3671875, 51.66015625, 53.953125, 56.24609375, 58.5390625, 60.83203125, 63.125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 7.0, 16.0, 25.0, 34.0, 44.0, 50.0, 91.0, 234.0, 558.0, 1073.0, 1000.0, 458.0, 202.0, 73.0, 61.0, 33.0, 22.0, 10.0, 17.0, 13.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.25, -38.94677734375, -37.6435546875, -36.34033203125, -35.037109375, -33.73388671875, -32.4306640625, -31.12744140625, -29.82421875, -28.52099609375, -27.2177734375, -25.91455078125, -24.611328125, -23.30810546875, -22.0048828125, -20.70166015625, -19.3984375, -18.09521484375, -16.7919921875, -15.48876953125, -14.185546875, -12.88232421875, -11.5791015625, -10.27587890625, -8.97265625, -7.66943359375, -6.3662109375, -5.06298828125, -3.759765625, -2.45654296875, -1.1533203125, 0.14990234375, 1.453125, 2.75634765625, 4.0595703125, 5.36279296875, 6.666015625, 7.96923828125, 9.2724609375, 10.57568359375, 11.87890625, 13.18212890625, 14.4853515625, 15.78857421875, 17.091796875, 18.39501953125, 19.6982421875, 21.00146484375, 22.3046875, 23.60791015625, 24.9111328125, 26.21435546875, 27.517578125, 28.82080078125, 30.1240234375, 31.42724609375, 32.73046875, 34.03369140625, 35.3369140625, 36.64013671875, 37.943359375, 39.24658203125, 40.5498046875, 41.85302734375, 43.15625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 5.0, 12.0, 16.0, 29.0, 40.0, 87.0, 195.0, 450.0, 986.0, 2660.0, 8852.0, 45940.0, 3670186.0, 431922.0, 24201.0, 5456.0, 1834.0, 712.0, 324.0, 170.0, 91.0, 42.0, 16.0, 13.0, 12.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-111.125, -107.83984375, -104.5546875, -101.26953125, -97.984375, -94.69921875, -91.4140625, -88.12890625, -84.84375, -81.55859375, -78.2734375, -74.98828125, -71.703125, -68.41796875, -65.1328125, -61.84765625, -58.5625, -55.27734375, -51.9921875, -48.70703125, -45.421875, -42.13671875, -38.8515625, -35.56640625, -32.28125, -28.99609375, -25.7109375, -22.42578125, -19.140625, -15.85546875, -12.5703125, -9.28515625, -6.0, -2.71484375, 0.5703125, 3.85546875, 7.140625, 10.42578125, 13.7109375, 16.99609375, 20.28125, 23.56640625, 26.8515625, 30.13671875, 33.421875, 36.70703125, 39.9921875, 43.27734375, 46.5625, 49.84765625, 53.1328125, 56.41796875, 59.703125, 62.98828125, 66.2734375, 69.55859375, 72.84375, 76.12890625, 79.4140625, 82.69921875, 85.984375, 89.26953125, 92.5546875, 95.83984375, 99.125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 6.0, 13.0, 11.0, 16.0, 27.0, 20.0, 45.0, 59.0, 89.0, 102.0, 148.0, 131.0, 94.0, 73.0, 43.0, 27.0, 29.0, 13.0, 9.0, 13.0, 7.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-146.2808074951172, -142.3976287841797, -138.51443481445312, -134.63125610351562, -130.74807739257812, -126.86489868164062, -122.9817123413086, -119.09852600097656, -115.21534729003906, -111.33216857910156, -107.44898223876953, -103.5657958984375, -99.6826171875, -95.7994384765625, -91.91625213623047, -88.03306579589844, -84.14988708496094, -80.26670837402344, -76.3835220336914, -72.50033569335938, -68.61715698242188, -64.73397827148438, -60.850791931152344, -56.96760940551758, -53.08442687988281, -49.20124435424805, -45.31806182861328, -41.434879302978516, -37.55169677734375, -33.668514251708984, -29.78533172607422, -25.902149200439453, -22.018959045410156, -18.13577651977539, -14.252593994140625, -10.36941146850586, -6.486228942871094, -2.603046417236328, 1.2801361083984375, 5.163318634033203, 9.046501159667969, 12.929683685302734, 16.8128662109375, 20.696048736572266, 24.57923126220703, 28.462413787841797, 32.34559631347656, 36.22877883911133, 40.111961364746094, 43.99514389038086, 47.878326416015625, 51.76150894165039, 55.644691467285156, 59.52787399291992, 63.41105651855469, 67.29423522949219, 71.17742156982422, 75.06060791015625, 78.94378662109375, 82.82696533203125, 86.71015167236328, 90.59333801269531, 94.47651672363281, 98.35969543457031, 102.24288177490234]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 10.0, 10.0, 7.0, 8.0, 18.0, 26.0, 17.0, 21.0, 22.0, 26.0, 36.0, 23.0, 38.0, 48.0, 40.0, 38.0, 32.0, 34.0, 41.0, 41.0, 44.0, 43.0, 37.0, 40.0, 39.0, 28.0, 30.0, 31.0, 19.0, 21.0, 12.0, 25.0, 19.0, 11.0, 14.0, 10.0, 9.0, 7.0, 4.0, 6.0, 3.0, 7.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.97794342041016, -72.29045104980469, -69.60296630859375, -66.91548156738281, -64.22798919677734, -61.54050064086914, -58.85301208496094, -56.165523529052734, -53.47803497314453, -50.79054641723633, -48.103057861328125, -45.41556930541992, -42.72808074951172, -40.040592193603516, -37.35310363769531, -34.66561508178711, -31.978126525878906, -29.290637969970703, -26.6031494140625, -23.915660858154297, -21.228172302246094, -18.54068374633789, -15.853195190429688, -13.165706634521484, -10.478218078613281, -7.790729522705078, -5.103240966796875, -2.415752410888672, 0.27173614501953125, 2.9592247009277344, 5.6467132568359375, 8.33420181274414, 11.021697998046875, 13.709186553955078, 16.39667510986328, 19.084163665771484, 21.771652221679688, 24.45914077758789, 27.146629333496094, 29.834117889404297, 32.5216064453125, 35.2090950012207, 37.896583557128906, 40.58407211303711, 43.27156066894531, 45.959049224853516, 48.64653778076172, 51.33402633666992, 54.021514892578125, 56.70900344848633, 59.39649200439453, 62.083980560302734, 64.77146911621094, 67.45895385742188, 70.14644622802734, 72.83393859863281, 75.52142333984375, 78.20890808105469, 80.89640045166016, 83.58389282226562, 86.27137756347656, 88.9588623046875, 91.64635467529297, 94.33384704589844, 97.02133178710938]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 10.0, 4.0, 12.0, 10.0, 12.0, 21.0, 19.0, 28.0, 31.0, 39.0, 41.0, 37.0, 44.0, 45.0, 46.0, 38.0, 44.0, 53.0, 59.0, 41.0, 45.0, 41.0, 36.0, 31.0, 30.0, 33.0, 32.0, 15.0, 16.0, 13.0, 18.0, 10.0, 11.0, 9.0, 5.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.71875, -16.22802734375, -15.7373046875, -15.24658203125, -14.755859375, -14.26513671875, -13.7744140625, -13.28369140625, -12.79296875, -12.30224609375, -11.8115234375, -11.32080078125, -10.830078125, -10.33935546875, -9.8486328125, -9.35791015625, -8.8671875, -8.37646484375, -7.8857421875, -7.39501953125, -6.904296875, -6.41357421875, -5.9228515625, -5.43212890625, -4.94140625, -4.45068359375, -3.9599609375, -3.46923828125, -2.978515625, -2.48779296875, -1.9970703125, -1.50634765625, -1.015625, -0.52490234375, -0.0341796875, 0.45654296875, 0.947265625, 1.43798828125, 1.9287109375, 2.41943359375, 2.91015625, 3.40087890625, 3.8916015625, 4.38232421875, 4.873046875, 5.36376953125, 5.8544921875, 6.34521484375, 6.8359375, 7.32666015625, 7.8173828125, 8.30810546875, 8.798828125, 9.28955078125, 9.7802734375, 10.27099609375, 10.76171875, 11.25244140625, 11.7431640625, 12.23388671875, 12.724609375, 13.21533203125, 13.7060546875, 14.19677734375, 14.6875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 10.0, 20.0, 21.0, 20.0, 36.0, 49.0, 55.0, 72.0, 146.0, 209.0, 292.0, 468.0, 763.0, 1097.0, 1780.0, 2777.0, 4194.0, 6669.0, 10935.0, 17791.0, 29223.0, 48866.0, 84949.0, 155109.0, 248800.0, 185444.0, 102381.0, 58099.0, 33934.0, 20425.0, 12413.0, 7886.0, 5008.0, 3044.0, 2005.0, 1199.0, 814.0, 565.0, 344.0, 243.0, 141.0, 96.0, 40.0, 40.0, 14.0, 22.0, 11.0, 13.0, 7.0, 4.0, 1.0, 5.0, 5.0, 2.0, 7.0, 0.0, 1.0, 2.0], "bins": [-1.57421875, -1.522857666015625, -1.47149658203125, -1.420135498046875, -1.3687744140625, -1.317413330078125, -1.26605224609375, -1.214691162109375, -1.163330078125, -1.111968994140625, -1.06060791015625, -1.009246826171875, -0.9578857421875, -0.906524658203125, -0.85516357421875, -0.803802490234375, -0.75244140625, -0.701080322265625, -0.64971923828125, -0.598358154296875, -0.5469970703125, -0.495635986328125, -0.44427490234375, -0.392913818359375, -0.341552734375, -0.290191650390625, -0.23883056640625, -0.187469482421875, -0.1361083984375, -0.084747314453125, -0.03338623046875, 0.017974853515625, 0.0693359375, 0.120697021484375, 0.17205810546875, 0.223419189453125, 0.2747802734375, 0.326141357421875, 0.37750244140625, 0.428863525390625, 0.480224609375, 0.531585693359375, 0.58294677734375, 0.634307861328125, 0.6856689453125, 0.737030029296875, 0.78839111328125, 0.839752197265625, 0.89111328125, 0.942474365234375, 0.99383544921875, 1.045196533203125, 1.0965576171875, 1.147918701171875, 1.19927978515625, 1.250640869140625, 1.302001953125, 1.353363037109375, 1.40472412109375, 1.456085205078125, 1.5074462890625, 1.558807373046875, 1.61016845703125, 1.661529541015625, 1.712890625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 5.0, 5.0, 4.0, 8.0, 10.0, 12.0, 7.0, 14.0, 17.0, 17.0, 24.0, 22.0, 28.0, 38.0, 20.0, 29.0, 38.0, 44.0, 36.0, 39.0, 34.0, 43.0, 1071.0, 45.0, 39.0, 44.0, 29.0, 32.0, 35.0, 38.0, 32.0, 20.0, 24.0, 20.0, 16.0, 10.0, 17.0, 15.0, 10.0, 10.0, 7.0, 4.0, 6.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.78564453125, -7.5087890625, -7.23193359375, -6.955078125, -6.67822265625, -6.4013671875, -6.12451171875, -5.84765625, -5.57080078125, -5.2939453125, -5.01708984375, -4.740234375, -4.46337890625, -4.1865234375, -3.90966796875, -3.6328125, -3.35595703125, -3.0791015625, -2.80224609375, -2.525390625, -2.24853515625, -1.9716796875, -1.69482421875, -1.41796875, -1.14111328125, -0.8642578125, -0.58740234375, -0.310546875, -0.03369140625, 0.2431640625, 0.52001953125, 0.796875, 1.07373046875, 1.3505859375, 1.62744140625, 1.904296875, 2.18115234375, 2.4580078125, 2.73486328125, 3.01171875, 3.28857421875, 3.5654296875, 3.84228515625, 4.119140625, 4.39599609375, 4.6728515625, 4.94970703125, 5.2265625, 5.50341796875, 5.7802734375, 6.05712890625, 6.333984375, 6.61083984375, 6.8876953125, 7.16455078125, 7.44140625, 7.71826171875, 7.9951171875, 8.27197265625, 8.548828125, 8.82568359375, 9.1025390625, 9.37939453125, 9.65625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 12.0, 14.0, 26.0, 41.0, 51.0, 85.0, 171.0, 246.0, 389.0, 612.0, 932.0, 1436.0, 2379.0, 3807.0, 6178.0, 9881.0, 16273.0, 26850.0, 47361.0, 88540.0, 170944.0, 1310818.0, 187683.0, 96220.0, 51404.0, 29115.0, 17288.0, 10674.0, 6416.0, 4214.0, 2703.0, 1580.0, 1011.0, 645.0, 429.0, 241.0, 156.0, 91.0, 79.0, 35.0, 37.0, 22.0, 14.0, 13.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.98193359375, -0.9517822265625, -0.921630859375, -0.8914794921875, -0.861328125, -0.8311767578125, -0.801025390625, -0.7708740234375, -0.74072265625, -0.7105712890625, -0.680419921875, -0.6502685546875, -0.6201171875, -0.5899658203125, -0.559814453125, -0.5296630859375, -0.49951171875, -0.4693603515625, -0.439208984375, -0.4090576171875, -0.37890625, -0.3487548828125, -0.318603515625, -0.2884521484375, -0.25830078125, -0.2281494140625, -0.197998046875, -0.1678466796875, -0.1376953125, -0.1075439453125, -0.077392578125, -0.0472412109375, -0.01708984375, 0.0130615234375, 0.043212890625, 0.0733642578125, 0.103515625, 0.1336669921875, 0.163818359375, 0.1939697265625, 0.22412109375, 0.2542724609375, 0.284423828125, 0.3145751953125, 0.3447265625, 0.3748779296875, 0.405029296875, 0.4351806640625, 0.46533203125, 0.4954833984375, 0.525634765625, 0.5557861328125, 0.5859375, 0.6160888671875, 0.646240234375, 0.6763916015625, 0.70654296875, 0.7366943359375, 0.766845703125, 0.7969970703125, 0.8271484375, 0.8572998046875, 0.887451171875, 0.9176025390625, 0.94775390625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 5.0, 7.0, 12.0, 6.0, 17.0, 16.0, 14.0, 19.0, 30.0, 43.0, 57.0, 80.0, 139.0, 160.0, 131.0, 66.0, 49.0, 29.0, 24.0, 16.0, 14.0, 11.0, 16.0, 4.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05169677734375, -0.05014657974243164, -0.04859638214111328, -0.04704618453979492, -0.04549598693847656, -0.0439457893371582, -0.042395591735839844, -0.040845394134521484, -0.039295196533203125, -0.037744998931884766, -0.036194801330566406, -0.03464460372924805, -0.03309440612792969, -0.03154420852661133, -0.02999401092529297, -0.02844381332397461, -0.02689361572265625, -0.02534341812133789, -0.02379322052001953, -0.022243022918701172, -0.020692825317382812, -0.019142627716064453, -0.017592430114746094, -0.016042232513427734, -0.014492034912109375, -0.012941837310791016, -0.011391639709472656, -0.009841442108154297, -0.008291244506835938, -0.006741046905517578, -0.005190849304199219, -0.0036406517028808594, -0.0020904541015625, -0.0005402565002441406, 0.0010099411010742188, 0.002560138702392578, 0.0041103363037109375, 0.005660533905029297, 0.007210731506347656, 0.008760929107666016, 0.010311126708984375, 0.011861324310302734, 0.013411521911621094, 0.014961719512939453, 0.016511917114257812, 0.018062114715576172, 0.01961231231689453, 0.02116250991821289, 0.02271270751953125, 0.02426290512084961, 0.02581310272216797, 0.027363300323486328, 0.028913497924804688, 0.030463695526123047, 0.032013893127441406, 0.033564090728759766, 0.035114288330078125, 0.036664485931396484, 0.038214683532714844, 0.0397648811340332, 0.04131507873535156, 0.04286527633666992, 0.04441547393798828, 0.04596567153930664, 0.047515869140625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 2.0, 6.0, 11.0, 18.0, 15.0, 33.0, 48.0, 61.0, 123.0, 227.0, 835.0, 11543.0, 984434.0, 48648.0, 1809.0, 313.0, 150.0, 84.0, 55.0, 30.0, 26.0, 21.0, 12.0, 8.0, 9.0, 7.0, 8.0, 2.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.044921875, -1.0108642578125, -0.976806640625, -0.9427490234375, -0.90869140625, -0.8746337890625, -0.840576171875, -0.8065185546875, -0.7724609375, -0.7384033203125, -0.704345703125, -0.6702880859375, -0.63623046875, -0.6021728515625, -0.568115234375, -0.5340576171875, -0.5, -0.4659423828125, -0.431884765625, -0.3978271484375, -0.36376953125, -0.3297119140625, -0.295654296875, -0.2615966796875, -0.2275390625, -0.1934814453125, -0.159423828125, -0.1253662109375, -0.09130859375, -0.0572509765625, -0.023193359375, 0.0108642578125, 0.044921875, 0.0789794921875, 0.113037109375, 0.1470947265625, 0.18115234375, 0.2152099609375, 0.249267578125, 0.2833251953125, 0.3173828125, 0.3514404296875, 0.385498046875, 0.4195556640625, 0.45361328125, 0.4876708984375, 0.521728515625, 0.5557861328125, 0.58984375, 0.6239013671875, 0.657958984375, 0.6920166015625, 0.72607421875, 0.7601318359375, 0.794189453125, 0.8282470703125, 0.8623046875, 0.8963623046875, 0.930419921875, 0.9644775390625, 0.99853515625, 1.0325927734375, 1.066650390625, 1.1007080078125, 1.134765625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 10.0, 13.0, 42.0, 96.0, 476.0, 221.0, 89.0, 39.0, 16.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42249006032943726, -0.4096030294895172, -0.39671602845191956, -0.3838289976119995, -0.37094199657440186, -0.3580549657344818, -0.34516793489456177, -0.3322809338569641, -0.31939390301704407, -0.306506872177124, -0.29361987113952637, -0.2807328402996063, -0.26784583926200867, -0.2549588084220886, -0.24207179248332977, -0.22918477654457092, -0.21629776060581207, -0.20341074466705322, -0.19052372872829437, -0.17763671278953552, -0.16474968194961548, -0.15186266601085663, -0.13897565007209778, -0.12608861923217773, -0.11320161074399948, -0.10031459480524063, -0.08742757141590118, -0.07454055547714233, -0.061653535813093185, -0.04876651614904404, -0.03587950021028519, -0.02299247682094574, -0.01010546088218689, 0.0027815578505396843, 0.015668576583266258, 0.028555594384670258, 0.041442614048719406, 0.054329633712768555, 0.0672166496515274, 0.08010367304086685, 0.0929906889796257, 0.10587770491838455, 0.118764728307724, 0.13165174424648285, 0.1445387601852417, 0.15742579102516174, 0.1703127920627594, 0.18319982290267944, 0.1960868388414383, 0.20897385478019714, 0.221860870718956, 0.23474788665771484, 0.2476349174976349, 0.26052194833755493, 0.2734089493751526, 0.28629598021507263, 0.2991829812526703, 0.31207001209259033, 0.324957013130188, 0.33784404397010803, 0.3507310450077057, 0.36361807584762573, 0.3765050768852234, 0.38939210772514343, 0.4022791385650635]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 9.0, 5.0, 5.0, 6.0, 16.0, 7.0, 19.0, 15.0, 16.0, 24.0, 12.0, 27.0, 24.0, 30.0, 28.0, 31.0, 34.0, 44.0, 28.0, 38.0, 39.0, 37.0, 36.0, 45.0, 33.0, 36.0, 43.0, 34.0, 34.0, 43.0, 23.0, 20.0, 24.0, 21.0, 24.0, 11.0, 15.0, 8.0, 11.0, 12.0, 3.0, 9.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.05724400281906128, -0.05544813722372055, -0.05365227162837982, -0.051856402307748795, -0.050060536712408066, -0.04826467111706734, -0.04646880179643631, -0.04467293620109558, -0.04287707060575485, -0.041081205010414124, -0.039285339415073395, -0.03748947009444237, -0.03569360449910164, -0.03389773890376091, -0.03210186958312988, -0.030306003987789154, -0.028510138392448425, -0.026714272797107697, -0.02491840533912182, -0.02312253788113594, -0.021326672285795212, -0.019530806690454483, -0.017734939232468605, -0.015939071774482727, -0.014143206179141998, -0.012347339652478695, -0.010551473125815392, -0.008755606599152088, -0.006959740072488785, -0.005163873545825481, -0.003368007019162178, -0.0015721404924988747, 0.0002237260341644287, 0.002019592560827732, 0.0038154590874910355, 0.005611325614154339, 0.007407192140817642, 0.009203058667480946, 0.010998925194144249, 0.012794791720807552, 0.014590658247470856, 0.016386523842811584, 0.018182391300797462, 0.01997825875878334, 0.02177412435412407, 0.023569989949464798, 0.025365857407450676, 0.027161724865436554, 0.028957590460777283, 0.03075345605611801, 0.03254932165145874, 0.03434519097208977, 0.036141056567430496, 0.037936922162771225, 0.03973279148340225, 0.04152865707874298, 0.04332452267408371, 0.04512038826942444, 0.04691625386476517, 0.048712123185396194, 0.05050798878073692, 0.05230385437607765, 0.05409972369670868, 0.05589558929204941, 0.05769145488739014]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 10.0, 4.0, 12.0, 10.0, 12.0, 21.0, 19.0, 28.0, 33.0, 37.0, 41.0, 38.0, 43.0, 45.0, 46.0, 38.0, 44.0, 54.0, 58.0, 41.0, 45.0, 41.0, 36.0, 30.0, 31.0, 33.0, 32.0, 15.0, 16.0, 13.0, 18.0, 10.0, 11.0, 9.0, 5.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.71875, -16.22802734375, -15.7373046875, -15.24658203125, -14.755859375, -14.26513671875, -13.7744140625, -13.28369140625, -12.79296875, -12.30224609375, -11.8115234375, -11.32080078125, -10.830078125, -10.33935546875, -9.8486328125, -9.35791015625, -8.8671875, -8.37646484375, -7.8857421875, -7.39501953125, -6.904296875, -6.41357421875, -5.9228515625, -5.43212890625, -4.94140625, -4.45068359375, -3.9599609375, -3.46923828125, -2.978515625, -2.48779296875, -1.9970703125, -1.50634765625, -1.015625, -0.52490234375, -0.0341796875, 0.45654296875, 0.947265625, 1.43798828125, 1.9287109375, 2.41943359375, 2.91015625, 3.40087890625, 3.8916015625, 4.38232421875, 4.873046875, 5.36376953125, 5.8544921875, 6.34521484375, 6.8359375, 7.32666015625, 7.8173828125, 8.30810546875, 8.798828125, 9.28955078125, 9.7802734375, 10.27099609375, 10.76171875, 11.25244140625, 11.7431640625, 12.23388671875, 12.724609375, 13.21533203125, 13.7060546875, 14.19677734375, 14.6875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 8.0, 12.0, 18.0, 20.0, 27.0, 41.0, 57.0, 77.0, 138.0, 199.0, 312.0, 524.0, 797.0, 1228.0, 1913.0, 3359.0, 7987.0, 29222.0, 172196.0, 646635.0, 142970.0, 25304.0, 7222.0, 3160.0, 1811.0, 1157.0, 749.0, 484.0, 314.0, 188.0, 147.0, 84.0, 62.0, 32.0, 35.0, 22.0, 16.0, 8.0, 7.0, 1.0, 3.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.484375, -11.1304931640625, -10.776611328125, -10.4227294921875, -10.06884765625, -9.7149658203125, -9.361083984375, -9.0072021484375, -8.6533203125, -8.2994384765625, -7.945556640625, -7.5916748046875, -7.23779296875, -6.8839111328125, -6.530029296875, -6.1761474609375, -5.822265625, -5.4683837890625, -5.114501953125, -4.7606201171875, -4.40673828125, -4.0528564453125, -3.698974609375, -3.3450927734375, -2.9912109375, -2.6373291015625, -2.283447265625, -1.9295654296875, -1.57568359375, -1.2218017578125, -0.867919921875, -0.5140380859375, -0.16015625, 0.1937255859375, 0.547607421875, 0.9014892578125, 1.25537109375, 1.6092529296875, 1.963134765625, 2.3170166015625, 2.6708984375, 3.0247802734375, 3.378662109375, 3.7325439453125, 4.08642578125, 4.4403076171875, 4.794189453125, 5.1480712890625, 5.501953125, 5.8558349609375, 6.209716796875, 6.5635986328125, 6.91748046875, 7.2713623046875, 7.625244140625, 7.9791259765625, 8.3330078125, 8.6868896484375, 9.040771484375, 9.3946533203125, 9.74853515625, 10.1024169921875, 10.456298828125, 10.8101806640625, 11.1640625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 4.0, 9.0, 7.0, 13.0, 9.0, 12.0, 21.0, 18.0, 28.0, 22.0, 40.0, 30.0, 38.0, 37.0, 33.0, 45.0, 59.0, 83.0, 1756.0, 268.0, 75.0, 43.0, 39.0, 40.0, 49.0, 38.0, 29.0, 27.0, 25.0, 20.0, 20.0, 19.0, 12.0, 16.0, 11.0, 13.0, 8.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.375, -33.1806640625, -31.986328125, -30.7919921875, -29.59765625, -28.4033203125, -27.208984375, -26.0146484375, -24.8203125, -23.6259765625, -22.431640625, -21.2373046875, -20.04296875, -18.8486328125, -17.654296875, -16.4599609375, -15.265625, -14.0712890625, -12.876953125, -11.6826171875, -10.48828125, -9.2939453125, -8.099609375, -6.9052734375, -5.7109375, -4.5166015625, -3.322265625, -2.1279296875, -0.93359375, 0.2607421875, 1.455078125, 2.6494140625, 3.84375, 5.0380859375, 6.232421875, 7.4267578125, 8.62109375, 9.8154296875, 11.009765625, 12.2041015625, 13.3984375, 14.5927734375, 15.787109375, 16.9814453125, 18.17578125, 19.3701171875, 20.564453125, 21.7587890625, 22.953125, 24.1474609375, 25.341796875, 26.5361328125, 27.73046875, 28.9248046875, 30.119140625, 31.3134765625, 32.5078125, 33.7021484375, 34.896484375, 36.0908203125, 37.28515625, 38.4794921875, 39.673828125, 40.8681640625, 42.0625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 6.0, 6.0, 12.0, 19.0, 22.0, 27.0, 34.0, 42.0, 60.0, 79.0, 87.0, 124.0, 157.0, 223.0, 327.0, 864.0, 9252.0, 3121293.0, 10928.0, 885.0, 320.0, 218.0, 149.0, 140.0, 87.0, 82.0, 57.0, 48.0, 36.0, 22.0, 21.0, 14.0, 10.0, 15.0, 9.0, 11.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-98.3125, -95.3798828125, -92.447265625, -89.5146484375, -86.58203125, -83.6494140625, -80.716796875, -77.7841796875, -74.8515625, -71.9189453125, -68.986328125, -66.0537109375, -63.12109375, -60.1884765625, -57.255859375, -54.3232421875, -51.390625, -48.4580078125, -45.525390625, -42.5927734375, -39.66015625, -36.7275390625, -33.794921875, -30.8623046875, -27.9296875, -24.9970703125, -22.064453125, -19.1318359375, -16.19921875, -13.2666015625, -10.333984375, -7.4013671875, -4.46875, -1.5361328125, 1.396484375, 4.3291015625, 7.26171875, 10.1943359375, 13.126953125, 16.0595703125, 18.9921875, 21.9248046875, 24.857421875, 27.7900390625, 30.72265625, 33.6552734375, 36.587890625, 39.5205078125, 42.453125, 45.3857421875, 48.318359375, 51.2509765625, 54.18359375, 57.1162109375, 60.048828125, 62.9814453125, 65.9140625, 68.8466796875, 71.779296875, 74.7119140625, 77.64453125, 80.5771484375, 83.509765625, 86.4423828125, 89.375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 23.0, 134.0, 426.0, 329.0, 89.0, 12.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34568214416504, -17.37533950805664, -14.404998779296875, -11.434657096862793, -8.464315414428711, -5.493973731994629, -2.523632049560547, 0.44671058654785156, 3.417051315307617, 6.387392997741699, 9.357734680175781, 12.328076362609863, 15.298418045043945, 18.268760681152344, 21.23910140991211, 24.209444046020508, 27.179784774780273, 30.150127410888672, 33.12046813964844, 36.0908088684082, 39.06114959716797, 42.031494140625, 45.001834869384766, 47.97217559814453, 50.94252014160156, 53.91286087036133, 56.883201599121094, 59.853546142578125, 62.82388687133789, 65.79422760009766, 68.76457214355469, 71.73490905761719, 74.70524597167969, 77.67559051513672, 80.64592742919922, 83.61627197265625, 86.58660888671875, 89.55695343017578, 92.52729797363281, 95.49763488769531, 98.46797943115234, 101.43832397460938, 104.40866088867188, 107.3790054321289, 110.34934997558594, 113.31968688964844, 116.29003143310547, 119.2603759765625, 122.230712890625, 125.20105743408203, 128.17140197753906, 131.14173889160156, 134.11207580566406, 137.08242797851562, 140.05276489257812, 143.02310180664062, 145.99343872070312, 148.96377563476562, 151.9341278076172, 154.9044647216797, 157.8748016357422, 160.84515380859375, 163.81549072265625, 166.78582763671875, 169.7561798095703]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 7.0, 5.0, 5.0, 11.0, 7.0, 6.0, 14.0, 15.0, 16.0, 17.0, 35.0, 20.0, 38.0, 22.0, 38.0, 32.0, 42.0, 41.0, 34.0, 50.0, 49.0, 37.0, 56.0, 33.0, 36.0, 44.0, 29.0, 28.0, 35.0, 30.0, 31.0, 26.0, 22.0, 21.0, 12.0, 11.0, 8.0, 7.0, 7.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-108.66925811767578, -105.16291809082031, -101.65657043457031, -98.15023040771484, -94.64389038085938, -91.13754272460938, -87.6312026977539, -84.12486267089844, -80.61851501464844, -77.11217498779297, -73.60582733154297, -70.0994873046875, -66.59314727783203, -63.0868034362793, -59.58045959472656, -56.074119567871094, -52.567779541015625, -49.06143569946289, -45.55509567260742, -42.04875183105469, -38.54241180419922, -35.036067962646484, -31.52972412109375, -28.02338218688965, -24.517040252685547, -21.010698318481445, -17.504356384277344, -13.99801254272461, -10.491670608520508, -6.985328674316406, -3.478984832763672, 0.027357101440429688, 3.53369140625, 7.04003381729126, 10.54637622833252, 14.052719116210938, 17.55906105041504, 21.06540298461914, 24.571746826171875, 28.078088760375977, 31.584430694580078, 35.09077453613281, 38.59711456298828, 42.103458404541016, 45.60980224609375, 49.11614227294922, 52.62248611450195, 56.12882995605469, 59.635169982910156, 63.14151382446289, 66.64785766601562, 70.1541976928711, 73.66053771972656, 77.16688537597656, 80.67322540283203, 84.1795654296875, 87.6859130859375, 91.19225311279297, 94.69860076904297, 98.20494079589844, 101.7112808227539, 105.21762084960938, 108.72396850585938, 112.23030853271484, 115.73664855957031]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 7.0, 8.0, 4.0, 11.0, 11.0, 12.0, 19.0, 18.0, 30.0, 21.0, 40.0, 36.0, 33.0, 49.0, 45.0, 44.0, 45.0, 45.0, 49.0, 58.0, 39.0, 41.0, 44.0, 41.0, 33.0, 39.0, 28.0, 28.0, 20.0, 17.0, 14.0, 10.0, 18.0, 7.0, 14.0, 6.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.03125, -16.536376953125, -16.04150390625, -15.546630859375, -15.0517578125, -14.556884765625, -14.06201171875, -13.567138671875, -13.072265625, -12.577392578125, -12.08251953125, -11.587646484375, -11.0927734375, -10.597900390625, -10.10302734375, -9.608154296875, -9.11328125, -8.618408203125, -8.12353515625, -7.628662109375, -7.1337890625, -6.638916015625, -6.14404296875, -5.649169921875, -5.154296875, -4.659423828125, -4.16455078125, -3.669677734375, -3.1748046875, -2.679931640625, -2.18505859375, -1.690185546875, -1.1953125, -0.700439453125, -0.20556640625, 0.289306640625, 0.7841796875, 1.279052734375, 1.77392578125, 2.268798828125, 2.763671875, 3.258544921875, 3.75341796875, 4.248291015625, 4.7431640625, 5.238037109375, 5.73291015625, 6.227783203125, 6.72265625, 7.217529296875, 7.71240234375, 8.207275390625, 8.7021484375, 9.197021484375, 9.69189453125, 10.186767578125, 10.681640625, 11.176513671875, 11.67138671875, 12.166259765625, 12.6611328125, 13.156005859375, 13.65087890625, 14.145751953125, 14.640625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 11.0, 20.0, 23.0, 26.0, 32.0, 55.0, 74.0, 92.0, 134.0, 243.0, 332.0, 554.0, 1051.0, 2062.0, 4452.0, 10937.0, 111921.0, 3753620.0, 282946.0, 14641.0, 5390.0, 2503.0, 1255.0, 683.0, 411.0, 256.0, 166.0, 123.0, 69.0, 52.0, 45.0, 32.0, 24.0, 16.0, 8.0, 13.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-64.375, -62.56689453125, -60.7587890625, -58.95068359375, -57.142578125, -55.33447265625, -53.5263671875, -51.71826171875, -49.91015625, -48.10205078125, -46.2939453125, -44.48583984375, -42.677734375, -40.86962890625, -39.0615234375, -37.25341796875, -35.4453125, -33.63720703125, -31.8291015625, -30.02099609375, -28.212890625, -26.40478515625, -24.5966796875, -22.78857421875, -20.98046875, -19.17236328125, -17.3642578125, -15.55615234375, -13.748046875, -11.93994140625, -10.1318359375, -8.32373046875, -6.515625, -4.70751953125, -2.8994140625, -1.09130859375, 0.716796875, 2.52490234375, 4.3330078125, 6.14111328125, 7.94921875, 9.75732421875, 11.5654296875, 13.37353515625, 15.181640625, 16.98974609375, 18.7978515625, 20.60595703125, 22.4140625, 24.22216796875, 26.0302734375, 27.83837890625, 29.646484375, 31.45458984375, 33.2626953125, 35.07080078125, 36.87890625, 38.68701171875, 40.4951171875, 42.30322265625, 44.111328125, 45.91943359375, 47.7275390625, 49.53564453125, 51.34375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 3.0, 3.0, 4.0, 7.0, 7.0, 2.0, 15.0, 14.0, 15.0, 15.0, 21.0, 27.0, 51.0, 92.0, 157.0, 367.0, 581.0, 893.0, 733.0, 465.0, 243.0, 102.0, 70.0, 39.0, 42.0, 20.0, 12.0, 14.0, 6.0, 9.0, 3.0, 7.0, 6.0, 5.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.21875, -28.267333984375, -27.31591796875, -26.364501953125, -25.4130859375, -24.461669921875, -23.51025390625, -22.558837890625, -21.607421875, -20.656005859375, -19.70458984375, -18.753173828125, -17.8017578125, -16.850341796875, -15.89892578125, -14.947509765625, -13.99609375, -13.044677734375, -12.09326171875, -11.141845703125, -10.1904296875, -9.239013671875, -8.28759765625, -7.336181640625, -6.384765625, -5.433349609375, -4.48193359375, -3.530517578125, -2.5791015625, -1.627685546875, -0.67626953125, 0.275146484375, 1.2265625, 2.177978515625, 3.12939453125, 4.080810546875, 5.0322265625, 5.983642578125, 6.93505859375, 7.886474609375, 8.837890625, 9.789306640625, 10.74072265625, 11.692138671875, 12.6435546875, 13.594970703125, 14.54638671875, 15.497802734375, 16.44921875, 17.400634765625, 18.35205078125, 19.303466796875, 20.2548828125, 21.206298828125, 22.15771484375, 23.109130859375, 24.060546875, 25.011962890625, 25.96337890625, 26.914794921875, 27.8662109375, 28.817626953125, 29.76904296875, 30.720458984375, 31.671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 6.0, 6.0, 6.0, 1.0, 9.0, 9.0, 14.0, 8.0, 21.0, 27.0, 44.0, 86.0, 143.0, 251.0, 543.0, 1259.0, 2961.0, 8229.0, 26313.0, 285671.0, 3774374.0, 70076.0, 15186.0, 5221.0, 2041.0, 837.0, 415.0, 198.0, 102.0, 62.0, 44.0, 28.0, 22.0, 15.0, 14.0, 10.0, 2.0, 4.0, 8.0, 8.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.625, -79.1728515625, -76.720703125, -74.2685546875, -71.81640625, -69.3642578125, -66.912109375, -64.4599609375, -62.0078125, -59.5556640625, -57.103515625, -54.6513671875, -52.19921875, -49.7470703125, -47.294921875, -44.8427734375, -42.390625, -39.9384765625, -37.486328125, -35.0341796875, -32.58203125, -30.1298828125, -27.677734375, -25.2255859375, -22.7734375, -20.3212890625, -17.869140625, -15.4169921875, -12.96484375, -10.5126953125, -8.060546875, -5.6083984375, -3.15625, -0.7041015625, 1.748046875, 4.2001953125, 6.65234375, 9.1044921875, 11.556640625, 14.0087890625, 16.4609375, 18.9130859375, 21.365234375, 23.8173828125, 26.26953125, 28.7216796875, 31.173828125, 33.6259765625, 36.078125, 38.5302734375, 40.982421875, 43.4345703125, 45.88671875, 48.3388671875, 50.791015625, 53.2431640625, 55.6953125, 58.1474609375, 60.599609375, 63.0517578125, 65.50390625, 67.9560546875, 70.408203125, 72.8603515625, 75.3125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 8.0, 7.0, 21.0, 36.0, 60.0, 147.0, 274.0, 238.0, 100.0, 46.0, 30.0, 19.0, 11.0, 9.0, 3.0, 1.0, 2.0], "bins": [-413.81341552734375, -406.13128662109375, -398.44915771484375, -390.76702880859375, -383.08489990234375, -375.40277099609375, -367.72064208984375, -360.03851318359375, -352.35638427734375, -344.67425537109375, -336.99212646484375, -329.30999755859375, -321.62786865234375, -313.94573974609375, -306.26361083984375, -298.58148193359375, -290.8993835449219, -283.2172546386719, -275.5351257324219, -267.8529968261719, -260.1708679199219, -252.48873901367188, -244.80661010742188, -237.12449645996094, -229.44235229492188, -221.76022338867188, -214.07809448242188, -206.39596557617188, -198.71383666992188, -191.03170776367188, -183.34957885742188, -175.66746520996094, -167.98533630371094, -160.30320739746094, -152.62107849121094, -144.93894958496094, -137.25682067871094, -129.57470703125, -121.89257049560547, -114.21044921875, -106.5283203125, -98.84619140625, -91.1640625, -83.48193359375, -75.79981231689453, -68.11768341064453, -60.43555450439453, -52.7534294128418, -45.07129669189453, -37.38916778564453, -29.707042694091797, -22.024913787841797, -14.34278678894043, -6.6606597900390625, 1.0214691162109375, 8.703594207763672, 16.385723114013672, 24.06785011291504, 31.749977111816406, 39.432106018066406, 47.114234924316406, 54.79636001586914, 62.47848892211914, 70.16061401367188, 77.84274291992188]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 13.0, 7.0, 7.0, 11.0, 6.0, 6.0, 19.0, 19.0, 21.0, 28.0, 23.0, 30.0, 33.0, 37.0, 39.0, 41.0, 40.0, 47.0, 34.0, 43.0, 36.0, 38.0, 30.0, 34.0, 31.0, 34.0, 29.0, 39.0, 26.0, 21.0, 20.0, 19.0, 25.0, 17.0, 22.0, 10.0, 10.0, 7.0, 5.0, 11.0, 7.0, 4.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-72.63909912109375, -70.26516723632812, -67.8912353515625, -65.51730346679688, -63.143367767333984, -60.76943588256836, -58.39550018310547, -56.021568298339844, -53.64763641357422, -51.273704528808594, -48.89977264404297, -46.52583694458008, -44.15190505981445, -41.77797317504883, -39.40403747558594, -37.03010559082031, -34.65617370605469, -32.28224182128906, -29.908308029174805, -27.534374237060547, -25.160442352294922, -22.786510467529297, -20.41257667541504, -18.03864288330078, -15.664710998535156, -13.290778160095215, -10.916845321655273, -8.542912483215332, -6.168979644775391, -3.795046806335449, -1.4211139678955078, 0.95281982421875, 3.326751708984375, 5.700684547424316, 8.074617385864258, 10.4485502243042, 12.82248306274414, 15.196415901184082, 17.570348739624023, 19.94428253173828, 22.318214416503906, 24.69214630126953, 27.06608009338379, 29.440013885498047, 31.813945770263672, 34.1878776550293, 36.56181335449219, 38.93574523925781, 41.30967712402344, 43.68360900878906, 46.05754089355469, 48.43147659301758, 50.8054084777832, 53.17934036254883, 55.55327606201172, 57.927207946777344, 60.30113983154297, 62.675071716308594, 65.04900360107422, 67.42293548583984, 69.796875, 72.17080688476562, 74.54473876953125, 76.91867065429688, 79.2926025390625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 6.0, 5.0, 8.0, 12.0, 7.0, 15.0, 21.0, 28.0, 32.0, 33.0, 33.0, 32.0, 36.0, 48.0, 38.0, 48.0, 46.0, 41.0, 41.0, 47.0, 39.0, 52.0, 45.0, 46.0, 29.0, 28.0, 35.0, 22.0, 19.0, 22.0, 16.0, 22.0, 15.0, 7.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.265625, -16.776123046875, -16.28662109375, -15.797119140625, -15.3076171875, -14.818115234375, -14.32861328125, -13.839111328125, -13.349609375, -12.860107421875, -12.37060546875, -11.881103515625, -11.3916015625, -10.902099609375, -10.41259765625, -9.923095703125, -9.43359375, -8.944091796875, -8.45458984375, -7.965087890625, -7.4755859375, -6.986083984375, -6.49658203125, -6.007080078125, -5.517578125, -5.028076171875, -4.53857421875, -4.049072265625, -3.5595703125, -3.070068359375, -2.58056640625, -2.091064453125, -1.6015625, -1.112060546875, -0.62255859375, -0.133056640625, 0.3564453125, 0.845947265625, 1.33544921875, 1.824951171875, 2.314453125, 2.803955078125, 3.29345703125, 3.782958984375, 4.2724609375, 4.761962890625, 5.25146484375, 5.740966796875, 6.23046875, 6.719970703125, 7.20947265625, 7.698974609375, 8.1884765625, 8.677978515625, 9.16748046875, 9.656982421875, 10.146484375, 10.635986328125, 11.12548828125, 11.614990234375, 12.1044921875, 12.593994140625, 13.08349609375, 13.572998046875, 14.0625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 8.0, 5.0, 11.0, 15.0, 29.0, 20.0, 34.0, 55.0, 84.0, 115.0, 212.0, 363.0, 599.0, 1031.0, 1705.0, 2989.0, 5123.0, 8803.0, 15294.0, 26289.0, 46211.0, 85184.0, 165906.0, 268557.0, 194419.0, 99739.0, 53834.0, 30074.0, 17503.0, 10105.0, 5849.0, 3417.0, 2015.0, 1198.0, 673.0, 424.0, 255.0, 162.0, 90.0, 57.0, 39.0, 19.0, 16.0, 11.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5732421875, -1.518280029296875, -1.46331787109375, -1.408355712890625, -1.3533935546875, -1.298431396484375, -1.24346923828125, -1.188507080078125, -1.133544921875, -1.078582763671875, -1.02362060546875, -0.968658447265625, -0.9136962890625, -0.858734130859375, -0.80377197265625, -0.748809814453125, -0.69384765625, -0.638885498046875, -0.58392333984375, -0.528961181640625, -0.4739990234375, -0.419036865234375, -0.36407470703125, -0.309112548828125, -0.254150390625, -0.199188232421875, -0.14422607421875, -0.089263916015625, -0.0343017578125, 0.020660400390625, 0.07562255859375, 0.130584716796875, 0.185546875, 0.240509033203125, 0.29547119140625, 0.350433349609375, 0.4053955078125, 0.460357666015625, 0.51531982421875, 0.570281982421875, 0.625244140625, 0.680206298828125, 0.73516845703125, 0.790130615234375, 0.8450927734375, 0.900054931640625, 0.95501708984375, 1.009979248046875, 1.06494140625, 1.119903564453125, 1.17486572265625, 1.229827880859375, 1.2847900390625, 1.339752197265625, 1.39471435546875, 1.449676513671875, 1.504638671875, 1.559600830078125, 1.61456298828125, 1.669525146484375, 1.7244873046875, 1.779449462890625, 1.83441162109375, 1.889373779296875, 1.9443359375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 3.0, 7.0, 11.0, 4.0, 8.0, 9.0, 11.0, 13.0, 23.0, 17.0, 20.0, 23.0, 34.0, 43.0, 30.0, 26.0, 30.0, 32.0, 28.0, 42.0, 41.0, 1056.0, 36.0, 32.0, 30.0, 36.0, 35.0, 26.0, 40.0, 22.0, 32.0, 23.0, 23.0, 29.0, 23.0, 12.0, 22.0, 18.0, 13.0, 7.0, 10.0, 6.0, 10.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 3.0], "bins": [-8.75, -8.50531005859375, -8.2606201171875, -8.01593017578125, -7.771240234375, -7.52655029296875, -7.2818603515625, -7.03717041015625, -6.79248046875, -6.54779052734375, -6.3031005859375, -6.05841064453125, -5.813720703125, -5.56903076171875, -5.3243408203125, -5.07965087890625, -4.8349609375, -4.59027099609375, -4.3455810546875, -4.10089111328125, -3.856201171875, -3.61151123046875, -3.3668212890625, -3.12213134765625, -2.87744140625, -2.63275146484375, -2.3880615234375, -2.14337158203125, -1.898681640625, -1.65399169921875, -1.4093017578125, -1.16461181640625, -0.919921875, -0.67523193359375, -0.4305419921875, -0.18585205078125, 0.058837890625, 0.30352783203125, 0.5482177734375, 0.79290771484375, 1.03759765625, 1.28228759765625, 1.5269775390625, 1.77166748046875, 2.016357421875, 2.26104736328125, 2.5057373046875, 2.75042724609375, 2.9951171875, 3.23980712890625, 3.4844970703125, 3.72918701171875, 3.973876953125, 4.21856689453125, 4.4632568359375, 4.70794677734375, 4.95263671875, 5.19732666015625, 5.4420166015625, 5.68670654296875, 5.931396484375, 6.17608642578125, 6.4207763671875, 6.66546630859375, 6.91015625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 13.0, 17.0, 29.0, 32.0, 67.0, 100.0, 148.0, 239.0, 378.0, 567.0, 851.0, 1315.0, 1965.0, 3017.0, 4505.0, 6672.0, 10281.0, 15328.0, 24063.0, 38290.0, 63832.0, 108523.0, 182786.0, 1256414.0, 148022.0, 87460.0, 51897.0, 31899.0, 20022.0, 12958.0, 8563.0, 5598.0, 3839.0, 2485.0, 1710.0, 1146.0, 721.0, 464.0, 322.0, 221.0, 118.0, 81.0, 64.0, 39.0, 20.0, 15.0, 8.0, 9.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.83154296875, -0.8065719604492188, -0.7816009521484375, -0.7566299438476562, -0.731658935546875, -0.7066879272460938, -0.6817169189453125, -0.6567459106445312, -0.63177490234375, -0.6068038940429688, -0.5818328857421875, -0.5568618774414062, -0.531890869140625, -0.5069198608398438, -0.4819488525390625, -0.45697784423828125, -0.4320068359375, -0.40703582763671875, -0.3820648193359375, -0.35709381103515625, -0.332122802734375, -0.30715179443359375, -0.2821807861328125, -0.25720977783203125, -0.23223876953125, -0.20726776123046875, -0.1822967529296875, -0.15732574462890625, -0.132354736328125, -0.10738372802734375, -0.0824127197265625, -0.05744171142578125, -0.032470703125, -0.00749969482421875, 0.0174713134765625, 0.04244232177734375, 0.067413330078125, 0.09238433837890625, 0.1173553466796875, 0.14232635498046875, 0.16729736328125, 0.19226837158203125, 0.2172393798828125, 0.24221038818359375, 0.267181396484375, 0.29215240478515625, 0.3171234130859375, 0.34209442138671875, 0.3670654296875, 0.39203643798828125, 0.4170074462890625, 0.44197845458984375, 0.466949462890625, 0.49192047119140625, 0.5168914794921875, 0.5418624877929688, 0.56683349609375, 0.5918045043945312, 0.6167755126953125, 0.6417465209960938, 0.666717529296875, 0.6916885375976562, 0.7166595458984375, 0.7416305541992188, 0.7666015625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 1.0, 6.0, 10.0, 14.0, 9.0, 22.0, 14.0, 29.0, 31.0, 46.0, 53.0, 86.0, 135.0, 152.0, 117.0, 67.0, 41.0, 38.0, 32.0, 19.0, 14.0, 10.0, 9.0, 11.0, 10.0, 7.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0419921875, -0.04059648513793945, -0.039200782775878906, -0.03780508041381836, -0.03640937805175781, -0.035013675689697266, -0.03361797332763672, -0.03222227096557617, -0.030826568603515625, -0.029430866241455078, -0.02803516387939453, -0.026639461517333984, -0.025243759155273438, -0.02384805679321289, -0.022452354431152344, -0.021056652069091797, -0.01966094970703125, -0.018265247344970703, -0.016869544982910156, -0.01547384262084961, -0.014078140258789062, -0.012682437896728516, -0.011286735534667969, -0.009891033172607422, -0.008495330810546875, -0.007099628448486328, -0.005703926086425781, -0.004308223724365234, -0.0029125213623046875, -0.0015168190002441406, -0.00012111663818359375, 0.0012745857238769531, 0.0026702880859375, 0.004065990447998047, 0.005461692810058594, 0.006857395172119141, 0.008253097534179688, 0.009648799896240234, 0.011044502258300781, 0.012440204620361328, 0.013835906982421875, 0.015231609344482422, 0.01662731170654297, 0.018023014068603516, 0.019418716430664062, 0.02081441879272461, 0.022210121154785156, 0.023605823516845703, 0.02500152587890625, 0.026397228240966797, 0.027792930603027344, 0.02918863296508789, 0.030584335327148438, 0.031980037689208984, 0.03337574005126953, 0.03477144241333008, 0.036167144775390625, 0.03756284713745117, 0.03895854949951172, 0.040354251861572266, 0.04174995422363281, 0.04314565658569336, 0.044541358947753906, 0.04593706130981445, 0.047332763671875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 10.0, 8.0, 7.0, 7.0, 17.0, 18.0, 20.0, 19.0, 47.0, 67.0, 117.0, 284.0, 1967.0, 785502.0, 258488.0, 1393.0, 280.0, 103.0, 59.0, 39.0, 26.0, 24.0, 13.0, 15.0, 11.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1171875, -1.0842742919921875, -1.051361083984375, -1.0184478759765625, -0.98553466796875, -0.9526214599609375, -0.919708251953125, -0.8867950439453125, -0.8538818359375, -0.8209686279296875, -0.788055419921875, -0.7551422119140625, -0.72222900390625, -0.6893157958984375, -0.656402587890625, -0.6234893798828125, -0.590576171875, -0.5576629638671875, -0.524749755859375, -0.4918365478515625, -0.45892333984375, -0.4260101318359375, -0.393096923828125, -0.3601837158203125, -0.3272705078125, -0.2943572998046875, -0.261444091796875, -0.2285308837890625, -0.19561767578125, -0.1627044677734375, -0.129791259765625, -0.0968780517578125, -0.06396484375, -0.0310516357421875, 0.001861572265625, 0.0347747802734375, 0.06768798828125, 0.1006011962890625, 0.133514404296875, 0.1664276123046875, 0.1993408203125, 0.2322540283203125, 0.265167236328125, 0.2980804443359375, 0.33099365234375, 0.3639068603515625, 0.396820068359375, 0.4297332763671875, 0.462646484375, 0.4955596923828125, 0.528472900390625, 0.5613861083984375, 0.59429931640625, 0.6272125244140625, 0.660125732421875, 0.6930389404296875, 0.7259521484375, 0.7588653564453125, 0.791778564453125, 0.8246917724609375, 0.85760498046875, 0.8905181884765625, 0.923431396484375, 0.9563446044921875, 0.9892578125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 13.0, 41.0, 70.0, 196.0, 383.0, 168.0, 63.0, 25.0, 23.0, 8.0, 2.0, 9.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07136602699756622, -0.0644640251994133, -0.05756201595067978, -0.050660014152526855, -0.04375800862908363, -0.03685600310564041, -0.029954001307487488, -0.023051995784044266, -0.016149990260601044, -0.009247985668480396, -0.002345981076359749, 0.004556022584438324, 0.011458028107881546, 0.018360033631324768, 0.02526203542947769, 0.032164040952920914, 0.039066046476364136, 0.04596805199980736, 0.05287005752325058, 0.0597720593214035, 0.06667406857013702, 0.07357607036828995, 0.08047807216644287, 0.08738008141517639, 0.09428208321332932, 0.10118408501148224, 0.10808609426021576, 0.11498809605836868, 0.1218900978565216, 0.12879210710525513, 0.13569411635398865, 0.14259611070156097, 0.1494981050491333, 0.15640011429786682, 0.16330210864543915, 0.17020411789417267, 0.1771061271429062, 0.18400812149047852, 0.19091013073921204, 0.19781213998794556, 0.20471414923667908, 0.2116161584854126, 0.21851815283298492, 0.22542016208171844, 0.23232217133045197, 0.2392241656780243, 0.2461261749267578, 0.25302818417549133, 0.25993019342422485, 0.2668322026729584, 0.2737342119216919, 0.280636191368103, 0.28753820061683655, 0.29444020986557007, 0.3013422191143036, 0.3082442283630371, 0.31514620780944824, 0.32204821705818176, 0.3289502263069153, 0.3358522057533264, 0.34275421500205994, 0.34965622425079346, 0.356558233499527, 0.3634602427482605, 0.370362251996994]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 6.0, 10.0, 13.0, 25.0, 16.0, 23.0, 33.0, 19.0, 27.0, 23.0, 26.0, 50.0, 36.0, 29.0, 52.0, 37.0, 52.0, 32.0, 48.0, 49.0, 34.0, 46.0, 47.0, 31.0, 39.0, 35.0, 23.0, 26.0, 29.0, 26.0, 11.0, 7.0, 10.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06251299381256104, -0.060667648911476135, -0.05882230028510094, -0.05697695165872574, -0.05513160675764084, -0.05328626185655594, -0.05144091323018074, -0.04959556460380554, -0.04775021970272064, -0.04590487480163574, -0.044059526175260544, -0.042214177548885345, -0.040368832647800446, -0.038523487746715546, -0.03667813912034035, -0.03483279049396515, -0.03298744559288025, -0.0311420988291502, -0.02929675206542015, -0.0274514053016901, -0.025606058537960052, -0.023760711774230003, -0.021915365010499954, -0.020070018246769905, -0.018224671483039856, -0.016379324719309807, -0.014533977955579758, -0.012688631191849709, -0.01084328442811966, -0.00899793766438961, -0.007152590900659561, -0.005307244136929512, -0.003461897373199463, -0.0016165506094694138, 0.00022879615426063538, 0.0020741429179906845, 0.003919489681720734, 0.005764836445450783, 0.007610183209180832, 0.009455529972910881, 0.01130087673664093, 0.01314622350037098, 0.014991570264101028, 0.016836917027831078, 0.018682263791561127, 0.020527610555291176, 0.022372957319021225, 0.024218304082751274, 0.026063650846481323, 0.027908997610211372, 0.02975434437394142, 0.03159969300031662, 0.03344503790140152, 0.03529038280248642, 0.03713573142886162, 0.038981080055236816, 0.040826424956321716, 0.042671769857406616, 0.044517118483781815, 0.04636246711015701, 0.04820781201124191, 0.05005315691232681, 0.05189850553870201, 0.05374385416507721, 0.05558919906616211]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 6.0, 5.0, 8.0, 12.0, 7.0, 16.0, 19.0, 29.0, 32.0, 33.0, 33.0, 32.0, 36.0, 48.0, 38.0, 48.0, 46.0, 40.0, 42.0, 47.0, 39.0, 53.0, 44.0, 46.0, 29.0, 28.0, 34.0, 23.0, 20.0, 21.0, 16.0, 22.0, 15.0, 7.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.265625, -16.776123046875, -16.28662109375, -15.797119140625, -15.3076171875, -14.818115234375, -14.32861328125, -13.839111328125, -13.349609375, -12.860107421875, -12.37060546875, -11.881103515625, -11.3916015625, -10.902099609375, -10.41259765625, -9.923095703125, -9.43359375, -8.944091796875, -8.45458984375, -7.965087890625, -7.4755859375, -6.986083984375, -6.49658203125, -6.007080078125, -5.517578125, -5.028076171875, -4.53857421875, -4.049072265625, -3.5595703125, -3.070068359375, -2.58056640625, -2.091064453125, -1.6015625, -1.112060546875, -0.62255859375, -0.133056640625, 0.3564453125, 0.845947265625, 1.33544921875, 1.824951171875, 2.314453125, 2.803955078125, 3.29345703125, 3.782958984375, 4.2724609375, 4.761962890625, 5.25146484375, 5.740966796875, 6.23046875, 6.719970703125, 7.20947265625, 7.698974609375, 8.1884765625, 8.677978515625, 9.16748046875, 9.656982421875, 10.146484375, 10.635986328125, 11.12548828125, 11.614990234375, 12.1044921875, 12.593994140625, 13.08349609375, 13.572998046875, 14.0625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 8.0, 6.0, 10.0, 14.0, 11.0, 18.0, 32.0, 47.0, 65.0, 78.0, 124.0, 159.0, 309.0, 567.0, 1421.0, 4979.0, 24291.0, 222755.0, 709317.0, 68524.0, 11145.0, 2647.0, 915.0, 422.0, 212.0, 145.0, 100.0, 52.0, 40.0, 33.0, 25.0, 27.0, 18.0, 9.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-16.078125, -15.6221923828125, -15.166259765625, -14.7103271484375, -14.25439453125, -13.7984619140625, -13.342529296875, -12.8865966796875, -12.4306640625, -11.9747314453125, -11.518798828125, -11.0628662109375, -10.60693359375, -10.1510009765625, -9.695068359375, -9.2391357421875, -8.783203125, -8.3272705078125, -7.871337890625, -7.4154052734375, -6.95947265625, -6.5035400390625, -6.047607421875, -5.5916748046875, -5.1357421875, -4.6798095703125, -4.223876953125, -3.7679443359375, -3.31201171875, -2.8560791015625, -2.400146484375, -1.9442138671875, -1.48828125, -1.0323486328125, -0.576416015625, -0.1204833984375, 0.33544921875, 0.7913818359375, 1.247314453125, 1.7032470703125, 2.1591796875, 2.6151123046875, 3.071044921875, 3.5269775390625, 3.98291015625, 4.4388427734375, 4.894775390625, 5.3507080078125, 5.806640625, 6.2625732421875, 6.718505859375, 7.1744384765625, 7.63037109375, 8.0863037109375, 8.542236328125, 8.9981689453125, 9.4541015625, 9.9100341796875, 10.365966796875, 10.8218994140625, 11.27783203125, 11.7337646484375, 12.189697265625, 12.6456298828125, 13.1015625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 8.0, 3.0, 12.0, 12.0, 16.0, 12.0, 10.0, 18.0, 30.0, 23.0, 29.0, 26.0, 31.0, 27.0, 36.0, 41.0, 33.0, 41.0, 50.0, 192.0, 1886.0, 81.0, 34.0, 43.0, 46.0, 28.0, 32.0, 40.0, 28.0, 19.0, 18.0, 20.0, 13.0, 19.0, 16.0, 13.0, 13.0, 12.0, 6.0, 4.0, 5.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.59375, -34.45654296875, -33.3193359375, -32.18212890625, -31.044921875, -29.90771484375, -28.7705078125, -27.63330078125, -26.49609375, -25.35888671875, -24.2216796875, -23.08447265625, -21.947265625, -20.81005859375, -19.6728515625, -18.53564453125, -17.3984375, -16.26123046875, -15.1240234375, -13.98681640625, -12.849609375, -11.71240234375, -10.5751953125, -9.43798828125, -8.30078125, -7.16357421875, -6.0263671875, -4.88916015625, -3.751953125, -2.61474609375, -1.4775390625, -0.34033203125, 0.796875, 1.93408203125, 3.0712890625, 4.20849609375, 5.345703125, 6.48291015625, 7.6201171875, 8.75732421875, 9.89453125, 11.03173828125, 12.1689453125, 13.30615234375, 14.443359375, 15.58056640625, 16.7177734375, 17.85498046875, 18.9921875, 20.12939453125, 21.2666015625, 22.40380859375, 23.541015625, 24.67822265625, 25.8154296875, 26.95263671875, 28.08984375, 29.22705078125, 30.3642578125, 31.50146484375, 32.638671875, 33.77587890625, 34.9130859375, 36.05029296875, 37.1875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 10.0, 7.0, 5.0, 4.0, 14.0, 16.0, 14.0, 18.0, 23.0, 19.0, 30.0, 42.0, 55.0, 79.0, 102.0, 110.0, 140.0, 214.0, 316.0, 693.0, 3998.0, 3116559.0, 20711.0, 1087.0, 398.0, 243.0, 173.0, 125.0, 104.0, 89.0, 55.0, 53.0, 36.0, 37.0, 24.0, 20.0, 21.0, 12.0, 18.0, 10.0, 5.0, 6.0, 5.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-78.25, -75.85546875, -73.4609375, -71.06640625, -68.671875, -66.27734375, -63.8828125, -61.48828125, -59.09375, -56.69921875, -54.3046875, -51.91015625, -49.515625, -47.12109375, -44.7265625, -42.33203125, -39.9375, -37.54296875, -35.1484375, -32.75390625, -30.359375, -27.96484375, -25.5703125, -23.17578125, -20.78125, -18.38671875, -15.9921875, -13.59765625, -11.203125, -8.80859375, -6.4140625, -4.01953125, -1.625, 0.76953125, 3.1640625, 5.55859375, 7.953125, 10.34765625, 12.7421875, 15.13671875, 17.53125, 19.92578125, 22.3203125, 24.71484375, 27.109375, 29.50390625, 31.8984375, 34.29296875, 36.6875, 39.08203125, 41.4765625, 43.87109375, 46.265625, 48.66015625, 51.0546875, 53.44921875, 55.84375, 58.23828125, 60.6328125, 63.02734375, 65.421875, 67.81640625, 70.2109375, 72.60546875, 75.0]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [7.0, 51.0, 376.0, 502.0, 83.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.273372650146484, -6.994553565979004, -3.7157340049743652, -0.43691444396972656, 2.841904640197754, 6.120723724365234, 9.399543762207031, 12.678361892700195, 15.957181930541992, 19.23600196838379, 22.514820098876953, 25.79364013671875, 29.072460174560547, 32.351280212402344, 35.630096435546875, 38.90891647338867, 42.18773651123047, 45.466556549072266, 48.74537658691406, 52.024192810058594, 55.30301284790039, 58.58183288574219, 61.860652923583984, 65.13947296142578, 68.41828918457031, 71.69710540771484, 74.9759292602539, 78.25474548339844, 81.5335693359375, 84.81238555908203, 88.09120178222656, 91.37002563476562, 94.64884185791016, 97.92765808105469, 101.20648193359375, 104.48529815673828, 107.76412200927734, 111.04293823242188, 114.32176208496094, 117.60057830810547, 120.87939453125, 124.15821075439453, 127.4370346069336, 130.71585083007812, 133.9946746826172, 137.27349853515625, 140.55230712890625, 143.8311309814453, 147.10995483398438, 150.38877868652344, 153.66758728027344, 156.9464111328125, 160.22523498535156, 163.50405883789062, 166.78286743164062, 170.0616912841797, 173.3404998779297, 176.61932373046875, 179.89813232421875, 183.1769561767578, 186.45578002929688, 189.73458862304688, 193.01341247558594, 196.292236328125, 199.57106018066406]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 6.0, 4.0, 11.0, 17.0, 15.0, 21.0, 15.0, 28.0, 23.0, 28.0, 33.0, 34.0, 43.0, 37.0, 31.0, 46.0, 42.0, 59.0, 45.0, 35.0, 39.0, 38.0, 40.0, 39.0, 48.0, 35.0, 27.0, 22.0, 19.0, 21.0, 16.0, 13.0, 11.0, 9.0, 7.0, 10.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-119.44609832763672, -115.95172119140625, -112.45734405517578, -108.96296691894531, -105.46858978271484, -101.97421264648438, -98.47984313964844, -94.98545837402344, -91.4910888671875, -87.99671173095703, -84.50233459472656, -81.0079574584961, -77.51358032226562, -74.01920318603516, -70.52482604980469, -67.03045654296875, -63.53607177734375, -60.04169464111328, -56.54731750488281, -53.052940368652344, -49.558563232421875, -46.064186096191406, -42.5698127746582, -39.075435638427734, -35.581058502197266, -32.0866813659668, -28.592304229736328, -25.097929000854492, -21.603551864624023, -18.109174728393555, -14.614799499511719, -11.12042236328125, -7.6260528564453125, -4.131676197052002, -0.6372995376586914, 2.857076644897461, 6.35145378112793, 9.845830917358398, 13.340206146240234, 16.834583282470703, 20.328960418701172, 23.82333755493164, 27.31771469116211, 30.812089920043945, 34.30646514892578, 37.80084228515625, 41.29521942138672, 44.78959655761719, 48.283973693847656, 51.778350830078125, 55.272727966308594, 58.76710510253906, 62.26148223876953, 65.755859375, 69.25022888183594, 72.74461364746094, 76.23898315429688, 79.73336029052734, 83.22773742675781, 86.72211456298828, 90.21649169921875, 93.71086883544922, 97.20524597167969, 100.69961547851562, 104.19400024414062]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 12.0, 13.0, 7.0, 17.0, 24.0, 24.0, 33.0, 36.0, 35.0, 31.0, 35.0, 46.0, 43.0, 40.0, 47.0, 35.0, 53.0, 40.0, 48.0, 45.0, 48.0, 39.0, 28.0, 29.0, 31.0, 26.0, 21.0, 18.0, 19.0, 18.0, 13.0, 10.0, 8.0, 5.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.078125, -16.59130859375, -16.1044921875, -15.61767578125, -15.130859375, -14.64404296875, -14.1572265625, -13.67041015625, -13.18359375, -12.69677734375, -12.2099609375, -11.72314453125, -11.236328125, -10.74951171875, -10.2626953125, -9.77587890625, -9.2890625, -8.80224609375, -8.3154296875, -7.82861328125, -7.341796875, -6.85498046875, -6.3681640625, -5.88134765625, -5.39453125, -4.90771484375, -4.4208984375, -3.93408203125, -3.447265625, -2.96044921875, -2.4736328125, -1.98681640625, -1.5, -1.01318359375, -0.5263671875, -0.03955078125, 0.447265625, 0.93408203125, 1.4208984375, 1.90771484375, 2.39453125, 2.88134765625, 3.3681640625, 3.85498046875, 4.341796875, 4.82861328125, 5.3154296875, 5.80224609375, 6.2890625, 6.77587890625, 7.2626953125, 7.74951171875, 8.236328125, 8.72314453125, 9.2099609375, 9.69677734375, 10.18359375, 10.67041015625, 11.1572265625, 11.64404296875, 12.130859375, 12.61767578125, 13.1044921875, 13.59130859375, 14.078125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 10.0, 16.0, 29.0, 33.0, 37.0, 74.0, 101.0, 123.0, 165.0, 253.0, 356.0, 524.0, 781.0, 1157.0, 1786.0, 3200.0, 5471.0, 10970.0, 61006.0, 1049730.0, 2836047.0, 187401.0, 17036.0, 7198.0, 3879.0, 2288.0, 1437.0, 964.0, 620.0, 429.0, 330.0, 208.0, 159.0, 117.0, 93.0, 73.0, 46.0, 41.0, 28.0, 19.0, 11.0, 10.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0], "bins": [-38.78125, -37.710205078125, -36.63916015625, -35.568115234375, -34.4970703125, -33.426025390625, -32.35498046875, -31.283935546875, -30.212890625, -29.141845703125, -28.07080078125, -26.999755859375, -25.9287109375, -24.857666015625, -23.78662109375, -22.715576171875, -21.64453125, -20.573486328125, -19.50244140625, -18.431396484375, -17.3603515625, -16.289306640625, -15.21826171875, -14.147216796875, -13.076171875, -12.005126953125, -10.93408203125, -9.863037109375, -8.7919921875, -7.720947265625, -6.64990234375, -5.578857421875, -4.5078125, -3.436767578125, -2.36572265625, -1.294677734375, -0.2236328125, 0.847412109375, 1.91845703125, 2.989501953125, 4.060546875, 5.131591796875, 6.20263671875, 7.273681640625, 8.3447265625, 9.415771484375, 10.48681640625, 11.557861328125, 12.62890625, 13.699951171875, 14.77099609375, 15.842041015625, 16.9130859375, 17.984130859375, 19.05517578125, 20.126220703125, 21.197265625, 22.268310546875, 23.33935546875, 24.410400390625, 25.4814453125, 26.552490234375, 27.62353515625, 28.694580078125, 29.765625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 7.0, 7.0, 8.0, 11.0, 7.0, 15.0, 15.0, 17.0, 25.0, 37.0, 62.0, 104.0, 183.0, 369.0, 599.0, 949.0, 660.0, 412.0, 234.0, 115.0, 62.0, 42.0, 26.0, 27.0, 16.0, 13.0, 11.0, 8.0, 7.0, 4.0, 3.0, 4.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-29.40625, -28.503662109375, -27.60107421875, -26.698486328125, -25.7958984375, -24.893310546875, -23.99072265625, -23.088134765625, -22.185546875, -21.282958984375, -20.38037109375, -19.477783203125, -18.5751953125, -17.672607421875, -16.77001953125, -15.867431640625, -14.96484375, -14.062255859375, -13.15966796875, -12.257080078125, -11.3544921875, -10.451904296875, -9.54931640625, -8.646728515625, -7.744140625, -6.841552734375, -5.93896484375, -5.036376953125, -4.1337890625, -3.231201171875, -2.32861328125, -1.426025390625, -0.5234375, 0.379150390625, 1.28173828125, 2.184326171875, 3.0869140625, 3.989501953125, 4.89208984375, 5.794677734375, 6.697265625, 7.599853515625, 8.50244140625, 9.405029296875, 10.3076171875, 11.210205078125, 12.11279296875, 13.015380859375, 13.91796875, 14.820556640625, 15.72314453125, 16.625732421875, 17.5283203125, 18.430908203125, 19.33349609375, 20.236083984375, 21.138671875, 22.041259765625, 22.94384765625, 23.846435546875, 24.7490234375, 25.651611328125, 26.55419921875, 27.456787109375, 28.359375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 1.0, 6.0, 6.0, 13.0, 18.0, 22.0, 28.0, 40.0, 48.0, 98.0, 198.0, 511.0, 1429.0, 5719.0, 35389.0, 3839211.0, 291125.0, 15584.0, 3169.0, 890.0, 361.0, 175.0, 71.0, 44.0, 33.0, 14.0, 21.0, 13.0, 11.0, 8.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.5, -102.07421875, -98.6484375, -95.22265625, -91.796875, -88.37109375, -84.9453125, -81.51953125, -78.09375, -74.66796875, -71.2421875, -67.81640625, -64.390625, -60.96484375, -57.5390625, -54.11328125, -50.6875, -47.26171875, -43.8359375, -40.41015625, -36.984375, -33.55859375, -30.1328125, -26.70703125, -23.28125, -19.85546875, -16.4296875, -13.00390625, -9.578125, -6.15234375, -2.7265625, 0.69921875, 4.125, 7.55078125, 10.9765625, 14.40234375, 17.828125, 21.25390625, 24.6796875, 28.10546875, 31.53125, 34.95703125, 38.3828125, 41.80859375, 45.234375, 48.66015625, 52.0859375, 55.51171875, 58.9375, 62.36328125, 65.7890625, 69.21484375, 72.640625, 76.06640625, 79.4921875, 82.91796875, 86.34375, 89.76953125, 93.1953125, 96.62109375, 100.046875, 103.47265625, 106.8984375, 110.32421875, 113.75]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 11.0, 27.0, 50.0, 103.0, 242.0, 304.0, 159.0, 50.0, 25.0, 20.0, 6.0, 5.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-186.51565551757812, -179.0924835205078, -171.6693115234375, -164.2461395263672, -156.82296752929688, -149.3997802734375, -141.9766082763672, -134.55343627929688, -127.13026428222656, -119.70709228515625, -112.28392028808594, -104.8607406616211, -97.43756866455078, -90.01439666748047, -82.59121704101562, -75.16804504394531, -67.744873046875, -60.32170104980469, -52.89852523803711, -45.47534942626953, -38.05217742919922, -30.629005432128906, -23.205829620361328, -15.78265380859375, -8.359481811523438, -0.9363079071044922, 6.486865997314453, 13.910039901733398, 21.333213806152344, 28.756385803222656, 36.179561614990234, 43.60273742675781, 51.025909423828125, 58.44908142089844, 65.87225341796875, 73.2954330444336, 80.7186050415039, 88.14177703857422, 95.56495666503906, 102.98812866210938, 110.41130065917969, 117.83447265625, 125.25764465332031, 132.68081665039062, 140.10400390625, 147.52716064453125, 154.95034790039062, 162.37351989746094, 169.79669189453125, 177.21986389160156, 184.64303588867188, 192.0662078857422, 199.4893798828125, 206.91256713867188, 214.3357391357422, 221.7589111328125, 229.1820831298828, 236.60525512695312, 244.02842712402344, 251.45159912109375, 258.8747863769531, 266.2979431152344, 273.72113037109375, 281.144287109375, 288.5674743652344]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 2.0, 3.0, 12.0, 8.0, 4.0, 13.0, 12.0, 17.0, 21.0, 18.0, 19.0, 27.0, 24.0, 22.0, 28.0, 36.0, 39.0, 41.0, 34.0, 43.0, 39.0, 31.0, 45.0, 50.0, 37.0, 29.0, 38.0, 32.0, 31.0, 32.0, 23.0, 27.0, 26.0, 16.0, 26.0, 21.0, 15.0, 9.0, 5.0, 12.0, 7.0, 8.0, 3.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.77050018310547, -64.57345581054688, -62.37641906738281, -60.179378509521484, -57.982337951660156, -55.78529739379883, -53.5882568359375, -51.39121627807617, -49.194175720214844, -46.997135162353516, -44.80009460449219, -42.60305404663086, -40.40601348876953, -38.2089729309082, -36.011932373046875, -33.81489181518555, -31.61785125732422, -29.42081069946289, -27.223770141601562, -25.026729583740234, -22.829689025878906, -20.632648468017578, -18.43560791015625, -16.238567352294922, -14.041526794433594, -11.844486236572266, -9.647445678710938, -7.450405120849609, -5.253364562988281, -3.056324005126953, -0.859283447265625, 1.3377571105957031, 3.5348052978515625, 5.731845855712891, 7.928886413574219, 10.125926971435547, 12.322967529296875, 14.520008087158203, 16.71704864501953, 18.91408920288086, 21.111129760742188, 23.308170318603516, 25.505210876464844, 27.702251434326172, 29.8992919921875, 32.09633255004883, 34.293373107910156, 36.490413665771484, 38.68745422363281, 40.88449478149414, 43.08153533935547, 45.2785758972168, 47.475616455078125, 49.67265701293945, 51.86969757080078, 54.06673812866211, 56.26377868652344, 58.460819244384766, 60.657859802246094, 62.85490036010742, 65.05194091796875, 67.24897766113281, 69.4460220336914, 71.64306640625, 73.84010314941406]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 2.0, 13.0, 17.0, 16.0, 21.0, 21.0, 14.0, 30.0, 30.0, 36.0, 25.0, 42.0, 40.0, 39.0, 46.0, 41.0, 44.0, 33.0, 41.0, 47.0, 37.0, 35.0, 44.0, 37.0, 28.0, 29.0, 23.0, 26.0, 21.0, 14.0, 23.0, 16.0, 6.0, 12.0, 5.0, 10.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-15.5078125, -15.05712890625, -14.6064453125, -14.15576171875, -13.705078125, -13.25439453125, -12.8037109375, -12.35302734375, -11.90234375, -11.45166015625, -11.0009765625, -10.55029296875, -10.099609375, -9.64892578125, -9.1982421875, -8.74755859375, -8.296875, -7.84619140625, -7.3955078125, -6.94482421875, -6.494140625, -6.04345703125, -5.5927734375, -5.14208984375, -4.69140625, -4.24072265625, -3.7900390625, -3.33935546875, -2.888671875, -2.43798828125, -1.9873046875, -1.53662109375, -1.0859375, -0.63525390625, -0.1845703125, 0.26611328125, 0.716796875, 1.16748046875, 1.6181640625, 2.06884765625, 2.51953125, 2.97021484375, 3.4208984375, 3.87158203125, 4.322265625, 4.77294921875, 5.2236328125, 5.67431640625, 6.125, 6.57568359375, 7.0263671875, 7.47705078125, 7.927734375, 8.37841796875, 8.8291015625, 9.27978515625, 9.73046875, 10.18115234375, 10.6318359375, 11.08251953125, 11.533203125, 11.98388671875, 12.4345703125, 12.88525390625, 13.3359375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 6.0, 7.0, 9.0, 16.0, 21.0, 60.0, 67.0, 112.0, 179.0, 267.0, 424.0, 672.0, 1006.0, 1576.0, 2409.0, 4022.0, 6631.0, 10590.0, 17131.0, 28886.0, 48958.0, 87852.0, 160691.0, 245979.0, 187165.0, 102853.0, 56345.0, 32985.0, 19904.0, 12085.0, 7445.0, 4542.0, 2870.0, 1717.0, 1092.0, 694.0, 443.0, 259.0, 201.0, 126.0, 101.0, 52.0, 45.0, 16.0, 16.0, 10.0, 10.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.6201171875, -1.573333740234375, -1.52655029296875, -1.479766845703125, -1.4329833984375, -1.386199951171875, -1.33941650390625, -1.292633056640625, -1.245849609375, -1.199066162109375, -1.15228271484375, -1.105499267578125, -1.0587158203125, -1.011932373046875, -0.96514892578125, -0.918365478515625, -0.87158203125, -0.824798583984375, -0.77801513671875, -0.731231689453125, -0.6844482421875, -0.637664794921875, -0.59088134765625, -0.544097900390625, -0.497314453125, -0.450531005859375, -0.40374755859375, -0.356964111328125, -0.3101806640625, -0.263397216796875, -0.21661376953125, -0.169830322265625, -0.123046875, -0.076263427734375, -0.02947998046875, 0.017303466796875, 0.0640869140625, 0.110870361328125, 0.15765380859375, 0.204437255859375, 0.251220703125, 0.298004150390625, 0.34478759765625, 0.391571044921875, 0.4383544921875, 0.485137939453125, 0.53192138671875, 0.578704833984375, 0.62548828125, 0.672271728515625, 0.71905517578125, 0.765838623046875, 0.8126220703125, 0.859405517578125, 0.90618896484375, 0.952972412109375, 0.999755859375, 1.046539306640625, 1.09332275390625, 1.140106201171875, 1.1868896484375, 1.233673095703125, 1.28045654296875, 1.327239990234375, 1.3740234375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 6.0, 6.0, 10.0, 5.0, 8.0, 13.0, 17.0, 20.0, 18.0, 27.0, 19.0, 24.0, 26.0, 26.0, 35.0, 33.0, 27.0, 30.0, 54.0, 41.0, 45.0, 1061.0, 38.0, 35.0, 44.0, 44.0, 42.0, 37.0, 34.0, 25.0, 19.0, 21.0, 23.0, 18.0, 18.0, 14.0, 16.0, 9.0, 14.0, 7.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.4609375, -9.17529296875, -8.8896484375, -8.60400390625, -8.318359375, -8.03271484375, -7.7470703125, -7.46142578125, -7.17578125, -6.89013671875, -6.6044921875, -6.31884765625, -6.033203125, -5.74755859375, -5.4619140625, -5.17626953125, -4.890625, -4.60498046875, -4.3193359375, -4.03369140625, -3.748046875, -3.46240234375, -3.1767578125, -2.89111328125, -2.60546875, -2.31982421875, -2.0341796875, -1.74853515625, -1.462890625, -1.17724609375, -0.8916015625, -0.60595703125, -0.3203125, -0.03466796875, 0.2509765625, 0.53662109375, 0.822265625, 1.10791015625, 1.3935546875, 1.67919921875, 1.96484375, 2.25048828125, 2.5361328125, 2.82177734375, 3.107421875, 3.39306640625, 3.6787109375, 3.96435546875, 4.25, 4.53564453125, 4.8212890625, 5.10693359375, 5.392578125, 5.67822265625, 5.9638671875, 6.24951171875, 6.53515625, 6.82080078125, 7.1064453125, 7.39208984375, 7.677734375, 7.96337890625, 8.2490234375, 8.53466796875, 8.8203125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 11.0, 10.0, 16.0, 35.0, 64.0, 71.0, 101.0, 141.0, 248.0, 395.0, 579.0, 884.0, 1398.0, 2110.0, 3416.0, 5117.0, 8038.0, 12141.0, 19383.0, 31642.0, 53554.0, 94284.0, 170547.0, 1291756.0, 169470.0, 93207.0, 53342.0, 31380.0, 19408.0, 11856.0, 7876.0, 5095.0, 3377.0, 2169.0, 1393.0, 942.0, 619.0, 378.0, 227.0, 141.0, 100.0, 79.0, 46.0, 30.0, 29.0, 12.0, 9.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.88232421875, -0.85430908203125, -0.8262939453125, -0.79827880859375, -0.770263671875, -0.74224853515625, -0.7142333984375, -0.68621826171875, -0.658203125, -0.63018798828125, -0.6021728515625, -0.57415771484375, -0.546142578125, -0.51812744140625, -0.4901123046875, -0.46209716796875, -0.43408203125, -0.40606689453125, -0.3780517578125, -0.35003662109375, -0.322021484375, -0.29400634765625, -0.2659912109375, -0.23797607421875, -0.2099609375, -0.18194580078125, -0.1539306640625, -0.12591552734375, -0.097900390625, -0.06988525390625, -0.0418701171875, -0.01385498046875, 0.01416015625, 0.04217529296875, 0.0701904296875, 0.09820556640625, 0.126220703125, 0.15423583984375, 0.1822509765625, 0.21026611328125, 0.23828125, 0.26629638671875, 0.2943115234375, 0.32232666015625, 0.350341796875, 0.37835693359375, 0.4063720703125, 0.43438720703125, 0.46240234375, 0.49041748046875, 0.5184326171875, 0.54644775390625, 0.574462890625, 0.60247802734375, 0.6304931640625, 0.65850830078125, 0.6865234375, 0.71453857421875, 0.7425537109375, 0.77056884765625, 0.798583984375, 0.82659912109375, 0.8546142578125, 0.88262939453125, 0.91064453125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 12.0, 37.0, 36.0, 64.0, 99.0, 126.0, 148.0, 149.0, 112.0, 75.0, 58.0, 29.0, 21.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0391845703125, -0.03802061080932617, -0.036856651306152344, -0.035692691802978516, -0.03452873229980469, -0.03336477279663086, -0.03220081329345703, -0.031036853790283203, -0.029872894287109375, -0.028708934783935547, -0.02754497528076172, -0.02638101577758789, -0.025217056274414062, -0.024053096771240234, -0.022889137268066406, -0.021725177764892578, -0.02056121826171875, -0.019397258758544922, -0.018233299255371094, -0.017069339752197266, -0.015905380249023438, -0.01474142074584961, -0.013577461242675781, -0.012413501739501953, -0.011249542236328125, -0.010085582733154297, -0.008921623229980469, -0.007757663726806641, -0.0065937042236328125, -0.005429744720458984, -0.004265785217285156, -0.003101825714111328, -0.0019378662109375, -0.0007739067077636719, 0.00039005279541015625, 0.0015540122985839844, 0.0027179718017578125, 0.0038819313049316406, 0.005045890808105469, 0.006209850311279297, 0.007373809814453125, 0.008537769317626953, 0.009701728820800781, 0.01086568832397461, 0.012029647827148438, 0.013193607330322266, 0.014357566833496094, 0.015521526336669922, 0.01668548583984375, 0.017849445343017578, 0.019013404846191406, 0.020177364349365234, 0.021341323852539062, 0.02250528335571289, 0.02366924285888672, 0.024833202362060547, 0.025997161865234375, 0.027161121368408203, 0.02832508087158203, 0.02948904037475586, 0.030652999877929688, 0.031816959381103516, 0.032980918884277344, 0.03414487838745117, 0.035308837890625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 8.0, 11.0, 16.0, 38.0, 80.0, 160.0, 359.0, 4417.0, 1037842.0, 4938.0, 356.0, 151.0, 70.0, 46.0, 10.0, 16.0, 5.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.765625, -0.7405319213867188, -0.7154388427734375, -0.6903457641601562, -0.665252685546875, -0.6401596069335938, -0.6150665283203125, -0.5899734497070312, -0.56488037109375, -0.5397872924804688, -0.5146942138671875, -0.48960113525390625, -0.464508056640625, -0.43941497802734375, -0.4143218994140625, -0.38922882080078125, -0.3641357421875, -0.33904266357421875, -0.3139495849609375, -0.28885650634765625, -0.263763427734375, -0.23867034912109375, -0.2135772705078125, -0.18848419189453125, -0.16339111328125, -0.13829803466796875, -0.1132049560546875, -0.08811187744140625, -0.063018798828125, -0.03792572021484375, -0.0128326416015625, 0.01226043701171875, 0.037353515625, 0.06244659423828125, 0.0875396728515625, 0.11263275146484375, 0.137725830078125, 0.16281890869140625, 0.1879119873046875, 0.21300506591796875, 0.23809814453125, 0.26319122314453125, 0.2882843017578125, 0.31337738037109375, 0.338470458984375, 0.36356353759765625, 0.3886566162109375, 0.41374969482421875, 0.4388427734375, 0.46393585205078125, 0.4890289306640625, 0.5141220092773438, 0.539215087890625, 0.5643081665039062, 0.5894012451171875, 0.6144943237304688, 0.63958740234375, 0.6646804809570312, 0.6897735595703125, 0.7148666381835938, 0.739959716796875, 0.7650527954101562, 0.7901458740234375, 0.8152389526367188, 0.84033203125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 35.0, 146.0, 600.0, 165.0, 39.0, 17.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025875117629766464, -0.02000894397497177, -0.014142771251499653, -0.008276598528027534, -0.0024104248732328415, 0.0034557487815618515, 0.009321920573711395, 0.015188094228506088, 0.02105426788330078, 0.026920441538095474, 0.03278661519289017, 0.03865278512239456, 0.04451896250247955, 0.05038513243198395, 0.05625130608677864, 0.062117479741573334, 0.06798365712165833, 0.07384982705116272, 0.07971600443124771, 0.0855821743607521, 0.0914483517408371, 0.09731452167034149, 0.10318069159984589, 0.10904686897993088, 0.11491303890943527, 0.12077920883893967, 0.12664538621902466, 0.13251155614852905, 0.13837772607803345, 0.14424391090869904, 0.15011008083820343, 0.15597625076770782, 0.16184242069721222, 0.1677085906267166, 0.173574760556221, 0.1794409453868866, 0.185307115316391, 0.19117328524589539, 0.19703945517539978, 0.20290562510490417, 0.20877180993556976, 0.21463797986507416, 0.22050414979457855, 0.22637033462524414, 0.23223650455474854, 0.23810267448425293, 0.24396884441375732, 0.24983501434326172, 0.2557011842727661, 0.2615673542022705, 0.2674335241317749, 0.2732996940612793, 0.2791658639907837, 0.2850320637226105, 0.29089823365211487, 0.29676440358161926, 0.30263057351112366, 0.30849674344062805, 0.31436291337013245, 0.32022908329963684, 0.32609525322914124, 0.331961452960968, 0.3378276228904724, 0.3436937928199768, 0.3495599627494812]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 8.0, 9.0, 8.0, 11.0, 14.0, 11.0, 13.0, 13.0, 14.0, 21.0, 15.0, 23.0, 24.0, 26.0, 28.0, 26.0, 32.0, 30.0, 31.0, 36.0, 29.0, 34.0, 31.0, 41.0, 48.0, 31.0, 42.0, 43.0, 26.0, 31.0, 34.0, 32.0, 29.0, 22.0, 21.0, 19.0, 15.0, 18.0, 16.0, 14.0, 6.0, 5.0, 6.0, 3.0, 7.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.030151307582855225, -0.02926386147737503, -0.028376417234539986, -0.02748897299170494, -0.026601526886224747, -0.025714080780744553, -0.024826636537909508, -0.023939192295074463, -0.02305174618959427, -0.022164300084114075, -0.02127685584127903, -0.020389411598443985, -0.01950196549296379, -0.018614519387483597, -0.017727075144648552, -0.016839630901813507, -0.015952184796333313, -0.015064739622175694, -0.014177294448018074, -0.013289849273860455, -0.012402404099702835, -0.011514958925545216, -0.010627513751387596, -0.009740068577229977, -0.008852623403072357, -0.007965178228914738, -0.007077733054757118, -0.006190287880599499, -0.005302842706441879, -0.00441539753228426, -0.0035279523581266403, -0.002640507183969021, -0.0017530620098114014, -0.0008656168356537819, 2.1828338503837585e-05, 0.0009092735126614571, 0.0017967186868190765, 0.002684163860976696, 0.0035716090351343155, 0.004459054209291935, 0.0053464993834495544, 0.006233944557607174, 0.007121389731764793, 0.008008834905922413, 0.008896280080080032, 0.009783725254237652, 0.010671170428395271, 0.01155861560255289, 0.01244606077671051, 0.01333350595086813, 0.01422095112502575, 0.015108396299183369, 0.015995841473340988, 0.016883287578821182, 0.017770731821656227, 0.018658176064491272, 0.019545622169971466, 0.02043306827545166, 0.021320512518286705, 0.02220795676112175, 0.023095402866601944, 0.023982848972082138, 0.024870293214917183, 0.025757737457752228, 0.026645183563232422]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 2.0, 13.0, 17.0, 16.0, 21.0, 21.0, 14.0, 30.0, 30.0, 36.0, 25.0, 42.0, 40.0, 39.0, 46.0, 41.0, 44.0, 33.0, 41.0, 47.0, 37.0, 35.0, 44.0, 37.0, 28.0, 29.0, 24.0, 25.0, 21.0, 14.0, 23.0, 16.0, 6.0, 12.0, 5.0, 10.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-15.5078125, -15.05712890625, -14.6064453125, -14.15576171875, -13.705078125, -13.25439453125, -12.8037109375, -12.35302734375, -11.90234375, -11.45166015625, -11.0009765625, -10.55029296875, -10.099609375, -9.64892578125, -9.1982421875, -8.74755859375, -8.296875, -7.84619140625, -7.3955078125, -6.94482421875, -6.494140625, -6.04345703125, -5.5927734375, -5.14208984375, -4.69140625, -4.24072265625, -3.7900390625, -3.33935546875, -2.888671875, -2.43798828125, -1.9873046875, -1.53662109375, -1.0859375, -0.63525390625, -0.1845703125, 0.26611328125, 0.716796875, 1.16748046875, 1.6181640625, 2.06884765625, 2.51953125, 2.97021484375, 3.4208984375, 3.87158203125, 4.322265625, 4.77294921875, 5.2236328125, 5.67431640625, 6.125, 6.57568359375, 7.0263671875, 7.47705078125, 7.927734375, 8.37841796875, 8.8291015625, 9.27978515625, 9.73046875, 10.18115234375, 10.6318359375, 11.08251953125, 11.533203125, 11.98388671875, 12.4345703125, 12.88525390625, 13.3359375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 9.0, 10.0, 15.0, 21.0, 30.0, 38.0, 52.0, 107.0, 120.0, 186.0, 253.0, 380.0, 657.0, 1056.0, 1894.0, 3259.0, 6343.0, 13059.0, 29137.0, 70294.0, 188489.0, 418975.0, 187956.0, 69596.0, 29076.0, 13193.0, 6322.0, 3240.0, 1843.0, 1067.0, 617.0, 395.0, 275.0, 164.0, 118.0, 92.0, 57.0, 40.0, 35.0, 23.0, 16.0, 13.0, 8.0, 7.0, 4.0, 4.0, 6.0, 4.0, 4.0, 1.0], "bins": [-6.91796875, -6.72308349609375, -6.5281982421875, -6.33331298828125, -6.138427734375, -5.94354248046875, -5.7486572265625, -5.55377197265625, -5.35888671875, -5.16400146484375, -4.9691162109375, -4.77423095703125, -4.579345703125, -4.38446044921875, -4.1895751953125, -3.99468994140625, -3.7998046875, -3.60491943359375, -3.4100341796875, -3.21514892578125, -3.020263671875, -2.82537841796875, -2.6304931640625, -2.43560791015625, -2.24072265625, -2.04583740234375, -1.8509521484375, -1.65606689453125, -1.461181640625, -1.26629638671875, -1.0714111328125, -0.87652587890625, -0.681640625, -0.48675537109375, -0.2918701171875, -0.09698486328125, 0.097900390625, 0.29278564453125, 0.4876708984375, 0.68255615234375, 0.87744140625, 1.07232666015625, 1.2672119140625, 1.46209716796875, 1.656982421875, 1.85186767578125, 2.0467529296875, 2.24163818359375, 2.4365234375, 2.63140869140625, 2.8262939453125, 3.02117919921875, 3.216064453125, 3.41094970703125, 3.6058349609375, 3.80072021484375, 3.99560546875, 4.19049072265625, 4.3853759765625, 4.58026123046875, 4.775146484375, 4.97003173828125, 5.1649169921875, 5.35980224609375, 5.5546875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 7.0, 9.0, 11.0, 12.0, 19.0, 15.0, 27.0, 32.0, 30.0, 34.0, 45.0, 39.0, 38.0, 42.0, 60.0, 105.0, 1847.0, 188.0, 73.0, 58.0, 38.0, 43.0, 42.0, 39.0, 24.0, 29.0, 19.0, 23.0, 19.0, 11.0, 14.0, 8.0, 13.0, 3.0, 7.0, 7.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-49.625, -48.2705078125, -46.916015625, -45.5615234375, -44.20703125, -42.8525390625, -41.498046875, -40.1435546875, -38.7890625, -37.4345703125, -36.080078125, -34.7255859375, -33.37109375, -32.0166015625, -30.662109375, -29.3076171875, -27.953125, -26.5986328125, -25.244140625, -23.8896484375, -22.53515625, -21.1806640625, -19.826171875, -18.4716796875, -17.1171875, -15.7626953125, -14.408203125, -13.0537109375, -11.69921875, -10.3447265625, -8.990234375, -7.6357421875, -6.28125, -4.9267578125, -3.572265625, -2.2177734375, -0.86328125, 0.4912109375, 1.845703125, 3.2001953125, 4.5546875, 5.9091796875, 7.263671875, 8.6181640625, 9.97265625, 11.3271484375, 12.681640625, 14.0361328125, 15.390625, 16.7451171875, 18.099609375, 19.4541015625, 20.80859375, 22.1630859375, 23.517578125, 24.8720703125, 26.2265625, 27.5810546875, 28.935546875, 30.2900390625, 31.64453125, 32.9990234375, 34.353515625, 35.7080078125, 37.0625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 10.0, 4.0, 8.0, 13.0, 13.0, 21.0, 27.0, 30.0, 40.0, 57.0, 68.0, 89.0, 121.0, 158.0, 252.0, 421.0, 1104.0, 18260.0, 3117897.0, 5152.0, 782.0, 354.0, 218.0, 152.0, 114.0, 85.0, 57.0, 43.0, 44.0, 19.0, 21.0, 16.0, 12.0, 8.0, 6.0, 4.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-87.9375, -84.7236328125, -81.509765625, -78.2958984375, -75.08203125, -71.8681640625, -68.654296875, -65.4404296875, -62.2265625, -59.0126953125, -55.798828125, -52.5849609375, -49.37109375, -46.1572265625, -42.943359375, -39.7294921875, -36.515625, -33.3017578125, -30.087890625, -26.8740234375, -23.66015625, -20.4462890625, -17.232421875, -14.0185546875, -10.8046875, -7.5908203125, -4.376953125, -1.1630859375, 2.05078125, 5.2646484375, 8.478515625, 11.6923828125, 14.90625, 18.1201171875, 21.333984375, 24.5478515625, 27.76171875, 30.9755859375, 34.189453125, 37.4033203125, 40.6171875, 43.8310546875, 47.044921875, 50.2587890625, 53.47265625, 56.6865234375, 59.900390625, 63.1142578125, 66.328125, 69.5419921875, 72.755859375, 75.9697265625, 79.18359375, 82.3974609375, 85.611328125, 88.8251953125, 92.0390625, 95.2529296875, 98.466796875, 101.6806640625, 104.89453125, 108.1083984375, 111.322265625, 114.5361328125, 117.75]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 7.0, 132.0, 604.0, 255.0, 15.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.84003829956055, -27.916202545166016, -22.99236488342285, -18.068527221679688, -13.144691467285156, -8.220855712890625, -3.297018051147461, 1.6268196105957031, 6.550655364990234, 11.474492073059082, 16.39832878112793, 21.322166442871094, 26.246002197265625, 31.169837951660156, 36.09367370605469, 41.017513275146484, 45.941349029541016, 50.86518478393555, 55.789024353027344, 60.712860107421875, 65.6366958618164, 70.56053161621094, 75.48436737060547, 80.408203125, 85.33204650878906, 90.2558822631836, 95.17971801757812, 100.10355377197266, 105.02738952636719, 109.95123291015625, 114.87506866455078, 119.79890441894531, 124.72274780273438, 129.64659118652344, 134.57041931152344, 139.4942626953125, 144.4180908203125, 149.34193420410156, 154.26576232910156, 159.18960571289062, 164.11343383789062, 169.0372772216797, 173.9611053466797, 178.88494873046875, 183.80877685546875, 188.7326202392578, 193.6564483642578, 198.58029174804688, 203.50413513183594, 208.427978515625, 213.351806640625, 218.27565002441406, 223.19947814941406, 228.12332153320312, 233.04714965820312, 237.9709930419922, 242.89483642578125, 247.8186798095703, 252.7425079345703, 257.6663513183594, 262.5901794433594, 267.5140075683594, 272.4378662109375, 277.3616943359375, 282.2855224609375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 8.0, 2.0, 6.0, 12.0, 5.0, 12.0, 14.0, 25.0, 21.0, 21.0, 26.0, 30.0, 21.0, 37.0, 32.0, 30.0, 28.0, 42.0, 36.0, 42.0, 42.0, 42.0, 56.0, 40.0, 32.0, 47.0, 28.0, 32.0, 32.0, 33.0, 24.0, 20.0, 22.0, 17.0, 13.0, 10.0, 18.0, 10.0, 9.0, 6.0, 5.0, 4.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.08296203613281, -110.76636505126953, -107.44976043701172, -104.13316345214844, -100.81655883789062, -97.49996185302734, -94.18336486816406, -90.86676025390625, -87.55016326904297, -84.23356628417969, -80.91696166992188, -77.6003646850586, -74.28376770019531, -70.9671630859375, -67.65056610107422, -64.33396911621094, -61.017364501953125, -57.70076370239258, -54.38416290283203, -51.06756591796875, -47.7509651184082, -44.434364318847656, -41.117767333984375, -37.80116653442383, -34.48456573486328, -31.167964935302734, -27.85136604309082, -24.534767150878906, -21.21816635131836, -17.901565551757812, -14.584966659545898, -11.268367767333984, -7.9517669677734375, -4.635167121887207, -1.3185672760009766, 1.998032569885254, 5.314632415771484, 8.631233215332031, 11.947832107543945, 15.26443099975586, 18.581031799316406, 21.897632598876953, 25.214231491088867, 28.53083038330078, 31.847431182861328, 35.164031982421875, 38.480628967285156, 41.7972297668457, 45.11383056640625, 48.4304313659668, 51.747032165527344, 55.063629150390625, 58.38022994995117, 61.69683074951172, 65.013427734375, 68.33003234863281, 71.6466293334961, 74.96322631835938, 78.27983093261719, 81.59642791748047, 84.91302490234375, 88.22962951660156, 91.54622650146484, 94.86282348632812, 98.17942810058594]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 8.0, 12.0, 13.0, 12.0, 25.0, 17.0, 15.0, 34.0, 25.0, 34.0, 25.0, 39.0, 45.0, 45.0, 37.0, 46.0, 43.0, 35.0, 43.0, 33.0, 36.0, 41.0, 41.0, 39.0, 33.0, 30.0, 30.0, 17.0, 26.0, 12.0, 19.0, 18.0, 6.0, 15.0, 12.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0], "bins": [-15.6796875, -15.227783203125, -14.77587890625, -14.323974609375, -13.8720703125, -13.420166015625, -12.96826171875, -12.516357421875, -12.064453125, -11.612548828125, -11.16064453125, -10.708740234375, -10.2568359375, -9.804931640625, -9.35302734375, -8.901123046875, -8.44921875, -7.997314453125, -7.54541015625, -7.093505859375, -6.6416015625, -6.189697265625, -5.73779296875, -5.285888671875, -4.833984375, -4.382080078125, -3.93017578125, -3.478271484375, -3.0263671875, -2.574462890625, -2.12255859375, -1.670654296875, -1.21875, -0.766845703125, -0.31494140625, 0.136962890625, 0.5888671875, 1.040771484375, 1.49267578125, 1.944580078125, 2.396484375, 2.848388671875, 3.30029296875, 3.752197265625, 4.2041015625, 4.656005859375, 5.10791015625, 5.559814453125, 6.01171875, 6.463623046875, 6.91552734375, 7.367431640625, 7.8193359375, 8.271240234375, 8.72314453125, 9.175048828125, 9.626953125, 10.078857421875, 10.53076171875, 10.982666015625, 11.4345703125, 11.886474609375, 12.33837890625, 12.790283203125, 13.2421875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 9.0, 6.0, 11.0, 15.0, 23.0, 37.0, 47.0, 75.0, 84.0, 122.0, 193.0, 268.0, 400.0, 595.0, 911.0, 1514.0, 3256.0, 8152.0, 54044.0, 2263617.0, 1811089.0, 34622.0, 7438.0, 3292.0, 1586.0, 925.0, 570.0, 379.0, 270.0, 185.0, 142.0, 101.0, 81.0, 63.0, 24.0, 39.0, 30.0, 21.0, 14.0, 9.0, 7.0, 4.0, 4.0, 0.0, 2.0, 4.0, 4.0, 2.0, 1.0], "bins": [-50.65625, -49.20751953125, -47.7587890625, -46.31005859375, -44.861328125, -43.41259765625, -41.9638671875, -40.51513671875, -39.06640625, -37.61767578125, -36.1689453125, -34.72021484375, -33.271484375, -31.82275390625, -30.3740234375, -28.92529296875, -27.4765625, -26.02783203125, -24.5791015625, -23.13037109375, -21.681640625, -20.23291015625, -18.7841796875, -17.33544921875, -15.88671875, -14.43798828125, -12.9892578125, -11.54052734375, -10.091796875, -8.64306640625, -7.1943359375, -5.74560546875, -4.296875, -2.84814453125, -1.3994140625, 0.04931640625, 1.498046875, 2.94677734375, 4.3955078125, 5.84423828125, 7.29296875, 8.74169921875, 10.1904296875, 11.63916015625, 13.087890625, 14.53662109375, 15.9853515625, 17.43408203125, 18.8828125, 20.33154296875, 21.7802734375, 23.22900390625, 24.677734375, 26.12646484375, 27.5751953125, 29.02392578125, 30.47265625, 31.92138671875, 33.3701171875, 34.81884765625, 36.267578125, 37.71630859375, 39.1650390625, 40.61376953125, 42.0625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 8.0, 4.0, 10.0, 6.0, 15.0, 17.0, 18.0, 19.0, 43.0, 61.0, 117.0, 242.0, 481.0, 880.0, 983.0, 579.0, 239.0, 133.0, 63.0, 38.0, 26.0, 15.0, 19.0, 14.0, 12.0, 7.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-38.8125, -37.79296875, -36.7734375, -35.75390625, -34.734375, -33.71484375, -32.6953125, -31.67578125, -30.65625, -29.63671875, -28.6171875, -27.59765625, -26.578125, -25.55859375, -24.5390625, -23.51953125, -22.5, -21.48046875, -20.4609375, -19.44140625, -18.421875, -17.40234375, -16.3828125, -15.36328125, -14.34375, -13.32421875, -12.3046875, -11.28515625, -10.265625, -9.24609375, -8.2265625, -7.20703125, -6.1875, -5.16796875, -4.1484375, -3.12890625, -2.109375, -1.08984375, -0.0703125, 0.94921875, 1.96875, 2.98828125, 4.0078125, 5.02734375, 6.046875, 7.06640625, 8.0859375, 9.10546875, 10.125, 11.14453125, 12.1640625, 13.18359375, 14.203125, 15.22265625, 16.2421875, 17.26171875, 18.28125, 19.30078125, 20.3203125, 21.33984375, 22.359375, 23.37890625, 24.3984375, 25.41796875, 26.4375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 8.0, 12.0, 25.0, 21.0, 33.0, 64.0, 86.0, 198.0, 514.0, 1657.0, 8029.0, 83561.0, 4046108.0, 46147.0, 5669.0, 1288.0, 417.0, 179.0, 78.0, 52.0, 38.0, 26.0, 10.0, 10.0, 9.0, 8.0, 11.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.6875, -99.7607421875, -95.833984375, -91.9072265625, -87.98046875, -84.0537109375, -80.126953125, -76.2001953125, -72.2734375, -68.3466796875, -64.419921875, -60.4931640625, -56.56640625, -52.6396484375, -48.712890625, -44.7861328125, -40.859375, -36.9326171875, -33.005859375, -29.0791015625, -25.15234375, -21.2255859375, -17.298828125, -13.3720703125, -9.4453125, -5.5185546875, -1.591796875, 2.3349609375, 6.26171875, 10.1884765625, 14.115234375, 18.0419921875, 21.96875, 25.8955078125, 29.822265625, 33.7490234375, 37.67578125, 41.6025390625, 45.529296875, 49.4560546875, 53.3828125, 57.3095703125, 61.236328125, 65.1630859375, 69.08984375, 73.0166015625, 76.943359375, 80.8701171875, 84.796875, 88.7236328125, 92.650390625, 96.5771484375, 100.50390625, 104.4306640625, 108.357421875, 112.2841796875, 116.2109375, 120.1376953125, 124.064453125, 127.9912109375, 131.91796875, 135.8447265625, 139.771484375, 143.6982421875, 147.625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 5.0, 16.0, 27.0, 46.0, 84.0, 190.0, 259.0, 182.0, 91.0, 43.0, 25.0, 7.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.24630737304688, -155.5892333984375, -149.93214416503906, -144.2750701904297, -138.6179962158203, -132.96090698242188, -127.3038330078125, -121.64675903320312, -115.98967742919922, -110.33259582519531, -104.67552185058594, -99.01844024658203, -93.36135864257812, -87.70428466796875, -82.04720306396484, -76.39012145996094, -70.73304748535156, -65.07596588134766, -59.41889190673828, -53.761810302734375, -48.104732513427734, -42.447654724121094, -36.79057312011719, -31.133495330810547, -25.476417541503906, -19.819339752197266, -14.162260055541992, -8.505180358886719, -2.848102569580078, 2.8089752197265625, 8.466056823730469, 14.12313461303711, 19.780227661132812, 25.437305450439453, 31.094385147094727, 36.75146484375, 42.40854263305664, 48.06562042236328, 53.72270202636719, 59.37977981567383, 65.03685760498047, 70.69393920898438, 76.35101318359375, 82.00809478759766, 87.66517639160156, 93.32225036621094, 98.97933197021484, 104.63641357421875, 110.29348754882812, 115.95056915283203, 121.6076431274414, 127.26472473144531, 132.9217987060547, 138.57888793945312, 144.2359619140625, 149.89303588867188, 155.55010986328125, 161.20718383789062, 166.86427307128906, 172.52134704589844, 178.1784210205078, 183.83551025390625, 189.49258422851562, 195.149658203125, 200.80674743652344]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 0.0, 4.0, 8.0, 13.0, 8.0, 21.0, 10.0, 13.0, 10.0, 16.0, 22.0, 19.0, 35.0, 25.0, 25.0, 39.0, 30.0, 28.0, 41.0, 39.0, 40.0, 31.0, 40.0, 40.0, 24.0, 47.0, 40.0, 32.0, 36.0, 25.0, 29.0, 27.0, 15.0, 25.0, 22.0, 18.0, 9.0, 16.0, 10.0, 9.0, 10.0, 7.0, 9.0, 10.0, 4.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-61.555450439453125, -59.51859664916992, -57.481746673583984, -55.44489288330078, -53.408042907714844, -51.37118911743164, -49.33433532714844, -47.2974853515625, -45.2606315612793, -43.223777770996094, -41.186927795410156, -39.15007400512695, -37.11322021484375, -35.07637023925781, -33.03951644897461, -31.00266456604004, -28.96581268310547, -26.9289608001709, -24.892108917236328, -22.855255126953125, -20.818403244018555, -18.781551361083984, -16.74469757080078, -14.707845687866211, -12.67099380493164, -10.63414192199707, -8.597289085388184, -6.560436725616455, -4.523584365844727, -2.4867324829101562, -0.44987964630126953, 1.5869731903076172, 3.6238250732421875, 5.660677433013916, 7.6975297927856445, 9.734382629394531, 11.771234512329102, 13.808086395263672, 15.844939231872559, 17.881792068481445, 19.918643951416016, 21.955495834350586, 23.992347717285156, 26.02920150756836, 28.06605339050293, 30.1029052734375, 32.1397590637207, 34.176612854003906, 36.213462829589844, 38.25031661987305, 40.287166595458984, 42.32402038574219, 44.360870361328125, 46.39772415161133, 48.43457794189453, 50.47142791748047, 52.50828170776367, 54.545135498046875, 56.58198547363281, 58.618839263916016, 60.65569305419922, 62.692543029785156, 64.7293930053711, 66.76625061035156, 68.8031005859375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 9.0, 10.0, 12.0, 13.0, 12.0, 21.0, 30.0, 16.0, 27.0, 28.0, 37.0, 24.0, 16.0, 45.0, 46.0, 34.0, 51.0, 35.0, 48.0, 38.0, 33.0, 40.0, 34.0, 27.0, 34.0, 27.0, 40.0, 28.0, 28.0, 18.0, 24.0, 19.0, 13.0, 16.0, 14.0, 8.0, 11.0, 7.0, 9.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.3431396484375, -12.912841796875, -12.4825439453125, -12.05224609375, -11.6219482421875, -11.191650390625, -10.7613525390625, -10.3310546875, -9.9007568359375, -9.470458984375, -9.0401611328125, -8.60986328125, -8.1795654296875, -7.749267578125, -7.3189697265625, -6.888671875, -6.4583740234375, -6.028076171875, -5.5977783203125, -5.16748046875, -4.7371826171875, -4.306884765625, -3.8765869140625, -3.4462890625, -3.0159912109375, -2.585693359375, -2.1553955078125, -1.72509765625, -1.2947998046875, -0.864501953125, -0.4342041015625, -0.00390625, 0.4263916015625, 0.856689453125, 1.2869873046875, 1.71728515625, 2.1475830078125, 2.577880859375, 3.0081787109375, 3.4384765625, 3.8687744140625, 4.299072265625, 4.7293701171875, 5.15966796875, 5.5899658203125, 6.020263671875, 6.4505615234375, 6.880859375, 7.3111572265625, 7.741455078125, 8.1717529296875, 8.60205078125, 9.0323486328125, 9.462646484375, 9.8929443359375, 10.3232421875, 10.7535400390625, 11.183837890625, 11.6141357421875, 12.04443359375, 12.4747314453125, 12.905029296875, 13.3353271484375, 13.765625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 8.0, 11.0, 17.0, 42.0, 49.0, 78.0, 117.0, 138.0, 246.0, 358.0, 631.0, 940.0, 1439.0, 2209.0, 3396.0, 5431.0, 8680.0, 13729.0, 21931.0, 35402.0, 58075.0, 100568.0, 177974.0, 237592.0, 155526.0, 87870.0, 51425.0, 31761.0, 19473.0, 12170.0, 7757.0, 5011.0, 3120.0, 1905.0, 1218.0, 762.0, 507.0, 340.0, 219.0, 147.0, 95.0, 66.0, 44.0, 22.0, 20.0, 6.0, 6.0, 9.0, 6.0, 8.0, 1.0, 0.0, 2.0], "bins": [-1.53125, -1.4867095947265625, -1.442169189453125, -1.3976287841796875, -1.35308837890625, -1.3085479736328125, -1.264007568359375, -1.2194671630859375, -1.1749267578125, -1.1303863525390625, -1.085845947265625, -1.0413055419921875, -0.99676513671875, -0.9522247314453125, -0.907684326171875, -0.8631439208984375, -0.818603515625, -0.7740631103515625, -0.729522705078125, -0.6849822998046875, -0.64044189453125, -0.5959014892578125, -0.551361083984375, -0.5068206787109375, -0.4622802734375, -0.4177398681640625, -0.373199462890625, -0.3286590576171875, -0.28411865234375, -0.2395782470703125, -0.195037841796875, -0.1504974365234375, -0.10595703125, -0.0614166259765625, -0.016876220703125, 0.0276641845703125, 0.07220458984375, 0.1167449951171875, 0.161285400390625, 0.2058258056640625, 0.2503662109375, 0.2949066162109375, 0.339447021484375, 0.3839874267578125, 0.42852783203125, 0.4730682373046875, 0.517608642578125, 0.5621490478515625, 0.606689453125, 0.6512298583984375, 0.695770263671875, 0.7403106689453125, 0.78485107421875, 0.8293914794921875, 0.873931884765625, 0.9184722900390625, 0.9630126953125, 1.0075531005859375, 1.052093505859375, 1.0966339111328125, 1.14117431640625, 1.1857147216796875, 1.230255126953125, 1.2747955322265625, 1.3193359375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 7.0, 24.0, 18.0, 11.0, 14.0, 19.0, 29.0, 20.0, 31.0, 29.0, 29.0, 29.0, 39.0, 39.0, 45.0, 38.0, 38.0, 1062.0, 37.0, 50.0, 43.0, 32.0, 36.0, 38.0, 30.0, 36.0, 25.0, 27.0, 14.0, 14.0, 25.0, 9.0, 17.0, 13.0, 8.0, 10.0, 8.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.375, -8.0994873046875, -7.823974609375, -7.5484619140625, -7.27294921875, -6.9974365234375, -6.721923828125, -6.4464111328125, -6.1708984375, -5.8953857421875, -5.619873046875, -5.3443603515625, -5.06884765625, -4.7933349609375, -4.517822265625, -4.2423095703125, -3.966796875, -3.6912841796875, -3.415771484375, -3.1402587890625, -2.86474609375, -2.5892333984375, -2.313720703125, -2.0382080078125, -1.7626953125, -1.4871826171875, -1.211669921875, -0.9361572265625, -0.66064453125, -0.3851318359375, -0.109619140625, 0.1658935546875, 0.44140625, 0.7169189453125, 0.992431640625, 1.2679443359375, 1.54345703125, 1.8189697265625, 2.094482421875, 2.3699951171875, 2.6455078125, 2.9210205078125, 3.196533203125, 3.4720458984375, 3.74755859375, 4.0230712890625, 4.298583984375, 4.5740966796875, 4.849609375, 5.1251220703125, 5.400634765625, 5.6761474609375, 5.95166015625, 6.2271728515625, 6.502685546875, 6.7781982421875, 7.0537109375, 7.3292236328125, 7.604736328125, 7.8802490234375, 8.15576171875, 8.4312744140625, 8.706787109375, 8.9822998046875, 9.2578125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 7.0, 13.0, 20.0, 28.0, 32.0, 93.0, 116.0, 167.0, 261.0, 401.0, 562.0, 888.0, 1375.0, 2069.0, 3192.0, 4884.0, 7660.0, 12195.0, 19286.0, 31544.0, 54478.0, 95248.0, 172042.0, 1285713.0, 170968.0, 95191.0, 53792.0, 31456.0, 19506.0, 11935.0, 7802.0, 4970.0, 3230.0, 2021.0, 1421.0, 867.0, 560.0, 355.0, 258.0, 202.0, 107.0, 75.0, 54.0, 21.0, 8.0, 16.0, 20.0, 13.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.90087890625, -0.8739852905273438, -0.8470916748046875, -0.8201980590820312, -0.793304443359375, -0.7664108276367188, -0.7395172119140625, -0.7126235961914062, -0.68572998046875, -0.6588363647460938, -0.6319427490234375, -0.6050491333007812, -0.578155517578125, -0.5512619018554688, -0.5243682861328125, -0.49747467041015625, -0.4705810546875, -0.44368743896484375, -0.4167938232421875, -0.38990020751953125, -0.363006591796875, -0.33611297607421875, -0.3092193603515625, -0.28232574462890625, -0.25543212890625, -0.22853851318359375, -0.2016448974609375, -0.17475128173828125, -0.147857666015625, -0.12096405029296875, -0.0940704345703125, -0.06717681884765625, -0.040283203125, -0.01338958740234375, 0.0135040283203125, 0.04039764404296875, 0.067291259765625, 0.09418487548828125, 0.1210784912109375, 0.14797210693359375, 0.17486572265625, 0.20175933837890625, 0.2286529541015625, 0.25554656982421875, 0.282440185546875, 0.30933380126953125, 0.3362274169921875, 0.36312103271484375, 0.3900146484375, 0.41690826416015625, 0.4438018798828125, 0.47069549560546875, 0.497589111328125, 0.5244827270507812, 0.5513763427734375, 0.5782699584960938, 0.60516357421875, 0.6320571899414062, 0.6589508056640625, 0.6858444213867188, 0.712738037109375, 0.7396316528320312, 0.7665252685546875, 0.7934188842773438, 0.8203125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 6.0, 4.0, 13.0, 4.0, 14.0, 15.0, 24.0, 20.0, 24.0, 24.0, 30.0, 30.0, 30.0, 52.0, 68.0, 77.0, 92.0, 78.0, 60.0, 45.0, 36.0, 32.0, 39.0, 25.0, 25.0, 17.0, 18.0, 13.0, 10.0, 9.0, 10.0, 6.0, 5.0, 2.0, 5.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0145721435546875, -0.01407313346862793, -0.01357412338256836, -0.013075113296508789, -0.012576103210449219, -0.012077093124389648, -0.011578083038330078, -0.011079072952270508, -0.010580062866210938, -0.010081052780151367, -0.009582042694091797, -0.009083032608032227, -0.008584022521972656, -0.008085012435913086, -0.007586002349853516, -0.007086992263793945, -0.006587982177734375, -0.006088972091674805, -0.005589962005615234, -0.005090951919555664, -0.004591941833496094, -0.0040929317474365234, -0.003593921661376953, -0.003094911575317383, -0.0025959014892578125, -0.002096891403198242, -0.0015978813171386719, -0.0010988712310791016, -0.0005998611450195312, -0.00010085105895996094, 0.0003981590270996094, 0.0008971691131591797, 0.00139617919921875, 0.0018951892852783203, 0.0023941993713378906, 0.002893209457397461, 0.0033922195434570312, 0.0038912296295166016, 0.004390239715576172, 0.004889249801635742, 0.0053882598876953125, 0.005887269973754883, 0.006386280059814453, 0.0068852901458740234, 0.007384300231933594, 0.007883310317993164, 0.008382320404052734, 0.008881330490112305, 0.009380340576171875, 0.009879350662231445, 0.010378360748291016, 0.010877370834350586, 0.011376380920410156, 0.011875391006469727, 0.012374401092529297, 0.012873411178588867, 0.013372421264648438, 0.013871431350708008, 0.014370441436767578, 0.014869451522827148, 0.015368461608886719, 0.01586747169494629, 0.01636648178100586, 0.01686549186706543, 0.017364501953125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 9.0, 7.0, 9.0, 7.0, 13.0, 14.0, 14.0, 22.0, 15.0, 15.0, 30.0, 44.0, 64.0, 72.0, 95.0, 186.0, 283.0, 1037.0, 19707.0, 991344.0, 33322.0, 1336.0, 304.0, 155.0, 109.0, 75.0, 50.0, 39.0, 36.0, 30.0, 18.0, 24.0, 10.0, 5.0, 12.0, 7.0, 5.0, 11.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.34716796875, -0.336822509765625, -0.32647705078125, -0.316131591796875, -0.3057861328125, -0.295440673828125, -0.28509521484375, -0.274749755859375, -0.264404296875, -0.254058837890625, -0.24371337890625, -0.233367919921875, -0.2230224609375, -0.212677001953125, -0.20233154296875, -0.191986083984375, -0.181640625, -0.171295166015625, -0.16094970703125, -0.150604248046875, -0.1402587890625, -0.129913330078125, -0.11956787109375, -0.109222412109375, -0.098876953125, -0.088531494140625, -0.07818603515625, -0.067840576171875, -0.0574951171875, -0.047149658203125, -0.03680419921875, -0.026458740234375, -0.01611328125, -0.005767822265625, 0.00457763671875, 0.014923095703125, 0.0252685546875, 0.035614013671875, 0.04595947265625, 0.056304931640625, 0.066650390625, 0.076995849609375, 0.08734130859375, 0.097686767578125, 0.1080322265625, 0.118377685546875, 0.12872314453125, 0.139068603515625, 0.1494140625, 0.159759521484375, 0.17010498046875, 0.180450439453125, 0.1907958984375, 0.201141357421875, 0.21148681640625, 0.221832275390625, 0.232177734375, 0.242523193359375, 0.25286865234375, 0.263214111328125, 0.2735595703125, 0.283905029296875, 0.29425048828125, 0.304595947265625, 0.31494140625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 20.0, 130.0, 664.0, 146.0, 44.0, 9.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04348637908697128, -0.037645310163497925, -0.031804244965314865, -0.025963177904486656, -0.020122110843658447, -0.014281043782830238, -0.00843997672200203, -0.0025989115238189697, 0.0032421573996543884, 0.009083224460482597, 0.014924291521310806, 0.020765358582139015, 0.026606425642967224, 0.03244749456644058, 0.03828855976462364, 0.0441296249628067, 0.04997069388628006, 0.05581176280975342, 0.06165282800793648, 0.06749389320611954, 0.0733349621295929, 0.07917603105306625, 0.08501709997653961, 0.09085816144943237, 0.09669923037290573, 0.10254029929637909, 0.10838136076927185, 0.11422242969274521, 0.12006349861621857, 0.12590456008911133, 0.13174563646316528, 0.13758669793605804, 0.1434277594089508, 0.14926882088184357, 0.15510989725589752, 0.16095095872879028, 0.16679203510284424, 0.172633096575737, 0.17847415804862976, 0.18431523442268372, 0.19015629589557648, 0.19599735736846924, 0.2018384337425232, 0.20767949521541595, 0.21352055668830872, 0.21936163306236267, 0.22520269453525543, 0.2310437560081482, 0.23688483238220215, 0.2427258938550949, 0.24856697022914886, 0.2544080317020416, 0.2602491080760956, 0.26609015464782715, 0.2719312310218811, 0.27777230739593506, 0.283613383769989, 0.28945446014404297, 0.29529550671577454, 0.3011365830898285, 0.30697765946388245, 0.312818706035614, 0.31865978240966797, 0.3245008587837219, 0.3303419053554535]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 7.0, 9.0, 10.0, 10.0, 13.0, 18.0, 18.0, 26.0, 31.0, 24.0, 24.0, 32.0, 33.0, 28.0, 33.0, 43.0, 44.0, 49.0, 39.0, 46.0, 43.0, 51.0, 43.0, 36.0, 33.0, 38.0, 27.0, 25.0, 22.0, 29.0, 21.0, 20.0, 16.0, 8.0, 11.0, 8.0, 3.0, 8.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02180624008178711, -0.021124038845300674, -0.02044183947145939, -0.019759640097618103, -0.019077438861131668, -0.018395237624645233, -0.017713038250803947, -0.017030838876962662, -0.016348637640476227, -0.015666436403989792, -0.014984237030148506, -0.014302036724984646, -0.013619836419820786, -0.012937636114656925, -0.012255435809493065, -0.011573235504329205, -0.010891035199165344, -0.010208834894001484, -0.009526634588837624, -0.008844434283673763, -0.008162233978509903, -0.007480033673346043, -0.006797833368182182, -0.006115633063018322, -0.005433432757854462, -0.004751232452690601, -0.004069032147526741, -0.0033868318423628807, -0.0027046315371990204, -0.00202243123203516, -0.0013402309268712997, -0.0006580306217074394, 2.41696834564209e-05, 0.0007063699886202812, 0.0013885702937841415, 0.002070770598948002, 0.002752970904111862, 0.0034351712092757225, 0.004117371514439583, 0.004799571819603443, 0.0054817721247673035, 0.006163972429931164, 0.006846172735095024, 0.007528373040258884, 0.008210573345422745, 0.008892773650586605, 0.009574973955750465, 0.010257174260914326, 0.010939374566078186, 0.011621574871242046, 0.012303775176405907, 0.012985975481569767, 0.013668175786733627, 0.014350376091897488, 0.015032576397061348, 0.015714775770902634, 0.01639697700738907, 0.017079178243875504, 0.01776137761771679, 0.018443576991558075, 0.01912577822804451, 0.019807979464530945, 0.02049017883837223, 0.021172378212213516, 0.02185457944869995]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 9.0, 10.0, 12.0, 13.0, 12.0, 21.0, 30.0, 16.0, 27.0, 28.0, 37.0, 24.0, 16.0, 44.0, 47.0, 34.0, 51.0, 35.0, 48.0, 38.0, 33.0, 40.0, 34.0, 27.0, 35.0, 25.0, 41.0, 28.0, 28.0, 18.0, 24.0, 19.0, 13.0, 16.0, 14.0, 8.0, 11.0, 7.0, 9.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.3431396484375, -12.912841796875, -12.4825439453125, -12.05224609375, -11.6219482421875, -11.191650390625, -10.7613525390625, -10.3310546875, -9.9007568359375, -9.470458984375, -9.0401611328125, -8.60986328125, -8.1795654296875, -7.749267578125, -7.3189697265625, -6.888671875, -6.4583740234375, -6.028076171875, -5.5977783203125, -5.16748046875, -4.7371826171875, -4.306884765625, -3.8765869140625, -3.4462890625, -3.0159912109375, -2.585693359375, -2.1553955078125, -1.72509765625, -1.2947998046875, -0.864501953125, -0.4342041015625, -0.00390625, 0.4263916015625, 0.856689453125, 1.2869873046875, 1.71728515625, 2.1475830078125, 2.577880859375, 3.0081787109375, 3.4384765625, 3.8687744140625, 4.299072265625, 4.7293701171875, 5.15966796875, 5.5899658203125, 6.020263671875, 6.4505615234375, 6.880859375, 7.3111572265625, 7.741455078125, 8.1717529296875, 8.60205078125, 9.0323486328125, 9.462646484375, 9.8929443359375, 10.3232421875, 10.7535400390625, 11.183837890625, 11.6141357421875, 12.04443359375, 12.4747314453125, 12.905029296875, 13.3353271484375, 13.765625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 15.0, 14.0, 20.0, 21.0, 48.0, 41.0, 71.0, 91.0, 106.0, 186.0, 263.0, 355.0, 528.0, 777.0, 1205.0, 2070.0, 3838.0, 9849.0, 44511.0, 345375.0, 549715.0, 65372.0, 12964.0, 4767.0, 2388.0, 1328.0, 897.0, 503.0, 342.0, 229.0, 163.0, 120.0, 92.0, 67.0, 53.0, 45.0, 24.0, 25.0, 20.0, 11.0, 9.0, 8.0, 9.0, 7.0, 6.0, 6.0, 3.0, 1.0, 0.0, 2.0], "bins": [-16.96875, -16.47119140625, -15.9736328125, -15.47607421875, -14.978515625, -14.48095703125, -13.9833984375, -13.48583984375, -12.98828125, -12.49072265625, -11.9931640625, -11.49560546875, -10.998046875, -10.50048828125, -10.0029296875, -9.50537109375, -9.0078125, -8.51025390625, -8.0126953125, -7.51513671875, -7.017578125, -6.52001953125, -6.0224609375, -5.52490234375, -5.02734375, -4.52978515625, -4.0322265625, -3.53466796875, -3.037109375, -2.53955078125, -2.0419921875, -1.54443359375, -1.046875, -0.54931640625, -0.0517578125, 0.44580078125, 0.943359375, 1.44091796875, 1.9384765625, 2.43603515625, 2.93359375, 3.43115234375, 3.9287109375, 4.42626953125, 4.923828125, 5.42138671875, 5.9189453125, 6.41650390625, 6.9140625, 7.41162109375, 7.9091796875, 8.40673828125, 8.904296875, 9.40185546875, 9.8994140625, 10.39697265625, 10.89453125, 11.39208984375, 11.8896484375, 12.38720703125, 12.884765625, 13.38232421875, 13.8798828125, 14.37744140625, 14.875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 8.0, 8.0, 9.0, 12.0, 17.0, 18.0, 18.0, 17.0, 23.0, 11.0, 22.0, 42.0, 34.0, 41.0, 52.0, 42.0, 78.0, 108.0, 1855.0, 146.0, 52.0, 72.0, 36.0, 42.0, 33.0, 36.0, 29.0, 30.0, 21.0, 29.0, 23.0, 14.0, 17.0, 8.0, 10.0, 4.0, 5.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.6875, -35.52685546875, -34.3662109375, -33.20556640625, -32.044921875, -30.88427734375, -29.7236328125, -28.56298828125, -27.40234375, -26.24169921875, -25.0810546875, -23.92041015625, -22.759765625, -21.59912109375, -20.4384765625, -19.27783203125, -18.1171875, -16.95654296875, -15.7958984375, -14.63525390625, -13.474609375, -12.31396484375, -11.1533203125, -9.99267578125, -8.83203125, -7.67138671875, -6.5107421875, -5.35009765625, -4.189453125, -3.02880859375, -1.8681640625, -0.70751953125, 0.453125, 1.61376953125, 2.7744140625, 3.93505859375, 5.095703125, 6.25634765625, 7.4169921875, 8.57763671875, 9.73828125, 10.89892578125, 12.0595703125, 13.22021484375, 14.380859375, 15.54150390625, 16.7021484375, 17.86279296875, 19.0234375, 20.18408203125, 21.3447265625, 22.50537109375, 23.666015625, 24.82666015625, 25.9873046875, 27.14794921875, 28.30859375, 29.46923828125, 30.6298828125, 31.79052734375, 32.951171875, 34.11181640625, 35.2724609375, 36.43310546875, 37.59375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 5.0, 17.0, 19.0, 36.0, 78.0, 137.0, 335.0, 728.0, 9750.0, 3129398.0, 4076.0, 593.0, 256.0, 110.0, 64.0, 44.0, 22.0, 13.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.25, -164.25390625, -158.2578125, -152.26171875, -146.265625, -140.26953125, -134.2734375, -128.27734375, -122.28125, -116.28515625, -110.2890625, -104.29296875, -98.296875, -92.30078125, -86.3046875, -80.30859375, -74.3125, -68.31640625, -62.3203125, -56.32421875, -50.328125, -44.33203125, -38.3359375, -32.33984375, -26.34375, -20.34765625, -14.3515625, -8.35546875, -2.359375, 3.63671875, 9.6328125, 15.62890625, 21.625, 27.62109375, 33.6171875, 39.61328125, 45.609375, 51.60546875, 57.6015625, 63.59765625, 69.59375, 75.58984375, 81.5859375, 87.58203125, 93.578125, 99.57421875, 105.5703125, 111.56640625, 117.5625, 123.55859375, 129.5546875, 135.55078125, 141.546875, 147.54296875, 153.5390625, 159.53515625, 165.53125, 171.52734375, 177.5234375, 183.51953125, 189.515625, 195.51171875, 201.5078125, 207.50390625, 213.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 30.0, 265.0, 542.0, 146.0, 20.0, 7.0], "bins": [-374.1932678222656, -367.989501953125, -361.7857666015625, -355.5820007324219, -349.3782653808594, -343.17449951171875, -336.9707336425781, -330.7669982910156, -324.563232421875, -318.3594665527344, -312.1557312011719, -305.95196533203125, -299.74822998046875, -293.5444641113281, -287.3406982421875, -281.136962890625, -274.9331970214844, -268.72943115234375, -262.52569580078125, -256.3219299316406, -250.11817932128906, -243.9144287109375, -237.71067810058594, -231.50692749023438, -225.3031768798828, -219.09942626953125, -212.8956756591797, -206.69190979003906, -200.4881591796875, -194.28440856933594, -188.08065795898438, -181.87689208984375, -175.6731414794922, -169.46939086914062, -163.26564025878906, -157.06187438964844, -150.85812377929688, -144.6543731689453, -138.45062255859375, -132.24685668945312, -126.0431137084961, -119.83936309814453, -113.63560485839844, -107.43185424804688, -101.22809600830078, -95.02434539794922, -88.82058715820312, -82.61683654785156, -76.41307830810547, -70.2093276977539, -64.00556945800781, -57.80181884765625, -51.598060607910156, -45.394309997558594, -39.190555572509766, -32.98680114746094, -26.783048629760742, -20.579294204711914, -14.375540733337402, -8.17178726196289, -1.9680328369140625, 4.235721588134766, 10.439474105834961, 16.64322853088379, 22.846982955932617]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 9.0, 4.0, 14.0, 20.0, 11.0, 18.0, 18.0, 16.0, 18.0, 28.0, 26.0, 37.0, 29.0, 37.0, 55.0, 38.0, 33.0, 40.0, 65.0, 44.0, 36.0, 30.0, 37.0, 30.0, 33.0, 35.0, 33.0, 34.0, 21.0, 24.0, 20.0, 21.0, 14.0, 14.0, 15.0, 9.0, 7.0, 8.0, 7.0, 2.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-106.68331146240234, -103.46924591064453, -100.25518035888672, -97.0411148071289, -93.8270492553711, -90.61298370361328, -87.39892578125, -84.18486022949219, -80.97079467773438, -77.75672912597656, -74.54266357421875, -71.32859802246094, -68.11453247070312, -64.90046691894531, -61.686405181884766, -58.47233963012695, -55.258270263671875, -52.04420471191406, -48.83013916015625, -45.61607360839844, -42.402008056640625, -39.18794250488281, -35.973880767822266, -32.75981521606445, -29.54574966430664, -26.331684112548828, -23.117618560791016, -19.903554916381836, -16.689489364624023, -13.475423812866211, -10.261360168457031, -7.047294616699219, -3.8332366943359375, -0.6191716194152832, 2.594893455505371, 5.808958053588867, 9.02302360534668, 12.237089157104492, 15.451152801513672, 18.665218353271484, 21.879283905029297, 25.09334945678711, 28.307415008544922, 31.5214786529541, 34.73554229736328, 37.949607849121094, 41.163673400878906, 44.37773895263672, 47.59180450439453, 50.805870056152344, 54.019935607910156, 57.23400115966797, 60.44806671142578, 63.662132263183594, 66.87619018554688, 70.09025573730469, 73.3043212890625, 76.51838684082031, 79.73245239257812, 82.94651794433594, 86.16058349609375, 89.37464904785156, 92.58871459960938, 95.80278015136719, 99.016845703125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 9.0, 8.0, 19.0, 19.0, 21.0, 25.0, 31.0, 14.0, 34.0, 37.0, 30.0, 33.0, 37.0, 41.0, 55.0, 37.0, 26.0, 45.0, 35.0, 54.0, 35.0, 40.0, 35.0, 25.0, 30.0, 23.0, 27.0, 26.0, 26.0, 16.0, 19.0, 15.0, 9.0, 11.0, 14.0, 4.0, 5.0, 6.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.7265625, -14.269287109375, -13.81201171875, -13.354736328125, -12.8974609375, -12.440185546875, -11.98291015625, -11.525634765625, -11.068359375, -10.611083984375, -10.15380859375, -9.696533203125, -9.2392578125, -8.781982421875, -8.32470703125, -7.867431640625, -7.41015625, -6.952880859375, -6.49560546875, -6.038330078125, -5.5810546875, -5.123779296875, -4.66650390625, -4.209228515625, -3.751953125, -3.294677734375, -2.83740234375, -2.380126953125, -1.9228515625, -1.465576171875, -1.00830078125, -0.551025390625, -0.09375, 0.363525390625, 0.82080078125, 1.278076171875, 1.7353515625, 2.192626953125, 2.64990234375, 3.107177734375, 3.564453125, 4.021728515625, 4.47900390625, 4.936279296875, 5.3935546875, 5.850830078125, 6.30810546875, 6.765380859375, 7.22265625, 7.679931640625, 8.13720703125, 8.594482421875, 9.0517578125, 9.509033203125, 9.96630859375, 10.423583984375, 10.880859375, 11.338134765625, 11.79541015625, 12.252685546875, 12.7099609375, 13.167236328125, 13.62451171875, 14.081787109375, 14.5390625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 7.0, 7.0, 8.0, 11.0, 20.0, 25.0, 27.0, 39.0, 48.0, 79.0, 140.0, 253.0, 481.0, 882.0, 1786.0, 3367.0, 7261.0, 39342.0, 2579382.0, 1524498.0, 23037.0, 6514.0, 3038.0, 1714.0, 948.0, 520.0, 311.0, 184.0, 115.0, 77.0, 36.0, 33.0, 18.0, 17.0, 17.0, 8.0, 8.0, 4.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-54.5, -52.84521484375, -51.1904296875, -49.53564453125, -47.880859375, -46.22607421875, -44.5712890625, -42.91650390625, -41.26171875, -39.60693359375, -37.9521484375, -36.29736328125, -34.642578125, -32.98779296875, -31.3330078125, -29.67822265625, -28.0234375, -26.36865234375, -24.7138671875, -23.05908203125, -21.404296875, -19.74951171875, -18.0947265625, -16.43994140625, -14.78515625, -13.13037109375, -11.4755859375, -9.82080078125, -8.166015625, -6.51123046875, -4.8564453125, -3.20166015625, -1.546875, 0.10791015625, 1.7626953125, 3.41748046875, 5.072265625, 6.72705078125, 8.3818359375, 10.03662109375, 11.69140625, 13.34619140625, 15.0009765625, 16.65576171875, 18.310546875, 19.96533203125, 21.6201171875, 23.27490234375, 24.9296875, 26.58447265625, 28.2392578125, 29.89404296875, 31.548828125, 33.20361328125, 34.8583984375, 36.51318359375, 38.16796875, 39.82275390625, 41.4775390625, 43.13232421875, 44.787109375, 46.44189453125, 48.0966796875, 49.75146484375, 51.40625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 11.0, 8.0, 8.0, 9.0, 9.0, 16.0, 18.0, 24.0, 39.0, 65.0, 124.0, 218.0, 484.0, 783.0, 947.0, 626.0, 305.0, 145.0, 79.0, 35.0, 27.0, 17.0, 20.0, 10.0, 6.0, 4.0, 5.0, 6.0, 4.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.59375, -31.6396484375, -30.685546875, -29.7314453125, -28.77734375, -27.8232421875, -26.869140625, -25.9150390625, -24.9609375, -24.0068359375, -23.052734375, -22.0986328125, -21.14453125, -20.1904296875, -19.236328125, -18.2822265625, -17.328125, -16.3740234375, -15.419921875, -14.4658203125, -13.51171875, -12.5576171875, -11.603515625, -10.6494140625, -9.6953125, -8.7412109375, -7.787109375, -6.8330078125, -5.87890625, -4.9248046875, -3.970703125, -3.0166015625, -2.0625, -1.1083984375, -0.154296875, 0.7998046875, 1.75390625, 2.7080078125, 3.662109375, 4.6162109375, 5.5703125, 6.5244140625, 7.478515625, 8.4326171875, 9.38671875, 10.3408203125, 11.294921875, 12.2490234375, 13.203125, 14.1572265625, 15.111328125, 16.0654296875, 17.01953125, 17.9736328125, 18.927734375, 19.8818359375, 20.8359375, 21.7900390625, 22.744140625, 23.6982421875, 24.65234375, 25.6064453125, 26.560546875, 27.5146484375, 28.46875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 2.0, 8.0, 3.0, 7.0, 11.0, 14.0, 16.0, 35.0, 58.0, 84.0, 190.0, 422.0, 1450.0, 6925.0, 64026.0, 4069577.0, 43877.0, 5578.0, 1191.0, 379.0, 162.0, 77.0, 57.0, 38.0, 21.0, 14.0, 9.0, 7.0, 12.0, 7.0, 9.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.4375, -121.1767578125, -116.916015625, -112.6552734375, -108.39453125, -104.1337890625, -99.873046875, -95.6123046875, -91.3515625, -87.0908203125, -82.830078125, -78.5693359375, -74.30859375, -70.0478515625, -65.787109375, -61.5263671875, -57.265625, -53.0048828125, -48.744140625, -44.4833984375, -40.22265625, -35.9619140625, -31.701171875, -27.4404296875, -23.1796875, -18.9189453125, -14.658203125, -10.3974609375, -6.13671875, -1.8759765625, 2.384765625, 6.6455078125, 10.90625, 15.1669921875, 19.427734375, 23.6884765625, 27.94921875, 32.2099609375, 36.470703125, 40.7314453125, 44.9921875, 49.2529296875, 53.513671875, 57.7744140625, 62.03515625, 66.2958984375, 70.556640625, 74.8173828125, 79.078125, 83.3388671875, 87.599609375, 91.8603515625, 96.12109375, 100.3818359375, 104.642578125, 108.9033203125, 113.1640625, 117.4248046875, 121.685546875, 125.9462890625, 130.20703125, 134.4677734375, 138.728515625, 142.9892578125, 147.25]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 4.0, 7.0, 3.0, 11.0, 9.0, 14.0, 16.0, 31.0, 36.0, 44.0, 75.0, 121.0, 120.0, 141.0, 98.0, 74.0, 55.0, 33.0, 26.0, 23.0, 14.0, 14.0, 10.0, 3.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-116.70932006835938, -113.93148803710938, -111.15364837646484, -108.37581634521484, -105.59797668457031, -102.82014465332031, -100.04231262207031, -97.26447296142578, -94.48663330078125, -91.70880126953125, -88.93096160888672, -86.15312957763672, -83.37528991699219, -80.59745788574219, -77.81962585449219, -75.04178619384766, -72.26395416259766, -69.48612213134766, -66.70828247070312, -63.930450439453125, -61.152610778808594, -58.374778747558594, -55.59694290161133, -52.81910705566406, -50.0412712097168, -47.26343536376953, -44.485599517822266, -41.707763671875, -38.929931640625, -36.15209197998047, -33.37425994873047, -30.596424102783203, -27.818580627441406, -25.04074478149414, -22.262908935546875, -19.485074996948242, -16.707239151000977, -13.929403305053711, -11.151569366455078, -8.373733520507812, -5.595897674560547, -2.8180623054504395, -0.04022693634033203, 2.737607955932617, 5.515443801879883, 8.293279647827148, 11.071113586425781, 13.848949432373047, 16.626785278320312, 19.404621124267578, 22.182456970214844, 24.960290908813477, 27.738126754760742, 30.515962600708008, 33.29379653930664, 36.071632385253906, 38.84946823120117, 41.62730407714844, 44.4051399230957, 47.18297576904297, 49.96080780029297, 52.7386474609375, 55.5164794921875, 58.294315338134766, 61.07215118408203]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 7.0, 7.0, 10.0, 11.0, 13.0, 13.0, 11.0, 14.0, 21.0, 15.0, 25.0, 27.0, 29.0, 28.0, 29.0, 28.0, 19.0, 37.0, 31.0, 34.0, 36.0, 47.0, 53.0, 43.0, 44.0, 39.0, 30.0, 19.0, 29.0, 24.0, 39.0, 20.0, 27.0, 26.0, 17.0, 20.0, 10.0, 14.0, 13.0, 8.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-63.53112030029297, -61.490440368652344, -59.44975662231445, -57.40907669067383, -55.36839294433594, -53.32771301269531, -51.28703308105469, -49.24635314941406, -47.20566940307617, -45.16498947143555, -43.124305725097656, -41.08362579345703, -39.042945861816406, -37.002262115478516, -34.96158218383789, -32.9208984375, -30.880218505859375, -28.839536666870117, -26.79885482788086, -24.758174896240234, -22.717493057250977, -20.67681121826172, -18.636131286621094, -16.595449447631836, -14.554767608642578, -12.51408576965332, -10.473404884338379, -8.432723999023438, -6.39204216003418, -4.351360321044922, -2.3106794357299805, -0.26999855041503906, 1.7706756591796875, 3.811357021331787, 5.852038383483887, 7.892719745635986, 9.933401107788086, 11.974082946777344, 14.014763832092285, 16.055444717407227, 18.096126556396484, 20.136808395385742, 22.177490234375, 24.218170166015625, 26.258852005004883, 28.29953384399414, 30.340213775634766, 32.380897521972656, 34.42157745361328, 36.462257385253906, 38.5029411315918, 40.54362106323242, 42.58430480957031, 44.62498474121094, 46.66566467285156, 48.70634460449219, 50.74702835083008, 52.7877082824707, 54.828392028808594, 56.86907196044922, 58.909751892089844, 60.950435638427734, 62.99111557006836, 65.03179931640625, 67.07247924804688]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 8.0, 4.0, 6.0, 9.0, 10.0, 7.0, 17.0, 13.0, 15.0, 30.0, 21.0, 20.0, 23.0, 42.0, 30.0, 30.0, 36.0, 40.0, 31.0, 46.0, 44.0, 54.0, 26.0, 38.0, 41.0, 44.0, 22.0, 28.0, 33.0, 22.0, 25.0, 34.0, 25.0, 16.0, 23.0, 15.0, 10.0, 19.0, 11.0, 5.0, 5.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-14.0078125, -13.567138671875, -13.12646484375, -12.685791015625, -12.2451171875, -11.804443359375, -11.36376953125, -10.923095703125, -10.482421875, -10.041748046875, -9.60107421875, -9.160400390625, -8.7197265625, -8.279052734375, -7.83837890625, -7.397705078125, -6.95703125, -6.516357421875, -6.07568359375, -5.635009765625, -5.1943359375, -4.753662109375, -4.31298828125, -3.872314453125, -3.431640625, -2.990966796875, -2.55029296875, -2.109619140625, -1.6689453125, -1.228271484375, -0.78759765625, -0.346923828125, 0.09375, 0.534423828125, 0.97509765625, 1.415771484375, 1.8564453125, 2.297119140625, 2.73779296875, 3.178466796875, 3.619140625, 4.059814453125, 4.50048828125, 4.941162109375, 5.3818359375, 5.822509765625, 6.26318359375, 6.703857421875, 7.14453125, 7.585205078125, 8.02587890625, 8.466552734375, 8.9072265625, 9.347900390625, 9.78857421875, 10.229248046875, 10.669921875, 11.110595703125, 11.55126953125, 11.991943359375, 12.4326171875, 12.873291015625, 13.31396484375, 13.754638671875, 14.1953125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 5.0, 14.0, 25.0, 39.0, 79.0, 69.0, 142.0, 186.0, 292.0, 491.0, 786.0, 1312.0, 2064.0, 3266.0, 5161.0, 8408.0, 13775.0, 22336.0, 38546.0, 68898.0, 127093.0, 230479.0, 231079.0, 127808.0, 68982.0, 38884.0, 22626.0, 13638.0, 8588.0, 5125.0, 3149.0, 1926.0, 1240.0, 729.0, 452.0, 279.0, 198.0, 135.0, 72.0, 61.0, 32.0, 37.0, 15.0, 11.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6943359375, -1.639678955078125, -1.58502197265625, -1.530364990234375, -1.4757080078125, -1.421051025390625, -1.36639404296875, -1.311737060546875, -1.257080078125, -1.202423095703125, -1.14776611328125, -1.093109130859375, -1.0384521484375, -0.983795166015625, -0.92913818359375, -0.874481201171875, -0.81982421875, -0.765167236328125, -0.71051025390625, -0.655853271484375, -0.6011962890625, -0.546539306640625, -0.49188232421875, -0.437225341796875, -0.382568359375, -0.327911376953125, -0.27325439453125, -0.218597412109375, -0.1639404296875, -0.109283447265625, -0.05462646484375, 3.0517578125e-05, 0.0546875, 0.109344482421875, 0.16400146484375, 0.218658447265625, 0.2733154296875, 0.327972412109375, 0.38262939453125, 0.437286376953125, 0.491943359375, 0.546600341796875, 0.60125732421875, 0.655914306640625, 0.7105712890625, 0.765228271484375, 0.81988525390625, 0.874542236328125, 0.92919921875, 0.983856201171875, 1.03851318359375, 1.093170166015625, 1.1478271484375, 1.202484130859375, 1.25714111328125, 1.311798095703125, 1.366455078125, 1.421112060546875, 1.47576904296875, 1.530426025390625, 1.5850830078125, 1.639739990234375, 1.69439697265625, 1.749053955078125, 1.8037109375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 9.0, 7.0, 10.0, 24.0, 20.0, 18.0, 29.0, 34.0, 32.0, 36.0, 28.0, 47.0, 50.0, 41.0, 42.0, 55.0, 1077.0, 46.0, 57.0, 38.0, 40.0, 38.0, 43.0, 40.0, 22.0, 20.0, 23.0, 21.0, 14.0, 11.0, 10.0, 12.0, 8.0, 10.0, 1.0, 2.0, 0.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.7578125, -12.40869140625, -12.0595703125, -11.71044921875, -11.361328125, -11.01220703125, -10.6630859375, -10.31396484375, -9.96484375, -9.61572265625, -9.2666015625, -8.91748046875, -8.568359375, -8.21923828125, -7.8701171875, -7.52099609375, -7.171875, -6.82275390625, -6.4736328125, -6.12451171875, -5.775390625, -5.42626953125, -5.0771484375, -4.72802734375, -4.37890625, -4.02978515625, -3.6806640625, -3.33154296875, -2.982421875, -2.63330078125, -2.2841796875, -1.93505859375, -1.5859375, -1.23681640625, -0.8876953125, -0.53857421875, -0.189453125, 0.15966796875, 0.5087890625, 0.85791015625, 1.20703125, 1.55615234375, 1.9052734375, 2.25439453125, 2.603515625, 2.95263671875, 3.3017578125, 3.65087890625, 4.0, 4.34912109375, 4.6982421875, 5.04736328125, 5.396484375, 5.74560546875, 6.0947265625, 6.44384765625, 6.79296875, 7.14208984375, 7.4912109375, 7.84033203125, 8.189453125, 8.53857421875, 8.8876953125, 9.23681640625, 9.5859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 10.0, 16.0, 21.0, 28.0, 42.0, 65.0, 95.0, 192.0, 326.0, 551.0, 973.0, 1722.0, 3121.0, 5675.0, 10432.0, 19693.0, 39379.0, 81452.0, 179045.0, 1363997.0, 204800.0, 92700.0, 44281.0, 22203.0, 11837.0, 6463.0, 3571.0, 1865.0, 1069.0, 596.0, 351.0, 210.0, 94.0, 72.0, 45.0, 43.0, 29.0, 21.0, 11.0, 6.0, 6.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.193359375, -1.151611328125, -1.10986328125, -1.068115234375, -1.0263671875, -0.984619140625, -0.94287109375, -0.901123046875, -0.859375, -0.817626953125, -0.77587890625, -0.734130859375, -0.6923828125, -0.650634765625, -0.60888671875, -0.567138671875, -0.525390625, -0.483642578125, -0.44189453125, -0.400146484375, -0.3583984375, -0.316650390625, -0.27490234375, -0.233154296875, -0.19140625, -0.149658203125, -0.10791015625, -0.066162109375, -0.0244140625, 0.017333984375, 0.05908203125, 0.100830078125, 0.142578125, 0.184326171875, 0.22607421875, 0.267822265625, 0.3095703125, 0.351318359375, 0.39306640625, 0.434814453125, 0.4765625, 0.518310546875, 0.56005859375, 0.601806640625, 0.6435546875, 0.685302734375, 0.72705078125, 0.768798828125, 0.810546875, 0.852294921875, 0.89404296875, 0.935791015625, 0.9775390625, 1.019287109375, 1.06103515625, 1.102783203125, 1.14453125, 1.186279296875, 1.22802734375, 1.269775390625, 1.3115234375, 1.353271484375, 1.39501953125, 1.436767578125, 1.478515625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 6.0, 1.0, 6.0, 4.0, 5.0, 11.0, 6.0, 12.0, 23.0, 27.0, 41.0, 38.0, 34.0, 58.0, 72.0, 55.0, 114.0, 98.0, 81.0, 44.0, 40.0, 40.0, 36.0, 31.0, 25.0, 17.0, 12.0, 13.0, 9.0, 7.0, 10.0, 3.0, 6.0, 2.0, 2.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.07080078125, -0.06871604919433594, -0.06663131713867188, -0.06454658508300781, -0.06246185302734375, -0.06037712097167969, -0.058292388916015625, -0.05620765686035156, -0.0541229248046875, -0.05203819274902344, -0.049953460693359375, -0.04786872863769531, -0.04578399658203125, -0.04369926452636719, -0.041614532470703125, -0.03952980041503906, -0.037445068359375, -0.03536033630371094, -0.033275604248046875, -0.031190872192382812, -0.02910614013671875, -0.027021408081054688, -0.024936676025390625, -0.022851943969726562, -0.0207672119140625, -0.018682479858398438, -0.016597747802734375, -0.014513015747070312, -0.01242828369140625, -0.010343551635742188, -0.008258819580078125, -0.0061740875244140625, -0.00408935546875, -0.0020046234130859375, 8.0108642578125e-05, 0.0021648406982421875, 0.00424957275390625, 0.0063343048095703125, 0.008419036865234375, 0.010503768920898438, 0.0125885009765625, 0.014673233032226562, 0.016757965087890625, 0.018842697143554688, 0.02092742919921875, 0.023012161254882812, 0.025096893310546875, 0.027181625366210938, 0.029266357421875, 0.03135108947753906, 0.033435821533203125, 0.03552055358886719, 0.03760528564453125, 0.03969001770019531, 0.041774749755859375, 0.04385948181152344, 0.0459442138671875, 0.04802894592285156, 0.050113677978515625, 0.05219841003417969, 0.05428314208984375, 0.05636787414550781, 0.058452606201171875, 0.06053733825683594, 0.0626220703125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 7.0, 8.0, 14.0, 10.0, 17.0, 24.0, 22.0, 38.0, 56.0, 72.0, 98.0, 136.0, 256.0, 950.0, 21276.0, 1004926.0, 18970.0, 836.0, 280.0, 154.0, 99.0, 72.0, 60.0, 30.0, 35.0, 20.0, 12.0, 15.0, 7.0, 8.0, 8.0, 6.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.353515625, -1.3105316162109375, -1.267547607421875, -1.2245635986328125, -1.18157958984375, -1.1385955810546875, -1.095611572265625, -1.0526275634765625, -1.0096435546875, -0.9666595458984375, -0.923675537109375, -0.8806915283203125, -0.83770751953125, -0.7947235107421875, -0.751739501953125, -0.7087554931640625, -0.665771484375, -0.6227874755859375, -0.579803466796875, -0.5368194580078125, -0.49383544921875, -0.4508514404296875, -0.407867431640625, -0.3648834228515625, -0.3218994140625, -0.2789154052734375, -0.235931396484375, -0.1929473876953125, -0.14996337890625, -0.1069793701171875, -0.063995361328125, -0.0210113525390625, 0.02197265625, 0.0649566650390625, 0.107940673828125, 0.1509246826171875, 0.19390869140625, 0.2368927001953125, 0.279876708984375, 0.3228607177734375, 0.3658447265625, 0.4088287353515625, 0.451812744140625, 0.4947967529296875, 0.53778076171875, 0.5807647705078125, 0.623748779296875, 0.6667327880859375, 0.709716796875, 0.7527008056640625, 0.795684814453125, 0.8386688232421875, 0.88165283203125, 0.9246368408203125, 0.967620849609375, 1.0106048583984375, 1.0535888671875, 1.0965728759765625, 1.139556884765625, 1.1825408935546875, 1.22552490234375, 1.2685089111328125, 1.311492919921875, 1.3544769287109375, 1.3974609375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 17.0, 89.0, 729.0, 153.0, 25.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4743356704711914, -1.4370964765548706, -1.3998572826385498, -1.362618088722229, -1.3253788948059082, -1.288139820098877, -1.2509005069732666, -1.2136614322662354, -1.1764222383499146, -1.1391830444335938, -1.101943850517273, -1.0647046566009521, -1.0274654626846313, -0.9902263283729553, -0.9529871344566345, -0.9157480001449585, -0.8785087466239929, -0.8412695527076721, -0.8040303587913513, -0.7667912244796753, -0.7295520305633545, -0.6923128366470337, -0.6550736427307129, -0.6178344488143921, -0.5805952548980713, -0.5433560609817505, -0.5061168670654297, -0.4688777029514313, -0.43163853883743286, -0.39439934492111206, -0.35716015100479126, -0.31992098689079285, -0.2826818823814392, -0.2454427033662796, -0.20820352435112, -0.1709643304347992, -0.1337251514196396, -0.09648597240447998, -0.05924677848815918, -0.022007614374160767, 0.015231579542160034, 0.05247076228260994, 0.08970994502305984, 0.12694913148880005, 0.16418831050395966, 0.20142748951911926, 0.23866668343544006, 0.2759058475494385, 0.3131450414657593, 0.3503842353820801, 0.3876233994960785, 0.4248625934123993, 0.4621017575263977, 0.4993409514427185, 0.5365801453590393, 0.5738192796707153, 0.6110584735870361, 0.6482976675033569, 0.6855368614196777, 0.7227760553359985, 0.7600151896476746, 0.7972543835639954, 0.8344935774803162, 0.8717327117919922, 0.9089719653129578]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 8.0, 6.0, 7.0, 5.0, 7.0, 15.0, 12.0, 25.0, 17.0, 18.0, 19.0, 40.0, 32.0, 33.0, 45.0, 44.0, 39.0, 49.0, 33.0, 48.0, 45.0, 49.0, 40.0, 43.0, 38.0, 40.0, 33.0, 26.0, 29.0, 34.0, 23.0, 24.0, 19.0, 16.0, 9.0, 11.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1353248953819275, -0.1309289038181305, -0.1265329122543335, -0.1221369281411171, -0.1177409365773201, -0.1133449450135231, -0.1089489609003067, -0.1045529693365097, -0.10015697777271271, -0.09576098620891571, -0.09136499464511871, -0.08696901053190231, -0.08257301896810532, -0.07817702740430832, -0.07378104329109192, -0.06938505172729492, -0.06498906016349792, -0.06059306859970093, -0.05619708076119423, -0.05180109292268753, -0.04740510135889053, -0.043009109795093536, -0.03861312195658684, -0.03421713411808014, -0.029821142554283142, -0.025425152853131294, -0.021029163151979446, -0.0166331734508276, -0.01223718374967575, -0.007841194048523903, -0.003445204347372055, 0.0009507853537797928, 0.005346775054931641, 0.009742764756083488, 0.014138754457235336, 0.018534744158387184, 0.022930733859539032, 0.02732672356069088, 0.03172271326184273, 0.036118701100349426, 0.04051469266414642, 0.04491068422794342, 0.04930667206645012, 0.05370265990495682, 0.058098651468753815, 0.06249464303255081, 0.06689062714576721, 0.07128661870956421, 0.0756826102733612, 0.0800786018371582, 0.0844745934009552, 0.0888705775141716, 0.0932665690779686, 0.0976625606417656, 0.102058544754982, 0.10645453631877899, 0.11085052788257599, 0.11524651944637299, 0.11964251101016998, 0.12403849512338638, 0.12843447923660278, 0.13283047080039978, 0.13722646236419678, 0.14162245392799377, 0.14601844549179077]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 8.0, 4.0, 7.0, 8.0, 10.0, 7.0, 17.0, 13.0, 15.0, 30.0, 21.0, 20.0, 23.0, 40.0, 32.0, 31.0, 35.0, 40.0, 31.0, 45.0, 44.0, 56.0, 25.0, 36.0, 40.0, 47.0, 21.0, 29.0, 33.0, 22.0, 25.0, 34.0, 25.0, 16.0, 23.0, 15.0, 10.0, 19.0, 11.0, 5.0, 5.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-14.0078125, -13.5672607421875, -13.126708984375, -12.6861572265625, -12.24560546875, -11.8050537109375, -11.364501953125, -10.9239501953125, -10.4833984375, -10.0428466796875, -9.602294921875, -9.1617431640625, -8.72119140625, -8.2806396484375, -7.840087890625, -7.3995361328125, -6.958984375, -6.5184326171875, -6.077880859375, -5.6373291015625, -5.19677734375, -4.7562255859375, -4.315673828125, -3.8751220703125, -3.4345703125, -2.9940185546875, -2.553466796875, -2.1129150390625, -1.67236328125, -1.2318115234375, -0.791259765625, -0.3507080078125, 0.08984375, 0.5303955078125, 0.970947265625, 1.4114990234375, 1.85205078125, 2.2926025390625, 2.733154296875, 3.1737060546875, 3.6142578125, 4.0548095703125, 4.495361328125, 4.9359130859375, 5.37646484375, 5.8170166015625, 6.257568359375, 6.6981201171875, 7.138671875, 7.5792236328125, 8.019775390625, 8.4603271484375, 8.90087890625, 9.3414306640625, 9.781982421875, 10.2225341796875, 10.6630859375, 11.1036376953125, 11.544189453125, 11.9847412109375, 12.42529296875, 12.8658447265625, 13.306396484375, 13.7469482421875, 14.1875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 8.0, 6.0, 10.0, 10.0, 14.0, 15.0, 27.0, 29.0, 37.0, 62.0, 55.0, 94.0, 112.0, 181.0, 249.0, 434.0, 707.0, 1264.0, 2504.0, 6432.0, 35287.0, 762145.0, 214454.0, 15709.0, 4246.0, 1875.0, 943.0, 514.0, 362.0, 211.0, 133.0, 112.0, 78.0, 47.0, 42.0, 29.0, 24.0, 27.0, 18.0, 7.0, 8.0, 9.0, 6.0, 10.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-23.96875, -23.215087890625, -22.46142578125, -21.707763671875, -20.9541015625, -20.200439453125, -19.44677734375, -18.693115234375, -17.939453125, -17.185791015625, -16.43212890625, -15.678466796875, -14.9248046875, -14.171142578125, -13.41748046875, -12.663818359375, -11.91015625, -11.156494140625, -10.40283203125, -9.649169921875, -8.8955078125, -8.141845703125, -7.38818359375, -6.634521484375, -5.880859375, -5.127197265625, -4.37353515625, -3.619873046875, -2.8662109375, -2.112548828125, -1.35888671875, -0.605224609375, 0.1484375, 0.902099609375, 1.65576171875, 2.409423828125, 3.1630859375, 3.916748046875, 4.67041015625, 5.424072265625, 6.177734375, 6.931396484375, 7.68505859375, 8.438720703125, 9.1923828125, 9.946044921875, 10.69970703125, 11.453369140625, 12.20703125, 12.960693359375, 13.71435546875, 14.468017578125, 15.2216796875, 15.975341796875, 16.72900390625, 17.482666015625, 18.236328125, 18.989990234375, 19.74365234375, 20.497314453125, 21.2509765625, 22.004638671875, 22.75830078125, 23.511962890625, 24.265625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 11.0, 6.0, 9.0, 14.0, 17.0, 14.0, 23.0, 22.0, 22.0, 26.0, 28.0, 44.0, 41.0, 42.0, 54.0, 50.0, 80.0, 182.0, 1830.0, 93.0, 50.0, 50.0, 45.0, 40.0, 29.0, 30.0, 27.0, 21.0, 22.0, 19.0, 13.0, 15.0, 18.0, 8.0, 8.0, 8.0, 7.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.03125, -31.81640625, -30.6015625, -29.38671875, -28.171875, -26.95703125, -25.7421875, -24.52734375, -23.3125, -22.09765625, -20.8828125, -19.66796875, -18.453125, -17.23828125, -16.0234375, -14.80859375, -13.59375, -12.37890625, -11.1640625, -9.94921875, -8.734375, -7.51953125, -6.3046875, -5.08984375, -3.875, -2.66015625, -1.4453125, -0.23046875, 0.984375, 2.19921875, 3.4140625, 4.62890625, 5.84375, 7.05859375, 8.2734375, 9.48828125, 10.703125, 11.91796875, 13.1328125, 14.34765625, 15.5625, 16.77734375, 17.9921875, 19.20703125, 20.421875, 21.63671875, 22.8515625, 24.06640625, 25.28125, 26.49609375, 27.7109375, 28.92578125, 30.140625, 31.35546875, 32.5703125, 33.78515625, 35.0, 36.21484375, 37.4296875, 38.64453125, 39.859375, 41.07421875, 42.2890625, 43.50390625, 44.71875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 5.0, 5.0, 10.0, 8.0, 6.0, 16.0, 16.0, 14.0, 21.0, 19.0, 26.0, 26.0, 49.0, 50.0, 94.0, 132.0, 203.0, 451.0, 2084.0, 2880214.0, 259496.0, 1598.0, 421.0, 222.0, 117.0, 87.0, 68.0, 41.0, 33.0, 21.0, 27.0, 22.0, 18.0, 16.0, 17.0, 9.0, 4.0, 9.0, 8.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0], "bins": [-130.625, -127.0888671875, -123.552734375, -120.0166015625, -116.48046875, -112.9443359375, -109.408203125, -105.8720703125, -102.3359375, -98.7998046875, -95.263671875, -91.7275390625, -88.19140625, -84.6552734375, -81.119140625, -77.5830078125, -74.046875, -70.5107421875, -66.974609375, -63.4384765625, -59.90234375, -56.3662109375, -52.830078125, -49.2939453125, -45.7578125, -42.2216796875, -38.685546875, -35.1494140625, -31.61328125, -28.0771484375, -24.541015625, -21.0048828125, -17.46875, -13.9326171875, -10.396484375, -6.8603515625, -3.32421875, 0.2119140625, 3.748046875, 7.2841796875, 10.8203125, 14.3564453125, 17.892578125, 21.4287109375, 24.96484375, 28.5009765625, 32.037109375, 35.5732421875, 39.109375, 42.6455078125, 46.181640625, 49.7177734375, 53.25390625, 56.7900390625, 60.326171875, 63.8623046875, 67.3984375, 70.9345703125, 74.470703125, 78.0068359375, 81.54296875, 85.0791015625, 88.615234375, 92.1513671875, 95.6875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 81.0, 542.0, 359.0, 31.0], "bins": [-239.0032501220703, -235.13783264160156, -231.2724151611328, -227.40699768066406, -223.54159545898438, -219.67617797851562, -215.81076049804688, -211.94534301757812, -208.07992553710938, -204.21450805664062, -200.34909057617188, -196.48367309570312, -192.61825561523438, -188.7528533935547, -184.88743591308594, -181.0220184326172, -177.15660095214844, -173.2911834716797, -169.42576599121094, -165.5603485107422, -161.6949462890625, -157.82952880859375, -153.964111328125, -150.09869384765625, -146.2332763671875, -142.36785888671875, -138.50244140625, -134.63702392578125, -130.7716064453125, -126.90619659423828, -123.04078674316406, -119.17536926269531, -115.30994415283203, -111.44452667236328, -107.57911682128906, -103.71369934082031, -99.84828186035156, -95.98286437988281, -92.11744689941406, -88.25203704833984, -84.3866195678711, -80.52120208740234, -76.65579223632812, -72.79037475585938, -68.92495727539062, -65.05953979492188, -61.19412612915039, -57.328712463378906, -53.463294982910156, -49.597877502441406, -45.73246383666992, -41.86705017089844, -38.00163269042969, -34.13621520996094, -30.270801544189453, -26.405385971069336, -22.53997039794922, -18.6745548248291, -14.809139251708984, -10.943723678588867, -7.07830810546875, -3.212892532348633, 0.6525230407714844, 4.517938613891602, 8.383353233337402]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 11.0, 10.0, 9.0, 18.0, 17.0, 20.0, 17.0, 20.0, 28.0, 39.0, 22.0, 33.0, 37.0, 45.0, 41.0, 44.0, 44.0, 40.0, 45.0, 42.0, 47.0, 37.0, 45.0, 32.0, 32.0, 38.0, 37.0, 15.0, 19.0, 14.0, 14.0, 17.0, 14.0, 10.0, 8.0, 12.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-117.60169219970703, -114.11853790283203, -110.63538360595703, -107.15222930908203, -103.66907501220703, -100.18592071533203, -96.7027587890625, -93.2196044921875, -89.7364501953125, -86.2532958984375, -82.7701416015625, -79.2869873046875, -75.8038330078125, -72.3206787109375, -68.8375244140625, -65.3543701171875, -61.8712158203125, -58.3880615234375, -54.9049072265625, -51.4217529296875, -47.9385986328125, -44.4554443359375, -40.972286224365234, -37.489131927490234, -34.005977630615234, -30.522823333740234, -27.039669036865234, -23.5565128326416, -20.0733585357666, -16.5902042388916, -13.107048034667969, -9.623893737792969, -6.1407318115234375, -2.6575770378112793, 0.8255777359008789, 4.308732986450195, 7.791887283325195, 11.275041580200195, 14.758197784423828, 18.241352081298828, 21.724506378173828, 25.207660675048828, 28.690814971923828, 32.173973083496094, 35.657127380371094, 39.140281677246094, 42.623435974121094, 46.106590270996094, 49.589744567871094, 53.072898864746094, 56.556053161621094, 60.039207458496094, 63.522361755371094, 67.0055160522461, 70.48867797851562, 73.97183227539062, 77.45498657226562, 80.93814086914062, 84.42129516601562, 87.90444946289062, 91.38760375976562, 94.87075805664062, 98.35391235351562, 101.83706665039062, 105.32022094726562]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 9.0, 7.0, 9.0, 8.0, 12.0, 15.0, 16.0, 19.0, 28.0, 14.0, 25.0, 25.0, 36.0, 26.0, 37.0, 40.0, 32.0, 37.0, 42.0, 42.0, 36.0, 42.0, 37.0, 38.0, 42.0, 25.0, 31.0, 23.0, 24.0, 28.0, 25.0, 22.0, 27.0, 16.0, 13.0, 18.0, 14.0, 9.0, 15.0, 5.0, 2.0, 5.0, 4.0, 6.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0], "bins": [-13.7265625, -13.29345703125, -12.8603515625, -12.42724609375, -11.994140625, -11.56103515625, -11.1279296875, -10.69482421875, -10.26171875, -9.82861328125, -9.3955078125, -8.96240234375, -8.529296875, -8.09619140625, -7.6630859375, -7.22998046875, -6.796875, -6.36376953125, -5.9306640625, -5.49755859375, -5.064453125, -4.63134765625, -4.1982421875, -3.76513671875, -3.33203125, -2.89892578125, -2.4658203125, -2.03271484375, -1.599609375, -1.16650390625, -0.7333984375, -0.30029296875, 0.1328125, 0.56591796875, 0.9990234375, 1.43212890625, 1.865234375, 2.29833984375, 2.7314453125, 3.16455078125, 3.59765625, 4.03076171875, 4.4638671875, 4.89697265625, 5.330078125, 5.76318359375, 6.1962890625, 6.62939453125, 7.0625, 7.49560546875, 7.9287109375, 8.36181640625, 8.794921875, 9.22802734375, 9.6611328125, 10.09423828125, 10.52734375, 10.96044921875, 11.3935546875, 11.82666015625, 12.259765625, 12.69287109375, 13.1259765625, 13.55908203125, 13.9921875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 9.0, 8.0, 5.0, 18.0, 28.0, 21.0, 40.0, 55.0, 72.0, 121.0, 129.0, 207.0, 330.0, 495.0, 758.0, 1164.0, 1899.0, 3121.0, 5497.0, 9304.0, 26234.0, 234277.0, 2488211.0, 1296852.0, 90545.0, 14695.0, 7375.0, 4566.0, 2765.0, 1720.0, 1186.0, 805.0, 498.0, 339.0, 245.0, 175.0, 148.0, 96.0, 71.0, 51.0, 34.0, 38.0, 16.0, 19.0, 7.0, 15.0, 4.0, 6.0, 4.0, 2.0, 4.0, 9.0], "bins": [-34.15625, -33.17578125, -32.1953125, -31.21484375, -30.234375, -29.25390625, -28.2734375, -27.29296875, -26.3125, -25.33203125, -24.3515625, -23.37109375, -22.390625, -21.41015625, -20.4296875, -19.44921875, -18.46875, -17.48828125, -16.5078125, -15.52734375, -14.546875, -13.56640625, -12.5859375, -11.60546875, -10.625, -9.64453125, -8.6640625, -7.68359375, -6.703125, -5.72265625, -4.7421875, -3.76171875, -2.78125, -1.80078125, -0.8203125, 0.16015625, 1.140625, 2.12109375, 3.1015625, 4.08203125, 5.0625, 6.04296875, 7.0234375, 8.00390625, 8.984375, 9.96484375, 10.9453125, 11.92578125, 12.90625, 13.88671875, 14.8671875, 15.84765625, 16.828125, 17.80859375, 18.7890625, 19.76953125, 20.75, 21.73046875, 22.7109375, 23.69140625, 24.671875, 25.65234375, 26.6328125, 27.61328125, 28.59375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 10.0, 9.0, 13.0, 21.0, 18.0, 37.0, 56.0, 101.0, 203.0, 516.0, 1003.0, 1045.0, 544.0, 242.0, 102.0, 58.0, 20.0, 20.0, 19.0, 11.0, 7.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.28125, -38.94091796875, -37.6005859375, -36.26025390625, -34.919921875, -33.57958984375, -32.2392578125, -30.89892578125, -29.55859375, -28.21826171875, -26.8779296875, -25.53759765625, -24.197265625, -22.85693359375, -21.5166015625, -20.17626953125, -18.8359375, -17.49560546875, -16.1552734375, -14.81494140625, -13.474609375, -12.13427734375, -10.7939453125, -9.45361328125, -8.11328125, -6.77294921875, -5.4326171875, -4.09228515625, -2.751953125, -1.41162109375, -0.0712890625, 1.26904296875, 2.609375, 3.94970703125, 5.2900390625, 6.63037109375, 7.970703125, 9.31103515625, 10.6513671875, 11.99169921875, 13.33203125, 14.67236328125, 16.0126953125, 17.35302734375, 18.693359375, 20.03369140625, 21.3740234375, 22.71435546875, 24.0546875, 25.39501953125, 26.7353515625, 28.07568359375, 29.416015625, 30.75634765625, 32.0966796875, 33.43701171875, 34.77734375, 36.11767578125, 37.4580078125, 38.79833984375, 40.138671875, 41.47900390625, 42.8193359375, 44.15966796875, 45.5]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 10.0, 8.0, 15.0, 17.0, 39.0, 91.0, 161.0, 355.0, 881.0, 2906.0, 18016.0, 3249942.0, 904265.0, 13719.0, 2437.0, 773.0, 309.0, 149.0, 71.0, 47.0, 32.0, 10.0, 13.0, 8.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.25, -135.9921875, -131.734375, -127.4765625, -123.21875, -118.9609375, -114.703125, -110.4453125, -106.1875, -101.9296875, -97.671875, -93.4140625, -89.15625, -84.8984375, -80.640625, -76.3828125, -72.125, -67.8671875, -63.609375, -59.3515625, -55.09375, -50.8359375, -46.578125, -42.3203125, -38.0625, -33.8046875, -29.546875, -25.2890625, -21.03125, -16.7734375, -12.515625, -8.2578125, -4.0, 0.2578125, 4.515625, 8.7734375, 13.03125, 17.2890625, 21.546875, 25.8046875, 30.0625, 34.3203125, 38.578125, 42.8359375, 47.09375, 51.3515625, 55.609375, 59.8671875, 64.125, 68.3828125, 72.640625, 76.8984375, 81.15625, 85.4140625, 89.671875, 93.9296875, 98.1875, 102.4453125, 106.703125, 110.9609375, 115.21875, 119.4765625, 123.734375, 127.9921875, 132.25]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 17.0, 134.0, 651.0, 177.0, 31.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1150.5255126953125, -1130.531982421875, -1110.5384521484375, -1090.544921875, -1070.551513671875, -1050.5579833984375, -1030.564453125, -1010.5709228515625, -990.577392578125, -970.5838623046875, -950.59033203125, -930.5968627929688, -910.6033325195312, -890.6098022460938, -870.6163330078125, -850.622802734375, -830.6292724609375, -810.6357421875, -790.6422119140625, -770.6487426757812, -750.6552124023438, -730.6616821289062, -710.668212890625, -690.6746826171875, -670.68115234375, -650.6876220703125, -630.694091796875, -610.7006225585938, -590.7070922851562, -570.7135620117188, -550.7200927734375, -530.7265625, -510.7330322265625, -490.739501953125, -470.7460021972656, -450.75250244140625, -430.75897216796875, -410.76544189453125, -390.7719421386719, -370.7784423828125, -350.784912109375, -330.7913818359375, -310.7978820800781, -290.80438232421875, -270.81085205078125, -250.8173370361328, -230.82382202148438, -210.83030700683594, -190.83680725097656, -170.84329223632812, -150.8497772216797, -130.85626220703125, -110.86274719238281, -90.86923217773438, -70.87571716308594, -50.8822021484375, -30.888687133789062, -10.895172119140625, 9.098342895507812, 29.09185791015625, 49.08537292480469, 69.07888793945312, 89.07240295410156, 109.06591796875, 129.05943298339844]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 10.0, 6.0, 2.0, 12.0, 12.0, 17.0, 15.0, 15.0, 19.0, 35.0, 21.0, 32.0, 28.0, 28.0, 40.0, 27.0, 42.0, 35.0, 56.0, 39.0, 41.0, 37.0, 52.0, 33.0, 36.0, 40.0, 23.0, 30.0, 24.0, 36.0, 26.0, 19.0, 10.0, 27.0, 17.0, 12.0, 9.0, 5.0, 7.0, 10.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.24681091308594, -72.58232116699219, -69.91783142089844, -67.25334930419922, -64.58885955810547, -61.92436981201172, -59.25988006591797, -56.595394134521484, -53.930908203125, -51.26641845703125, -48.601932525634766, -45.937442779541016, -43.27295684814453, -40.60846710205078, -37.94397735595703, -35.27949142456055, -32.6150016784668, -29.95051383972168, -27.286026000976562, -24.621536254882812, -21.957050323486328, -19.292560577392578, -16.62807273864746, -13.963584899902344, -11.299097061157227, -8.63460922241211, -5.970120906829834, -3.3056325912475586, -0.6411447525024414, 2.023343086242676, 4.687831878662109, 7.352319717407227, 10.016807556152344, 12.681295394897461, 15.345783233642578, 18.010272979736328, 20.674758911132812, 23.339248657226562, 26.00373649597168, 28.668224334716797, 31.332712173461914, 33.99720001220703, 36.66168975830078, 39.326175689697266, 41.990665435791016, 44.6551513671875, 47.31964111328125, 49.984130859375, 52.648616790771484, 55.313106536865234, 57.97759246826172, 60.64208221435547, 63.30656814575195, 65.97105407714844, 68.63554382324219, 71.30003356933594, 73.96452331542969, 76.62901306152344, 79.29350280761719, 81.9579849243164, 84.62247467041016, 87.2869644165039, 89.95145416259766, 92.61593627929688, 95.28042602539062]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 5.0, 11.0, 12.0, 14.0, 11.0, 15.0, 14.0, 17.0, 20.0, 22.0, 34.0, 36.0, 36.0, 32.0, 33.0, 37.0, 35.0, 34.0, 40.0, 43.0, 34.0, 40.0, 46.0, 31.0, 34.0, 39.0, 30.0, 27.0, 29.0, 22.0, 21.0, 17.0, 15.0, 22.0, 13.0, 8.0, 11.0, 10.0, 11.0, 8.0, 3.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.53125, -13.0953369140625, -12.659423828125, -12.2235107421875, -11.78759765625, -11.3516845703125, -10.915771484375, -10.4798583984375, -10.0439453125, -9.6080322265625, -9.172119140625, -8.7362060546875, -8.30029296875, -7.8643798828125, -7.428466796875, -6.9925537109375, -6.556640625, -6.1207275390625, -5.684814453125, -5.2489013671875, -4.81298828125, -4.3770751953125, -3.941162109375, -3.5052490234375, -3.0693359375, -2.6334228515625, -2.197509765625, -1.7615966796875, -1.32568359375, -0.8897705078125, -0.453857421875, -0.0179443359375, 0.41796875, 0.8538818359375, 1.289794921875, 1.7257080078125, 2.16162109375, 2.5975341796875, 3.033447265625, 3.4693603515625, 3.9052734375, 4.3411865234375, 4.777099609375, 5.2130126953125, 5.64892578125, 6.0848388671875, 6.520751953125, 6.9566650390625, 7.392578125, 7.8284912109375, 8.264404296875, 8.7003173828125, 9.13623046875, 9.5721435546875, 10.008056640625, 10.4439697265625, 10.8798828125, 11.3157958984375, 11.751708984375, 12.1876220703125, 12.62353515625, 13.0594482421875, 13.495361328125, 13.9312744140625, 14.3671875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 17.0, 23.0, 31.0, 49.0, 52.0, 80.0, 106.0, 158.0, 225.0, 329.0, 523.0, 804.0, 1201.0, 1852.0, 2654.0, 4044.0, 6028.0, 9039.0, 14282.0, 22323.0, 35359.0, 57702.0, 99588.0, 172832.0, 225357.0, 158613.0, 90612.0, 52813.0, 32557.0, 20423.0, 13487.0, 8526.0, 5690.0, 3761.0, 2375.0, 1632.0, 1067.0, 707.0, 518.0, 338.0, 218.0, 200.0, 118.0, 85.0, 52.0, 28.0, 16.0, 20.0, 7.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 3.0], "bins": [-1.412109375, -1.3685455322265625, -1.324981689453125, -1.2814178466796875, -1.23785400390625, -1.1942901611328125, -1.150726318359375, -1.1071624755859375, -1.0635986328125, -1.0200347900390625, -0.976470947265625, -0.9329071044921875, -0.88934326171875, -0.8457794189453125, -0.802215576171875, -0.7586517333984375, -0.715087890625, -0.6715240478515625, -0.627960205078125, -0.5843963623046875, -0.54083251953125, -0.4972686767578125, -0.453704833984375, -0.4101409912109375, -0.3665771484375, -0.3230133056640625, -0.279449462890625, -0.2358856201171875, -0.19232177734375, -0.1487579345703125, -0.105194091796875, -0.0616302490234375, -0.01806640625, 0.0254974365234375, 0.069061279296875, 0.1126251220703125, 0.15618896484375, 0.1997528076171875, 0.243316650390625, 0.2868804931640625, 0.3304443359375, 0.3740081787109375, 0.417572021484375, 0.4611358642578125, 0.50469970703125, 0.5482635498046875, 0.591827392578125, 0.6353912353515625, 0.678955078125, 0.7225189208984375, 0.766082763671875, 0.8096466064453125, 0.85321044921875, 0.8967742919921875, 0.940338134765625, 0.9839019775390625, 1.0274658203125, 1.0710296630859375, 1.114593505859375, 1.1581573486328125, 1.20172119140625, 1.2452850341796875, 1.288848876953125, 1.3324127197265625, 1.3759765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 9.0, 7.0, 6.0, 8.0, 7.0, 6.0, 13.0, 18.0, 19.0, 12.0, 18.0, 28.0, 27.0, 23.0, 32.0, 35.0, 40.0, 35.0, 31.0, 44.0, 37.0, 37.0, 1064.0, 51.0, 35.0, 24.0, 28.0, 29.0, 34.0, 34.0, 32.0, 32.0, 24.0, 27.0, 16.0, 17.0, 22.0, 14.0, 10.0, 5.0, 3.0, 8.0, 10.0, 5.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.8046875, -9.519775390625, -9.23486328125, -8.949951171875, -8.6650390625, -8.380126953125, -8.09521484375, -7.810302734375, -7.525390625, -7.240478515625, -6.95556640625, -6.670654296875, -6.3857421875, -6.100830078125, -5.81591796875, -5.531005859375, -5.24609375, -4.961181640625, -4.67626953125, -4.391357421875, -4.1064453125, -3.821533203125, -3.53662109375, -3.251708984375, -2.966796875, -2.681884765625, -2.39697265625, -2.112060546875, -1.8271484375, -1.542236328125, -1.25732421875, -0.972412109375, -0.6875, -0.402587890625, -0.11767578125, 0.167236328125, 0.4521484375, 0.737060546875, 1.02197265625, 1.306884765625, 1.591796875, 1.876708984375, 2.16162109375, 2.446533203125, 2.7314453125, 3.016357421875, 3.30126953125, 3.586181640625, 3.87109375, 4.156005859375, 4.44091796875, 4.725830078125, 5.0107421875, 5.295654296875, 5.58056640625, 5.865478515625, 6.150390625, 6.435302734375, 6.72021484375, 7.005126953125, 7.2900390625, 7.574951171875, 7.85986328125, 8.144775390625, 8.4296875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 10.0, 20.0, 20.0, 31.0, 48.0, 73.0, 104.0, 190.0, 335.0, 476.0, 671.0, 984.0, 1596.0, 2376.0, 3612.0, 5473.0, 8504.0, 13286.0, 20977.0, 33131.0, 53987.0, 90250.0, 154340.0, 1264957.0, 174459.0, 103169.0, 61633.0, 37325.0, 23043.0, 14643.0, 9583.0, 6059.0, 4064.0, 2684.0, 1694.0, 1077.0, 804.0, 517.0, 307.0, 231.0, 137.0, 91.0, 44.0, 36.0, 29.0, 17.0, 8.0, 11.0, 9.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8525390625, -0.8246994018554688, -0.7968597412109375, -0.7690200805664062, -0.741180419921875, -0.7133407592773438, -0.6855010986328125, -0.6576614379882812, -0.62982177734375, -0.6019821166992188, -0.5741424560546875, -0.5463027954101562, -0.518463134765625, -0.49062347412109375, -0.4627838134765625, -0.43494415283203125, -0.4071044921875, -0.37926483154296875, -0.3514251708984375, -0.32358551025390625, -0.295745849609375, -0.26790618896484375, -0.2400665283203125, -0.21222686767578125, -0.18438720703125, -0.15654754638671875, -0.1287078857421875, -0.10086822509765625, -0.073028564453125, -0.04518890380859375, -0.0173492431640625, 0.01049041748046875, 0.038330078125, 0.06616973876953125, 0.0940093994140625, 0.12184906005859375, 0.149688720703125, 0.17752838134765625, 0.2053680419921875, 0.23320770263671875, 0.26104736328125, 0.28888702392578125, 0.3167266845703125, 0.34456634521484375, 0.372406005859375, 0.40024566650390625, 0.4280853271484375, 0.45592498779296875, 0.4837646484375, 0.5116043090820312, 0.5394439697265625, 0.5672836303710938, 0.595123291015625, 0.6229629516601562, 0.6508026123046875, 0.6786422729492188, 0.70648193359375, 0.7343215942382812, 0.7621612548828125, 0.7900009155273438, 0.817840576171875, 0.8456802368164062, 0.8735198974609375, 0.9013595581054688, 0.92919921875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 1.0, 3.0, 6.0, 7.0, 11.0, 5.0, 7.0, 14.0, 15.0, 11.0, 13.0, 20.0, 19.0, 40.0, 42.0, 65.0, 95.0, 126.0, 134.0, 95.0, 80.0, 41.0, 34.0, 22.0, 12.0, 18.0, 13.0, 15.0, 11.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.03857421875, -0.03747081756591797, -0.03636741638183594, -0.035264015197753906, -0.034160614013671875, -0.033057212829589844, -0.03195381164550781, -0.03085041046142578, -0.02974700927734375, -0.02864360809326172, -0.027540206909179688, -0.026436805725097656, -0.025333404541015625, -0.024230003356933594, -0.023126602172851562, -0.02202320098876953, -0.0209197998046875, -0.01981639862060547, -0.018712997436523438, -0.017609596252441406, -0.016506195068359375, -0.015402793884277344, -0.014299392700195312, -0.013195991516113281, -0.01209259033203125, -0.010989189147949219, -0.009885787963867188, -0.008782386779785156, -0.007678985595703125, -0.006575584411621094, -0.0054721832275390625, -0.004368782043457031, -0.003265380859375, -0.0021619796752929688, -0.0010585784912109375, 4.482269287109375e-05, 0.001148223876953125, 0.0022516250610351562, 0.0033550262451171875, 0.004458427429199219, 0.00556182861328125, 0.006665229797363281, 0.0077686309814453125, 0.008872032165527344, 0.009975433349609375, 0.011078834533691406, 0.012182235717773438, 0.013285636901855469, 0.0143890380859375, 0.015492439270019531, 0.016595840454101562, 0.017699241638183594, 0.018802642822265625, 0.019906044006347656, 0.021009445190429688, 0.02211284637451172, 0.02321624755859375, 0.02431964874267578, 0.025423049926757812, 0.026526451110839844, 0.027629852294921875, 0.028733253479003906, 0.029836654663085938, 0.03094005584716797, 0.03204345703125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 9.0, 14.0, 15.0, 22.0, 25.0, 32.0, 32.0, 71.0, 84.0, 197.0, 541.0, 7681.0, 974562.0, 63152.0, 1405.0, 242.0, 118.0, 87.0, 53.0, 42.0, 31.0, 27.0, 12.0, 19.0, 9.0, 12.0, 9.0, 10.0, 6.0, 5.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70263671875, -0.6790084838867188, -0.6553802490234375, -0.6317520141601562, -0.608123779296875, -0.5844955444335938, -0.5608673095703125, -0.5372390747070312, -0.51361083984375, -0.48998260498046875, -0.4663543701171875, -0.44272613525390625, -0.419097900390625, -0.39546966552734375, -0.3718414306640625, -0.34821319580078125, -0.3245849609375, -0.30095672607421875, -0.2773284912109375, -0.25370025634765625, -0.230072021484375, -0.20644378662109375, -0.1828155517578125, -0.15918731689453125, -0.13555908203125, -0.11193084716796875, -0.0883026123046875, -0.06467437744140625, -0.041046142578125, -0.01741790771484375, 0.0062103271484375, 0.02983856201171875, 0.053466796875, 0.07709503173828125, 0.1007232666015625, 0.12435150146484375, 0.147979736328125, 0.17160797119140625, 0.1952362060546875, 0.21886444091796875, 0.24249267578125, 0.26612091064453125, 0.2897491455078125, 0.31337738037109375, 0.337005615234375, 0.36063385009765625, 0.3842620849609375, 0.40789031982421875, 0.4315185546875, 0.45514678955078125, 0.4787750244140625, 0.5024032592773438, 0.526031494140625, 0.5496597290039062, 0.5732879638671875, 0.5969161987304688, 0.62054443359375, 0.6441726684570312, 0.6678009033203125, 0.6914291381835938, 0.715057373046875, 0.7386856079101562, 0.7623138427734375, 0.7859420776367188, 0.8095703125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 30.0, 104.0, 576.0, 227.0, 51.0, 10.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3132428526878357, -0.3014827072620392, -0.2897225618362427, -0.27796244621276855, -0.26620230078697205, -0.25444215536117554, -0.24268202483654022, -0.2309218943119049, -0.2191617488861084, -0.2074016034603119, -0.19564147293567657, -0.18388134241104126, -0.17212119698524475, -0.16036105155944824, -0.14860092103481293, -0.1368407905101776, -0.1250806450843811, -0.11332050710916519, -0.10156036913394928, -0.08980023115873337, -0.07804009318351746, -0.06627995520830154, -0.05451981723308563, -0.04275967925786972, -0.03099954128265381, -0.019239403307437897, -0.007479265332221985, 0.004280872642993927, 0.01604101061820984, 0.02780114859342575, 0.03956128656864166, 0.051321424543857574, 0.06308159232139587, 0.07484173029661179, 0.0866018682718277, 0.09836200624704361, 0.11012214422225952, 0.12188228219747543, 0.13364242017269135, 0.14540255069732666, 0.15716269612312317, 0.16892284154891968, 0.180682972073555, 0.1924431025981903, 0.20420324802398682, 0.21596339344978333, 0.22772352397441864, 0.23948365449905396, 0.25124379992485046, 0.263003945350647, 0.2747640609741211, 0.2865242063999176, 0.2982843518257141, 0.3100444972515106, 0.32180464267730713, 0.33356475830078125, 0.34532490372657776, 0.35708504915237427, 0.3688451647758484, 0.3806053102016449, 0.3923654556274414, 0.4041256010532379, 0.4158857464790344, 0.42764586210250854, 0.43940600752830505]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 6.0, 8.0, 10.0, 6.0, 12.0, 21.0, 22.0, 18.0, 24.0, 38.0, 34.0, 28.0, 43.0, 43.0, 36.0, 39.0, 33.0, 47.0, 47.0, 36.0, 44.0, 45.0, 40.0, 47.0, 40.0, 31.0, 31.0, 26.0, 22.0, 24.0, 19.0, 18.0, 16.0, 3.0, 10.0, 10.0, 4.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04542136192321777, -0.04374955594539642, -0.042077746242284775, -0.040405936539173126, -0.038734130561351776, -0.037062324583530426, -0.03539051488041878, -0.03371870517730713, -0.03204689919948578, -0.03037509135901928, -0.02870328351855278, -0.02703147567808628, -0.02535966783761978, -0.023687859997153282, -0.022016052156686783, -0.020344244316220284, -0.018672436475753784, -0.017000628635287285, -0.015328820794820786, -0.013657012954354286, -0.011985205113887787, -0.010313397273421288, -0.008641589432954788, -0.006969781592488289, -0.0052979737520217896, -0.0036261659115552902, -0.001954358071088791, -0.00028255023062229156, 0.0013892576098442078, 0.003061065450310707, 0.004732873290777206, 0.006404681131243706, 0.008076488971710205, 0.009748296812176704, 0.011420104652643204, 0.013091912493109703, 0.014763720333576202, 0.0164355281740427, 0.0181073360145092, 0.0197791438549757, 0.0214509516954422, 0.0231227595359087, 0.0247945673763752, 0.026466375216841698, 0.028138183057308197, 0.029809990897774696, 0.031481798738241196, 0.033153608441352844, 0.034825414419174194, 0.036497220396995544, 0.03816903010010719, 0.03984083980321884, 0.04151264578104019, 0.04318445175886154, 0.04485626146197319, 0.04652807116508484, 0.04819987714290619, 0.04987168312072754, 0.05154349282383919, 0.053215302526950836, 0.054887108504772186, 0.056558914482593536, 0.058230724185705185, 0.059902533888816833, 0.061574339866638184]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 5.0, 12.0, 11.0, 14.0, 11.0, 15.0, 14.0, 17.0, 20.0, 22.0, 34.0, 36.0, 36.0, 32.0, 33.0, 37.0, 35.0, 34.0, 41.0, 42.0, 35.0, 39.0, 46.0, 32.0, 33.0, 39.0, 30.0, 27.0, 29.0, 22.0, 22.0, 16.0, 15.0, 22.0, 13.0, 8.0, 11.0, 10.0, 11.0, 8.0, 3.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.53125, -13.09521484375, -12.6591796875, -12.22314453125, -11.787109375, -11.35107421875, -10.9150390625, -10.47900390625, -10.04296875, -9.60693359375, -9.1708984375, -8.73486328125, -8.298828125, -7.86279296875, -7.4267578125, -6.99072265625, -6.5546875, -6.11865234375, -5.6826171875, -5.24658203125, -4.810546875, -4.37451171875, -3.9384765625, -3.50244140625, -3.06640625, -2.63037109375, -2.1943359375, -1.75830078125, -1.322265625, -0.88623046875, -0.4501953125, -0.01416015625, 0.421875, 0.85791015625, 1.2939453125, 1.72998046875, 2.166015625, 2.60205078125, 3.0380859375, 3.47412109375, 3.91015625, 4.34619140625, 4.7822265625, 5.21826171875, 5.654296875, 6.09033203125, 6.5263671875, 6.96240234375, 7.3984375, 7.83447265625, 8.2705078125, 8.70654296875, 9.142578125, 9.57861328125, 10.0146484375, 10.45068359375, 10.88671875, 11.32275390625, 11.7587890625, 12.19482421875, 12.630859375, 13.06689453125, 13.5029296875, 13.93896484375, 14.375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 7.0, 15.0, 10.0, 25.0, 18.0, 35.0, 43.0, 38.0, 80.0, 94.0, 183.0, 266.0, 444.0, 778.0, 1567.0, 3197.0, 8605.0, 28732.0, 115311.0, 511916.0, 285972.0, 63427.0, 17201.0, 5452.0, 2356.0, 1080.0, 620.0, 386.0, 199.0, 134.0, 94.0, 62.0, 45.0, 34.0, 22.0, 16.0, 21.0, 12.0, 12.0, 6.0, 4.0, 6.0, 6.0, 4.0, 1.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.7421875, -12.328369140625, -11.91455078125, -11.500732421875, -11.0869140625, -10.673095703125, -10.25927734375, -9.845458984375, -9.431640625, -9.017822265625, -8.60400390625, -8.190185546875, -7.7763671875, -7.362548828125, -6.94873046875, -6.534912109375, -6.12109375, -5.707275390625, -5.29345703125, -4.879638671875, -4.4658203125, -4.052001953125, -3.63818359375, -3.224365234375, -2.810546875, -2.396728515625, -1.98291015625, -1.569091796875, -1.1552734375, -0.741455078125, -0.32763671875, 0.086181640625, 0.5, 0.913818359375, 1.32763671875, 1.741455078125, 2.1552734375, 2.569091796875, 2.98291015625, 3.396728515625, 3.810546875, 4.224365234375, 4.63818359375, 5.052001953125, 5.4658203125, 5.879638671875, 6.29345703125, 6.707275390625, 7.12109375, 7.534912109375, 7.94873046875, 8.362548828125, 8.7763671875, 9.190185546875, 9.60400390625, 10.017822265625, 10.431640625, 10.845458984375, 11.25927734375, 11.673095703125, 12.0869140625, 12.500732421875, 12.91455078125, 13.328369140625, 13.7421875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 7.0, 1.0, 9.0, 13.0, 10.0, 14.0, 11.0, 10.0, 15.0, 21.0, 29.0, 20.0, 31.0, 36.0, 34.0, 38.0, 44.0, 55.0, 84.0, 309.0, 1680.0, 98.0, 79.0, 49.0, 44.0, 40.0, 36.0, 25.0, 31.0, 35.0, 18.0, 19.0, 20.0, 13.0, 10.0, 9.0, 18.0, 9.0, 11.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5, -34.24072265625, -32.9814453125, -31.72216796875, -30.462890625, -29.20361328125, -27.9443359375, -26.68505859375, -25.42578125, -24.16650390625, -22.9072265625, -21.64794921875, -20.388671875, -19.12939453125, -17.8701171875, -16.61083984375, -15.3515625, -14.09228515625, -12.8330078125, -11.57373046875, -10.314453125, -9.05517578125, -7.7958984375, -6.53662109375, -5.27734375, -4.01806640625, -2.7587890625, -1.49951171875, -0.240234375, 1.01904296875, 2.2783203125, 3.53759765625, 4.796875, 6.05615234375, 7.3154296875, 8.57470703125, 9.833984375, 11.09326171875, 12.3525390625, 13.61181640625, 14.87109375, 16.13037109375, 17.3896484375, 18.64892578125, 19.908203125, 21.16748046875, 22.4267578125, 23.68603515625, 24.9453125, 26.20458984375, 27.4638671875, 28.72314453125, 29.982421875, 31.24169921875, 32.5009765625, 33.76025390625, 35.01953125, 36.27880859375, 37.5380859375, 38.79736328125, 40.056640625, 41.31591796875, 42.5751953125, 43.83447265625, 45.09375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 11.0, 10.0, 10.0, 12.0, 15.0, 16.0, 15.0, 23.0, 37.0, 38.0, 82.0, 84.0, 73.0, 128.0, 127.0, 236.0, 342.0, 782.0, 5367.0, 2787641.0, 345786.0, 3152.0, 661.0, 282.0, 194.0, 139.0, 101.0, 90.0, 52.0, 52.0, 35.0, 24.0, 18.0, 12.0, 17.0, 8.0, 12.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-76.25, -74.1259765625, -72.001953125, -69.8779296875, -67.75390625, -65.6298828125, -63.505859375, -61.3818359375, -59.2578125, -57.1337890625, -55.009765625, -52.8857421875, -50.76171875, -48.6376953125, -46.513671875, -44.3896484375, -42.265625, -40.1416015625, -38.017578125, -35.8935546875, -33.76953125, -31.6455078125, -29.521484375, -27.3974609375, -25.2734375, -23.1494140625, -21.025390625, -18.9013671875, -16.77734375, -14.6533203125, -12.529296875, -10.4052734375, -8.28125, -6.1572265625, -4.033203125, -1.9091796875, 0.21484375, 2.3388671875, 4.462890625, 6.5869140625, 8.7109375, 10.8349609375, 12.958984375, 15.0830078125, 17.20703125, 19.3310546875, 21.455078125, 23.5791015625, 25.703125, 27.8271484375, 29.951171875, 32.0751953125, 34.19921875, 36.3232421875, 38.447265625, 40.5712890625, 42.6953125, 44.8193359375, 46.943359375, 49.0673828125, 51.19140625, 53.3154296875, 55.439453125, 57.5634765625, 59.6875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [203.0, 807.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.93674373626709, -2.113966941833496, 7.708809852600098, 17.531585693359375, 27.35436248779297, 37.17713928222656, 46.999916076660156, 56.82269287109375, 66.64546966552734, 76.46824645996094, 86.29102325439453, 96.11380004882812, 105.93657684326172, 115.75935363769531, 125.5821304321289, 135.4049072265625, 145.22769165039062, 155.05047607421875, 164.8732452392578, 174.69601440429688, 184.518798828125, 194.34158325195312, 204.1643524169922, 213.98712158203125, 223.80990600585938, 233.6326904296875, 243.45545959472656, 253.27822875976562, 263.10101318359375, 272.9237976074219, 282.74658203125, 292.5693359375, 302.39208984375, 312.2148742675781, 322.03765869140625, 331.86041259765625, 341.6831970214844, 351.5059814453125, 361.3287353515625, 371.1515197753906, 380.97430419921875, 390.7970886230469, 400.619873046875, 410.442626953125, 420.2654113769531, 430.08819580078125, 439.91094970703125, 449.7337341308594, 459.5565185546875, 469.3793029785156, 479.20208740234375, 489.02484130859375, 498.8476257324219, 508.67041015625, 518.4931640625, 528.3159790039062, 538.1387329101562, 547.9614868164062, 557.7843017578125, 567.6070556640625, 577.4298095703125, 587.2526245117188, 597.0753784179688, 606.898193359375, 616.720947265625]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 2.0, 6.0, 9.0, 16.0, 14.0, 23.0, 20.0, 27.0, 35.0, 32.0, 31.0, 39.0, 42.0, 36.0, 38.0, 53.0, 59.0, 33.0, 44.0, 35.0, 49.0, 37.0, 39.0, 36.0, 27.0, 21.0, 29.0, 22.0, 26.0, 16.0, 25.0, 15.0, 13.0, 8.0, 8.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-99.80734252929688, -96.58840942382812, -93.3694839477539, -90.15055084228516, -86.9316177368164, -83.71269226074219, -80.49375915527344, -77.27482604980469, -74.05590057373047, -70.83696746826172, -67.6180419921875, -64.39910888671875, -61.180179595947266, -57.96125030517578, -54.74231719970703, -51.52338790893555, -48.3044548034668, -45.08552551269531, -41.86659240722656, -38.64766311645508, -35.428733825683594, -32.209800720214844, -28.99087142944336, -25.771942138671875, -22.553010940551758, -19.33407974243164, -16.115150451660156, -12.896219253540039, -9.677289009094238, -6.4583587646484375, -3.2394275665283203, -0.020498275756835938, 3.1984329223632812, 6.417363166809082, 9.636293411254883, 12.855224609375, 16.074153900146484, 19.2930850982666, 22.51201629638672, 25.730945587158203, 28.94987678527832, 32.16880798339844, 35.38773727416992, 38.606666564941406, 41.825599670410156, 45.04452896118164, 48.263458251953125, 51.482391357421875, 54.70132064819336, 57.920249938964844, 61.139183044433594, 64.35810852050781, 67.57704162597656, 70.79597473144531, 74.01490783691406, 77.23383331298828, 80.45276641845703, 83.67169952392578, 86.890625, 90.10955810546875, 93.3284912109375, 96.54741668701172, 99.76634979248047, 102.98527526855469, 106.20420837402344]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 2.0, 4.0, 4.0, 14.0, 7.0, 15.0, 8.0, 13.0, 14.0, 20.0, 21.0, 29.0, 29.0, 33.0, 39.0, 27.0, 33.0, 43.0, 41.0, 33.0, 42.0, 40.0, 29.0, 33.0, 47.0, 52.0, 30.0, 35.0, 29.0, 32.0, 20.0, 27.0, 18.0, 14.0, 17.0, 24.0, 11.0, 15.0, 12.0, 8.0, 7.0, 7.0, 6.0, 2.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.6953125, -13.2537841796875, -12.812255859375, -12.3707275390625, -11.92919921875, -11.4876708984375, -11.046142578125, -10.6046142578125, -10.1630859375, -9.7215576171875, -9.280029296875, -8.8385009765625, -8.39697265625, -7.9554443359375, -7.513916015625, -7.0723876953125, -6.630859375, -6.1893310546875, -5.747802734375, -5.3062744140625, -4.86474609375, -4.4232177734375, -3.981689453125, -3.5401611328125, -3.0986328125, -2.6571044921875, -2.215576171875, -1.7740478515625, -1.33251953125, -0.8909912109375, -0.449462890625, -0.0079345703125, 0.43359375, 0.8751220703125, 1.316650390625, 1.7581787109375, 2.19970703125, 2.6412353515625, 3.082763671875, 3.5242919921875, 3.9658203125, 4.4073486328125, 4.848876953125, 5.2904052734375, 5.73193359375, 6.1734619140625, 6.614990234375, 7.0565185546875, 7.498046875, 7.9395751953125, 8.381103515625, 8.8226318359375, 9.26416015625, 9.7056884765625, 10.147216796875, 10.5887451171875, 11.0302734375, 11.4718017578125, 11.913330078125, 12.3548583984375, 12.79638671875, 13.2379150390625, 13.679443359375, 14.1209716796875, 14.5625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 9.0, 17.0, 15.0, 22.0, 47.0, 51.0, 57.0, 109.0, 155.0, 172.0, 240.0, 379.0, 567.0, 868.0, 1394.0, 2152.0, 3603.0, 6416.0, 11777.0, 35894.0, 644258.0, 3312807.0, 134022.0, 17523.0, 8507.0, 4757.0, 2791.0, 1800.0, 1181.0, 768.0, 533.0, 379.0, 259.0, 178.0, 144.0, 112.0, 66.0, 63.0, 41.0, 42.0, 20.0, 22.0, 10.0, 19.0, 14.0, 4.0, 4.0, 3.0, 1.0, 0.0, 5.0, 2.0, 0.0, 2.0], "bins": [-43.09375, -41.7158203125, -40.337890625, -38.9599609375, -37.58203125, -36.2041015625, -34.826171875, -33.4482421875, -32.0703125, -30.6923828125, -29.314453125, -27.9365234375, -26.55859375, -25.1806640625, -23.802734375, -22.4248046875, -21.046875, -19.6689453125, -18.291015625, -16.9130859375, -15.53515625, -14.1572265625, -12.779296875, -11.4013671875, -10.0234375, -8.6455078125, -7.267578125, -5.8896484375, -4.51171875, -3.1337890625, -1.755859375, -0.3779296875, 1.0, 2.3779296875, 3.755859375, 5.1337890625, 6.51171875, 7.8896484375, 9.267578125, 10.6455078125, 12.0234375, 13.4013671875, 14.779296875, 16.1572265625, 17.53515625, 18.9130859375, 20.291015625, 21.6689453125, 23.046875, 24.4248046875, 25.802734375, 27.1806640625, 28.55859375, 29.9365234375, 31.314453125, 32.6923828125, 34.0703125, 35.4482421875, 36.826171875, 38.2041015625, 39.58203125, 40.9599609375, 42.337890625, 43.7158203125, 45.09375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0, 11.0, 9.0, 6.0, 7.0, 14.0, 13.0, 18.0, 16.0, 28.0, 46.0, 89.0, 200.0, 402.0, 907.0, 1146.0, 556.0, 278.0, 137.0, 46.0, 42.0, 32.0, 19.0, 13.0, 7.0, 10.0, 8.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.625, -29.40869140625, -28.1923828125, -26.97607421875, -25.759765625, -24.54345703125, -23.3271484375, -22.11083984375, -20.89453125, -19.67822265625, -18.4619140625, -17.24560546875, -16.029296875, -14.81298828125, -13.5966796875, -12.38037109375, -11.1640625, -9.94775390625, -8.7314453125, -7.51513671875, -6.298828125, -5.08251953125, -3.8662109375, -2.64990234375, -1.43359375, -0.21728515625, 0.9990234375, 2.21533203125, 3.431640625, 4.64794921875, 5.8642578125, 7.08056640625, 8.296875, 9.51318359375, 10.7294921875, 11.94580078125, 13.162109375, 14.37841796875, 15.5947265625, 16.81103515625, 18.02734375, 19.24365234375, 20.4599609375, 21.67626953125, 22.892578125, 24.10888671875, 25.3251953125, 26.54150390625, 27.7578125, 28.97412109375, 30.1904296875, 31.40673828125, 32.623046875, 33.83935546875, 35.0556640625, 36.27197265625, 37.48828125, 38.70458984375, 39.9208984375, 41.13720703125, 42.353515625, 43.56982421875, 44.7861328125, 46.00244140625, 47.21875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 11.0, 19.0, 25.0, 45.0, 77.0, 139.0, 255.0, 477.0, 1139.0, 3008.0, 9798.0, 44884.0, 3789779.0, 313598.0, 21512.0, 5883.0, 2066.0, 735.0, 347.0, 185.0, 95.0, 54.0, 41.0, 25.0, 24.0, 11.0, 10.0, 9.0, 6.0, 1.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-133.125, -129.693359375, -126.26171875, -122.830078125, -119.3984375, -115.966796875, -112.53515625, -109.103515625, -105.671875, -102.240234375, -98.80859375, -95.376953125, -91.9453125, -88.513671875, -85.08203125, -81.650390625, -78.21875, -74.787109375, -71.35546875, -67.923828125, -64.4921875, -61.060546875, -57.62890625, -54.197265625, -50.765625, -47.333984375, -43.90234375, -40.470703125, -37.0390625, -33.607421875, -30.17578125, -26.744140625, -23.3125, -19.880859375, -16.44921875, -13.017578125, -9.5859375, -6.154296875, -2.72265625, 0.708984375, 4.140625, 7.572265625, 11.00390625, 14.435546875, 17.8671875, 21.298828125, 24.73046875, 28.162109375, 31.59375, 35.025390625, 38.45703125, 41.888671875, 45.3203125, 48.751953125, 52.18359375, 55.615234375, 59.046875, 62.478515625, 65.91015625, 69.341796875, 72.7734375, 76.205078125, 79.63671875, 83.068359375, 86.5]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 1.0, 3.0, 4.0, 7.0, 3.0, 11.0, 12.0, 9.0, 8.0, 13.0, 21.0, 43.0, 58.0, 70.0, 119.0, 122.0, 136.0, 115.0, 65.0, 50.0, 40.0, 27.0, 19.0, 13.0, 5.0, 4.0, 14.0, 6.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.74673461914062, -79.55815887451172, -76.36959075927734, -73.18101501464844, -69.99243927001953, -66.80386352539062, -63.61529541015625, -60.426719665527344, -57.2381477355957, -54.04957580566406, -50.861000061035156, -47.672428131103516, -44.483856201171875, -41.29528045654297, -38.10670852661133, -34.91813659667969, -31.72956085205078, -28.540987014770508, -25.352413177490234, -22.163841247558594, -18.97526741027832, -15.786693572998047, -12.598121643066406, -9.409547805786133, -6.220973968505859, -3.032400608062744, 0.1561727523803711, 3.344745635986328, 6.533319473266602, 9.721893310546875, 12.910465240478516, 16.09903907775879, 19.28760528564453, 22.476179122924805, 25.664752960205078, 28.85332489013672, 32.041900634765625, 35.230472564697266, 38.419044494628906, 41.60762023925781, 44.79619216918945, 47.984764099121094, 51.17333984375, 54.36191177368164, 57.55048370361328, 60.73905944824219, 63.92763137817383, 67.11620330810547, 70.30477905273438, 73.49335479736328, 76.68192291259766, 79.87049865722656, 83.05907440185547, 86.24765014648438, 89.43621826171875, 92.62479400634766, 95.81336975097656, 99.00194549560547, 102.19051361083984, 105.37908935546875, 108.56766510009766, 111.75624084472656, 114.94480895996094, 118.13338470458984, 121.32195281982422]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 4.0, 8.0, 8.0, 3.0, 20.0, 18.0, 11.0, 14.0, 18.0, 15.0, 23.0, 23.0, 20.0, 24.0, 38.0, 29.0, 21.0, 33.0, 38.0, 45.0, 33.0, 47.0, 44.0, 49.0, 34.0, 36.0, 46.0, 38.0, 28.0, 24.0, 28.0, 29.0, 20.0, 22.0, 18.0, 14.0, 13.0, 9.0, 7.0, 7.0, 7.0, 6.0, 9.0, 3.0, 7.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-87.6893310546875, -85.1355209350586, -82.58171081542969, -80.02790069580078, -77.47409057617188, -74.92028045654297, -72.36647033691406, -69.81266021728516, -67.25885009765625, -64.70503997802734, -62.15122985839844, -59.59741973876953, -57.043609619140625, -54.48979949951172, -51.93598937988281, -49.382179260253906, -46.828369140625, -44.274559020996094, -41.72074890136719, -39.16693878173828, -36.613128662109375, -34.05931854248047, -31.505508422851562, -28.951698303222656, -26.39788818359375, -23.844078063964844, -21.290267944335938, -18.73645782470703, -16.182647705078125, -13.628837585449219, -11.075027465820312, -8.521217346191406, -5.9674072265625, -3.4135971069335938, -0.8597869873046875, 1.6940231323242188, 4.247833251953125, 6.801643371582031, 9.355453491210938, 11.909263610839844, 14.46307373046875, 17.016883850097656, 19.570693969726562, 22.12450408935547, 24.678314208984375, 27.23212432861328, 29.785934448242188, 32.339744567871094, 34.8935546875, 37.447364807128906, 40.00117492675781, 42.55498504638672, 45.108795166015625, 47.66260528564453, 50.21641540527344, 52.770225524902344, 55.32403564453125, 57.877845764160156, 60.43165588378906, 62.98546600341797, 65.53927612304688, 68.09308624267578, 70.64689636230469, 73.2007064819336, 75.7545166015625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 2.0, 5.0, 9.0, 7.0, 11.0, 19.0, 18.0, 16.0, 20.0, 15.0, 44.0, 27.0, 41.0, 44.0, 29.0, 41.0, 37.0, 35.0, 47.0, 50.0, 28.0, 41.0, 42.0, 35.0, 26.0, 36.0, 37.0, 34.0, 24.0, 24.0, 20.0, 27.0, 16.0, 12.0, 10.0, 13.0, 9.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.671875, -13.199462890625, -12.72705078125, -12.254638671875, -11.7822265625, -11.309814453125, -10.83740234375, -10.364990234375, -9.892578125, -9.420166015625, -8.94775390625, -8.475341796875, -8.0029296875, -7.530517578125, -7.05810546875, -6.585693359375, -6.11328125, -5.640869140625, -5.16845703125, -4.696044921875, -4.2236328125, -3.751220703125, -3.27880859375, -2.806396484375, -2.333984375, -1.861572265625, -1.38916015625, -0.916748046875, -0.4443359375, 0.028076171875, 0.50048828125, 0.972900390625, 1.4453125, 1.917724609375, 2.39013671875, 2.862548828125, 3.3349609375, 3.807373046875, 4.27978515625, 4.752197265625, 5.224609375, 5.697021484375, 6.16943359375, 6.641845703125, 7.1142578125, 7.586669921875, 8.05908203125, 8.531494140625, 9.00390625, 9.476318359375, 9.94873046875, 10.421142578125, 10.8935546875, 11.365966796875, 11.83837890625, 12.310791015625, 12.783203125, 13.255615234375, 13.72802734375, 14.200439453125, 14.6728515625, 15.145263671875, 15.61767578125, 16.090087890625, 16.5625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 17.0, 12.0, 20.0, 21.0, 55.0, 66.0, 101.0, 126.0, 208.0, 300.0, 428.0, 614.0, 851.0, 1348.0, 1912.0, 2938.0, 4329.0, 6731.0, 10152.0, 15813.0, 25121.0, 40856.0, 67392.0, 115292.0, 192308.0, 213042.0, 137765.0, 80315.0, 47702.0, 29584.0, 18251.0, 11729.0, 7733.0, 5089.0, 3230.0, 2245.0, 1569.0, 1039.0, 699.0, 511.0, 350.0, 210.0, 159.0, 111.0, 86.0, 47.0, 31.0, 17.0, 17.0, 6.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.41796875, -1.375213623046875, -1.33245849609375, -1.289703369140625, -1.2469482421875, -1.204193115234375, -1.16143798828125, -1.118682861328125, -1.075927734375, -1.033172607421875, -0.99041748046875, -0.947662353515625, -0.9049072265625, -0.862152099609375, -0.81939697265625, -0.776641845703125, -0.73388671875, -0.691131591796875, -0.64837646484375, -0.605621337890625, -0.5628662109375, -0.520111083984375, -0.47735595703125, -0.434600830078125, -0.391845703125, -0.349090576171875, -0.30633544921875, -0.263580322265625, -0.2208251953125, -0.178070068359375, -0.13531494140625, -0.092559814453125, -0.0498046875, -0.007049560546875, 0.03570556640625, 0.078460693359375, 0.1212158203125, 0.163970947265625, 0.20672607421875, 0.249481201171875, 0.292236328125, 0.334991455078125, 0.37774658203125, 0.420501708984375, 0.4632568359375, 0.506011962890625, 0.54876708984375, 0.591522216796875, 0.63427734375, 0.677032470703125, 0.71978759765625, 0.762542724609375, 0.8052978515625, 0.848052978515625, 0.89080810546875, 0.933563232421875, 0.976318359375, 1.019073486328125, 1.06182861328125, 1.104583740234375, 1.1473388671875, 1.190093994140625, 1.23284912109375, 1.275604248046875, 1.318359375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 6.0, 4.0, 7.0, 8.0, 11.0, 15.0, 21.0, 18.0, 25.0, 23.0, 24.0, 27.0, 25.0, 34.0, 53.0, 37.0, 39.0, 37.0, 37.0, 1070.0, 33.0, 31.0, 39.0, 40.0, 41.0, 45.0, 21.0, 33.0, 24.0, 23.0, 17.0, 21.0, 16.0, 13.0, 18.0, 17.0, 15.0, 9.0, 6.0, 11.0, 5.0, 1.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.6640625, -8.3651123046875, -8.066162109375, -7.7672119140625, -7.46826171875, -7.1693115234375, -6.870361328125, -6.5714111328125, -6.2724609375, -5.9735107421875, -5.674560546875, -5.3756103515625, -5.07666015625, -4.7777099609375, -4.478759765625, -4.1798095703125, -3.880859375, -3.5819091796875, -3.282958984375, -2.9840087890625, -2.68505859375, -2.3861083984375, -2.087158203125, -1.7882080078125, -1.4892578125, -1.1903076171875, -0.891357421875, -0.5924072265625, -0.29345703125, 0.0054931640625, 0.304443359375, 0.6033935546875, 0.90234375, 1.2012939453125, 1.500244140625, 1.7991943359375, 2.09814453125, 2.3970947265625, 2.696044921875, 2.9949951171875, 3.2939453125, 3.5928955078125, 3.891845703125, 4.1907958984375, 4.48974609375, 4.7886962890625, 5.087646484375, 5.3865966796875, 5.685546875, 5.9844970703125, 6.283447265625, 6.5823974609375, 6.88134765625, 7.1802978515625, 7.479248046875, 7.7781982421875, 8.0771484375, 8.3760986328125, 8.675048828125, 8.9739990234375, 9.27294921875, 9.5718994140625, 9.870849609375, 10.1697998046875, 10.46875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 10.0, 11.0, 15.0, 24.0, 51.0, 64.0, 113.0, 145.0, 217.0, 374.0, 531.0, 802.0, 1195.0, 1794.0, 2867.0, 4254.0, 6304.0, 9799.0, 14847.0, 23022.0, 35995.0, 59865.0, 102566.0, 172255.0, 1267219.0, 154451.0, 91146.0, 53887.0, 32700.0, 20929.0, 13567.0, 9096.0, 5772.0, 3866.0, 2546.0, 1668.0, 1145.0, 646.0, 481.0, 311.0, 201.0, 149.0, 93.0, 51.0, 40.0, 17.0, 12.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.92724609375, -0.89862060546875, -0.8699951171875, -0.84136962890625, -0.812744140625, -0.78411865234375, -0.7554931640625, -0.72686767578125, -0.6982421875, -0.66961669921875, -0.6409912109375, -0.61236572265625, -0.583740234375, -0.55511474609375, -0.5264892578125, -0.49786376953125, -0.46923828125, -0.44061279296875, -0.4119873046875, -0.38336181640625, -0.354736328125, -0.32611083984375, -0.2974853515625, -0.26885986328125, -0.240234375, -0.21160888671875, -0.1829833984375, -0.15435791015625, -0.125732421875, -0.09710693359375, -0.0684814453125, -0.03985595703125, -0.01123046875, 0.01739501953125, 0.0460205078125, 0.07464599609375, 0.103271484375, 0.13189697265625, 0.1605224609375, 0.18914794921875, 0.2177734375, 0.24639892578125, 0.2750244140625, 0.30364990234375, 0.332275390625, 0.36090087890625, 0.3895263671875, 0.41815185546875, 0.44677734375, 0.47540283203125, 0.5040283203125, 0.53265380859375, 0.561279296875, 0.58990478515625, 0.6185302734375, 0.64715576171875, 0.67578125, 0.70440673828125, 0.7330322265625, 0.76165771484375, 0.790283203125, 0.81890869140625, 0.8475341796875, 0.87615966796875, 0.90478515625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 4.0, 6.0, 5.0, 6.0, 5.0, 18.0, 14.0, 19.0, 21.0, 29.0, 37.0, 33.0, 43.0, 75.0, 75.0, 106.0, 124.0, 85.0, 58.0, 42.0, 37.0, 25.0, 27.0, 23.0, 16.0, 13.0, 16.0, 5.0, 5.0, 10.0, 10.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.027130126953125, -0.02639603614807129, -0.025661945343017578, -0.024927854537963867, -0.024193763732910156, -0.023459672927856445, -0.022725582122802734, -0.021991491317749023, -0.021257400512695312, -0.0205233097076416, -0.01978921890258789, -0.01905512809753418, -0.01832103729248047, -0.017586946487426758, -0.016852855682373047, -0.016118764877319336, -0.015384674072265625, -0.014650583267211914, -0.013916492462158203, -0.013182401657104492, -0.012448310852050781, -0.01171422004699707, -0.01098012924194336, -0.010246038436889648, -0.009511947631835938, -0.008777856826782227, -0.008043766021728516, -0.007309675216674805, -0.006575584411621094, -0.005841493606567383, -0.005107402801513672, -0.004373311996459961, -0.00363922119140625, -0.002905130386352539, -0.002171039581298828, -0.0014369487762451172, -0.0007028579711914062, 3.123283386230469e-05, 0.0007653236389160156, 0.0014994144439697266, 0.0022335052490234375, 0.0029675960540771484, 0.0037016868591308594, 0.00443577766418457, 0.005169868469238281, 0.005903959274291992, 0.006638050079345703, 0.007372140884399414, 0.008106231689453125, 0.008840322494506836, 0.009574413299560547, 0.010308504104614258, 0.011042594909667969, 0.01177668571472168, 0.01251077651977539, 0.013244867324829102, 0.013978958129882812, 0.014713048934936523, 0.015447139739990234, 0.016181230545043945, 0.016915321350097656, 0.017649412155151367, 0.018383502960205078, 0.01911759376525879, 0.0198516845703125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 5.0, 8.0, 8.0, 10.0, 9.0, 10.0, 20.0, 20.0, 25.0, 38.0, 41.0, 58.0, 109.0, 185.0, 459.0, 1652.0, 10564.0, 820204.0, 207076.0, 5964.0, 1213.0, 349.0, 158.0, 93.0, 65.0, 43.0, 40.0, 24.0, 25.0, 14.0, 12.0, 11.0, 9.0, 8.0, 6.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374755859375, -0.3608131408691406, -0.34687042236328125, -0.3329277038574219, -0.3189849853515625, -0.3050422668457031, -0.29109954833984375, -0.2771568298339844, -0.263214111328125, -0.24927139282226562, -0.23532867431640625, -0.22138595581054688, -0.2074432373046875, -0.19350051879882812, -0.17955780029296875, -0.16561508178710938, -0.15167236328125, -0.13772964477539062, -0.12378692626953125, -0.10984420776367188, -0.0959014892578125, -0.08195877075195312, -0.06801605224609375, -0.054073333740234375, -0.040130615234375, -0.026187896728515625, -0.01224517822265625, 0.001697540283203125, 0.0156402587890625, 0.029582977294921875, 0.04352569580078125, 0.057468414306640625, 0.0714111328125, 0.08535385131835938, 0.09929656982421875, 0.11323928833007812, 0.1271820068359375, 0.14112472534179688, 0.15506744384765625, 0.16901016235351562, 0.182952880859375, 0.19689559936523438, 0.21083831787109375, 0.22478103637695312, 0.2387237548828125, 0.2526664733886719, 0.26660919189453125, 0.2805519104003906, 0.29449462890625, 0.3084373474121094, 0.32238006591796875, 0.3363227844238281, 0.3502655029296875, 0.3642082214355469, 0.37815093994140625, 0.3920936584472656, 0.406036376953125, 0.4199790954589844, 0.43392181396484375, 0.4478645324707031, 0.4618072509765625, 0.4757499694824219, 0.48969268798828125, 0.5036354064941406, 0.517578125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 5.0, 5.0, 7.0, 26.0, 51.0, 146.0, 386.0, 225.0, 85.0, 43.0, 13.0, 12.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034176044166088104, -0.029731385409832, -0.025286724790930748, -0.020842064172029495, -0.01639740541577339, -0.011952746659517288, -0.0075080860406160355, -0.0030634254217147827, 0.0013812333345413208, 0.005825893022119999, 0.010270552709698677, 0.014715212397277355, 0.019159872084856033, 0.023604530841112137, 0.02804919146001339, 0.03249385207891464, 0.036938510835170746, 0.04138316959142685, 0.04582782834768295, 0.050272490829229355, 0.05471714958548546, 0.05916180834174156, 0.06360647082328796, 0.06805112957954407, 0.07249578833580017, 0.07694044709205627, 0.08138510584831238, 0.08582976460456848, 0.09027442336082458, 0.09471908211708069, 0.09916374832391739, 0.10360840708017349, 0.108053058385849, 0.1124977171421051, 0.1169423758983612, 0.12138703465461731, 0.1258316934108734, 0.13027635216712952, 0.13472101092338562, 0.13916566967964172, 0.14361032843589783, 0.14805498719215393, 0.15249964594841003, 0.15694430470466614, 0.16138896346092224, 0.16583362221717834, 0.17027828097343445, 0.17472293972969055, 0.17916761338710785, 0.18361227214336395, 0.18805693089962006, 0.19250158965587616, 0.19694624841213226, 0.20139090716838837, 0.20583556592464447, 0.21028023958206177, 0.21472489833831787, 0.21916955709457397, 0.22361421585083008, 0.22805887460708618, 0.23250353336334229, 0.2369481921195984, 0.2413928508758545, 0.2458375096321106, 0.2502821683883667]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 3.0, 5.0, 7.0, 10.0, 10.0, 10.0, 12.0, 27.0, 16.0, 19.0, 21.0, 26.0, 27.0, 22.0, 43.0, 29.0, 26.0, 38.0, 49.0, 47.0, 43.0, 45.0, 39.0, 42.0, 42.0, 41.0, 40.0, 41.0, 24.0, 18.0, 24.0, 30.0, 25.0, 16.0, 19.0, 15.0, 12.0, 12.0, 9.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024921059608459473, -0.02416166290640831, -0.023402266204357147, -0.022642869502305984, -0.021883472800254822, -0.02112407609820366, -0.020364679396152496, -0.019605282694101334, -0.01884588599205017, -0.018086489289999008, -0.017327092587947845, -0.016567695885896683, -0.01580829918384552, -0.015048902481794357, -0.014289505779743195, -0.013530109077692032, -0.01277071237564087, -0.012011315673589706, -0.011251918971538544, -0.010492522269487381, -0.009733125567436218, -0.008973728865385056, -0.008214332163333893, -0.00745493546128273, -0.006695538759231567, -0.005936142057180405, -0.005176745355129242, -0.004417348653078079, -0.0036579519510269165, -0.002898555248975754, -0.002139158546924591, -0.0013797618448734283, -0.0006203651428222656, 0.0001390315592288971, 0.0008984282612800598, 0.0016578249633312225, 0.0024172216653823853, 0.003176618367433548, 0.003936015069484711, 0.004695411771535873, 0.005454808473587036, 0.006214205175638199, 0.006973601877689362, 0.007732998579740524, 0.008492395281791687, 0.00925179198384285, 0.010011188685894012, 0.010770585387945175, 0.011529982089996338, 0.0122893787920475, 0.013048775494098663, 0.013808172196149826, 0.014567568898200989, 0.015326965600252151, 0.016086362302303314, 0.016845759004354477, 0.01760515570640564, 0.018364552408456802, 0.019123949110507965, 0.019883345812559128, 0.02064274251461029, 0.021402139216661453, 0.022161535918712616, 0.02292093262076378, 0.02368032932281494]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 2.0, 5.0, 9.0, 7.0, 11.0, 18.0, 19.0, 16.0, 20.0, 15.0, 44.0, 27.0, 41.0, 44.0, 28.0, 42.0, 37.0, 35.0, 47.0, 49.0, 29.0, 40.0, 43.0, 34.0, 26.0, 37.0, 36.0, 35.0, 24.0, 24.0, 20.0, 26.0, 17.0, 11.0, 11.0, 13.0, 9.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.6796875, -13.2071533203125, -12.734619140625, -12.2620849609375, -11.78955078125, -11.3170166015625, -10.844482421875, -10.3719482421875, -9.8994140625, -9.4268798828125, -8.954345703125, -8.4818115234375, -8.00927734375, -7.5367431640625, -7.064208984375, -6.5916748046875, -6.119140625, -5.6466064453125, -5.174072265625, -4.7015380859375, -4.22900390625, -3.7564697265625, -3.283935546875, -2.8114013671875, -2.3388671875, -1.8663330078125, -1.393798828125, -0.9212646484375, -0.44873046875, 0.0238037109375, 0.496337890625, 0.9688720703125, 1.44140625, 1.9139404296875, 2.386474609375, 2.8590087890625, 3.33154296875, 3.8040771484375, 4.276611328125, 4.7491455078125, 5.2216796875, 5.6942138671875, 6.166748046875, 6.6392822265625, 7.11181640625, 7.5843505859375, 8.056884765625, 8.5294189453125, 9.001953125, 9.4744873046875, 9.947021484375, 10.4195556640625, 10.89208984375, 11.3646240234375, 11.837158203125, 12.3096923828125, 12.7822265625, 13.2547607421875, 13.727294921875, 14.1998291015625, 14.67236328125, 15.1448974609375, 15.617431640625, 16.0899658203125, 16.5625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 4.0, 8.0, 9.0, 13.0, 14.0, 19.0, 31.0, 28.0, 40.0, 41.0, 79.0, 77.0, 123.0, 193.0, 276.0, 589.0, 1366.0, 4357.0, 24323.0, 459637.0, 523852.0, 25985.0, 4483.0, 1400.0, 562.0, 335.0, 198.0, 117.0, 85.0, 67.0, 50.0, 40.0, 27.0, 19.0, 19.0, 18.0, 11.0, 14.0, 8.0, 8.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.109375, -26.175048828125, -25.24072265625, -24.306396484375, -23.3720703125, -22.437744140625, -21.50341796875, -20.569091796875, -19.634765625, -18.700439453125, -17.76611328125, -16.831787109375, -15.8974609375, -14.963134765625, -14.02880859375, -13.094482421875, -12.16015625, -11.225830078125, -10.29150390625, -9.357177734375, -8.4228515625, -7.488525390625, -6.55419921875, -5.619873046875, -4.685546875, -3.751220703125, -2.81689453125, -1.882568359375, -0.9482421875, -0.013916015625, 0.92041015625, 1.854736328125, 2.7890625, 3.723388671875, 4.65771484375, 5.592041015625, 6.5263671875, 7.460693359375, 8.39501953125, 9.329345703125, 10.263671875, 11.197998046875, 12.13232421875, 13.066650390625, 14.0009765625, 14.935302734375, 15.86962890625, 16.803955078125, 17.73828125, 18.672607421875, 19.60693359375, 20.541259765625, 21.4755859375, 22.409912109375, 23.34423828125, 24.278564453125, 25.212890625, 26.147216796875, 27.08154296875, 28.015869140625, 28.9501953125, 29.884521484375, 30.81884765625, 31.753173828125, 32.6875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 3.0, 7.0, 17.0, 17.0, 13.0, 19.0, 23.0, 29.0, 28.0, 35.0, 34.0, 45.0, 46.0, 46.0, 56.0, 80.0, 1538.0, 483.0, 82.0, 63.0, 39.0, 53.0, 35.0, 35.0, 40.0, 35.0, 31.0, 19.0, 18.0, 17.0, 13.0, 8.0, 9.0, 12.0, 3.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.03125, -44.63525390625, -43.2392578125, -41.84326171875, -40.447265625, -39.05126953125, -37.6552734375, -36.25927734375, -34.86328125, -33.46728515625, -32.0712890625, -30.67529296875, -29.279296875, -27.88330078125, -26.4873046875, -25.09130859375, -23.6953125, -22.29931640625, -20.9033203125, -19.50732421875, -18.111328125, -16.71533203125, -15.3193359375, -13.92333984375, -12.52734375, -11.13134765625, -9.7353515625, -8.33935546875, -6.943359375, -5.54736328125, -4.1513671875, -2.75537109375, -1.359375, 0.03662109375, 1.4326171875, 2.82861328125, 4.224609375, 5.62060546875, 7.0166015625, 8.41259765625, 9.80859375, 11.20458984375, 12.6005859375, 13.99658203125, 15.392578125, 16.78857421875, 18.1845703125, 19.58056640625, 20.9765625, 22.37255859375, 23.7685546875, 25.16455078125, 26.560546875, 27.95654296875, 29.3525390625, 30.74853515625, 32.14453125, 33.54052734375, 34.9365234375, 36.33251953125, 37.728515625, 39.12451171875, 40.5205078125, 41.91650390625, 43.3125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 9.0, 9.0, 10.0, 14.0, 20.0, 12.0, 30.0, 34.0, 36.0, 46.0, 74.0, 94.0, 143.0, 250.0, 719.0, 2670.0, 163846.0, 2970994.0, 4839.0, 957.0, 305.0, 165.0, 100.0, 69.0, 49.0, 50.0, 38.0, 22.0, 21.0, 14.0, 21.0, 13.0, 6.0, 3.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.375, -96.1826171875, -92.990234375, -89.7978515625, -86.60546875, -83.4130859375, -80.220703125, -77.0283203125, -73.8359375, -70.6435546875, -67.451171875, -64.2587890625, -61.06640625, -57.8740234375, -54.681640625, -51.4892578125, -48.296875, -45.1044921875, -41.912109375, -38.7197265625, -35.52734375, -32.3349609375, -29.142578125, -25.9501953125, -22.7578125, -19.5654296875, -16.373046875, -13.1806640625, -9.98828125, -6.7958984375, -3.603515625, -0.4111328125, 2.78125, 5.9736328125, 9.166015625, 12.3583984375, 15.55078125, 18.7431640625, 21.935546875, 25.1279296875, 28.3203125, 31.5126953125, 34.705078125, 37.8974609375, 41.08984375, 44.2822265625, 47.474609375, 50.6669921875, 53.859375, 57.0517578125, 60.244140625, 63.4365234375, 66.62890625, 69.8212890625, 73.013671875, 76.2060546875, 79.3984375, 82.5908203125, 85.783203125, 88.9755859375, 92.16796875, 95.3603515625, 98.552734375, 101.7451171875, 104.9375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 48.0, 670.0, 282.0, 15.0], "bins": [-483.9574279785156, -476.1205749511719, -468.28375244140625, -460.4468994140625, -452.61004638671875, -444.7732238769531, -436.9363708496094, -429.0995178222656, -421.2626953125, -413.42584228515625, -405.5890197753906, -397.7521667480469, -389.9153137207031, -382.0784912109375, -374.24163818359375, -366.40478515625, -358.56793212890625, -350.7310791015625, -342.8942565917969, -335.0574035644531, -327.2205505371094, -319.38372802734375, -311.546875, -303.71002197265625, -295.8731994628906, -288.0363464355469, -280.19952392578125, -272.3626708984375, -264.52581787109375, -256.6889953613281, -248.85214233398438, -241.0153045654297, -233.178466796875, -225.3416290283203, -217.50477600097656, -209.66793823242188, -201.8311004638672, -193.9942626953125, -186.15740966796875, -178.32057189941406, -170.4837188720703, -162.64688110351562, -154.81002807617188, -146.9731903076172, -139.1363525390625, -131.29949951171875, -123.46266174316406, -115.62582397460938, -107.78898620605469, -99.95214080810547, -92.11530303955078, -84.27845764160156, -76.44161987304688, -68.60477447509766, -60.76792907714844, -52.931087493896484, -45.09424591064453, -37.25740432739258, -29.420560836791992, -21.583717346191406, -13.746875762939453, -5.9100341796875, 1.9268112182617188, 9.763652801513672, 17.600496292114258]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 8.0, 5.0, 6.0, 6.0, 8.0, 13.0, 12.0, 12.0, 18.0, 20.0, 25.0, 18.0, 20.0, 27.0, 37.0, 26.0, 25.0, 36.0, 44.0, 32.0, 37.0, 41.0, 39.0, 50.0, 45.0, 33.0, 40.0, 34.0, 42.0, 25.0, 34.0, 25.0, 19.0, 23.0, 21.0, 14.0, 9.0, 9.0, 11.0, 9.0, 13.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-89.78470611572266, -86.94556427001953, -84.10641479492188, -81.26727294921875, -78.42813110351562, -75.58898162841797, -72.74983978271484, -69.91069030761719, -67.07154846191406, -64.23240661621094, -61.39325714111328, -58.554115295410156, -55.714969635009766, -52.875823974609375, -50.03668212890625, -47.19753646850586, -44.35839080810547, -41.51924514770508, -38.68009948730469, -35.84095764160156, -33.00181198120117, -30.16266632080078, -27.323522567749023, -24.484378814697266, -21.645233154296875, -18.806087493896484, -15.966943740844727, -13.127799034118652, -10.288654327392578, -7.449509620666504, -4.61036491394043, -1.7712211608886719, 1.0679168701171875, 3.9070615768432617, 6.746206283569336, 9.58535099029541, 12.424495697021484, 15.263640403747559, 18.102785110473633, 20.94192886352539, 23.78107452392578, 26.620220184326172, 29.45936393737793, 32.29850769042969, 35.13765335083008, 37.97679901123047, 40.815940856933594, 43.655086517333984, 46.494232177734375, 49.333377838134766, 52.172523498535156, 55.01166534423828, 57.85081100463867, 60.68995666503906, 63.52909851074219, 66.36824035644531, 69.20738983154297, 72.0465316772461, 74.88568115234375, 77.72482299804688, 80.56396484375, 83.40311431884766, 86.24225616455078, 89.08140563964844, 91.92054748535156]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 4.0, 14.0, 14.0, 12.0, 25.0, 21.0, 22.0, 18.0, 39.0, 32.0, 43.0, 31.0, 44.0, 36.0, 50.0, 37.0, 42.0, 51.0, 45.0, 29.0, 40.0, 41.0, 38.0, 33.0, 33.0, 26.0, 24.0, 25.0, 22.0, 12.0, 13.0, 12.0, 14.0, 6.0, 9.0, 11.0, 5.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.53125, -14.0341796875, -13.537109375, -13.0400390625, -12.54296875, -12.0458984375, -11.548828125, -11.0517578125, -10.5546875, -10.0576171875, -9.560546875, -9.0634765625, -8.56640625, -8.0693359375, -7.572265625, -7.0751953125, -6.578125, -6.0810546875, -5.583984375, -5.0869140625, -4.58984375, -4.0927734375, -3.595703125, -3.0986328125, -2.6015625, -2.1044921875, -1.607421875, -1.1103515625, -0.61328125, -0.1162109375, 0.380859375, 0.8779296875, 1.375, 1.8720703125, 2.369140625, 2.8662109375, 3.36328125, 3.8603515625, 4.357421875, 4.8544921875, 5.3515625, 5.8486328125, 6.345703125, 6.8427734375, 7.33984375, 7.8369140625, 8.333984375, 8.8310546875, 9.328125, 9.8251953125, 10.322265625, 10.8193359375, 11.31640625, 11.8134765625, 12.310546875, 12.8076171875, 13.3046875, 13.8017578125, 14.298828125, 14.7958984375, 15.29296875, 15.7900390625, 16.287109375, 16.7841796875, 17.28125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 11.0, 21.0, 32.0, 40.0, 66.0, 85.0, 106.0, 159.0, 236.0, 329.0, 470.0, 683.0, 988.0, 1484.0, 2304.0, 3622.0, 6171.0, 11434.0, 30881.0, 435719.0, 3427722.0, 223826.0, 22039.0, 10135.0, 5557.0, 3337.0, 2119.0, 1402.0, 945.0, 675.0, 453.0, 351.0, 222.0, 189.0, 121.0, 85.0, 74.0, 52.0, 40.0, 24.0, 22.0, 15.0, 11.0, 9.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.28125, -42.87109375, -41.4609375, -40.05078125, -38.640625, -37.23046875, -35.8203125, -34.41015625, -33.0, -31.58984375, -30.1796875, -28.76953125, -27.359375, -25.94921875, -24.5390625, -23.12890625, -21.71875, -20.30859375, -18.8984375, -17.48828125, -16.078125, -14.66796875, -13.2578125, -11.84765625, -10.4375, -9.02734375, -7.6171875, -6.20703125, -4.796875, -3.38671875, -1.9765625, -0.56640625, 0.84375, 2.25390625, 3.6640625, 5.07421875, 6.484375, 7.89453125, 9.3046875, 10.71484375, 12.125, 13.53515625, 14.9453125, 16.35546875, 17.765625, 19.17578125, 20.5859375, 21.99609375, 23.40625, 24.81640625, 26.2265625, 27.63671875, 29.046875, 30.45703125, 31.8671875, 33.27734375, 34.6875, 36.09765625, 37.5078125, 38.91796875, 40.328125, 41.73828125, 43.1484375, 44.55859375, 45.96875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 7.0, 7.0, 4.0, 8.0, 7.0, 5.0, 14.0, 17.0, 30.0, 44.0, 74.0, 117.0, 262.0, 568.0, 1033.0, 907.0, 446.0, 191.0, 106.0, 61.0, 40.0, 28.0, 16.0, 24.0, 14.0, 9.0, 9.0, 7.0, 5.0, 4.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.0, -34.8701171875, -33.740234375, -32.6103515625, -31.48046875, -30.3505859375, -29.220703125, -28.0908203125, -26.9609375, -25.8310546875, -24.701171875, -23.5712890625, -22.44140625, -21.3115234375, -20.181640625, -19.0517578125, -17.921875, -16.7919921875, -15.662109375, -14.5322265625, -13.40234375, -12.2724609375, -11.142578125, -10.0126953125, -8.8828125, -7.7529296875, -6.623046875, -5.4931640625, -4.36328125, -3.2333984375, -2.103515625, -0.9736328125, 0.15625, 1.2861328125, 2.416015625, 3.5458984375, 4.67578125, 5.8056640625, 6.935546875, 8.0654296875, 9.1953125, 10.3251953125, 11.455078125, 12.5849609375, 13.71484375, 14.8447265625, 15.974609375, 17.1044921875, 18.234375, 19.3642578125, 20.494140625, 21.6240234375, 22.75390625, 23.8837890625, 25.013671875, 26.1435546875, 27.2734375, 28.4033203125, 29.533203125, 30.6630859375, 31.79296875, 32.9228515625, 34.052734375, 35.1826171875, 36.3125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 6.0, 6.0, 8.0, 24.0, 27.0, 34.0, 52.0, 81.0, 120.0, 164.0, 268.0, 440.0, 739.0, 1366.0, 2609.0, 5369.0, 12553.0, 33772.0, 216700.0, 3723575.0, 145125.0, 29649.0, 11207.0, 4873.0, 2374.0, 1312.0, 705.0, 390.0, 250.0, 150.0, 103.0, 65.0, 52.0, 32.0, 20.0, 21.0, 9.0, 10.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.25, -63.23828125, -61.2265625, -59.21484375, -57.203125, -55.19140625, -53.1796875, -51.16796875, -49.15625, -47.14453125, -45.1328125, -43.12109375, -41.109375, -39.09765625, -37.0859375, -35.07421875, -33.0625, -31.05078125, -29.0390625, -27.02734375, -25.015625, -23.00390625, -20.9921875, -18.98046875, -16.96875, -14.95703125, -12.9453125, -10.93359375, -8.921875, -6.91015625, -4.8984375, -2.88671875, -0.875, 1.13671875, 3.1484375, 5.16015625, 7.171875, 9.18359375, 11.1953125, 13.20703125, 15.21875, 17.23046875, 19.2421875, 21.25390625, 23.265625, 25.27734375, 27.2890625, 29.30078125, 31.3125, 33.32421875, 35.3359375, 37.34765625, 39.359375, 41.37109375, 43.3828125, 45.39453125, 47.40625, 49.41796875, 51.4296875, 53.44140625, 55.453125, 57.46484375, 59.4765625, 61.48828125, 63.5]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 6.0, 18.0, 18.0, 18.0, 48.0, 91.0, 189.0, 237.0, 173.0, 80.0, 55.0, 28.0, 16.0, 11.0, 4.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-263.5518798828125, -258.11639404296875, -252.68087768554688, -247.24539184570312, -241.8098907470703, -236.3743896484375, -230.9388885498047, -225.50338745117188, -220.06788635253906, -214.63238525390625, -209.19688415527344, -203.76138305664062, -198.32589721679688, -192.89039611816406, -187.45489501953125, -182.01939392089844, -176.58389282226562, -171.1483917236328, -165.712890625, -160.27740478515625, -154.84190368652344, -149.40640258789062, -143.9709014892578, -138.535400390625, -133.09991455078125, -127.66441345214844, -122.22891998291016, -116.79341888427734, -111.35791778564453, -105.92242431640625, -100.48692321777344, -95.05142211914062, -89.61591339111328, -84.18041229248047, -78.74491882324219, -73.30941772460938, -67.87391662597656, -62.438419342041016, -57.00292205810547, -51.567420959472656, -46.13192367553711, -40.69642639160156, -35.26092529296875, -29.825428009033203, -24.389928817749023, -18.954429626464844, -13.518932342529297, -8.083431243896484, -2.6479339599609375, 2.787564754486084, 8.223063468933105, 13.658561706542969, 19.09406089782715, 24.529560089111328, 29.965057373046875, 35.40055847167969, 40.836055755615234, 46.27155303955078, 51.707054138183594, 57.14255142211914, 62.57804870605469, 68.0135498046875, 73.44905090332031, 78.88455200195312, 84.3200454711914]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 6.0, 5.0, 4.0, 3.0, 8.0, 11.0, 12.0, 12.0, 18.0, 11.0, 21.0, 26.0, 33.0, 31.0, 26.0, 41.0, 34.0, 33.0, 33.0, 44.0, 44.0, 39.0, 41.0, 38.0, 34.0, 39.0, 22.0, 39.0, 46.0, 36.0, 23.0, 28.0, 24.0, 22.0, 18.0, 11.0, 18.0, 11.0, 9.0, 9.0, 4.0, 8.0, 5.0, 9.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-76.08663940429688, -73.7289810180664, -71.37132263183594, -69.01365661621094, -66.65599822998047, -64.29833984375, -61.94068145751953, -59.5830192565918, -57.22535705566406, -54.867698669433594, -52.51003646850586, -50.15237808227539, -47.794715881347656, -45.43705749511719, -43.07939910888672, -40.721736907958984, -38.364078521728516, -36.00642013549805, -33.64875793457031, -31.291099548339844, -28.93343734741211, -26.57577896118164, -24.21811866760254, -21.860458374023438, -19.502798080444336, -17.145137786865234, -14.787477493286133, -12.429818153381348, -10.072157859802246, -7.7144975662231445, -5.356838226318359, -2.999177932739258, -0.6415176391601562, 1.7161424160003662, 4.073802471160889, 6.431462287902832, 8.789122581481934, 11.146782875061035, 13.50444221496582, 15.862102508544922, 18.219762802124023, 20.577423095703125, 22.935083389282227, 25.292743682861328, 27.650402069091797, 30.00806427001953, 32.36572265625, 34.72338104248047, 37.0810432434082, 39.43870162963867, 41.796363830566406, 44.154022216796875, 46.51168441772461, 48.86934280395508, 51.22700500488281, 53.58466339111328, 55.94232177734375, 58.29998016357422, 60.65764236450195, 63.01530075073242, 65.37296295166016, 67.73062133789062, 70.0882797241211, 72.44593811035156, 74.80360412597656]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 10.0, 12.0, 14.0, 15.0, 19.0, 19.0, 35.0, 21.0, 27.0, 36.0, 30.0, 54.0, 41.0, 54.0, 38.0, 66.0, 39.0, 36.0, 46.0, 35.0, 33.0, 38.0, 29.0, 31.0, 27.0, 25.0, 28.0, 11.0, 19.0, 18.0, 15.0, 11.0, 8.0, 11.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.375, -14.84765625, -14.3203125, -13.79296875, -13.265625, -12.73828125, -12.2109375, -11.68359375, -11.15625, -10.62890625, -10.1015625, -9.57421875, -9.046875, -8.51953125, -7.9921875, -7.46484375, -6.9375, -6.41015625, -5.8828125, -5.35546875, -4.828125, -4.30078125, -3.7734375, -3.24609375, -2.71875, -2.19140625, -1.6640625, -1.13671875, -0.609375, -0.08203125, 0.4453125, 0.97265625, 1.5, 2.02734375, 2.5546875, 3.08203125, 3.609375, 4.13671875, 4.6640625, 5.19140625, 5.71875, 6.24609375, 6.7734375, 7.30078125, 7.828125, 8.35546875, 8.8828125, 9.41015625, 9.9375, 10.46484375, 10.9921875, 11.51953125, 12.046875, 12.57421875, 13.1015625, 13.62890625, 14.15625, 14.68359375, 15.2109375, 15.73828125, 16.265625, 16.79296875, 17.3203125, 17.84765625, 18.375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 8.0, 4.0, 7.0, 15.0, 19.0, 25.0, 44.0, 82.0, 85.0, 130.0, 209.0, 287.0, 451.0, 628.0, 965.0, 1451.0, 2218.0, 3282.0, 4880.0, 7854.0, 12262.0, 19500.0, 31677.0, 53839.0, 94914.0, 167898.0, 238075.0, 170552.0, 96226.0, 54066.0, 32359.0, 19536.0, 12206.0, 7868.0, 5001.0, 3319.0, 2161.0, 1463.0, 957.0, 654.0, 464.0, 281.0, 200.0, 146.0, 87.0, 67.0, 46.0, 32.0, 19.0, 11.0, 19.0, 8.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.276092529296875, -1.23284912109375, -1.189605712890625, -1.1463623046875, -1.103118896484375, -1.05987548828125, -1.016632080078125, -0.973388671875, -0.930145263671875, -0.88690185546875, -0.843658447265625, -0.8004150390625, -0.757171630859375, -0.71392822265625, -0.670684814453125, -0.62744140625, -0.584197998046875, -0.54095458984375, -0.497711181640625, -0.4544677734375, -0.411224365234375, -0.36798095703125, -0.324737548828125, -0.281494140625, -0.238250732421875, -0.19500732421875, -0.151763916015625, -0.1085205078125, -0.065277099609375, -0.02203369140625, 0.021209716796875, 0.064453125, 0.107696533203125, 0.15093994140625, 0.194183349609375, 0.2374267578125, 0.280670166015625, 0.32391357421875, 0.367156982421875, 0.410400390625, 0.453643798828125, 0.49688720703125, 0.540130615234375, 0.5833740234375, 0.626617431640625, 0.66986083984375, 0.713104248046875, 0.75634765625, 0.799591064453125, 0.84283447265625, 0.886077880859375, 0.9293212890625, 0.972564697265625, 1.01580810546875, 1.059051513671875, 1.102294921875, 1.145538330078125, 1.18878173828125, 1.232025146484375, 1.2752685546875, 1.318511962890625, 1.36175537109375, 1.404998779296875, 1.4482421875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 9.0, 6.0, 10.0, 13.0, 9.0, 17.0, 16.0, 19.0, 19.0, 21.0, 32.0, 21.0, 25.0, 43.0, 38.0, 38.0, 30.0, 29.0, 37.0, 1071.0, 37.0, 55.0, 56.0, 31.0, 35.0, 40.0, 31.0, 25.0, 26.0, 23.0, 20.0, 21.0, 16.0, 23.0, 13.0, 13.0, 8.0, 12.0, 3.0, 4.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-10.875, -10.5626220703125, -10.250244140625, -9.9378662109375, -9.62548828125, -9.3131103515625, -9.000732421875, -8.6883544921875, -8.3759765625, -8.0635986328125, -7.751220703125, -7.4388427734375, -7.12646484375, -6.8140869140625, -6.501708984375, -6.1893310546875, -5.876953125, -5.5645751953125, -5.252197265625, -4.9398193359375, -4.62744140625, -4.3150634765625, -4.002685546875, -3.6903076171875, -3.3779296875, -3.0655517578125, -2.753173828125, -2.4407958984375, -2.12841796875, -1.8160400390625, -1.503662109375, -1.1912841796875, -0.87890625, -0.5665283203125, -0.254150390625, 0.0582275390625, 0.37060546875, 0.6829833984375, 0.995361328125, 1.3077392578125, 1.6201171875, 1.9324951171875, 2.244873046875, 2.5572509765625, 2.86962890625, 3.1820068359375, 3.494384765625, 3.8067626953125, 4.119140625, 4.4315185546875, 4.743896484375, 5.0562744140625, 5.36865234375, 5.6810302734375, 5.993408203125, 6.3057861328125, 6.6181640625, 6.9305419921875, 7.242919921875, 7.5552978515625, 7.86767578125, 8.1800537109375, 8.492431640625, 8.8048095703125, 9.1171875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 4.0, 18.0, 22.0, 25.0, 44.0, 71.0, 89.0, 114.0, 178.0, 307.0, 369.0, 596.0, 842.0, 1234.0, 1854.0, 2676.0, 4073.0, 6158.0, 9350.0, 14124.0, 21754.0, 34670.0, 56338.0, 94814.0, 159783.0, 1261147.0, 166306.0, 99157.0, 58575.0, 36074.0, 22768.0, 14614.0, 9510.0, 6340.0, 4188.0, 2855.0, 1980.0, 1284.0, 900.0, 637.0, 408.0, 302.0, 178.0, 127.0, 95.0, 56.0, 40.0, 36.0, 14.0, 7.0, 14.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.83935546875, -0.810943603515625, -0.78253173828125, -0.754119873046875, -0.7257080078125, -0.697296142578125, -0.66888427734375, -0.640472412109375, -0.612060546875, -0.583648681640625, -0.55523681640625, -0.526824951171875, -0.4984130859375, -0.470001220703125, -0.44158935546875, -0.413177490234375, -0.384765625, -0.356353759765625, -0.32794189453125, -0.299530029296875, -0.2711181640625, -0.242706298828125, -0.21429443359375, -0.185882568359375, -0.157470703125, -0.129058837890625, -0.10064697265625, -0.072235107421875, -0.0438232421875, -0.015411376953125, 0.01300048828125, 0.041412353515625, 0.06982421875, 0.098236083984375, 0.12664794921875, 0.155059814453125, 0.1834716796875, 0.211883544921875, 0.24029541015625, 0.268707275390625, 0.297119140625, 0.325531005859375, 0.35394287109375, 0.382354736328125, 0.4107666015625, 0.439178466796875, 0.46759033203125, 0.496002197265625, 0.5244140625, 0.552825927734375, 0.58123779296875, 0.609649658203125, 0.6380615234375, 0.666473388671875, 0.69488525390625, 0.723297119140625, 0.751708984375, 0.780120849609375, 0.80853271484375, 0.836944580078125, 0.8653564453125, 0.893768310546875, 0.92218017578125, 0.950592041015625, 0.97900390625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 4.0, 6.0, 7.0, 9.0, 7.0, 13.0, 16.0, 15.0, 19.0, 23.0, 39.0, 65.0, 62.0, 71.0, 83.0, 85.0, 84.0, 79.0, 52.0, 44.0, 39.0, 33.0, 21.0, 8.0, 11.0, 19.0, 13.0, 15.0, 6.0, 8.0, 3.0, 6.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.01629638671875, -0.015798449516296387, -0.015300512313842773, -0.01480257511138916, -0.014304637908935547, -0.013806700706481934, -0.01330876350402832, -0.012810826301574707, -0.012312889099121094, -0.01181495189666748, -0.011317014694213867, -0.010819077491760254, -0.01032114028930664, -0.009823203086853027, -0.009325265884399414, -0.0088273286819458, -0.008329391479492188, -0.007831454277038574, -0.007333517074584961, -0.006835579872131348, -0.006337642669677734, -0.005839705467224121, -0.005341768264770508, -0.0048438310623168945, -0.004345893859863281, -0.003847956657409668, -0.0033500194549560547, -0.0028520822525024414, -0.002354145050048828, -0.0018562078475952148, -0.0013582706451416016, -0.0008603334426879883, -0.000362396240234375, 0.00013554096221923828, 0.0006334781646728516, 0.0011314153671264648, 0.0016293525695800781, 0.0021272897720336914, 0.0026252269744873047, 0.003123164176940918, 0.0036211013793945312, 0.0041190385818481445, 0.004616975784301758, 0.005114912986755371, 0.005612850189208984, 0.006110787391662598, 0.006608724594116211, 0.007106661796569824, 0.0076045989990234375, 0.00810253620147705, 0.008600473403930664, 0.009098410606384277, 0.00959634780883789, 0.010094285011291504, 0.010592222213745117, 0.01109015941619873, 0.011588096618652344, 0.012086033821105957, 0.01258397102355957, 0.013081908226013184, 0.013579845428466797, 0.01407778263092041, 0.014575719833374023, 0.015073657035827637, 0.01557159423828125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 4.0, 12.0, 5.0, 11.0, 8.0, 16.0, 12.0, 22.0, 16.0, 28.0, 24.0, 30.0, 68.0, 109.0, 142.0, 265.0, 1319.0, 104703.0, 936137.0, 4583.0, 414.0, 189.0, 114.0, 79.0, 51.0, 47.0, 28.0, 21.0, 18.0, 8.0, 17.0, 8.0, 12.0, 4.0, 4.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3623046875, -0.35105133056640625, -0.3397979736328125, -0.32854461669921875, -0.317291259765625, -0.30603790283203125, -0.2947845458984375, -0.28353118896484375, -0.27227783203125, -0.26102447509765625, -0.2497711181640625, -0.23851776123046875, -0.227264404296875, -0.21601104736328125, -0.2047576904296875, -0.19350433349609375, -0.1822509765625, -0.17099761962890625, -0.1597442626953125, -0.14849090576171875, -0.137237548828125, -0.12598419189453125, -0.1147308349609375, -0.10347747802734375, -0.09222412109375, -0.08097076416015625, -0.0697174072265625, -0.05846405029296875, -0.047210693359375, -0.03595733642578125, -0.0247039794921875, -0.01345062255859375, -0.002197265625, 0.00905609130859375, 0.0203094482421875, 0.03156280517578125, 0.042816162109375, 0.05406951904296875, 0.0653228759765625, 0.07657623291015625, 0.08782958984375, 0.09908294677734375, 0.1103363037109375, 0.12158966064453125, 0.132843017578125, 0.14409637451171875, 0.1553497314453125, 0.16660308837890625, 0.1778564453125, 0.18910980224609375, 0.2003631591796875, 0.21161651611328125, 0.222869873046875, 0.23412322998046875, 0.2453765869140625, 0.25662994384765625, 0.26788330078125, 0.27913665771484375, 0.2903900146484375, 0.30164337158203125, 0.312896728515625, 0.32415008544921875, 0.3354034423828125, 0.34665679931640625, 0.35791015625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 43.0, 446.0, 461.0, 50.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0415981188416481, -0.03640041500329971, -0.031202707439661026, -0.026005001738667488, -0.02080729603767395, -0.015609590336680412, -0.010411884635686874, -0.005214177072048187, -1.6473233699798584e-05, 0.005181232467293739, 0.010378938168287277, 0.015576643869280815, 0.020774349570274353, 0.02597205527126789, 0.03116976097226143, 0.036367468535900116, 0.041565172374248505, 0.04676287621259689, 0.05196058377623558, 0.05715829133987427, 0.062355995178222656, 0.06755369901657104, 0.07275140285491943, 0.07794911414384842, 0.08314681798219681, 0.0883445218205452, 0.09354223310947418, 0.09873993694782257, 0.10393764078617096, 0.10913534462451935, 0.11433304846286774, 0.11953075975179672, 0.12472847104072571, 0.1299261748790741, 0.13512387871742249, 0.14032158255577087, 0.14551928639411926, 0.15071700513362885, 0.15591470897197723, 0.16111241281032562, 0.166310116648674, 0.1715078204870224, 0.1767055243253708, 0.18190322816371918, 0.18710094690322876, 0.19229865074157715, 0.19749635457992554, 0.20269405841827393, 0.20789176225662231, 0.2130894660949707, 0.2182871699333191, 0.22348487377166748, 0.22868257761001587, 0.23388029634952545, 0.23907800018787384, 0.24427570402622223, 0.24947340786457062, 0.2546711266040802, 0.2598688304424286, 0.265066534280777, 0.27026423811912537, 0.27546194195747375, 0.28065964579582214, 0.28585734963417053, 0.2910550534725189]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 12.0, 13.0, 8.0, 13.0, 13.0, 16.0, 19.0, 18.0, 30.0, 31.0, 37.0, 34.0, 35.0, 40.0, 45.0, 47.0, 46.0, 38.0, 44.0, 51.0, 53.0, 41.0, 46.0, 39.0, 31.0, 21.0, 23.0, 24.0, 29.0, 19.0, 18.0, 16.0, 8.0, 4.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021617889404296875, -0.020996319130063057, -0.02037474885582924, -0.01975317858159542, -0.019131608307361603, -0.018510038033127785, -0.017888467758893967, -0.01726689748466015, -0.01664532721042633, -0.016023756936192513, -0.015402186661958694, -0.014780616387724876, -0.014159046113491058, -0.01353747583925724, -0.012915905565023422, -0.012294335290789604, -0.011672765016555786, -0.011051194742321968, -0.01042962446808815, -0.009808054193854332, -0.009186483919620514, -0.008564913645386696, -0.007943343371152878, -0.00732177309691906, -0.006700202822685242, -0.006078632548451424, -0.005457062274217606, -0.0048354919999837875, -0.0042139217257499695, -0.0035923514515161514, -0.0029707811772823334, -0.0023492109030485153, -0.0017276406288146973, -0.0011060703545808792, -0.00048450008034706116, 0.0001370701938867569, 0.000758640468120575, 0.001380210742354393, 0.002001781016588211, 0.002623351290822029, 0.003244921565055847, 0.0038664918392896652, 0.004488062113523483, 0.005109632387757301, 0.005731202661991119, 0.0063527729362249374, 0.0069743432104587555, 0.0075959134846925735, 0.008217483758926392, 0.00883905403316021, 0.009460624307394028, 0.010082194581627846, 0.010703764855861664, 0.011325335130095482, 0.0119469054043293, 0.012568475678563118, 0.013190045952796936, 0.013811616227030754, 0.014433186501264572, 0.01505475677549839, 0.015676327049732208, 0.016297897323966026, 0.016919467598199844, 0.017541037872433662, 0.01816260814666748]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 10.0, 12.0, 14.0, 15.0, 19.0, 19.0, 35.0, 21.0, 27.0, 36.0, 30.0, 54.0, 41.0, 54.0, 38.0, 66.0, 39.0, 36.0, 46.0, 35.0, 33.0, 38.0, 29.0, 31.0, 27.0, 25.0, 28.0, 11.0, 19.0, 18.0, 15.0, 11.0, 8.0, 11.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.375, -14.84765625, -14.3203125, -13.79296875, -13.265625, -12.73828125, -12.2109375, -11.68359375, -11.15625, -10.62890625, -10.1015625, -9.57421875, -9.046875, -8.51953125, -7.9921875, -7.46484375, -6.9375, -6.41015625, -5.8828125, -5.35546875, -4.828125, -4.30078125, -3.7734375, -3.24609375, -2.71875, -2.19140625, -1.6640625, -1.13671875, -0.609375, -0.08203125, 0.4453125, 0.97265625, 1.5, 2.02734375, 2.5546875, 3.08203125, 3.609375, 4.13671875, 4.6640625, 5.19140625, 5.71875, 6.24609375, 6.7734375, 7.30078125, 7.828125, 8.35546875, 8.8828125, 9.41015625, 9.9375, 10.46484375, 10.9921875, 11.51953125, 12.046875, 12.57421875, 13.1015625, 13.62890625, 14.15625, 14.68359375, 15.2109375, 15.73828125, 16.265625, 16.79296875, 17.3203125, 17.84765625, 18.375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 6.0, 14.0, 18.0, 17.0, 26.0, 26.0, 33.0, 46.0, 60.0, 91.0, 126.0, 176.0, 263.0, 402.0, 604.0, 1109.0, 2096.0, 4891.0, 16219.0, 202429.0, 781536.0, 25821.0, 6502.0, 2583.0, 1268.0, 717.0, 444.0, 282.0, 207.0, 142.0, 96.0, 64.0, 55.0, 30.0, 37.0, 23.0, 20.0, 17.0, 11.0, 11.0, 6.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.75, -35.48876953125, -34.2275390625, -32.96630859375, -31.705078125, -30.44384765625, -29.1826171875, -27.92138671875, -26.66015625, -25.39892578125, -24.1376953125, -22.87646484375, -21.615234375, -20.35400390625, -19.0927734375, -17.83154296875, -16.5703125, -15.30908203125, -14.0478515625, -12.78662109375, -11.525390625, -10.26416015625, -9.0029296875, -7.74169921875, -6.48046875, -5.21923828125, -3.9580078125, -2.69677734375, -1.435546875, -0.17431640625, 1.0869140625, 2.34814453125, 3.609375, 4.87060546875, 6.1318359375, 7.39306640625, 8.654296875, 9.91552734375, 11.1767578125, 12.43798828125, 13.69921875, 14.96044921875, 16.2216796875, 17.48291015625, 18.744140625, 20.00537109375, 21.2666015625, 22.52783203125, 23.7890625, 25.05029296875, 26.3115234375, 27.57275390625, 28.833984375, 30.09521484375, 31.3564453125, 32.61767578125, 33.87890625, 35.14013671875, 36.4013671875, 37.66259765625, 38.923828125, 40.18505859375, 41.4462890625, 42.70751953125, 43.96875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 2.0, 7.0, 8.0, 3.0, 11.0, 8.0, 11.0, 10.0, 19.0, 16.0, 15.0, 22.0, 29.0, 21.0, 31.0, 42.0, 37.0, 38.0, 44.0, 69.0, 92.0, 1605.0, 382.0, 100.0, 52.0, 44.0, 35.0, 36.0, 30.0, 30.0, 32.0, 26.0, 22.0, 20.0, 26.0, 21.0, 13.0, 12.0, 6.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.5625, -35.341796875, -34.12109375, -32.900390625, -31.6796875, -30.458984375, -29.23828125, -28.017578125, -26.796875, -25.576171875, -24.35546875, -23.134765625, -21.9140625, -20.693359375, -19.47265625, -18.251953125, -17.03125, -15.810546875, -14.58984375, -13.369140625, -12.1484375, -10.927734375, -9.70703125, -8.486328125, -7.265625, -6.044921875, -4.82421875, -3.603515625, -2.3828125, -1.162109375, 0.05859375, 1.279296875, 2.5, 3.720703125, 4.94140625, 6.162109375, 7.3828125, 8.603515625, 9.82421875, 11.044921875, 12.265625, 13.486328125, 14.70703125, 15.927734375, 17.1484375, 18.369140625, 19.58984375, 20.810546875, 22.03125, 23.251953125, 24.47265625, 25.693359375, 26.9140625, 28.134765625, 29.35546875, 30.576171875, 31.796875, 33.017578125, 34.23828125, 35.458984375, 36.6796875, 37.900390625, 39.12109375, 40.341796875, 41.5625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 1.0, 12.0, 5.0, 10.0, 12.0, 16.0, 20.0, 32.0, 24.0, 15.0, 40.0, 37.0, 57.0, 47.0, 82.0, 140.0, 265.0, 747.0, 4257.0, 125838.0, 3002292.0, 9512.0, 1250.0, 332.0, 173.0, 108.0, 66.0, 64.0, 44.0, 22.0, 26.0, 16.0, 17.0, 17.0, 20.0, 14.0, 9.0, 12.0, 9.0, 8.0, 5.0, 4.0, 7.0, 1.0, 6.0, 1.0, 2.0, 4.0], "bins": [-107.4375, -104.4677734375, -101.498046875, -98.5283203125, -95.55859375, -92.5888671875, -89.619140625, -86.6494140625, -83.6796875, -80.7099609375, -77.740234375, -74.7705078125, -71.80078125, -68.8310546875, -65.861328125, -62.8916015625, -59.921875, -56.9521484375, -53.982421875, -51.0126953125, -48.04296875, -45.0732421875, -42.103515625, -39.1337890625, -36.1640625, -33.1943359375, -30.224609375, -27.2548828125, -24.28515625, -21.3154296875, -18.345703125, -15.3759765625, -12.40625, -9.4365234375, -6.466796875, -3.4970703125, -0.52734375, 2.4423828125, 5.412109375, 8.3818359375, 11.3515625, 14.3212890625, 17.291015625, 20.2607421875, 23.23046875, 26.2001953125, 29.169921875, 32.1396484375, 35.109375, 38.0791015625, 41.048828125, 44.0185546875, 46.98828125, 49.9580078125, 52.927734375, 55.8974609375, 58.8671875, 61.8369140625, 64.806640625, 67.7763671875, 70.74609375, 73.7158203125, 76.685546875, 79.6552734375, 82.625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 18.0, 19.0, 52.0, 95.0, 171.0, 178.0, 191.0, 116.0, 73.0, 42.0, 30.0, 8.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.6999626159668, -51.271575927734375, -49.84318923950195, -48.41480255126953, -46.986419677734375, -45.55803298950195, -44.12964630126953, -42.70125961303711, -41.27287292480469, -39.844486236572266, -38.416099548339844, -36.98771286010742, -35.559326171875, -34.130943298339844, -32.70255661010742, -31.274169921875, -29.845783233642578, -28.417396545410156, -26.989009857177734, -25.560625076293945, -24.132238388061523, -22.7038516998291, -21.275466918945312, -19.84708023071289, -18.41869354248047, -16.990306854248047, -15.561921119689941, -14.133535385131836, -12.705148696899414, -11.276762008666992, -9.848376274108887, -8.419990539550781, -6.991600036621094, -5.56321382522583, -4.134827613830566, -2.7064414024353027, -1.278055191040039, 0.1503310203552246, 1.5787172317504883, 3.0071029663085938, 4.435489654541016, 5.863875865936279, 7.292262077331543, 8.720647811889648, 10.14903450012207, 11.577421188354492, 13.005806922912598, 14.434192657470703, 15.862579345703125, 17.290966033935547, 18.71935272216797, 20.147737503051758, 21.57612419128418, 23.0045108795166, 24.43289566040039, 25.861282348632812, 27.289669036865234, 28.718055725097656, 30.146442413330078, 31.574827194213867, 33.003211975097656, 34.43159866333008, 35.8599853515625, 37.28837203979492, 38.716758728027344]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 13.0, 3.0, 17.0, 17.0, 9.0, 19.0, 20.0, 24.0, 25.0, 27.0, 24.0, 32.0, 51.0, 33.0, 50.0, 42.0, 60.0, 58.0, 49.0, 48.0, 56.0, 37.0, 45.0, 35.0, 33.0, 30.0, 18.0, 24.0, 24.0, 17.0, 18.0, 11.0, 7.0, 4.0, 11.0, 8.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.44855499267578, -112.91067504882812, -109.37279510498047, -105.83491516113281, -102.29703521728516, -98.7591552734375, -95.22127532958984, -91.68339538574219, -88.14551544189453, -84.60763549804688, -81.06975555419922, -77.53187561035156, -73.9939956665039, -70.45611572265625, -66.9182357788086, -63.38035583496094, -59.84247589111328, -56.304595947265625, -52.76671600341797, -49.22883605957031, -45.690956115722656, -42.153076171875, -38.615196228027344, -35.07731628417969, -31.53943634033203, -28.001556396484375, -24.46367645263672, -20.925796508789062, -17.387916564941406, -13.85003662109375, -10.312156677246094, -6.7742767333984375, -3.2363967895507812, 0.301483154296875, 3.8393630981445312, 7.3772430419921875, 10.915122985839844, 14.4530029296875, 17.990882873535156, 21.528762817382812, 25.06664276123047, 28.604522705078125, 32.14240264892578, 35.68028259277344, 39.218162536621094, 42.75604248046875, 46.293922424316406, 49.83180236816406, 53.36968231201172, 56.907562255859375, 60.44544219970703, 63.98332214355469, 67.52120208740234, 71.05908203125, 74.59696197509766, 78.13484191894531, 81.67272186279297, 85.21060180664062, 88.74848175048828, 92.28636169433594, 95.8242416381836, 99.36212158203125, 102.9000015258789, 106.43788146972656, 109.97576141357422]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 8.0, 9.0, 8.0, 8.0, 18.0, 18.0, 15.0, 22.0, 25.0, 26.0, 25.0, 34.0, 30.0, 58.0, 43.0, 52.0, 56.0, 57.0, 41.0, 35.0, 40.0, 39.0, 33.0, 30.0, 39.0, 34.0, 31.0, 21.0, 18.0, 25.0, 22.0, 15.0, 9.0, 8.0, 12.0, 5.0, 8.0, 4.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7109375, -15.1717529296875, -14.632568359375, -14.0933837890625, -13.55419921875, -13.0150146484375, -12.475830078125, -11.9366455078125, -11.3974609375, -10.8582763671875, -10.319091796875, -9.7799072265625, -9.24072265625, -8.7015380859375, -8.162353515625, -7.6231689453125, -7.083984375, -6.5447998046875, -6.005615234375, -5.4664306640625, -4.92724609375, -4.3880615234375, -3.848876953125, -3.3096923828125, -2.7705078125, -2.2313232421875, -1.692138671875, -1.1529541015625, -0.61376953125, -0.0745849609375, 0.464599609375, 1.0037841796875, 1.54296875, 2.0821533203125, 2.621337890625, 3.1605224609375, 3.69970703125, 4.2388916015625, 4.778076171875, 5.3172607421875, 5.8564453125, 6.3956298828125, 6.934814453125, 7.4739990234375, 8.01318359375, 8.5523681640625, 9.091552734375, 9.6307373046875, 10.169921875, 10.7091064453125, 11.248291015625, 11.7874755859375, 12.32666015625, 12.8658447265625, 13.405029296875, 13.9442138671875, 14.4833984375, 15.0225830078125, 15.561767578125, 16.1009521484375, 16.64013671875, 17.1793212890625, 17.718505859375, 18.2576904296875, 18.796875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 5.0, 17.0, 19.0, 35.0, 43.0, 60.0, 78.0, 131.0, 211.0, 235.0, 401.0, 577.0, 762.0, 1144.0, 1702.0, 2490.0, 3921.0, 6220.0, 10670.0, 21423.0, 125635.0, 2499357.0, 1402652.0, 72797.0, 17484.0, 9533.0, 5612.0, 3583.0, 2280.0, 1575.0, 1058.0, 763.0, 498.0, 373.0, 291.0, 181.0, 124.0, 92.0, 79.0, 43.0, 29.0, 26.0, 24.0, 19.0, 5.0, 14.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.4375, -36.14208984375, -34.8466796875, -33.55126953125, -32.255859375, -30.96044921875, -29.6650390625, -28.36962890625, -27.07421875, -25.77880859375, -24.4833984375, -23.18798828125, -21.892578125, -20.59716796875, -19.3017578125, -18.00634765625, -16.7109375, -15.41552734375, -14.1201171875, -12.82470703125, -11.529296875, -10.23388671875, -8.9384765625, -7.64306640625, -6.34765625, -5.05224609375, -3.7568359375, -2.46142578125, -1.166015625, 0.12939453125, 1.4248046875, 2.72021484375, 4.015625, 5.31103515625, 6.6064453125, 7.90185546875, 9.197265625, 10.49267578125, 11.7880859375, 13.08349609375, 14.37890625, 15.67431640625, 16.9697265625, 18.26513671875, 19.560546875, 20.85595703125, 22.1513671875, 23.44677734375, 24.7421875, 26.03759765625, 27.3330078125, 28.62841796875, 29.923828125, 31.21923828125, 32.5146484375, 33.81005859375, 35.10546875, 36.40087890625, 37.6962890625, 38.99169921875, 40.287109375, 41.58251953125, 42.8779296875, 44.17333984375, 45.46875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 10.0, 13.0, 21.0, 25.0, 29.0, 30.0, 43.0, 109.0, 228.0, 451.0, 899.0, 1006.0, 576.0, 267.0, 124.0, 46.0, 41.0, 22.0, 17.0, 17.0, 10.0, 19.0, 10.0, 6.0, 5.0, 5.0, 1.0, 7.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-38.9375, -37.7978515625, -36.658203125, -35.5185546875, -34.37890625, -33.2392578125, -32.099609375, -30.9599609375, -29.8203125, -28.6806640625, -27.541015625, -26.4013671875, -25.26171875, -24.1220703125, -22.982421875, -21.8427734375, -20.703125, -19.5634765625, -18.423828125, -17.2841796875, -16.14453125, -15.0048828125, -13.865234375, -12.7255859375, -11.5859375, -10.4462890625, -9.306640625, -8.1669921875, -7.02734375, -5.8876953125, -4.748046875, -3.6083984375, -2.46875, -1.3291015625, -0.189453125, 0.9501953125, 2.08984375, 3.2294921875, 4.369140625, 5.5087890625, 6.6484375, 7.7880859375, 8.927734375, 10.0673828125, 11.20703125, 12.3466796875, 13.486328125, 14.6259765625, 15.765625, 16.9052734375, 18.044921875, 19.1845703125, 20.32421875, 21.4638671875, 22.603515625, 23.7431640625, 24.8828125, 26.0224609375, 27.162109375, 28.3017578125, 29.44140625, 30.5810546875, 31.720703125, 32.8603515625, 34.0]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 7.0, 8.0, 7.0, 8.0, 27.0, 30.0, 65.0, 83.0, 152.0, 287.0, 456.0, 891.0, 1724.0, 3470.0, 8036.0, 22015.0, 96617.0, 3747038.0, 260475.0, 32777.0, 10853.0, 4566.0, 2206.0, 1084.0, 621.0, 333.0, 163.0, 104.0, 62.0, 46.0, 21.0, 14.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.5, -74.083984375, -71.66796875, -69.251953125, -66.8359375, -64.419921875, -62.00390625, -59.587890625, -57.171875, -54.755859375, -52.33984375, -49.923828125, -47.5078125, -45.091796875, -42.67578125, -40.259765625, -37.84375, -35.427734375, -33.01171875, -30.595703125, -28.1796875, -25.763671875, -23.34765625, -20.931640625, -18.515625, -16.099609375, -13.68359375, -11.267578125, -8.8515625, -6.435546875, -4.01953125, -1.603515625, 0.8125, 3.228515625, 5.64453125, 8.060546875, 10.4765625, 12.892578125, 15.30859375, 17.724609375, 20.140625, 22.556640625, 24.97265625, 27.388671875, 29.8046875, 32.220703125, 34.63671875, 37.052734375, 39.46875, 41.884765625, 44.30078125, 46.716796875, 49.1328125, 51.548828125, 53.96484375, 56.380859375, 58.796875, 61.212890625, 63.62890625, 66.044921875, 68.4609375, 70.876953125, 73.29296875, 75.708984375, 78.125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 50.0, 829.0, 127.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1635.44873046875, -1597.9898681640625, -1560.531005859375, -1523.072265625, -1485.6134033203125, -1448.154541015625, -1410.69580078125, -1373.2369384765625, -1335.778076171875, -1298.3192138671875, -1260.8603515625, -1223.401611328125, -1185.9427490234375, -1148.48388671875, -1111.025146484375, -1073.5662841796875, -1036.107421875, -998.6485595703125, -961.1897583007812, -923.73095703125, -886.2720947265625, -848.813232421875, -811.3544311523438, -773.8956298828125, -736.436767578125, -698.9779052734375, -661.5191040039062, -624.060302734375, -586.6014404296875, -549.142578125, -511.68377685546875, -474.2249450683594, -436.7659912109375, -399.3071594238281, -361.84832763671875, -324.3894958496094, -286.9306640625, -249.47183227539062, -212.01300048828125, -174.55416870117188, -137.0953369140625, -99.63650512695312, -62.17767333984375, -24.718841552734375, 12.739990234375, 50.198822021484375, 87.65765380859375, 125.11648559570312, 162.5753173828125, 200.03414916992188, 237.49298095703125, 274.9518127441406, 312.41064453125, 349.8694763183594, 387.32830810546875, 424.7871398925781, 462.2459716796875, 499.7048034667969, 537.1636352539062, 574.6224365234375, 612.081298828125, 649.5401611328125, 686.9989624023438, 724.457763671875, 761.9166259765625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 6.0, 3.0, 1.0, 13.0, 15.0, 24.0, 11.0, 22.0, 20.0, 20.0, 23.0, 25.0, 28.0, 40.0, 34.0, 36.0, 45.0, 39.0, 50.0, 38.0, 44.0, 36.0, 42.0, 48.0, 31.0, 42.0, 24.0, 28.0, 37.0, 35.0, 20.0, 30.0, 20.0, 17.0, 14.0, 19.0, 10.0, 7.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.83078002929688, -72.99639129638672, -70.16200256347656, -67.32760620117188, -64.49321746826172, -61.65882873535156, -58.824440002441406, -55.99005126953125, -53.15565872192383, -50.32126998901367, -47.48687744140625, -44.652488708496094, -41.81809997558594, -38.983707427978516, -36.14931869506836, -33.31492614746094, -30.48053741455078, -27.646146774291992, -24.811756134033203, -21.977367401123047, -19.142976760864258, -16.30858612060547, -13.474197387695312, -10.639806747436523, -7.805416107177734, -4.9710259437561035, -2.1366357803344727, 0.69775390625, 3.532144546508789, 6.366535186767578, 9.200923919677734, 12.035314559936523, 14.869705200195312, 17.7040958404541, 20.53848648071289, 23.372875213623047, 26.207265853881836, 29.041656494140625, 31.87604522705078, 34.71043395996094, 37.54482650756836, 40.379215240478516, 43.21360778808594, 46.047996520996094, 48.88238525390625, 51.71677780151367, 54.55116653442383, 57.38555908203125, 60.219947814941406, 63.05433654785156, 65.88872528076172, 68.72311401367188, 71.55751037597656, 74.39189910888672, 77.22628784179688, 80.06067657470703, 82.89506530761719, 85.72945404052734, 88.5638427734375, 91.39823913574219, 94.23262786865234, 97.0670166015625, 99.90140533447266, 102.73579406738281, 105.5701904296875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 10.0, 4.0, 11.0, 6.0, 15.0, 21.0, 15.0, 26.0, 28.0, 38.0, 34.0, 36.0, 38.0, 41.0, 56.0, 47.0, 48.0, 41.0, 55.0, 37.0, 34.0, 37.0, 29.0, 29.0, 34.0, 31.0, 33.0, 20.0, 24.0, 25.0, 18.0, 17.0, 14.0, 9.0, 8.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.0, -16.428955078125, -15.85791015625, -15.286865234375, -14.7158203125, -14.144775390625, -13.57373046875, -13.002685546875, -12.431640625, -11.860595703125, -11.28955078125, -10.718505859375, -10.1474609375, -9.576416015625, -9.00537109375, -8.434326171875, -7.86328125, -7.292236328125, -6.72119140625, -6.150146484375, -5.5791015625, -5.008056640625, -4.43701171875, -3.865966796875, -3.294921875, -2.723876953125, -2.15283203125, -1.581787109375, -1.0107421875, -0.439697265625, 0.13134765625, 0.702392578125, 1.2734375, 1.844482421875, 2.41552734375, 2.986572265625, 3.5576171875, 4.128662109375, 4.69970703125, 5.270751953125, 5.841796875, 6.412841796875, 6.98388671875, 7.554931640625, 8.1259765625, 8.697021484375, 9.26806640625, 9.839111328125, 10.41015625, 10.981201171875, 11.55224609375, 12.123291015625, 12.6943359375, 13.265380859375, 13.83642578125, 14.407470703125, 14.978515625, 15.549560546875, 16.12060546875, 16.691650390625, 17.2626953125, 17.833740234375, 18.40478515625, 18.975830078125, 19.546875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 15.0, 18.0, 46.0, 48.0, 71.0, 124.0, 168.0, 230.0, 381.0, 638.0, 940.0, 1517.0, 2458.0, 4013.0, 6551.0, 10620.0, 18128.0, 30339.0, 52715.0, 94724.0, 175377.0, 249634.0, 175765.0, 95123.0, 52520.0, 30402.0, 18007.0, 10777.0, 6476.0, 3963.0, 2450.0, 1579.0, 988.0, 605.0, 415.0, 219.0, 171.0, 93.0, 70.0, 43.0, 45.0, 32.0, 17.0, 13.0, 8.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-1.732421875, -1.6807098388671875, -1.628997802734375, -1.5772857666015625, -1.52557373046875, -1.4738616943359375, -1.422149658203125, -1.3704376220703125, -1.3187255859375, -1.2670135498046875, -1.215301513671875, -1.1635894775390625, -1.11187744140625, -1.0601654052734375, -1.008453369140625, -0.9567413330078125, -0.905029296875, -0.8533172607421875, -0.801605224609375, -0.7498931884765625, -0.69818115234375, -0.6464691162109375, -0.594757080078125, -0.5430450439453125, -0.4913330078125, -0.4396209716796875, -0.387908935546875, -0.3361968994140625, -0.28448486328125, -0.2327728271484375, -0.181060791015625, -0.1293487548828125, -0.07763671875, -0.0259246826171875, 0.025787353515625, 0.0774993896484375, 0.12921142578125, 0.1809234619140625, 0.232635498046875, 0.2843475341796875, 0.3360595703125, 0.3877716064453125, 0.439483642578125, 0.4911956787109375, 0.54290771484375, 0.5946197509765625, 0.646331787109375, 0.6980438232421875, 0.749755859375, 0.8014678955078125, 0.853179931640625, 0.9048919677734375, 0.95660400390625, 1.0083160400390625, 1.060028076171875, 1.1117401123046875, 1.1634521484375, 1.2151641845703125, 1.266876220703125, 1.3185882568359375, 1.37030029296875, 1.4220123291015625, 1.473724365234375, 1.5254364013671875, 1.5771484375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 2.0, 11.0, 11.0, 8.0, 10.0, 8.0, 16.0, 14.0, 19.0, 13.0, 23.0, 18.0, 21.0, 20.0, 29.0, 32.0, 26.0, 38.0, 35.0, 38.0, 44.0, 39.0, 1053.0, 42.0, 48.0, 35.0, 28.0, 31.0, 34.0, 31.0, 27.0, 24.0, 24.0, 23.0, 15.0, 18.0, 12.0, 6.0, 18.0, 22.0, 18.0, 9.0, 7.0, 6.0, 8.0, 1.0, 2.0, 1.0, 4.0], "bins": [-11.2734375, -10.9713134765625, -10.669189453125, -10.3670654296875, -10.06494140625, -9.7628173828125, -9.460693359375, -9.1585693359375, -8.8564453125, -8.5543212890625, -8.252197265625, -7.9500732421875, -7.64794921875, -7.3458251953125, -7.043701171875, -6.7415771484375, -6.439453125, -6.1373291015625, -5.835205078125, -5.5330810546875, -5.23095703125, -4.9288330078125, -4.626708984375, -4.3245849609375, -4.0224609375, -3.7203369140625, -3.418212890625, -3.1160888671875, -2.81396484375, -2.5118408203125, -2.209716796875, -1.9075927734375, -1.60546875, -1.3033447265625, -1.001220703125, -0.6990966796875, -0.39697265625, -0.0948486328125, 0.207275390625, 0.5093994140625, 0.8115234375, 1.1136474609375, 1.415771484375, 1.7178955078125, 2.02001953125, 2.3221435546875, 2.624267578125, 2.9263916015625, 3.228515625, 3.5306396484375, 3.832763671875, 4.1348876953125, 4.43701171875, 4.7391357421875, 5.041259765625, 5.3433837890625, 5.6455078125, 5.9476318359375, 6.249755859375, 6.5518798828125, 6.85400390625, 7.1561279296875, 7.458251953125, 7.7603759765625, 8.0625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 13.0, 27.0, 27.0, 34.0, 54.0, 81.0, 141.0, 220.0, 343.0, 522.0, 837.0, 1266.0, 1989.0, 3107.0, 4716.0, 7361.0, 11002.0, 16892.0, 26878.0, 43223.0, 72961.0, 125473.0, 556828.0, 901353.0, 127222.0, 74001.0, 44220.0, 27248.0, 17078.0, 11029.0, 7285.0, 4732.0, 3177.0, 2074.0, 1339.0, 846.0, 586.0, 334.0, 215.0, 145.0, 72.0, 57.0, 37.0, 35.0, 14.0, 13.0, 9.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.0029296875, -0.9716033935546875, -0.940277099609375, -0.9089508056640625, -0.87762451171875, -0.8462982177734375, -0.814971923828125, -0.7836456298828125, -0.7523193359375, -0.7209930419921875, -0.689666748046875, -0.6583404541015625, -0.62701416015625, -0.5956878662109375, -0.564361572265625, -0.5330352783203125, -0.501708984375, -0.4703826904296875, -0.439056396484375, -0.4077301025390625, -0.37640380859375, -0.3450775146484375, -0.313751220703125, -0.2824249267578125, -0.2510986328125, -0.2197723388671875, -0.188446044921875, -0.1571197509765625, -0.12579345703125, -0.0944671630859375, -0.063140869140625, -0.0318145751953125, -0.00048828125, 0.0308380126953125, 0.062164306640625, 0.0934906005859375, 0.12481689453125, 0.1561431884765625, 0.187469482421875, 0.2187957763671875, 0.2501220703125, 0.2814483642578125, 0.312774658203125, 0.3441009521484375, 0.37542724609375, 0.4067535400390625, 0.438079833984375, 0.4694061279296875, 0.500732421875, 0.5320587158203125, 0.563385009765625, 0.5947113037109375, 0.62603759765625, 0.6573638916015625, 0.688690185546875, 0.7200164794921875, 0.7513427734375, 0.7826690673828125, 0.813995361328125, 0.8453216552734375, 0.87664794921875, 0.9079742431640625, 0.939300537109375, 0.9706268310546875, 1.001953125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 5.0, 7.0, 8.0, 18.0, 20.0, 19.0, 26.0, 32.0, 30.0, 40.0, 55.0, 66.0, 95.0, 104.0, 121.0, 81.0, 52.0, 35.0, 35.0, 33.0, 26.0, 20.0, 15.0, 8.0, 9.0, 8.0, 5.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04522705078125, -0.043990135192871094, -0.04275321960449219, -0.04151630401611328, -0.040279388427734375, -0.03904247283935547, -0.03780555725097656, -0.036568641662597656, -0.03533172607421875, -0.034094810485839844, -0.03285789489746094, -0.03162097930908203, -0.030384063720703125, -0.02914714813232422, -0.027910232543945312, -0.026673316955566406, -0.0254364013671875, -0.024199485778808594, -0.022962570190429688, -0.02172565460205078, -0.020488739013671875, -0.01925182342529297, -0.018014907836914062, -0.016777992248535156, -0.01554107666015625, -0.014304161071777344, -0.013067245483398438, -0.011830329895019531, -0.010593414306640625, -0.009356498718261719, -0.008119583129882812, -0.006882667541503906, -0.005645751953125, -0.004408836364746094, -0.0031719207763671875, -0.0019350051879882812, -0.000698089599609375, 0.0005388259887695312, 0.0017757415771484375, 0.0030126571655273438, 0.00424957275390625, 0.005486488342285156, 0.0067234039306640625, 0.007960319519042969, 0.009197235107421875, 0.010434150695800781, 0.011671066284179688, 0.012907981872558594, 0.0141448974609375, 0.015381813049316406, 0.016618728637695312, 0.01785564422607422, 0.019092559814453125, 0.02032947540283203, 0.021566390991210938, 0.022803306579589844, 0.02404022216796875, 0.025277137756347656, 0.026514053344726562, 0.02775096893310547, 0.028987884521484375, 0.03022480010986328, 0.03146171569824219, 0.032698631286621094, 0.033935546875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 11.0, 11.0, 9.0, 13.0, 15.0, 12.0, 25.0, 30.0, 39.0, 72.0, 97.0, 132.0, 274.0, 647.0, 9911.0, 1032676.0, 3327.0, 549.0, 221.0, 127.0, 90.0, 68.0, 47.0, 41.0, 28.0, 22.0, 14.0, 9.0, 6.0, 5.0, 7.0, 6.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.697265625, -0.67181396484375, -0.6463623046875, -0.62091064453125, -0.595458984375, -0.57000732421875, -0.5445556640625, -0.51910400390625, -0.49365234375, -0.46820068359375, -0.4427490234375, -0.41729736328125, -0.391845703125, -0.36639404296875, -0.3409423828125, -0.31549072265625, -0.2900390625, -0.26458740234375, -0.2391357421875, -0.21368408203125, -0.188232421875, -0.16278076171875, -0.1373291015625, -0.11187744140625, -0.08642578125, -0.06097412109375, -0.0355224609375, -0.01007080078125, 0.015380859375, 0.04083251953125, 0.0662841796875, 0.09173583984375, 0.1171875, 0.14263916015625, 0.1680908203125, 0.19354248046875, 0.218994140625, 0.24444580078125, 0.2698974609375, 0.29534912109375, 0.32080078125, 0.34625244140625, 0.3717041015625, 0.39715576171875, 0.422607421875, 0.44805908203125, 0.4735107421875, 0.49896240234375, 0.5244140625, 0.54986572265625, 0.5753173828125, 0.60076904296875, 0.626220703125, 0.65167236328125, 0.6771240234375, 0.70257568359375, 0.72802734375, 0.75347900390625, 0.7789306640625, 0.80438232421875, 0.829833984375, 0.85528564453125, 0.8807373046875, 0.90618896484375, 0.931640625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 27.0, 919.0, 65.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15368282794952393, -0.1356232464313507, -0.11756366491317749, -0.09950407594442368, -0.08144449442625046, -0.06338491290807724, -0.045325323939323425, -0.027265742421150208, -0.00920616090297699, 0.008853422477841377, 0.026913005858659744, 0.04497259110212326, 0.06303217262029648, 0.0810917541384697, 0.09915134310722351, 0.11721092462539673, 0.13527050614356995, 0.15333008766174316, 0.17138966917991638, 0.1894492506980896, 0.20750883221626282, 0.22556841373443604, 0.24362801015377045, 0.26168757677078247, 0.2797471880912781, 0.2978067696094513, 0.3158663511276245, 0.33392593264579773, 0.35198551416397095, 0.37004509568214417, 0.3881046772003174, 0.406164288520813, 0.4242238402366638, 0.44228342175483704, 0.46034300327301025, 0.47840258479118347, 0.4964621663093567, 0.5145217776298523, 0.5325813293457031, 0.5506409406661987, 0.5687004923820496, 0.5867601037025452, 0.604819655418396, 0.6228792667388916, 0.6409388184547424, 0.658998429775238, 0.6770579814910889, 0.6951175928115845, 0.7131772041320801, 0.7312368154525757, 0.7492963671684265, 0.7673559784889221, 0.785415530204773, 0.8034751415252686, 0.8215346932411194, 0.839594304561615, 0.8576538562774658, 0.8757134675979614, 0.8937730193138123, 0.9118326306343079, 0.9298921823501587, 0.9479517936706543, 0.9660113453865051, 0.9840709567070007, 1.0021305084228516]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 11.0, 10.0, 16.0, 13.0, 15.0, 15.0, 23.0, 23.0, 22.0, 45.0, 37.0, 34.0, 40.0, 37.0, 46.0, 49.0, 45.0, 45.0, 46.0, 51.0, 30.0, 40.0, 31.0, 52.0, 31.0, 31.0, 29.0, 25.0, 22.0, 18.0, 15.0, 16.0, 9.0, 10.0, 5.0, 3.0, 3.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05918377637863159, -0.05743154510855675, -0.0556793138384819, -0.05392708256840706, -0.052174851298332214, -0.05042262002825737, -0.048670388758182526, -0.04691815748810768, -0.04516592621803284, -0.04341369494795799, -0.04166146367788315, -0.039909232407808304, -0.03815700113773346, -0.036404769867658615, -0.03465253859758377, -0.032900307327508926, -0.031148076057434082, -0.029395844787359238, -0.027643613517284393, -0.02589138224720955, -0.024139150977134705, -0.02238691970705986, -0.020634688436985016, -0.01888245716691017, -0.017130225896835327, -0.015377994626760483, -0.013625763356685638, -0.011873532086610794, -0.01012130081653595, -0.008369069546461105, -0.006616838276386261, -0.004864607006311417, -0.0031123757362365723, -0.001360144466161728, 0.00039208680391311646, 0.002144318073987961, 0.003896549344062805, 0.0056487806141376495, 0.007401011884212494, 0.009153243154287338, 0.010905474424362183, 0.012657705694437027, 0.014409936964511871, 0.016162168234586716, 0.01791439950466156, 0.019666630774736404, 0.02141886204481125, 0.023171093314886093, 0.024923324584960938, 0.026675555855035782, 0.028427787125110626, 0.03018001839518547, 0.031932249665260315, 0.03368448093533516, 0.035436712205410004, 0.03718894347548485, 0.03894117474555969, 0.04069340601563454, 0.04244563728570938, 0.044197868555784225, 0.04595009982585907, 0.047702331095933914, 0.04945456236600876, 0.0512067936360836, 0.05295902490615845]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 10.0, 4.0, 11.0, 6.0, 15.0, 21.0, 16.0, 25.0, 28.0, 38.0, 34.0, 36.0, 39.0, 41.0, 56.0, 46.0, 48.0, 40.0, 56.0, 37.0, 35.0, 36.0, 29.0, 30.0, 33.0, 31.0, 33.0, 20.0, 24.0, 25.0, 18.0, 17.0, 14.0, 9.0, 8.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.0, -16.428955078125, -15.85791015625, -15.286865234375, -14.7158203125, -14.144775390625, -13.57373046875, -13.002685546875, -12.431640625, -11.860595703125, -11.28955078125, -10.718505859375, -10.1474609375, -9.576416015625, -9.00537109375, -8.434326171875, -7.86328125, -7.292236328125, -6.72119140625, -6.150146484375, -5.5791015625, -5.008056640625, -4.43701171875, -3.865966796875, -3.294921875, -2.723876953125, -2.15283203125, -1.581787109375, -1.0107421875, -0.439697265625, 0.13134765625, 0.702392578125, 1.2734375, 1.844482421875, 2.41552734375, 2.986572265625, 3.5576171875, 4.128662109375, 4.69970703125, 5.270751953125, 5.841796875, 6.412841796875, 6.98388671875, 7.554931640625, 8.1259765625, 8.697021484375, 9.26806640625, 9.839111328125, 10.41015625, 10.981201171875, 11.55224609375, 12.123291015625, 12.6943359375, 13.265380859375, 13.83642578125, 14.407470703125, 14.978515625, 15.549560546875, 16.12060546875, 16.691650390625, 17.2626953125, 17.833740234375, 18.40478515625, 18.975830078125, 19.546875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 11.0, 11.0, 15.0, 32.0, 35.0, 44.0, 70.0, 62.0, 95.0, 148.0, 251.0, 395.0, 589.0, 953.0, 1624.0, 2853.0, 5709.0, 14598.0, 69026.0, 634492.0, 264938.0, 33080.0, 9590.0, 4166.0, 2164.0, 1310.0, 762.0, 508.0, 284.0, 204.0, 140.0, 113.0, 72.0, 69.0, 35.0, 23.0, 20.0, 17.0, 9.0, 10.0, 10.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.375, -22.563232421875, -21.75146484375, -20.939697265625, -20.1279296875, -19.316162109375, -18.50439453125, -17.692626953125, -16.880859375, -16.069091796875, -15.25732421875, -14.445556640625, -13.6337890625, -12.822021484375, -12.01025390625, -11.198486328125, -10.38671875, -9.574951171875, -8.76318359375, -7.951416015625, -7.1396484375, -6.327880859375, -5.51611328125, -4.704345703125, -3.892578125, -3.080810546875, -2.26904296875, -1.457275390625, -0.6455078125, 0.166259765625, 0.97802734375, 1.789794921875, 2.6015625, 3.413330078125, 4.22509765625, 5.036865234375, 5.8486328125, 6.660400390625, 7.47216796875, 8.283935546875, 9.095703125, 9.907470703125, 10.71923828125, 11.531005859375, 12.3427734375, 13.154541015625, 13.96630859375, 14.778076171875, 15.58984375, 16.401611328125, 17.21337890625, 18.025146484375, 18.8369140625, 19.648681640625, 20.46044921875, 21.272216796875, 22.083984375, 22.895751953125, 23.70751953125, 24.519287109375, 25.3310546875, 26.142822265625, 26.95458984375, 27.766357421875, 28.578125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 9.0, 10.0, 14.0, 13.0, 8.0, 16.0, 20.0, 25.0, 26.0, 18.0, 26.0, 44.0, 38.0, 41.0, 66.0, 70.0, 174.0, 1665.0, 231.0, 94.0, 62.0, 54.0, 36.0, 52.0, 37.0, 37.0, 28.0, 24.0, 24.0, 15.0, 17.0, 9.0, 11.0, 6.0, 3.0, 4.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-43.625, -42.24560546875, -40.8662109375, -39.48681640625, -38.107421875, -36.72802734375, -35.3486328125, -33.96923828125, -32.58984375, -31.21044921875, -29.8310546875, -28.45166015625, -27.072265625, -25.69287109375, -24.3134765625, -22.93408203125, -21.5546875, -20.17529296875, -18.7958984375, -17.41650390625, -16.037109375, -14.65771484375, -13.2783203125, -11.89892578125, -10.51953125, -9.14013671875, -7.7607421875, -6.38134765625, -5.001953125, -3.62255859375, -2.2431640625, -0.86376953125, 0.515625, 1.89501953125, 3.2744140625, 4.65380859375, 6.033203125, 7.41259765625, 8.7919921875, 10.17138671875, 11.55078125, 12.93017578125, 14.3095703125, 15.68896484375, 17.068359375, 18.44775390625, 19.8271484375, 21.20654296875, 22.5859375, 23.96533203125, 25.3447265625, 26.72412109375, 28.103515625, 29.48291015625, 30.8623046875, 32.24169921875, 33.62109375, 35.00048828125, 36.3798828125, 37.75927734375, 39.138671875, 40.51806640625, 41.8974609375, 43.27685546875, 44.65625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 6.0, 9.0, 17.0, 13.0, 20.0, 32.0, 51.0, 85.0, 114.0, 191.0, 334.0, 873.0, 4387.0, 146614.0, 2975866.0, 14228.0, 1722.0, 467.0, 222.0, 141.0, 95.0, 61.0, 53.0, 34.0, 22.0, 17.0, 11.0, 6.0, 2.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.625, -66.1943359375, -63.763671875, -61.3330078125, -58.90234375, -56.4716796875, -54.041015625, -51.6103515625, -49.1796875, -46.7490234375, -44.318359375, -41.8876953125, -39.45703125, -37.0263671875, -34.595703125, -32.1650390625, -29.734375, -27.3037109375, -24.873046875, -22.4423828125, -20.01171875, -17.5810546875, -15.150390625, -12.7197265625, -10.2890625, -7.8583984375, -5.427734375, -2.9970703125, -0.56640625, 1.8642578125, 4.294921875, 6.7255859375, 9.15625, 11.5869140625, 14.017578125, 16.4482421875, 18.87890625, 21.3095703125, 23.740234375, 26.1708984375, 28.6015625, 31.0322265625, 33.462890625, 35.8935546875, 38.32421875, 40.7548828125, 43.185546875, 45.6162109375, 48.046875, 50.4775390625, 52.908203125, 55.3388671875, 57.76953125, 60.2001953125, 62.630859375, 65.0615234375, 67.4921875, 69.9228515625, 72.353515625, 74.7841796875, 77.21484375, 79.6455078125, 82.076171875, 84.5068359375, 86.9375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 338.0, 677.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.522544860839844, -45.73832702636719, -30.95410919189453, -16.169891357421875, -1.3856735229492188, 13.398544311523438, 28.182762145996094, 42.96697998046875, 57.751197814941406, 72.53541564941406, 87.31963348388672, 102.10385131835938, 116.88806915283203, 131.6722869873047, 146.45651245117188, 161.24072265625, 176.02493286132812, 190.80914306640625, 205.59336853027344, 220.37759399414062, 235.16180419921875, 249.94601440429688, 264.730224609375, 279.51446533203125, 294.2986755371094, 309.0828857421875, 323.86712646484375, 338.6513366699219, 353.435546875, 368.2197570800781, 383.00396728515625, 397.7882080078125, 412.57244873046875, 427.3566589355469, 442.140869140625, 456.92510986328125, 471.7093200683594, 486.4935302734375, 501.27777099609375, 516.0619506835938, 530.84619140625, 545.6304321289062, 560.4146118164062, 575.1988525390625, 589.9830322265625, 604.7672729492188, 619.551513671875, 634.335693359375, 649.1199340820312, 663.9041748046875, 678.6883544921875, 693.4725952148438, 708.2568359375, 723.041015625, 737.8252563476562, 752.6094360351562, 767.3936767578125, 782.1779174804688, 796.9620971679688, 811.746337890625, 826.530517578125, 841.3147583007812, 856.0989990234375, 870.8831787109375, 885.6674194335938]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 12.0, 5.0, 11.0, 15.0, 12.0, 26.0, 21.0, 17.0, 31.0, 31.0, 35.0, 31.0, 41.0, 37.0, 44.0, 41.0, 32.0, 43.0, 53.0, 43.0, 43.0, 35.0, 29.0, 34.0, 33.0, 38.0, 24.0, 32.0, 23.0, 20.0, 22.0, 14.0, 12.0, 11.0, 7.0, 6.0, 8.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-98.87551879882812, -96.03118133544922, -93.18684387207031, -90.34249877929688, -87.49816131591797, -84.65382385253906, -81.80948638916016, -78.96514892578125, -76.12080383300781, -73.2764663696289, -70.43212890625, -67.58778381347656, -64.74344635009766, -61.89910888671875, -59.054771423339844, -56.21043395996094, -53.36609649658203, -50.521759033203125, -47.67741775512695, -44.83308029174805, -41.988739013671875, -39.14440155029297, -36.30006408691406, -33.455726623535156, -30.611385345458984, -27.767045974731445, -24.922706604003906, -22.078369140625, -19.23402976989746, -16.389690399169922, -13.545352935791016, -10.701013565063477, -7.8566741943359375, -5.012335300445557, -2.167996406555176, 0.6763420104980469, 3.520681381225586, 6.365020751953125, 9.209358215332031, 12.05369758605957, 14.89803695678711, 17.74237632751465, 20.586715698242188, 23.431053161621094, 26.275392532348633, 29.119731903076172, 31.964069366455078, 34.80841064453125, 37.652748107910156, 40.49708557128906, 43.341426849365234, 46.18576431274414, 49.03010559082031, 51.87444305419922, 54.718780517578125, 57.56311798095703, 60.4074592590332, 63.25179672241211, 66.09613800048828, 68.94047546386719, 71.7848129272461, 74.629150390625, 77.47349548339844, 80.31783294677734, 83.16217041015625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 11.0, 2.0, 12.0, 8.0, 14.0, 16.0, 14.0, 17.0, 22.0, 40.0, 28.0, 37.0, 30.0, 41.0, 48.0, 39.0, 42.0, 49.0, 34.0, 47.0, 36.0, 49.0, 41.0, 38.0, 21.0, 41.0, 32.0, 15.0, 33.0, 22.0, 19.0, 15.0, 19.0, 15.0, 12.0, 8.0, 10.0, 7.0, 2.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.5, -15.9482421875, -15.396484375, -14.8447265625, -14.29296875, -13.7412109375, -13.189453125, -12.6376953125, -12.0859375, -11.5341796875, -10.982421875, -10.4306640625, -9.87890625, -9.3271484375, -8.775390625, -8.2236328125, -7.671875, -7.1201171875, -6.568359375, -6.0166015625, -5.46484375, -4.9130859375, -4.361328125, -3.8095703125, -3.2578125, -2.7060546875, -2.154296875, -1.6025390625, -1.05078125, -0.4990234375, 0.052734375, 0.6044921875, 1.15625, 1.7080078125, 2.259765625, 2.8115234375, 3.36328125, 3.9150390625, 4.466796875, 5.0185546875, 5.5703125, 6.1220703125, 6.673828125, 7.2255859375, 7.77734375, 8.3291015625, 8.880859375, 9.4326171875, 9.984375, 10.5361328125, 11.087890625, 11.6396484375, 12.19140625, 12.7431640625, 13.294921875, 13.8466796875, 14.3984375, 14.9501953125, 15.501953125, 16.0537109375, 16.60546875, 17.1572265625, 17.708984375, 18.2607421875, 18.8125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 8.0, 7.0, 18.0, 21.0, 45.0, 44.0, 73.0, 105.0, 160.0, 209.0, 356.0, 469.0, 679.0, 1018.0, 1522.0, 2263.0, 3494.0, 6048.0, 12584.0, 60364.0, 1718130.0, 2284184.0, 72465.0, 12715.0, 6125.0, 3715.0, 2447.0, 1598.0, 1102.0, 729.0, 497.0, 337.0, 221.0, 157.0, 103.0, 73.0, 59.0, 39.0, 21.0, 23.0, 14.0, 10.0, 11.0, 3.0, 0.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-43.75, -42.29345703125, -40.8369140625, -39.38037109375, -37.923828125, -36.46728515625, -35.0107421875, -33.55419921875, -32.09765625, -30.64111328125, -29.1845703125, -27.72802734375, -26.271484375, -24.81494140625, -23.3583984375, -21.90185546875, -20.4453125, -18.98876953125, -17.5322265625, -16.07568359375, -14.619140625, -13.16259765625, -11.7060546875, -10.24951171875, -8.79296875, -7.33642578125, -5.8798828125, -4.42333984375, -2.966796875, -1.51025390625, -0.0537109375, 1.40283203125, 2.859375, 4.31591796875, 5.7724609375, 7.22900390625, 8.685546875, 10.14208984375, 11.5986328125, 13.05517578125, 14.51171875, 15.96826171875, 17.4248046875, 18.88134765625, 20.337890625, 21.79443359375, 23.2509765625, 24.70751953125, 26.1640625, 27.62060546875, 29.0771484375, 30.53369140625, 31.990234375, 33.44677734375, 34.9033203125, 36.35986328125, 37.81640625, 39.27294921875, 40.7294921875, 42.18603515625, 43.642578125, 45.09912109375, 46.5556640625, 48.01220703125, 49.46875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 13.0, 9.0, 13.0, 24.0, 24.0, 48.0, 77.0, 140.0, 330.0, 861.0, 1323.0, 645.0, 272.0, 98.0, 49.0, 38.0, 26.0, 13.0, 16.0, 9.0, 10.0, 4.0, 4.0, 6.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.15625, -35.8896484375, -34.623046875, -33.3564453125, -32.08984375, -30.8232421875, -29.556640625, -28.2900390625, -27.0234375, -25.7568359375, -24.490234375, -23.2236328125, -21.95703125, -20.6904296875, -19.423828125, -18.1572265625, -16.890625, -15.6240234375, -14.357421875, -13.0908203125, -11.82421875, -10.5576171875, -9.291015625, -8.0244140625, -6.7578125, -5.4912109375, -4.224609375, -2.9580078125, -1.69140625, -0.4248046875, 0.841796875, 2.1083984375, 3.375, 4.6416015625, 5.908203125, 7.1748046875, 8.44140625, 9.7080078125, 10.974609375, 12.2412109375, 13.5078125, 14.7744140625, 16.041015625, 17.3076171875, 18.57421875, 19.8408203125, 21.107421875, 22.3740234375, 23.640625, 24.9072265625, 26.173828125, 27.4404296875, 28.70703125, 29.9736328125, 31.240234375, 32.5068359375, 33.7734375, 35.0400390625, 36.306640625, 37.5732421875, 38.83984375, 40.1064453125, 41.373046875, 42.6396484375, 43.90625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 9.0, 7.0, 14.0, 24.0, 27.0, 33.0, 53.0, 58.0, 95.0, 143.0, 209.0, 319.0, 506.0, 823.0, 1411.0, 2520.0, 4824.0, 9421.0, 21489.0, 66133.0, 1215697.0, 2733632.0, 88540.0, 25078.0, 10891.0, 5312.0, 2731.0, 1638.0, 935.0, 594.0, 388.0, 223.0, 150.0, 106.0, 62.0, 46.0, 40.0, 32.0, 18.0, 12.0, 13.0, 9.0, 8.0, 5.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0], "bins": [-54.34375, -52.794921875, -51.24609375, -49.697265625, -48.1484375, -46.599609375, -45.05078125, -43.501953125, -41.953125, -40.404296875, -38.85546875, -37.306640625, -35.7578125, -34.208984375, -32.66015625, -31.111328125, -29.5625, -28.013671875, -26.46484375, -24.916015625, -23.3671875, -21.818359375, -20.26953125, -18.720703125, -17.171875, -15.623046875, -14.07421875, -12.525390625, -10.9765625, -9.427734375, -7.87890625, -6.330078125, -4.78125, -3.232421875, -1.68359375, -0.134765625, 1.4140625, 2.962890625, 4.51171875, 6.060546875, 7.609375, 9.158203125, 10.70703125, 12.255859375, 13.8046875, 15.353515625, 16.90234375, 18.451171875, 20.0, 21.548828125, 23.09765625, 24.646484375, 26.1953125, 27.744140625, 29.29296875, 30.841796875, 32.390625, 33.939453125, 35.48828125, 37.037109375, 38.5859375, 40.134765625, 41.68359375, 43.232421875, 44.78125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 16.0, 32.0, 65.0, 162.0, 302.0, 212.0, 106.0, 45.0, 21.0, 17.0, 8.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-308.9152526855469, -302.4376525878906, -295.9600830078125, -289.48248291015625, -283.0048828125, -276.52728271484375, -270.0497131347656, -263.5721130371094, -257.0945129394531, -250.61692810058594, -244.1393280029297, -237.6617431640625, -231.18414306640625, -224.70655822753906, -218.2289581298828, -211.75137329101562, -205.27377319335938, -198.7961883544922, -192.31858825683594, -185.84100341796875, -179.3634033203125, -172.8858184814453, -166.40821838378906, -159.93063354492188, -153.4530487060547, -146.9754638671875, -140.49786376953125, -134.02027893066406, -127.54267883300781, -121.06509399414062, -114.58749389648438, -108.10990905761719, -101.63230895996094, -95.15471649169922, -88.6771240234375, -82.19953155517578, -75.72193908691406, -69.24435424804688, -62.76675796508789, -56.28916549682617, -49.81157302856445, -43.333980560302734, -36.856388092041016, -30.37879753112793, -23.90120506286621, -17.423614501953125, -10.946022033691406, -4.4684295654296875, 2.0091629028320312, 8.48675537109375, 14.964346885681152, 21.441938400268555, 27.919530868530273, 34.39712142944336, 40.87471389770508, 47.3523063659668, 53.829898834228516, 60.307491302490234, 66.78507995605469, 73.2626724243164, 79.74026489257812, 86.21785736083984, 92.69544982910156, 99.17304229736328, 105.650634765625]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 7.0, 9.0, 10.0, 12.0, 6.0, 19.0, 22.0, 18.0, 26.0, 37.0, 17.0, 38.0, 36.0, 28.0, 39.0, 46.0, 41.0, 47.0, 44.0, 46.0, 40.0, 53.0, 36.0, 42.0, 44.0, 35.0, 24.0, 17.0, 33.0, 26.0, 14.0, 11.0, 15.0, 10.0, 11.0, 11.0, 5.0, 2.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-86.68189239501953, -84.02593994140625, -81.36998748779297, -78.71403503417969, -76.05807495117188, -73.4021224975586, -70.74617004394531, -68.09021759033203, -65.43426513671875, -62.77831268310547, -60.12236022949219, -57.46640396118164, -54.81045150756836, -52.15449905395508, -49.49854278564453, -46.84259033203125, -44.18663787841797, -41.53068542480469, -38.874732971191406, -36.21877670288086, -33.56282424926758, -30.906871795654297, -28.250917434692383, -25.59496307373047, -22.939010620117188, -20.283058166503906, -17.627103805541992, -14.971150398254395, -12.315196990966797, -9.6592435836792, -7.003290176391602, -4.3473358154296875, -1.6913909912109375, 0.9645624160766602, 3.620515823364258, 6.2764692306518555, 8.932422637939453, 11.58837604522705, 14.244329452514648, 16.900283813476562, 19.556236267089844, 22.212188720703125, 24.86814308166504, 27.524097442626953, 30.180049896240234, 32.836002349853516, 35.49195861816406, 38.147911071777344, 40.803863525390625, 43.459815979003906, 46.11576843261719, 48.771724700927734, 51.427677154541016, 54.0836296081543, 56.739585876464844, 59.395538330078125, 62.051490783691406, 64.70744323730469, 67.36339569091797, 70.01934814453125, 72.67530822753906, 75.33126068115234, 77.98721313476562, 80.6431655883789, 83.29911804199219]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 7.0, 6.0, 13.0, 17.0, 27.0, 16.0, 17.0, 27.0, 20.0, 30.0, 41.0, 51.0, 39.0, 36.0, 48.0, 48.0, 50.0, 42.0, 52.0, 46.0, 41.0, 45.0, 37.0, 41.0, 22.0, 29.0, 20.0, 31.0, 15.0, 20.0, 12.0, 15.0, 8.0, 11.0, 4.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-19.390625, -18.769287109375, -18.14794921875, -17.526611328125, -16.9052734375, -16.283935546875, -15.66259765625, -15.041259765625, -14.419921875, -13.798583984375, -13.17724609375, -12.555908203125, -11.9345703125, -11.313232421875, -10.69189453125, -10.070556640625, -9.44921875, -8.827880859375, -8.20654296875, -7.585205078125, -6.9638671875, -6.342529296875, -5.72119140625, -5.099853515625, -4.478515625, -3.857177734375, -3.23583984375, -2.614501953125, -1.9931640625, -1.371826171875, -0.75048828125, -0.129150390625, 0.4921875, 1.113525390625, 1.73486328125, 2.356201171875, 2.9775390625, 3.598876953125, 4.22021484375, 4.841552734375, 5.462890625, 6.084228515625, 6.70556640625, 7.326904296875, 7.9482421875, 8.569580078125, 9.19091796875, 9.812255859375, 10.43359375, 11.054931640625, 11.67626953125, 12.297607421875, 12.9189453125, 13.540283203125, 14.16162109375, 14.782958984375, 15.404296875, 16.025634765625, 16.64697265625, 17.268310546875, 17.8896484375, 18.510986328125, 19.13232421875, 19.753662109375, 20.375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 19.0, 24.0, 25.0, 32.0, 38.0, 60.0, 92.0, 128.0, 196.0, 286.0, 425.0, 646.0, 943.0, 1330.0, 1939.0, 2709.0, 4142.0, 6207.0, 9335.0, 14084.0, 22013.0, 34039.0, 55144.0, 93451.0, 157620.0, 215941.0, 166140.0, 98965.0, 58707.0, 36181.0, 23097.0, 14780.0, 9719.0, 6398.0, 4306.0, 2956.0, 2022.0, 1400.0, 965.0, 631.0, 408.0, 320.0, 227.0, 153.0, 109.0, 61.0, 41.0, 35.0, 16.0, 11.0, 12.0, 11.0, 5.0, 7.0, 6.0], "bins": [-1.5771484375, -1.5315093994140625, -1.485870361328125, -1.4402313232421875, -1.39459228515625, -1.3489532470703125, -1.303314208984375, -1.2576751708984375, -1.2120361328125, -1.1663970947265625, -1.120758056640625, -1.0751190185546875, -1.02947998046875, -0.9838409423828125, -0.938201904296875, -0.8925628662109375, -0.846923828125, -0.8012847900390625, -0.755645751953125, -0.7100067138671875, -0.66436767578125, -0.6187286376953125, -0.573089599609375, -0.5274505615234375, -0.4818115234375, -0.4361724853515625, -0.390533447265625, -0.3448944091796875, -0.29925537109375, -0.2536163330078125, -0.207977294921875, -0.1623382568359375, -0.11669921875, -0.0710601806640625, -0.025421142578125, 0.0202178955078125, 0.06585693359375, 0.1114959716796875, 0.157135009765625, 0.2027740478515625, 0.2484130859375, 0.2940521240234375, 0.339691162109375, 0.3853302001953125, 0.43096923828125, 0.4766082763671875, 0.522247314453125, 0.5678863525390625, 0.613525390625, 0.6591644287109375, 0.704803466796875, 0.7504425048828125, 0.79608154296875, 0.8417205810546875, 0.887359619140625, 0.9329986572265625, 0.9786376953125, 1.0242767333984375, 1.069915771484375, 1.1155548095703125, 1.16119384765625, 1.2068328857421875, 1.252471923828125, 1.2981109619140625, 1.34375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 7.0, 6.0, 4.0, 6.0, 2.0, 10.0, 15.0, 11.0, 18.0, 19.0, 21.0, 24.0, 33.0, 36.0, 30.0, 26.0, 42.0, 48.0, 27.0, 55.0, 36.0, 1065.0, 35.0, 41.0, 38.0, 43.0, 37.0, 38.0, 29.0, 37.0, 23.0, 28.0, 25.0, 21.0, 19.0, 12.0, 7.0, 15.0, 6.0, 5.0, 6.0, 5.0, 8.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.78125, -11.4287109375, -11.076171875, -10.7236328125, -10.37109375, -10.0185546875, -9.666015625, -9.3134765625, -8.9609375, -8.6083984375, -8.255859375, -7.9033203125, -7.55078125, -7.1982421875, -6.845703125, -6.4931640625, -6.140625, -5.7880859375, -5.435546875, -5.0830078125, -4.73046875, -4.3779296875, -4.025390625, -3.6728515625, -3.3203125, -2.9677734375, -2.615234375, -2.2626953125, -1.91015625, -1.5576171875, -1.205078125, -0.8525390625, -0.5, -0.1474609375, 0.205078125, 0.5576171875, 0.91015625, 1.2626953125, 1.615234375, 1.9677734375, 2.3203125, 2.6728515625, 3.025390625, 3.3779296875, 3.73046875, 4.0830078125, 4.435546875, 4.7880859375, 5.140625, 5.4931640625, 5.845703125, 6.1982421875, 6.55078125, 6.9033203125, 7.255859375, 7.6083984375, 7.9609375, 8.3134765625, 8.666015625, 9.0185546875, 9.37109375, 9.7236328125, 10.076171875, 10.4287109375, 10.78125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 18.0, 27.0, 32.0, 52.0, 77.0, 114.0, 178.0, 231.0, 369.0, 581.0, 794.0, 1126.0, 1688.0, 2558.0, 3772.0, 5627.0, 8519.0, 13480.0, 21531.0, 35566.0, 59306.0, 101973.0, 173945.0, 1269289.0, 159732.0, 93371.0, 54483.0, 32078.0, 19914.0, 12514.0, 7935.0, 5312.0, 3533.0, 2400.0, 1531.0, 1113.0, 770.0, 484.0, 359.0, 252.0, 161.0, 110.0, 87.0, 46.0, 35.0, 18.0, 3.0, 7.0, 9.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 3.0], "bins": [-1.05078125, -1.017333984375, -0.98388671875, -0.950439453125, -0.9169921875, -0.883544921875, -0.85009765625, -0.816650390625, -0.783203125, -0.749755859375, -0.71630859375, -0.682861328125, -0.6494140625, -0.615966796875, -0.58251953125, -0.549072265625, -0.515625, -0.482177734375, -0.44873046875, -0.415283203125, -0.3818359375, -0.348388671875, -0.31494140625, -0.281494140625, -0.248046875, -0.214599609375, -0.18115234375, -0.147705078125, -0.1142578125, -0.080810546875, -0.04736328125, -0.013916015625, 0.01953125, 0.052978515625, 0.08642578125, 0.119873046875, 0.1533203125, 0.186767578125, 0.22021484375, 0.253662109375, 0.287109375, 0.320556640625, 0.35400390625, 0.387451171875, 0.4208984375, 0.454345703125, 0.48779296875, 0.521240234375, 0.5546875, 0.588134765625, 0.62158203125, 0.655029296875, 0.6884765625, 0.721923828125, 0.75537109375, 0.788818359375, 0.822265625, 0.855712890625, 0.88916015625, 0.922607421875, 0.9560546875, 0.989501953125, 1.02294921875, 1.056396484375, 1.08984375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 6.0, 5.0, 4.0, 5.0, 3.0, 11.0, 7.0, 10.0, 14.0, 32.0, 29.0, 38.0, 71.0, 73.0, 97.0, 122.0, 112.0, 86.0, 76.0, 49.0, 26.0, 17.0, 18.0, 10.0, 9.0, 11.0, 13.0, 7.0, 6.0, 5.0, 2.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0310516357421875, -0.030129194259643555, -0.02920675277709961, -0.028284311294555664, -0.02736186981201172, -0.026439428329467773, -0.025516986846923828, -0.024594545364379883, -0.023672103881835938, -0.022749662399291992, -0.021827220916748047, -0.0209047794342041, -0.019982337951660156, -0.01905989646911621, -0.018137454986572266, -0.01721501350402832, -0.016292572021484375, -0.01537013053894043, -0.014447689056396484, -0.013525247573852539, -0.012602806091308594, -0.011680364608764648, -0.010757923126220703, -0.009835481643676758, -0.008913040161132812, -0.007990598678588867, -0.007068157196044922, -0.0061457157135009766, -0.005223274230957031, -0.004300832748413086, -0.0033783912658691406, -0.0024559497833251953, -0.00153350830078125, -0.0006110668182373047, 0.0003113746643066406, 0.001233816146850586, 0.0021562576293945312, 0.0030786991119384766, 0.004001140594482422, 0.004923582077026367, 0.0058460235595703125, 0.006768465042114258, 0.007690906524658203, 0.008613348007202148, 0.009535789489746094, 0.010458230972290039, 0.011380672454833984, 0.01230311393737793, 0.013225555419921875, 0.01414799690246582, 0.015070438385009766, 0.01599287986755371, 0.016915321350097656, 0.0178377628326416, 0.018760204315185547, 0.019682645797729492, 0.020605087280273438, 0.021527528762817383, 0.022449970245361328, 0.023372411727905273, 0.02429485321044922, 0.025217294692993164, 0.02613973617553711, 0.027062177658081055, 0.027984619140625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 4.0, 4.0, 5.0, 11.0, 6.0, 12.0, 15.0, 27.0, 16.0, 31.0, 48.0, 49.0, 67.0, 92.0, 189.0, 368.0, 1567.0, 42559.0, 988117.0, 13636.0, 893.0, 265.0, 152.0, 109.0, 78.0, 51.0, 38.0, 28.0, 20.0, 22.0, 9.0, 5.0, 10.0, 6.0, 10.0, 2.0, 8.0, 3.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5244140625, -0.5059280395507812, -0.4874420166015625, -0.46895599365234375, -0.450469970703125, -0.43198394775390625, -0.4134979248046875, -0.39501190185546875, -0.37652587890625, -0.35803985595703125, -0.3395538330078125, -0.32106781005859375, -0.302581787109375, -0.28409576416015625, -0.2656097412109375, -0.24712371826171875, -0.2286376953125, -0.21015167236328125, -0.1916656494140625, -0.17317962646484375, -0.154693603515625, -0.13620758056640625, -0.1177215576171875, -0.09923553466796875, -0.08074951171875, -0.06226348876953125, -0.0437774658203125, -0.02529144287109375, -0.006805419921875, 0.01168060302734375, 0.0301666259765625, 0.04865264892578125, 0.067138671875, 0.08562469482421875, 0.1041107177734375, 0.12259674072265625, 0.141082763671875, 0.15956878662109375, 0.1780548095703125, 0.19654083251953125, 0.21502685546875, 0.23351287841796875, 0.2519989013671875, 0.27048492431640625, 0.288970947265625, 0.30745697021484375, 0.3259429931640625, 0.34442901611328125, 0.3629150390625, 0.38140106201171875, 0.3998870849609375, 0.41837310791015625, 0.436859130859375, 0.45534515380859375, 0.4738311767578125, 0.49231719970703125, 0.51080322265625, 0.5292892456054688, 0.5477752685546875, 0.5662612915039062, 0.584747314453125, 0.6032333374023438, 0.6217193603515625, 0.6402053833007812, 0.65869140625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 19.0, 82.0, 429.0, 376.0, 76.0, 18.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09516280889511108, -0.08785489201545715, -0.08054696768522263, -0.0732390433549881, -0.06593112647533417, -0.05862320587038994, -0.05131528526544571, -0.04400736466050148, -0.03669944405555725, -0.029391523450613022, -0.022083602845668793, -0.014775682240724564, -0.0074677616357803345, -0.00015984103083610535, 0.007148079574108124, 0.014456000179052353, 0.021763920783996582, 0.02907184138894081, 0.03637976199388504, 0.04368768259882927, 0.0509956032037735, 0.05830352380871773, 0.06561144441366196, 0.07291936874389648, 0.08022728562355042, 0.08753520250320435, 0.09484312683343887, 0.1021510511636734, 0.10945896804332733, 0.11676688492298126, 0.12407480925321579, 0.13138273358345032, 0.13869065046310425, 0.14599856734275818, 0.1533064842224121, 0.16061441600322723, 0.16792233288288116, 0.1752302497625351, 0.18253818154335022, 0.18984609842300415, 0.19715401530265808, 0.204461932182312, 0.21176984906196594, 0.21907778084278107, 0.226385697722435, 0.23369361460208893, 0.24100154638290405, 0.24830946326255798, 0.2556173801422119, 0.26292529702186584, 0.2702332139015198, 0.2775411307811737, 0.28484904766082764, 0.29215699434280396, 0.2994649112224579, 0.3067728281021118, 0.31408074498176575, 0.3213886618614197, 0.3286965787410736, 0.33600449562072754, 0.34331244230270386, 0.3506203591823578, 0.3579282760620117, 0.36523619294166565, 0.3725441098213196]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 13.0, 17.0, 16.0, 14.0, 18.0, 18.0, 24.0, 22.0, 30.0, 28.0, 28.0, 35.0, 38.0, 39.0, 42.0, 41.0, 36.0, 54.0, 38.0, 44.0, 35.0, 38.0, 30.0, 25.0, 35.0, 32.0, 32.0, 24.0, 28.0, 23.0, 18.0, 14.0, 12.0, 13.0, 9.0, 5.0, 4.0, 8.0, 1.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.023150980472564697, -0.02247793599963188, -0.021804893389344215, -0.02113185077905655, -0.020458806306123734, -0.019785761833190918, -0.01911271922290325, -0.018439676612615585, -0.01776663213968277, -0.017093587666749954, -0.016420545056462288, -0.01574750244617462, -0.015074457973241806, -0.014401414431631565, -0.013728370890021324, -0.013055327348411083, -0.012382283806800842, -0.011709240265190601, -0.01103619672358036, -0.01036315318197012, -0.009690109640359879, -0.009017066098749638, -0.008344022557139397, -0.007670979015529156, -0.006997935473918915, -0.006324891932308674, -0.005651848390698433, -0.004978804849088192, -0.004305761307477951, -0.00363271776586771, -0.002959674224257469, -0.0022866306826472282, -0.0016135871410369873, -0.0009405435994267464, -0.00026750005781650543, 0.0004055434837937355, 0.0010785870254039764, 0.0017516305670142174, 0.0024246741086244583, 0.0030977176502346992, 0.00377076119184494, 0.004443804733455181, 0.005116848275065422, 0.005789891816675663, 0.006462935358285904, 0.007135978899896145, 0.007809022441506386, 0.008482065983116627, 0.009155109524726868, 0.009828153066337109, 0.01050119660794735, 0.01117424014955759, 0.011847283691167831, 0.012520327232778072, 0.013193370774388313, 0.013866414315998554, 0.014539457857608795, 0.015212501399219036, 0.015885544940829277, 0.016558587551116943, 0.01723163202404976, 0.017904676496982574, 0.01857771910727024, 0.019250761717557907, 0.019923806190490723]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 9.0, 6.0, 13.0, 16.0, 27.0, 17.0, 17.0, 27.0, 20.0, 30.0, 40.0, 51.0, 39.0, 37.0, 47.0, 49.0, 50.0, 40.0, 54.0, 46.0, 41.0, 45.0, 36.0, 41.0, 22.0, 29.0, 21.0, 31.0, 15.0, 19.0, 13.0, 15.0, 8.0, 10.0, 5.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-19.40625, -18.78466796875, -18.1630859375, -17.54150390625, -16.919921875, -16.29833984375, -15.6767578125, -15.05517578125, -14.43359375, -13.81201171875, -13.1904296875, -12.56884765625, -11.947265625, -11.32568359375, -10.7041015625, -10.08251953125, -9.4609375, -8.83935546875, -8.2177734375, -7.59619140625, -6.974609375, -6.35302734375, -5.7314453125, -5.10986328125, -4.48828125, -3.86669921875, -3.2451171875, -2.62353515625, -2.001953125, -1.38037109375, -0.7587890625, -0.13720703125, 0.484375, 1.10595703125, 1.7275390625, 2.34912109375, 2.970703125, 3.59228515625, 4.2138671875, 4.83544921875, 5.45703125, 6.07861328125, 6.7001953125, 7.32177734375, 7.943359375, 8.56494140625, 9.1865234375, 9.80810546875, 10.4296875, 11.05126953125, 11.6728515625, 12.29443359375, 12.916015625, 13.53759765625, 14.1591796875, 14.78076171875, 15.40234375, 16.02392578125, 16.6455078125, 17.26708984375, 17.888671875, 18.51025390625, 19.1318359375, 19.75341796875, 20.375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 14.0, 13.0, 22.0, 44.0, 45.0, 75.0, 115.0, 153.0, 211.0, 318.0, 399.0, 644.0, 992.0, 1492.0, 2295.0, 3649.0, 6111.0, 10691.0, 22904.0, 81049.0, 553788.0, 278153.0, 46526.0, 16545.0, 8434.0, 4942.0, 3054.0, 1929.0, 1272.0, 869.0, 542.0, 379.0, 245.0, 172.0, 141.0, 92.0, 59.0, 49.0, 25.0, 29.0, 12.0, 15.0, 10.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-24.71875, -23.91650390625, -23.1142578125, -22.31201171875, -21.509765625, -20.70751953125, -19.9052734375, -19.10302734375, -18.30078125, -17.49853515625, -16.6962890625, -15.89404296875, -15.091796875, -14.28955078125, -13.4873046875, -12.68505859375, -11.8828125, -11.08056640625, -10.2783203125, -9.47607421875, -8.673828125, -7.87158203125, -7.0693359375, -6.26708984375, -5.46484375, -4.66259765625, -3.8603515625, -3.05810546875, -2.255859375, -1.45361328125, -0.6513671875, 0.15087890625, 0.953125, 1.75537109375, 2.5576171875, 3.35986328125, 4.162109375, 4.96435546875, 5.7666015625, 6.56884765625, 7.37109375, 8.17333984375, 8.9755859375, 9.77783203125, 10.580078125, 11.38232421875, 12.1845703125, 12.98681640625, 13.7890625, 14.59130859375, 15.3935546875, 16.19580078125, 16.998046875, 17.80029296875, 18.6025390625, 19.40478515625, 20.20703125, 21.00927734375, 21.8115234375, 22.61376953125, 23.416015625, 24.21826171875, 25.0205078125, 25.82275390625, 26.625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 10.0, 10.0, 9.0, 14.0, 12.0, 11.0, 13.0, 15.0, 12.0, 25.0, 26.0, 26.0, 25.0, 31.0, 38.0, 32.0, 48.0, 69.0, 89.0, 220.0, 1584.0, 208.0, 99.0, 58.0, 44.0, 51.0, 25.0, 33.0, 34.0, 19.0, 16.0, 23.0, 15.0, 17.0, 15.0, 18.0, 11.0, 8.0, 10.0, 10.0, 4.0, 4.0, 2.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.65625, -36.53076171875, -35.4052734375, -34.27978515625, -33.154296875, -32.02880859375, -30.9033203125, -29.77783203125, -28.65234375, -27.52685546875, -26.4013671875, -25.27587890625, -24.150390625, -23.02490234375, -21.8994140625, -20.77392578125, -19.6484375, -18.52294921875, -17.3974609375, -16.27197265625, -15.146484375, -14.02099609375, -12.8955078125, -11.77001953125, -10.64453125, -9.51904296875, -8.3935546875, -7.26806640625, -6.142578125, -5.01708984375, -3.8916015625, -2.76611328125, -1.640625, -0.51513671875, 0.6103515625, 1.73583984375, 2.861328125, 3.98681640625, 5.1123046875, 6.23779296875, 7.36328125, 8.48876953125, 9.6142578125, 10.73974609375, 11.865234375, 12.99072265625, 14.1162109375, 15.24169921875, 16.3671875, 17.49267578125, 18.6181640625, 19.74365234375, 20.869140625, 21.99462890625, 23.1201171875, 24.24560546875, 25.37109375, 26.49658203125, 27.6220703125, 28.74755859375, 29.873046875, 30.99853515625, 32.1240234375, 33.24951171875, 34.375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 5.0, 11.0, 17.0, 26.0, 39.0, 55.0, 78.0, 146.0, 256.0, 631.0, 3047.0, 45225.0, 3072325.0, 20743.0, 1993.0, 480.0, 247.0, 126.0, 74.0, 47.0, 36.0, 20.0, 17.0, 10.0, 9.0, 6.0, 3.0, 0.0, 1.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.75, -88.400390625, -85.05078125, -81.701171875, -78.3515625, -75.001953125, -71.65234375, -68.302734375, -64.953125, -61.603515625, -58.25390625, -54.904296875, -51.5546875, -48.205078125, -44.85546875, -41.505859375, -38.15625, -34.806640625, -31.45703125, -28.107421875, -24.7578125, -21.408203125, -18.05859375, -14.708984375, -11.359375, -8.009765625, -4.66015625, -1.310546875, 2.0390625, 5.388671875, 8.73828125, 12.087890625, 15.4375, 18.787109375, 22.13671875, 25.486328125, 28.8359375, 32.185546875, 35.53515625, 38.884765625, 42.234375, 45.583984375, 48.93359375, 52.283203125, 55.6328125, 58.982421875, 62.33203125, 65.681640625, 69.03125, 72.380859375, 75.73046875, 79.080078125, 82.4296875, 85.779296875, 89.12890625, 92.478515625, 95.828125, 99.177734375, 102.52734375, 105.876953125, 109.2265625, 112.576171875, 115.92578125, 119.275390625, 122.625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 18.0, 142.0, 495.0, 294.0, 61.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.3460578918457, -46.34069061279297, -40.33531951904297, -34.32994842529297, -28.324581146240234, -22.319211959838867, -16.3138427734375, -10.308475494384766, -4.303104400634766, 1.7022647857666016, 7.707633972167969, 13.713003158569336, 19.718372344970703, 25.72374153137207, 31.729110717773438, 37.73447799682617, 43.73984909057617, 49.745216369628906, 55.750587463378906, 61.755958557128906, 67.76132202148438, 73.76669311523438, 79.77206420898438, 85.77743530273438, 91.78280639648438, 97.78817749023438, 103.79354858398438, 109.79891204833984, 115.80428314208984, 121.80965423583984, 127.81501770019531, 133.8203887939453, 139.82574462890625, 145.83111572265625, 151.83648681640625, 157.84185791015625, 163.84722900390625, 169.8525848388672, 175.8579559326172, 181.8633270263672, 187.8686981201172, 193.8740692138672, 199.8794403076172, 205.8848114013672, 211.89016723632812, 217.89553833007812, 223.90090942382812, 229.90628051757812, 235.91165161132812, 241.91702270507812, 247.92239379882812, 253.92776489257812, 259.9331359863281, 265.9385070800781, 271.9438781738281, 277.94921875, 283.95458984375, 289.9599609375, 295.96533203125, 301.970703125, 307.97607421875, 313.9814453125, 319.98681640625, 325.9921875, 331.99755859375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 8.0, 12.0, 8.0, 10.0, 8.0, 15.0, 19.0, 22.0, 23.0, 29.0, 25.0, 27.0, 32.0, 42.0, 27.0, 39.0, 36.0, 40.0, 51.0, 44.0, 35.0, 41.0, 39.0, 33.0, 34.0, 26.0, 33.0, 38.0, 31.0, 29.0, 15.0, 22.0, 12.0, 10.0, 17.0, 11.0, 9.0, 11.0, 8.0, 7.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.37543487548828, -68.8658447265625, -66.35624694824219, -63.84665298461914, -61.337059020996094, -58.82746887207031, -56.317874908447266, -53.80828094482422, -51.29868698120117, -48.789093017578125, -46.27949905395508, -43.76990509033203, -41.26031494140625, -38.75071716308594, -36.241127014160156, -33.73153305053711, -31.221939086914062, -28.712345123291016, -26.20275115966797, -23.693159103393555, -21.183565139770508, -18.67397117614746, -16.164379119873047, -13.65478515625, -11.145191192626953, -8.635597229003906, -6.126004219055176, -3.616410732269287, -1.1068172454833984, 1.4027767181396484, 3.912369728088379, 6.421962738037109, 8.931556701660156, 11.441150665283203, 13.950743675231934, 16.460336685180664, 18.96993064880371, 21.479524612426758, 23.989116668701172, 26.49871063232422, 29.008304595947266, 31.517898559570312, 34.02749252319336, 36.537086486816406, 39.04667663574219, 41.5562744140625, 44.06586456298828, 46.57545852661133, 49.085052490234375, 51.59464645385742, 54.10424041748047, 56.613834381103516, 59.12342834472656, 61.633018493652344, 64.14261627197266, 66.65220642089844, 69.16180419921875, 71.67139434814453, 74.18099212646484, 76.69058227539062, 79.20018005371094, 81.70977020263672, 84.21936798095703, 86.72895812988281, 89.2385482788086]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 8.0, 13.0, 6.0, 12.0, 15.0, 21.0, 19.0, 21.0, 34.0, 20.0, 31.0, 37.0, 38.0, 37.0, 42.0, 46.0, 42.0, 47.0, 50.0, 55.0, 44.0, 43.0, 39.0, 44.0, 27.0, 27.0, 30.0, 19.0, 17.0, 23.0, 27.0, 14.0, 13.0, 8.0, 11.0, 4.0, 4.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.359375, -17.750244140625, -17.14111328125, -16.531982421875, -15.9228515625, -15.313720703125, -14.70458984375, -14.095458984375, -13.486328125, -12.877197265625, -12.26806640625, -11.658935546875, -11.0498046875, -10.440673828125, -9.83154296875, -9.222412109375, -8.61328125, -8.004150390625, -7.39501953125, -6.785888671875, -6.1767578125, -5.567626953125, -4.95849609375, -4.349365234375, -3.740234375, -3.131103515625, -2.52197265625, -1.912841796875, -1.3037109375, -0.694580078125, -0.08544921875, 0.523681640625, 1.1328125, 1.741943359375, 2.35107421875, 2.960205078125, 3.5693359375, 4.178466796875, 4.78759765625, 5.396728515625, 6.005859375, 6.614990234375, 7.22412109375, 7.833251953125, 8.4423828125, 9.051513671875, 9.66064453125, 10.269775390625, 10.87890625, 11.488037109375, 12.09716796875, 12.706298828125, 13.3154296875, 13.924560546875, 14.53369140625, 15.142822265625, 15.751953125, 16.361083984375, 16.97021484375, 17.579345703125, 18.1884765625, 18.797607421875, 19.40673828125, 20.015869140625, 20.625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 10.0, 7.0, 11.0, 9.0, 9.0, 24.0, 15.0, 21.0, 30.0, 26.0, 38.0, 47.0, 55.0, 97.0, 107.0, 158.0, 244.0, 363.0, 784.0, 2674.0, 29914.0, 4142420.0, 13330.0, 1981.0, 686.0, 365.0, 223.0, 149.0, 102.0, 87.0, 54.0, 40.0, 49.0, 28.0, 29.0, 16.0, 16.0, 14.0, 10.0, 13.0, 6.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-186.5, -180.365234375, -174.23046875, -168.095703125, -161.9609375, -155.826171875, -149.69140625, -143.556640625, -137.421875, -131.287109375, -125.15234375, -119.017578125, -112.8828125, -106.748046875, -100.61328125, -94.478515625, -88.34375, -82.208984375, -76.07421875, -69.939453125, -63.8046875, -57.669921875, -51.53515625, -45.400390625, -39.265625, -33.130859375, -26.99609375, -20.861328125, -14.7265625, -8.591796875, -2.45703125, 3.677734375, 9.8125, 15.947265625, 22.08203125, 28.216796875, 34.3515625, 40.486328125, 46.62109375, 52.755859375, 58.890625, 65.025390625, 71.16015625, 77.294921875, 83.4296875, 89.564453125, 95.69921875, 101.833984375, 107.96875, 114.103515625, 120.23828125, 126.373046875, 132.5078125, 138.642578125, 144.77734375, 150.912109375, 157.046875, 163.181640625, 169.31640625, 175.451171875, 181.5859375, 187.720703125, 193.85546875, 199.990234375, 206.125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 9.0, 9.0, 10.0, 9.0, 11.0, 25.0, 23.0, 29.0, 47.0, 59.0, 92.0, 166.0, 342.0, 676.0, 1184.0, 643.0, 312.0, 165.0, 74.0, 45.0, 37.0, 21.0, 15.0, 15.0, 6.0, 6.0, 7.0, 6.0, 8.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.75, -37.65576171875, -36.5615234375, -35.46728515625, -34.373046875, -33.27880859375, -32.1845703125, -31.09033203125, -29.99609375, -28.90185546875, -27.8076171875, -26.71337890625, -25.619140625, -24.52490234375, -23.4306640625, -22.33642578125, -21.2421875, -20.14794921875, -19.0537109375, -17.95947265625, -16.865234375, -15.77099609375, -14.6767578125, -13.58251953125, -12.48828125, -11.39404296875, -10.2998046875, -9.20556640625, -8.111328125, -7.01708984375, -5.9228515625, -4.82861328125, -3.734375, -2.64013671875, -1.5458984375, -0.45166015625, 0.642578125, 1.73681640625, 2.8310546875, 3.92529296875, 5.01953125, 6.11376953125, 7.2080078125, 8.30224609375, 9.396484375, 10.49072265625, 11.5849609375, 12.67919921875, 13.7734375, 14.86767578125, 15.9619140625, 17.05615234375, 18.150390625, 19.24462890625, 20.3388671875, 21.43310546875, 22.52734375, 23.62158203125, 24.7158203125, 25.81005859375, 26.904296875, 27.99853515625, 29.0927734375, 30.18701171875, 31.28125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 0.0, 4.0, 8.0, 14.0, 13.0, 7.0, 10.0, 25.0, 34.0, 40.0, 67.0, 125.0, 290.0, 626.0, 1800.0, 5757.0, 28107.0, 1850415.0, 2269737.0, 28446.0, 5746.0, 1787.0, 617.0, 261.0, 126.0, 65.0, 38.0, 23.0, 34.0, 12.0, 8.0, 10.0, 9.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.8125, -88.4130859375, -85.013671875, -81.6142578125, -78.21484375, -74.8154296875, -71.416015625, -68.0166015625, -64.6171875, -61.2177734375, -57.818359375, -54.4189453125, -51.01953125, -47.6201171875, -44.220703125, -40.8212890625, -37.421875, -34.0224609375, -30.623046875, -27.2236328125, -23.82421875, -20.4248046875, -17.025390625, -13.6259765625, -10.2265625, -6.8271484375, -3.427734375, -0.0283203125, 3.37109375, 6.7705078125, 10.169921875, 13.5693359375, 16.96875, 20.3681640625, 23.767578125, 27.1669921875, 30.56640625, 33.9658203125, 37.365234375, 40.7646484375, 44.1640625, 47.5634765625, 50.962890625, 54.3623046875, 57.76171875, 61.1611328125, 64.560546875, 67.9599609375, 71.359375, 74.7587890625, 78.158203125, 81.5576171875, 84.95703125, 88.3564453125, 91.755859375, 95.1552734375, 98.5546875, 101.9541015625, 105.353515625, 108.7529296875, 112.15234375, 115.5517578125, 118.951171875, 122.3505859375, 125.75]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 13.0, 27.0, 65.0, 212.0, 398.0, 191.0, 69.0, 22.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-278.3038330078125, -269.4793395996094, -260.6548156738281, -251.830322265625, -243.0058135986328, -234.18130493164062, -225.3568115234375, -216.5323028564453, -207.70779418945312, -198.88328552246094, -190.0587921142578, -181.23428344726562, -172.40977478027344, -163.58526611328125, -154.76077270507812, -145.93626403808594, -137.1117706298828, -128.28726196289062, -119.46276092529297, -110.63825988769531, -101.81375122070312, -92.98925018310547, -84.16474914550781, -75.34024047851562, -66.51573944091797, -57.69123458862305, -48.866729736328125, -40.04222869873047, -31.217723846435547, -22.393218994140625, -13.568717956542969, -4.744213104248047, 4.080291748046875, 12.90479564666748, 21.729299545288086, 30.553802490234375, 39.3783073425293, 48.20281219482422, 57.027313232421875, 65.85182189941406, 74.67632293701172, 83.50082397460938, 92.32533264160156, 101.14983367919922, 109.97433471679688, 118.79884338378906, 127.62334442138672, 136.44784545898438, 145.27235412597656, 154.09686279296875, 162.92135620117188, 171.74586486816406, 180.57037353515625, 189.39486694335938, 198.21937561035156, 207.04388427734375, 215.86837768554688, 224.69288635253906, 233.5173797607422, 242.34188842773438, 251.16639709472656, 259.99090576171875, 268.8153991699219, 277.639892578125, 286.46441650390625]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 5.0, 10.0, 10.0, 13.0, 10.0, 15.0, 25.0, 22.0, 36.0, 19.0, 41.0, 35.0, 37.0, 43.0, 43.0, 50.0, 40.0, 38.0, 52.0, 39.0, 37.0, 39.0, 34.0, 42.0, 32.0, 36.0, 30.0, 30.0, 20.0, 14.0, 21.0, 16.0, 13.0, 5.0, 9.0, 5.0, 9.0, 3.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.40347290039062, -79.65919494628906, -76.9149169921875, -74.17063903808594, -71.4263687133789, -68.68209075927734, -65.93781280517578, -63.19353485107422, -60.44926071166992, -57.70498275756836, -54.96070861816406, -52.2164306640625, -49.47215270996094, -46.72787857055664, -43.98360061645508, -41.23932647705078, -38.49504852294922, -35.750770568847656, -33.00649642944336, -30.262218475341797, -27.517942428588867, -24.773666381835938, -22.029388427734375, -19.285112380981445, -16.540836334228516, -13.796560287475586, -11.05228328704834, -8.308006286621094, -5.563730239868164, -2.8194541931152344, -0.07517623901367188, 2.669099807739258, 5.4133758544921875, 8.157651901245117, 10.901928901672363, 13.64620590209961, 16.39048194885254, 19.13475799560547, 21.87903594970703, 24.62331199645996, 27.36758804321289, 30.11186408996582, 32.85614013671875, 35.60041809082031, 38.344696044921875, 41.08897018432617, 43.833248138427734, 46.57752227783203, 49.321800231933594, 52.066078186035156, 54.81035232543945, 57.554630279541016, 60.29890441894531, 63.043182373046875, 65.78746032714844, 68.53173828125, 71.27601623535156, 74.02029418945312, 76.76457214355469, 79.50885009765625, 82.25312042236328, 84.99739837646484, 87.7416763305664, 90.48595428466797, 93.230224609375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 8.0, 5.0, 13.0, 10.0, 18.0, 16.0, 23.0, 14.0, 32.0, 34.0, 18.0, 31.0, 32.0, 31.0, 42.0, 51.0, 44.0, 52.0, 49.0, 40.0, 44.0, 54.0, 33.0, 49.0, 30.0, 30.0, 32.0, 25.0, 21.0, 21.0, 18.0, 17.0, 11.0, 7.0, 12.0, 9.0, 10.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.4375, -18.8525390625, -18.267578125, -17.6826171875, -17.09765625, -16.5126953125, -15.927734375, -15.3427734375, -14.7578125, -14.1728515625, -13.587890625, -13.0029296875, -12.41796875, -11.8330078125, -11.248046875, -10.6630859375, -10.078125, -9.4931640625, -8.908203125, -8.3232421875, -7.73828125, -7.1533203125, -6.568359375, -5.9833984375, -5.3984375, -4.8134765625, -4.228515625, -3.6435546875, -3.05859375, -2.4736328125, -1.888671875, -1.3037109375, -0.71875, -0.1337890625, 0.451171875, 1.0361328125, 1.62109375, 2.2060546875, 2.791015625, 3.3759765625, 3.9609375, 4.5458984375, 5.130859375, 5.7158203125, 6.30078125, 6.8857421875, 7.470703125, 8.0556640625, 8.640625, 9.2255859375, 9.810546875, 10.3955078125, 10.98046875, 11.5654296875, 12.150390625, 12.7353515625, 13.3203125, 13.9052734375, 14.490234375, 15.0751953125, 15.66015625, 16.2451171875, 16.830078125, 17.4150390625, 18.0]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 4.0, 11.0, 12.0, 23.0, 47.0, 46.0, 73.0, 105.0, 154.0, 240.0, 300.0, 464.0, 716.0, 1100.0, 1648.0, 2436.0, 3658.0, 5589.0, 8692.0, 13253.0, 20918.0, 32707.0, 53066.0, 89208.0, 154854.0, 225520.0, 173058.0, 99829.0, 59173.0, 36252.0, 22969.0, 14702.0, 9523.0, 6118.0, 4036.0, 2607.0, 1808.0, 1191.0, 789.0, 513.0, 366.0, 253.0, 170.0, 100.0, 70.0, 56.0, 40.0, 34.0, 13.0, 15.0, 4.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0], "bins": [-1.576171875, -1.52783203125, -1.4794921875, -1.43115234375, -1.3828125, -1.33447265625, -1.2861328125, -1.23779296875, -1.189453125, -1.14111328125, -1.0927734375, -1.04443359375, -0.99609375, -0.94775390625, -0.8994140625, -0.85107421875, -0.802734375, -0.75439453125, -0.7060546875, -0.65771484375, -0.609375, -0.56103515625, -0.5126953125, -0.46435546875, -0.416015625, -0.36767578125, -0.3193359375, -0.27099609375, -0.22265625, -0.17431640625, -0.1259765625, -0.07763671875, -0.029296875, 0.01904296875, 0.0673828125, 0.11572265625, 0.1640625, 0.21240234375, 0.2607421875, 0.30908203125, 0.357421875, 0.40576171875, 0.4541015625, 0.50244140625, 0.55078125, 0.59912109375, 0.6474609375, 0.69580078125, 0.744140625, 0.79248046875, 0.8408203125, 0.88916015625, 0.9375, 0.98583984375, 1.0341796875, 1.08251953125, 1.130859375, 1.17919921875, 1.2275390625, 1.27587890625, 1.32421875, 1.37255859375, 1.4208984375, 1.46923828125, 1.517578125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 2.0, 8.0, 7.0, 5.0, 7.0, 5.0, 19.0, 6.0, 16.0, 24.0, 14.0, 23.0, 22.0, 19.0, 32.0, 34.0, 25.0, 31.0, 40.0, 31.0, 39.0, 49.0, 1059.0, 38.0, 37.0, 39.0, 41.0, 32.0, 43.0, 33.0, 24.0, 26.0, 30.0, 20.0, 24.0, 21.0, 20.0, 18.0, 17.0, 11.0, 2.0, 7.0, 2.0, 8.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.9453125, -10.601318359375, -10.25732421875, -9.913330078125, -9.5693359375, -9.225341796875, -8.88134765625, -8.537353515625, -8.193359375, -7.849365234375, -7.50537109375, -7.161376953125, -6.8173828125, -6.473388671875, -6.12939453125, -5.785400390625, -5.44140625, -5.097412109375, -4.75341796875, -4.409423828125, -4.0654296875, -3.721435546875, -3.37744140625, -3.033447265625, -2.689453125, -2.345458984375, -2.00146484375, -1.657470703125, -1.3134765625, -0.969482421875, -0.62548828125, -0.281494140625, 0.0625, 0.406494140625, 0.75048828125, 1.094482421875, 1.4384765625, 1.782470703125, 2.12646484375, 2.470458984375, 2.814453125, 3.158447265625, 3.50244140625, 3.846435546875, 4.1904296875, 4.534423828125, 4.87841796875, 5.222412109375, 5.56640625, 5.910400390625, 6.25439453125, 6.598388671875, 6.9423828125, 7.286376953125, 7.63037109375, 7.974365234375, 8.318359375, 8.662353515625, 9.00634765625, 9.350341796875, 9.6943359375, 10.038330078125, 10.38232421875, 10.726318359375, 11.0703125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 9.0, 25.0, 24.0, 48.0, 81.0, 123.0, 179.0, 252.0, 403.0, 644.0, 997.0, 1518.0, 2223.0, 3570.0, 5444.0, 8385.0, 12857.0, 19980.0, 32106.0, 52542.0, 90823.0, 157514.0, 1276082.0, 174760.0, 101002.0, 58478.0, 35340.0, 21875.0, 13921.0, 8896.0, 5931.0, 3876.0, 2470.0, 1655.0, 1127.0, 685.0, 446.0, 295.0, 186.0, 133.0, 82.0, 45.0, 31.0, 22.0, 13.0, 9.0, 8.0, 7.0, 5.0, 4.0, 1.0], "bins": [-1.2529296875, -1.2177352905273438, -1.1825408935546875, -1.1473464965820312, -1.112152099609375, -1.0769577026367188, -1.0417633056640625, -1.0065689086914062, -0.97137451171875, -0.9361801147460938, -0.9009857177734375, -0.8657913208007812, -0.830596923828125, -0.7954025268554688, -0.7602081298828125, -0.7250137329101562, -0.6898193359375, -0.6546249389648438, -0.6194305419921875, -0.5842361450195312, -0.549041748046875, -0.5138473510742188, -0.4786529541015625, -0.44345855712890625, -0.40826416015625, -0.37306976318359375, -0.3378753662109375, -0.30268096923828125, -0.267486572265625, -0.23229217529296875, -0.1970977783203125, -0.16190338134765625, -0.126708984375, -0.09151458740234375, -0.0563201904296875, -0.02112579345703125, 0.014068603515625, 0.04926300048828125, 0.0844573974609375, 0.11965179443359375, 0.15484619140625, 0.19004058837890625, 0.2252349853515625, 0.26042938232421875, 0.295623779296875, 0.33081817626953125, 0.3660125732421875, 0.40120697021484375, 0.4364013671875, 0.47159576416015625, 0.5067901611328125, 0.5419845581054688, 0.577178955078125, 0.6123733520507812, 0.6475677490234375, 0.6827621459960938, 0.71795654296875, 0.7531509399414062, 0.7883453369140625, 0.8235397338867188, 0.858734130859375, 0.8939285278320312, 0.9291229248046875, 0.9643173217773438, 0.99951171875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 4.0, 5.0, 2.0, 4.0, 7.0, 8.0, 3.0, 18.0, 14.0, 13.0, 14.0, 20.0, 22.0, 22.0, 34.0, 63.0, 71.0, 88.0, 96.0, 107.0, 80.0, 55.0, 47.0, 37.0, 23.0, 17.0, 27.0, 17.0, 9.0, 19.0, 12.0, 10.0, 4.0, 7.0, 2.0, 3.0, 4.0, 5.0, 0.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0250701904296875, -0.02422618865966797, -0.023382186889648438, -0.022538185119628906, -0.021694183349609375, -0.020850181579589844, -0.020006179809570312, -0.01916217803955078, -0.01831817626953125, -0.01747417449951172, -0.016630172729492188, -0.015786170959472656, -0.014942169189453125, -0.014098167419433594, -0.013254165649414062, -0.012410163879394531, -0.011566162109375, -0.010722160339355469, -0.009878158569335938, -0.009034156799316406, -0.008190155029296875, -0.007346153259277344, -0.0065021514892578125, -0.005658149719238281, -0.00481414794921875, -0.003970146179199219, -0.0031261444091796875, -0.0022821426391601562, -0.001438140869140625, -0.0005941390991210938, 0.0002498626708984375, 0.0010938644409179688, 0.0019378662109375, 0.0027818679809570312, 0.0036258697509765625, 0.004469871520996094, 0.005313873291015625, 0.006157875061035156, 0.0070018768310546875, 0.007845878601074219, 0.00868988037109375, 0.009533882141113281, 0.010377883911132812, 0.011221885681152344, 0.012065887451171875, 0.012909889221191406, 0.013753890991210938, 0.014597892761230469, 0.01544189453125, 0.01628589630126953, 0.017129898071289062, 0.017973899841308594, 0.018817901611328125, 0.019661903381347656, 0.020505905151367188, 0.02134990692138672, 0.02219390869140625, 0.02303791046142578, 0.023881912231445312, 0.024725914001464844, 0.025569915771484375, 0.026413917541503906, 0.027257919311523438, 0.02810192108154297, 0.0289459228515625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 3.0, 7.0, 1.0, 5.0, 4.0, 6.0, 7.0, 8.0, 7.0, 15.0, 15.0, 16.0, 29.0, 27.0, 37.0, 50.0, 95.0, 91.0, 136.0, 277.0, 796.0, 5227.0, 147355.0, 876603.0, 15167.0, 1585.0, 405.0, 166.0, 92.0, 66.0, 55.0, 49.0, 31.0, 23.0, 19.0, 13.0, 9.0, 13.0, 2.0, 7.0, 7.0, 3.0, 8.0, 5.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5251922607421875, -0.508880615234375, -0.4925689697265625, -0.47625732421875, -0.4599456787109375, -0.443634033203125, -0.4273223876953125, -0.4110107421875, -0.3946990966796875, -0.378387451171875, -0.3620758056640625, -0.34576416015625, -0.3294525146484375, -0.313140869140625, -0.2968292236328125, -0.280517578125, -0.2642059326171875, -0.247894287109375, -0.2315826416015625, -0.21527099609375, -0.1989593505859375, -0.182647705078125, -0.1663360595703125, -0.1500244140625, -0.1337127685546875, -0.117401123046875, -0.1010894775390625, -0.08477783203125, -0.0684661865234375, -0.052154541015625, -0.0358428955078125, -0.01953125, -0.0032196044921875, 0.013092041015625, 0.0294036865234375, 0.04571533203125, 0.0620269775390625, 0.078338623046875, 0.0946502685546875, 0.1109619140625, 0.1272735595703125, 0.143585205078125, 0.1598968505859375, 0.17620849609375, 0.1925201416015625, 0.208831787109375, 0.2251434326171875, 0.241455078125, 0.2577667236328125, 0.274078369140625, 0.2903900146484375, 0.30670166015625, 0.3230133056640625, 0.339324951171875, 0.3556365966796875, 0.3719482421875, 0.3882598876953125, 0.404571533203125, 0.4208831787109375, 0.43719482421875, 0.4535064697265625, 0.469818115234375, 0.4861297607421875, 0.50244140625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 14.0, 40.0, 127.0, 391.0, 297.0, 90.0, 32.0, 11.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07173629850149155, -0.06513958424329758, -0.058542877435684204, -0.051946163177490234, -0.04534945636987686, -0.03875274211168289, -0.03215603157877922, -0.02555932104587555, -0.018962610512971878, -0.012365899980068207, -0.005769188515841961, 0.000827522948384285, 0.007424233481287956, 0.014020945876836777, 0.020617656409740448, 0.02721436694264412, 0.03381107747554779, 0.04040778800845146, 0.04700449854135513, 0.0536012127995491, 0.060197919607162476, 0.06679463386535645, 0.07339134812355042, 0.07998805493116379, 0.08658476173877716, 0.09318147599697113, 0.0997781828045845, 0.10637489706277847, 0.11297160387039185, 0.11956831812858582, 0.12616503238677979, 0.13276174664497375, 0.13935844600200653, 0.1459551602602005, 0.15255187451839447, 0.15914857387542725, 0.16574528813362122, 0.17234200239181519, 0.17893871665000916, 0.18553543090820312, 0.1921321302652359, 0.19872884452342987, 0.20532555878162384, 0.21192225813865662, 0.21851897239685059, 0.22511568665504456, 0.23171240091323853, 0.2383091151714325, 0.24490582942962646, 0.25150254368782043, 0.2580992579460144, 0.2646959722042084, 0.27129268646240234, 0.2778893709182739, 0.2844860851764679, 0.29108279943466187, 0.29767951369285583, 0.3042762279510498, 0.3108729422092438, 0.31746965646743774, 0.3240663707256317, 0.3306630849838257, 0.33725976943969727, 0.34385648369789124, 0.3504531979560852]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 9.0, 7.0, 8.0, 19.0, 16.0, 24.0, 18.0, 33.0, 27.0, 37.0, 22.0, 41.0, 34.0, 42.0, 45.0, 56.0, 43.0, 49.0, 61.0, 34.0, 60.0, 41.0, 32.0, 47.0, 30.0, 20.0, 29.0, 33.0, 18.0, 12.0, 9.0, 12.0, 4.0, 6.0, 3.0, 7.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.020522117614746094, -0.019879672676324844, -0.019237225875258446, -0.018594779074192047, -0.017952334135770798, -0.01730988919734955, -0.01666744239628315, -0.01602499559521675, -0.015382550656795502, -0.014740104787051678, -0.014097658917307854, -0.01345521304756403, -0.012812767177820206, -0.012170321308076382, -0.011527875438332558, -0.010885429568588734, -0.01024298369884491, -0.009600537829101086, -0.008958091959357262, -0.008315646089613438, -0.007673200219869614, -0.00703075435012579, -0.006388308480381966, -0.005745862610638142, -0.005103416740894318, -0.004460970871150494, -0.0038185250014066696, -0.0031760791316628456, -0.0025336332619190216, -0.0018911873921751976, -0.0012487415224313736, -0.0006062956526875496, 3.6150217056274414e-05, 0.0006785960868000984, 0.0013210419565439224, 0.0019634878262877464, 0.0026059336960315704, 0.0032483795657753944, 0.0038908254355192184, 0.0045332713052630424, 0.0051757171750068665, 0.0058181630447506905, 0.0064606089144945145, 0.0071030547842383385, 0.0077455006539821625, 0.008387946523725986, 0.00903039239346981, 0.009672838263213634, 0.010315284132957458, 0.010957730002701283, 0.011600175872445107, 0.01224262174218893, 0.012885067611932755, 0.013527513481676579, 0.014169959351420403, 0.014812405221164227, 0.01545485109090805, 0.0160972960293293, 0.0167397428303957, 0.017382189631462097, 0.018024634569883347, 0.018667079508304596, 0.019309526309370995, 0.019951973110437393, 0.020594418048858643]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 8.0, 5.0, 13.0, 10.0, 18.0, 16.0, 23.0, 14.0, 32.0, 34.0, 18.0, 31.0, 32.0, 31.0, 42.0, 51.0, 44.0, 52.0, 49.0, 40.0, 44.0, 54.0, 33.0, 49.0, 30.0, 30.0, 32.0, 25.0, 21.0, 21.0, 18.0, 17.0, 11.0, 7.0, 12.0, 9.0, 10.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.4375, -18.8525390625, -18.267578125, -17.6826171875, -17.09765625, -16.5126953125, -15.927734375, -15.3427734375, -14.7578125, -14.1728515625, -13.587890625, -13.0029296875, -12.41796875, -11.8330078125, -11.248046875, -10.6630859375, -10.078125, -9.4931640625, -8.908203125, -8.3232421875, -7.73828125, -7.1533203125, -6.568359375, -5.9833984375, -5.3984375, -4.8134765625, -4.228515625, -3.6435546875, -3.05859375, -2.4736328125, -1.888671875, -1.3037109375, -0.71875, -0.1337890625, 0.451171875, 1.0361328125, 1.62109375, 2.2060546875, 2.791015625, 3.3759765625, 3.9609375, 4.5458984375, 5.130859375, 5.7158203125, 6.30078125, 6.8857421875, 7.470703125, 8.0556640625, 8.640625, 9.2255859375, 9.810546875, 10.3955078125, 10.98046875, 11.5654296875, 12.150390625, 12.7353515625, 13.3203125, 13.9052734375, 14.490234375, 15.0751953125, 15.66015625, 16.2451171875, 16.830078125, 17.4150390625, 18.0]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 4.0, 11.0, 9.0, 12.0, 20.0, 19.0, 37.0, 48.0, 57.0, 83.0, 127.0, 157.0, 220.0, 370.0, 473.0, 724.0, 1042.0, 1647.0, 2476.0, 4712.0, 10504.0, 37189.0, 272088.0, 608668.0, 75917.0, 16479.0, 6354.0, 3186.0, 1974.0, 1226.0, 821.0, 544.0, 392.0, 277.0, 199.0, 146.0, 80.0, 75.0, 48.0, 41.0, 30.0, 27.0, 14.0, 3.0, 4.0, 13.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-33.8125, -32.794189453125, -31.77587890625, -30.757568359375, -29.7392578125, -28.720947265625, -27.70263671875, -26.684326171875, -25.666015625, -24.647705078125, -23.62939453125, -22.611083984375, -21.5927734375, -20.574462890625, -19.55615234375, -18.537841796875, -17.51953125, -16.501220703125, -15.48291015625, -14.464599609375, -13.4462890625, -12.427978515625, -11.40966796875, -10.391357421875, -9.373046875, -8.354736328125, -7.33642578125, -6.318115234375, -5.2998046875, -4.281494140625, -3.26318359375, -2.244873046875, -1.2265625, -0.208251953125, 0.81005859375, 1.828369140625, 2.8466796875, 3.864990234375, 4.88330078125, 5.901611328125, 6.919921875, 7.938232421875, 8.95654296875, 9.974853515625, 10.9931640625, 12.011474609375, 13.02978515625, 14.048095703125, 15.06640625, 16.084716796875, 17.10302734375, 18.121337890625, 19.1396484375, 20.157958984375, 21.17626953125, 22.194580078125, 23.212890625, 24.231201171875, 25.24951171875, 26.267822265625, 27.2861328125, 28.304443359375, 29.32275390625, 30.341064453125, 31.359375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 4.0, 4.0, 6.0, 11.0, 15.0, 12.0, 10.0, 21.0, 29.0, 23.0, 43.0, 23.0, 33.0, 30.0, 48.0, 55.0, 77.0, 165.0, 1599.0, 252.0, 99.0, 68.0, 74.0, 48.0, 35.0, 41.0, 35.0, 34.0, 24.0, 21.0, 14.0, 19.0, 8.0, 11.0, 6.0, 15.0, 9.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-36.84375, -35.71484375, -34.5859375, -33.45703125, -32.328125, -31.19921875, -30.0703125, -28.94140625, -27.8125, -26.68359375, -25.5546875, -24.42578125, -23.296875, -22.16796875, -21.0390625, -19.91015625, -18.78125, -17.65234375, -16.5234375, -15.39453125, -14.265625, -13.13671875, -12.0078125, -10.87890625, -9.75, -8.62109375, -7.4921875, -6.36328125, -5.234375, -4.10546875, -2.9765625, -1.84765625, -0.71875, 0.41015625, 1.5390625, 2.66796875, 3.796875, 4.92578125, 6.0546875, 7.18359375, 8.3125, 9.44140625, 10.5703125, 11.69921875, 12.828125, 13.95703125, 15.0859375, 16.21484375, 17.34375, 18.47265625, 19.6015625, 20.73046875, 21.859375, 22.98828125, 24.1171875, 25.24609375, 26.375, 27.50390625, 28.6328125, 29.76171875, 30.890625, 32.01953125, 33.1484375, 34.27734375, 35.40625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 10.0, 11.0, 5.0, 17.0, 11.0, 16.0, 21.0, 33.0, 47.0, 61.0, 98.0, 157.0, 270.0, 564.0, 1626.0, 263323.0, 2875949.0, 2103.0, 603.0, 268.0, 166.0, 97.0, 62.0, 32.0, 29.0, 19.0, 15.0, 20.0, 9.0, 15.0, 14.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-144.125, -139.16796875, -134.2109375, -129.25390625, -124.296875, -119.33984375, -114.3828125, -109.42578125, -104.46875, -99.51171875, -94.5546875, -89.59765625, -84.640625, -79.68359375, -74.7265625, -69.76953125, -64.8125, -59.85546875, -54.8984375, -49.94140625, -44.984375, -40.02734375, -35.0703125, -30.11328125, -25.15625, -20.19921875, -15.2421875, -10.28515625, -5.328125, -0.37109375, 4.5859375, 9.54296875, 14.5, 19.45703125, 24.4140625, 29.37109375, 34.328125, 39.28515625, 44.2421875, 49.19921875, 54.15625, 59.11328125, 64.0703125, 69.02734375, 73.984375, 78.94140625, 83.8984375, 88.85546875, 93.8125, 98.76953125, 103.7265625, 108.68359375, 113.640625, 118.59765625, 123.5546875, 128.51171875, 133.46875, 138.42578125, 143.3828125, 148.33984375, 153.296875, 158.25390625, 163.2109375, 168.16796875, 173.125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 41.0, 250.0, 466.0, 196.0, 35.0, 14.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-224.83074951171875, -218.1095428466797, -211.38832092285156, -204.6671142578125, -197.94589233398438, -191.2246856689453, -184.50347900390625, -177.78225708007812, -171.06105041503906, -164.33984375, -157.61862182617188, -150.8974151611328, -144.17620849609375, -137.45498657226562, -130.73377990722656, -124.01256561279297, -117.29135131835938, -110.57013702392578, -103.84892272949219, -97.12771606445312, -90.40650177001953, -83.68528747558594, -76.96408081054688, -70.24286651611328, -63.52165222167969, -56.800437927246094, -50.079227447509766, -43.35801696777344, -36.636802673339844, -29.91558837890625, -23.194377899169922, -16.473167419433594, -9.751968383789062, -3.0307559967041016, 3.6904563903808594, 10.41166877746582, 17.13288116455078, 23.854095458984375, 30.575305938720703, 37.29651641845703, 44.017730712890625, 50.73894500732422, 57.46015548706055, 64.18136596679688, 70.90258026123047, 77.62379455566406, 84.34500122070312, 91.06621551513672, 97.78742980957031, 104.5086441040039, 111.2298583984375, 117.95106506347656, 124.67227935791016, 131.39349365234375, 138.1147003173828, 144.83590698242188, 151.55712890625, 158.27833557128906, 164.9995574951172, 171.72076416015625, 178.44198608398438, 185.16319274902344, 191.8843994140625, 198.60562133789062, 205.3268280029297]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 7.0, 6.0, 8.0, 8.0, 14.0, 8.0, 19.0, 17.0, 19.0, 16.0, 22.0, 28.0, 31.0, 37.0, 44.0, 38.0, 47.0, 43.0, 47.0, 46.0, 53.0, 40.0, 46.0, 36.0, 41.0, 27.0, 31.0, 31.0, 20.0, 27.0, 24.0, 18.0, 16.0, 20.0, 9.0, 12.0, 9.0, 6.0, 8.0, 4.0, 2.0, 0.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.90000915527344, -89.84323120117188, -86.78644561767578, -83.72966766357422, -80.67288208007812, -77.61610412597656, -74.55931854248047, -71.5025405883789, -68.44575500488281, -65.38897705078125, -62.332191467285156, -59.27540969848633, -56.2186279296875, -53.16184616088867, -50.105064392089844, -47.04828643798828, -43.99150466918945, -40.934722900390625, -37.8779411315918, -34.82115936279297, -31.76437759399414, -28.707595825195312, -25.650815963745117, -22.59403419494629, -19.53725242614746, -16.480470657348633, -13.423688888549805, -10.366908073425293, -7.310126304626465, -4.253344535827637, -1.196563720703125, 1.8602180480957031, 4.916999816894531, 7.973781585693359, 11.030563354492188, 14.0873441696167, 17.144126892089844, 20.200908660888672, 23.257688522338867, 26.314470291137695, 29.371252059936523, 32.42803192138672, 35.48481369018555, 38.541595458984375, 41.5983772277832, 44.65515899658203, 47.71194076538086, 50.76872253417969, 53.825504302978516, 56.882286071777344, 59.93906784057617, 62.995849609375, 66.05262756347656, 69.10941314697266, 72.16619110107422, 75.22297668457031, 78.27975463867188, 81.33653259277344, 84.39331817626953, 87.4500961303711, 90.50688171386719, 93.56365966796875, 96.62044525146484, 99.6772232055664, 102.7340087890625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 8.0, 9.0, 11.0, 13.0, 23.0, 25.0, 16.0, 23.0, 33.0, 30.0, 28.0, 25.0, 42.0, 38.0, 41.0, 52.0, 48.0, 41.0, 63.0, 36.0, 54.0, 41.0, 34.0, 38.0, 30.0, 23.0, 25.0, 24.0, 23.0, 10.0, 19.0, 13.0, 14.0, 11.0, 7.0, 5.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.234375, -18.65576171875, -18.0771484375, -17.49853515625, -16.919921875, -16.34130859375, -15.7626953125, -15.18408203125, -14.60546875, -14.02685546875, -13.4482421875, -12.86962890625, -12.291015625, -11.71240234375, -11.1337890625, -10.55517578125, -9.9765625, -9.39794921875, -8.8193359375, -8.24072265625, -7.662109375, -7.08349609375, -6.5048828125, -5.92626953125, -5.34765625, -4.76904296875, -4.1904296875, -3.61181640625, -3.033203125, -2.45458984375, -1.8759765625, -1.29736328125, -0.71875, -0.14013671875, 0.4384765625, 1.01708984375, 1.595703125, 2.17431640625, 2.7529296875, 3.33154296875, 3.91015625, 4.48876953125, 5.0673828125, 5.64599609375, 6.224609375, 6.80322265625, 7.3818359375, 7.96044921875, 8.5390625, 9.11767578125, 9.6962890625, 10.27490234375, 10.853515625, 11.43212890625, 12.0107421875, 12.58935546875, 13.16796875, 13.74658203125, 14.3251953125, 14.90380859375, 15.482421875, 16.06103515625, 16.6396484375, 17.21826171875, 17.796875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 13.0, 5.0, 15.0, 21.0, 21.0, 36.0, 53.0, 74.0, 106.0, 144.0, 162.0, 296.0, 418.0, 633.0, 1145.0, 2125.0, 5014.0, 15315.0, 165816.0, 3441290.0, 524654.0, 24264.0, 6603.0, 2576.0, 1335.0, 703.0, 410.0, 305.0, 238.0, 128.0, 104.0, 57.0, 55.0, 27.0, 23.0, 32.0, 17.0, 8.0, 13.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.40625, -57.529296875, -55.65234375, -53.775390625, -51.8984375, -50.021484375, -48.14453125, -46.267578125, -44.390625, -42.513671875, -40.63671875, -38.759765625, -36.8828125, -35.005859375, -33.12890625, -31.251953125, -29.375, -27.498046875, -25.62109375, -23.744140625, -21.8671875, -19.990234375, -18.11328125, -16.236328125, -14.359375, -12.482421875, -10.60546875, -8.728515625, -6.8515625, -4.974609375, -3.09765625, -1.220703125, 0.65625, 2.533203125, 4.41015625, 6.287109375, 8.1640625, 10.041015625, 11.91796875, 13.794921875, 15.671875, 17.548828125, 19.42578125, 21.302734375, 23.1796875, 25.056640625, 26.93359375, 28.810546875, 30.6875, 32.564453125, 34.44140625, 36.318359375, 38.1953125, 40.072265625, 41.94921875, 43.826171875, 45.703125, 47.580078125, 49.45703125, 51.333984375, 53.2109375, 55.087890625, 56.96484375, 58.841796875, 60.71875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 4.0, 6.0, 4.0, 10.0, 12.0, 7.0, 11.0, 27.0, 14.0, 16.0, 34.0, 38.0, 49.0, 65.0, 103.0, 121.0, 197.0, 294.0, 530.0, 742.0, 619.0, 375.0, 256.0, 151.0, 90.0, 79.0, 53.0, 44.0, 29.0, 22.0, 17.0, 14.0, 8.0, 7.0, 7.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.53125, -28.5673828125, -27.603515625, -26.6396484375, -25.67578125, -24.7119140625, -23.748046875, -22.7841796875, -21.8203125, -20.8564453125, -19.892578125, -18.9287109375, -17.96484375, -17.0009765625, -16.037109375, -15.0732421875, -14.109375, -13.1455078125, -12.181640625, -11.2177734375, -10.25390625, -9.2900390625, -8.326171875, -7.3623046875, -6.3984375, -5.4345703125, -4.470703125, -3.5068359375, -2.54296875, -1.5791015625, -0.615234375, 0.3486328125, 1.3125, 2.2763671875, 3.240234375, 4.2041015625, 5.16796875, 6.1318359375, 7.095703125, 8.0595703125, 9.0234375, 9.9873046875, 10.951171875, 11.9150390625, 12.87890625, 13.8427734375, 14.806640625, 15.7705078125, 16.734375, 17.6982421875, 18.662109375, 19.6259765625, 20.58984375, 21.5537109375, 22.517578125, 23.4814453125, 24.4453125, 25.4091796875, 26.373046875, 27.3369140625, 28.30078125, 29.2646484375, 30.228515625, 31.1923828125, 32.15625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 7.0, 11.0, 16.0, 20.0, 34.0, 48.0, 73.0, 129.0, 204.0, 373.0, 763.0, 1420.0, 2985.0, 6859.0, 17269.0, 53578.0, 331777.0, 3439139.0, 264005.0, 47595.0, 15713.0, 6299.0, 2913.0, 1381.0, 715.0, 371.0, 208.0, 126.0, 70.0, 53.0, 34.0, 21.0, 21.0, 13.0, 8.0, 5.0, 1.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.96875, -49.3984375, -47.828125, -46.2578125, -44.6875, -43.1171875, -41.546875, -39.9765625, -38.40625, -36.8359375, -35.265625, -33.6953125, -32.125, -30.5546875, -28.984375, -27.4140625, -25.84375, -24.2734375, -22.703125, -21.1328125, -19.5625, -17.9921875, -16.421875, -14.8515625, -13.28125, -11.7109375, -10.140625, -8.5703125, -7.0, -5.4296875, -3.859375, -2.2890625, -0.71875, 0.8515625, 2.421875, 3.9921875, 5.5625, 7.1328125, 8.703125, 10.2734375, 11.84375, 13.4140625, 14.984375, 16.5546875, 18.125, 19.6953125, 21.265625, 22.8359375, 24.40625, 25.9765625, 27.546875, 29.1171875, 30.6875, 32.2578125, 33.828125, 35.3984375, 36.96875, 38.5390625, 40.109375, 41.6796875, 43.25, 44.8203125, 46.390625, 47.9609375, 49.53125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [7.0, 11.0, 30.0, 154.0, 541.0, 228.0, 36.0, 10.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.45288848876953, -64.00987243652344, -46.56685256958008, -29.12383270263672, -11.680816650390625, 5.762199401855469, 23.205223083496094, 40.64823913574219, 58.09125518798828, 75.53427124023438, 92.977294921875, 110.4203109741211, 127.86332702636719, 145.30633544921875, 162.74935913085938, 180.1923828125, 197.63540649414062, 215.07843017578125, 232.5214385986328, 249.96446228027344, 267.407470703125, 284.8504943847656, 302.29351806640625, 319.7365417480469, 337.1795349121094, 354.62255859375, 372.0655822753906, 389.50860595703125, 406.95159912109375, 424.3946228027344, 441.837646484375, 459.2806701660156, 476.72369384765625, 494.1667175292969, 511.6097412109375, 529.052734375, 546.4957885742188, 563.9387817382812, 581.3818359375, 598.8248291015625, 616.267822265625, 633.7108154296875, 651.1538696289062, 668.5968627929688, 686.0399169921875, 703.48291015625, 720.9259033203125, 738.3689575195312, 755.81201171875, 773.2550048828125, 790.6980590820312, 808.1410522460938, 825.5841064453125, 843.027099609375, 860.4700927734375, 877.9131469726562, 895.3561401367188, 912.7991333007812, 930.2421875, 947.6851806640625, 965.1282348632812, 982.5712280273438, 1000.0142822265625, 1017.457275390625, 1034.9002685546875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 1.0, 4.0, 6.0, 8.0, 14.0, 9.0, 13.0, 17.0, 18.0, 12.0, 21.0, 19.0, 35.0, 24.0, 30.0, 47.0, 36.0, 39.0, 41.0, 38.0, 44.0, 42.0, 40.0, 37.0, 39.0, 28.0, 30.0, 31.0, 32.0, 30.0, 33.0, 28.0, 21.0, 23.0, 13.0, 18.0, 15.0, 12.0, 7.0, 11.0, 11.0, 6.0, 5.0, 2.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-104.64703369140625, -101.5959701538086, -98.54490661621094, -95.49384307861328, -92.44277954101562, -89.39170837402344, -86.34064483642578, -83.28958129882812, -80.23851776123047, -77.18745422363281, -74.13639068603516, -71.0853271484375, -68.03425598144531, -64.98319244384766, -61.93212890625, -58.881065368652344, -55.83000183105469, -52.77893829345703, -49.727874755859375, -46.67680740356445, -43.6257438659668, -40.57468032836914, -37.52361297607422, -34.47254943847656, -31.421485900878906, -28.37042236328125, -25.31935691833496, -22.268291473388672, -19.217227935791016, -16.16616439819336, -13.11509895324707, -10.064033508300781, -7.012977600097656, -3.9619131088256836, -0.9108486175537109, 2.1402158737182617, 5.191280364990234, 8.242344856262207, 11.29340934753418, 14.344474792480469, 17.395538330078125, 20.44660186767578, 23.49766731262207, 26.54873275756836, 29.599796295166016, 32.65085983276367, 35.701927185058594, 38.75299072265625, 41.804054260253906, 44.85511779785156, 47.90618133544922, 50.95724868774414, 54.0083122253418, 57.05937576293945, 60.110443115234375, 63.16150665283203, 66.21257019042969, 69.26363372802734, 72.314697265625, 75.36576080322266, 78.41682434082031, 81.4678955078125, 84.51895904541016, 87.57002258300781, 90.62108612060547]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 6.0, 7.0, 13.0, 7.0, 11.0, 16.0, 12.0, 21.0, 25.0, 27.0, 34.0, 27.0, 27.0, 29.0, 46.0, 47.0, 54.0, 34.0, 40.0, 43.0, 34.0, 42.0, 41.0, 45.0, 31.0, 27.0, 29.0, 35.0, 28.0, 14.0, 20.0, 18.0, 16.0, 22.0, 12.0, 13.0, 7.0, 11.0, 6.0, 5.0, 7.0, 1.0, 1.0, 6.0, 2.0, 2.0, 1.0], "bins": [-16.484375, -16.031982421875, -15.57958984375, -15.127197265625, -14.6748046875, -14.222412109375, -13.77001953125, -13.317626953125, -12.865234375, -12.412841796875, -11.96044921875, -11.508056640625, -11.0556640625, -10.603271484375, -10.15087890625, -9.698486328125, -9.24609375, -8.793701171875, -8.34130859375, -7.888916015625, -7.4365234375, -6.984130859375, -6.53173828125, -6.079345703125, -5.626953125, -5.174560546875, -4.72216796875, -4.269775390625, -3.8173828125, -3.364990234375, -2.91259765625, -2.460205078125, -2.0078125, -1.555419921875, -1.10302734375, -0.650634765625, -0.1982421875, 0.254150390625, 0.70654296875, 1.158935546875, 1.611328125, 2.063720703125, 2.51611328125, 2.968505859375, 3.4208984375, 3.873291015625, 4.32568359375, 4.778076171875, 5.23046875, 5.682861328125, 6.13525390625, 6.587646484375, 7.0400390625, 7.492431640625, 7.94482421875, 8.397216796875, 8.849609375, 9.302001953125, 9.75439453125, 10.206787109375, 10.6591796875, 11.111572265625, 11.56396484375, 12.016357421875, 12.46875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 6.0, 9.0, 9.0, 16.0, 23.0, 32.0, 43.0, 64.0, 69.0, 106.0, 158.0, 220.0, 336.0, 401.0, 636.0, 868.0, 1219.0, 1773.0, 2450.0, 3421.0, 4995.0, 7503.0, 10808.0, 16294.0, 25545.0, 40969.0, 68014.0, 115877.0, 190097.0, 208026.0, 135451.0, 79268.0, 47248.0, 28878.0, 18615.0, 12172.0, 8079.0, 5680.0, 3843.0, 2708.0, 1916.0, 1384.0, 975.0, 712.0, 462.0, 340.0, 242.0, 152.0, 115.0, 92.0, 74.0, 67.0, 31.0, 35.0, 18.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 3.0], "bins": [-1.1904296875, -1.1522064208984375, -1.113983154296875, -1.0757598876953125, -1.03753662109375, -0.9993133544921875, -0.961090087890625, -0.9228668212890625, -0.8846435546875, -0.8464202880859375, -0.808197021484375, -0.7699737548828125, -0.73175048828125, -0.6935272216796875, -0.655303955078125, -0.6170806884765625, -0.578857421875, -0.5406341552734375, -0.502410888671875, -0.4641876220703125, -0.42596435546875, -0.3877410888671875, -0.349517822265625, -0.3112945556640625, -0.2730712890625, -0.2348480224609375, -0.196624755859375, -0.1584014892578125, -0.12017822265625, -0.0819549560546875, -0.043731689453125, -0.0055084228515625, 0.03271484375, 0.0709381103515625, 0.109161376953125, 0.1473846435546875, 0.18560791015625, 0.2238311767578125, 0.262054443359375, 0.3002777099609375, 0.3385009765625, 0.3767242431640625, 0.414947509765625, 0.4531707763671875, 0.49139404296875, 0.5296173095703125, 0.567840576171875, 0.6060638427734375, 0.644287109375, 0.6825103759765625, 0.720733642578125, 0.7589569091796875, 0.79718017578125, 0.8354034423828125, 0.873626708984375, 0.9118499755859375, 0.9500732421875, 0.9882965087890625, 1.026519775390625, 1.0647430419921875, 1.10296630859375, 1.1411895751953125, 1.179412841796875, 1.2176361083984375, 1.255859375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 4.0, 3.0, 4.0, 2.0, 4.0, 5.0, 8.0, 7.0, 9.0, 15.0, 16.0, 16.0, 18.0, 25.0, 30.0, 19.0, 30.0, 20.0, 40.0, 29.0, 41.0, 44.0, 38.0, 35.0, 36.0, 1067.0, 32.0, 40.0, 38.0, 32.0, 35.0, 27.0, 28.0, 27.0, 31.0, 29.0, 26.0, 24.0, 18.0, 14.0, 20.0, 13.0, 6.0, 5.0, 8.0, 7.0, 4.0, 0.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.89453125, -7.61505126953125, -7.3355712890625, -7.05609130859375, -6.776611328125, -6.49713134765625, -6.2176513671875, -5.93817138671875, -5.65869140625, -5.37921142578125, -5.0997314453125, -4.82025146484375, -4.540771484375, -4.26129150390625, -3.9818115234375, -3.70233154296875, -3.4228515625, -3.14337158203125, -2.8638916015625, -2.58441162109375, -2.304931640625, -2.02545166015625, -1.7459716796875, -1.46649169921875, -1.18701171875, -0.90753173828125, -0.6280517578125, -0.34857177734375, -0.069091796875, 0.21038818359375, 0.4898681640625, 0.76934814453125, 1.048828125, 1.32830810546875, 1.6077880859375, 1.88726806640625, 2.166748046875, 2.44622802734375, 2.7257080078125, 3.00518798828125, 3.28466796875, 3.56414794921875, 3.8436279296875, 4.12310791015625, 4.402587890625, 4.68206787109375, 4.9615478515625, 5.24102783203125, 5.5205078125, 5.79998779296875, 6.0794677734375, 6.35894775390625, 6.638427734375, 6.91790771484375, 7.1973876953125, 7.47686767578125, 7.75634765625, 8.03582763671875, 8.3153076171875, 8.59478759765625, 8.874267578125, 9.15374755859375, 9.4332275390625, 9.71270751953125, 9.9921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 10.0, 9.0, 12.0, 29.0, 43.0, 85.0, 86.0, 176.0, 237.0, 347.0, 554.0, 869.0, 1271.0, 1965.0, 2933.0, 4677.0, 7070.0, 11015.0, 17273.0, 27320.0, 44258.0, 75096.0, 128919.0, 991983.0, 463480.0, 125859.0, 73787.0, 43609.0, 26605.0, 16813.0, 10748.0, 6813.0, 4598.0, 3052.0, 1876.0, 1256.0, 806.0, 603.0, 323.0, 219.0, 158.0, 101.0, 59.0, 44.0, 31.0, 26.0, 7.0, 12.0, 4.0, 4.0, 3.0, 1.0, 3.0], "bins": [-1.029296875, -0.9998703002929688, -0.9704437255859375, -0.9410171508789062, -0.911590576171875, -0.8821640014648438, -0.8527374267578125, -0.8233108520507812, -0.79388427734375, -0.7644577026367188, -0.7350311279296875, -0.7056045532226562, -0.676177978515625, -0.6467514038085938, -0.6173248291015625, -0.5878982543945312, -0.5584716796875, -0.5290451049804688, -0.4996185302734375, -0.47019195556640625, -0.440765380859375, -0.41133880615234375, -0.3819122314453125, -0.35248565673828125, -0.32305908203125, -0.29363250732421875, -0.2642059326171875, -0.23477935791015625, -0.205352783203125, -0.17592620849609375, -0.1464996337890625, -0.11707305908203125, -0.087646484375, -0.05821990966796875, -0.0287933349609375, 0.00063323974609375, 0.030059814453125, 0.05948638916015625, 0.0889129638671875, 0.11833953857421875, 0.14776611328125, 0.17719268798828125, 0.2066192626953125, 0.23604583740234375, 0.265472412109375, 0.29489898681640625, 0.3243255615234375, 0.35375213623046875, 0.3831787109375, 0.41260528564453125, 0.4420318603515625, 0.47145843505859375, 0.500885009765625, 0.5303115844726562, 0.5597381591796875, 0.5891647338867188, 0.61859130859375, 0.6480178833007812, 0.6774444580078125, 0.7068710327148438, 0.736297607421875, 0.7657241821289062, 0.7951507568359375, 0.8245773315429688, 0.85400390625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 4.0, 10.0, 8.0, 9.0, 17.0, 16.0, 19.0, 29.0, 53.0, 67.0, 94.0, 121.0, 128.0, 99.0, 82.0, 65.0, 38.0, 33.0, 19.0, 13.0, 11.0, 3.0, 6.0, 3.0, 3.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031494140625, -0.03055095672607422, -0.029607772827148438, -0.028664588928222656, -0.027721405029296875, -0.026778221130371094, -0.025835037231445312, -0.02489185333251953, -0.02394866943359375, -0.02300548553466797, -0.022062301635742188, -0.021119117736816406, -0.020175933837890625, -0.019232749938964844, -0.018289566040039062, -0.01734638214111328, -0.0164031982421875, -0.015460014343261719, -0.014516830444335938, -0.013573646545410156, -0.012630462646484375, -0.011687278747558594, -0.010744094848632812, -0.009800910949707031, -0.00885772705078125, -0.007914543151855469, -0.0069713592529296875, -0.006028175354003906, -0.005084991455078125, -0.004141807556152344, -0.0031986236572265625, -0.0022554397583007812, -0.001312255859375, -0.00036907196044921875, 0.0005741119384765625, 0.0015172958374023438, 0.002460479736328125, 0.0034036636352539062, 0.0043468475341796875, 0.005290031433105469, 0.00623321533203125, 0.007176399230957031, 0.008119583129882812, 0.009062767028808594, 0.010005950927734375, 0.010949134826660156, 0.011892318725585938, 0.012835502624511719, 0.0137786865234375, 0.014721870422363281, 0.015665054321289062, 0.016608238220214844, 0.017551422119140625, 0.018494606018066406, 0.019437789916992188, 0.02038097381591797, 0.02132415771484375, 0.02226734161376953, 0.023210525512695312, 0.024153709411621094, 0.025096893310546875, 0.026040077209472656, 0.026983261108398438, 0.02792644500732422, 0.02886962890625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 5.0, 5.0, 7.0, 8.0, 5.0, 11.0, 8.0, 11.0, 13.0, 21.0, 27.0, 40.0, 65.0, 120.0, 178.0, 361.0, 1271.0, 187414.0, 855840.0, 2070.0, 431.0, 218.0, 104.0, 63.0, 51.0, 48.0, 33.0, 21.0, 14.0, 17.0, 13.0, 8.0, 7.0, 7.0, 5.0, 2.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.591796875, -0.5727615356445312, -0.5537261962890625, -0.5346908569335938, -0.515655517578125, -0.49662017822265625, -0.4775848388671875, -0.45854949951171875, -0.43951416015625, -0.42047882080078125, -0.4014434814453125, -0.38240814208984375, -0.363372802734375, -0.34433746337890625, -0.3253021240234375, -0.30626678466796875, -0.2872314453125, -0.26819610595703125, -0.2491607666015625, -0.23012542724609375, -0.211090087890625, -0.19205474853515625, -0.1730194091796875, -0.15398406982421875, -0.13494873046875, -0.11591339111328125, -0.0968780517578125, -0.07784271240234375, -0.058807373046875, -0.03977203369140625, -0.0207366943359375, -0.00170135498046875, 0.017333984375, 0.03636932373046875, 0.0554046630859375, 0.07444000244140625, 0.093475341796875, 0.11251068115234375, 0.1315460205078125, 0.15058135986328125, 0.16961669921875, 0.18865203857421875, 0.2076873779296875, 0.22672271728515625, 0.245758056640625, 0.26479339599609375, 0.2838287353515625, 0.30286407470703125, 0.3218994140625, 0.34093475341796875, 0.3599700927734375, 0.37900543212890625, 0.398040771484375, 0.41707611083984375, 0.4361114501953125, 0.45514678955078125, 0.47418212890625, 0.49321746826171875, 0.5122528076171875, 0.5312881469726562, 0.550323486328125, 0.5693588256835938, 0.5883941650390625, 0.6074295043945312, 0.62646484375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 18.0, 88.0, 633.0, 237.0, 29.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15334580838680267, -0.14595602452754974, -0.138566255569458, -0.13117647171020508, -0.12378668785095215, -0.11639690399169922, -0.10900712758302689, -0.10161735117435455, -0.09422756731510162, -0.0868377834558487, -0.07944800704717636, -0.07205823063850403, -0.0646684467792511, -0.05727866664528847, -0.049888886511325836, -0.042499106377363205, -0.035109326243400574, -0.027719546109437943, -0.02032976597547531, -0.01293998584151268, -0.005550205707550049, 0.0018395744264125824, 0.009229354560375214, 0.016619134694337845, 0.024008914828300476, 0.03139869496226311, 0.03878847509622574, 0.04617825523018837, 0.053568035364151, 0.06095781549811363, 0.06834759563207626, 0.0757373720407486, 0.08312717080116272, 0.09051695466041565, 0.09790673106908798, 0.10529650747776031, 0.11268629133701324, 0.12007607519626617, 0.1274658441543579, 0.13485562801361084, 0.14224541187286377, 0.1496351957321167, 0.15702497959136963, 0.16441474854946136, 0.1718045324087143, 0.17919431626796722, 0.18658408522605896, 0.1939738690853119, 0.20136365294456482, 0.20875343680381775, 0.21614322066307068, 0.22353298962116241, 0.23092277348041534, 0.23831255733966827, 0.24570232629776, 0.25309211015701294, 0.26048189401626587, 0.2678716778755188, 0.27526146173477173, 0.28265124559402466, 0.2900410294532776, 0.29743078351020813, 0.30482056736946106, 0.312210351228714, 0.3196001350879669]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 5.0, 11.0, 5.0, 9.0, 11.0, 15.0, 20.0, 14.0, 17.0, 23.0, 25.0, 32.0, 30.0, 37.0, 40.0, 47.0, 53.0, 50.0, 32.0, 50.0, 36.0, 35.0, 45.0, 44.0, 38.0, 31.0, 28.0, 32.0, 34.0, 30.0, 19.0, 15.0, 15.0, 19.0, 13.0, 9.0, 4.0, 11.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.03445249795913696, -0.033480700105428696, -0.03250890225172043, -0.03153710812330246, -0.030565310269594193, -0.029593512415885925, -0.028621716424822807, -0.02764992043375969, -0.026678122580051422, -0.025706324726343155, -0.024734528735280037, -0.02376273274421692, -0.02279093489050865, -0.021819137036800385, -0.020847341045737267, -0.01987554505467415, -0.01890374720096588, -0.017931949347257614, -0.016960153356194496, -0.015988357365131378, -0.015016559511423111, -0.014044762589037418, -0.013072965666651726, -0.012101168744266033, -0.01112937182188034, -0.010157574899494648, -0.009185777977108955, -0.008213981054723263, -0.00724218413233757, -0.006270387209951878, -0.005298590287566185, -0.004326793365180492, -0.0033549964427948, -0.002383199520409107, -0.0014114025980234146, -0.000439605675637722, 0.0005321912467479706, 0.0015039881691336632, 0.0024757850915193558, 0.0034475820139050484, 0.004419378936290741, 0.0053911758586764336, 0.006362972781062126, 0.007334769703447819, 0.008306566625833511, 0.009278363548219204, 0.010250160470604897, 0.01122195739299059, 0.012193754315376282, 0.013165551237761974, 0.014137348160147667, 0.01510914508253336, 0.016080942004919052, 0.01705273985862732, 0.018024535849690437, 0.018996331840753555, 0.019968129694461823, 0.02093992754817009, 0.021911723539233208, 0.022883519530296326, 0.023855317384004593, 0.02482711523771286, 0.025798911228775978, 0.026770707219839096, 0.027742505073547363]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 6.0, 7.0, 13.0, 7.0, 11.0, 16.0, 12.0, 21.0, 25.0, 28.0, 35.0, 25.0, 29.0, 28.0, 46.0, 47.0, 54.0, 33.0, 40.0, 43.0, 34.0, 42.0, 41.0, 46.0, 30.0, 27.0, 29.0, 36.0, 27.0, 14.0, 20.0, 18.0, 16.0, 22.0, 12.0, 13.0, 7.0, 11.0, 6.0, 5.0, 7.0, 1.0, 1.0, 6.0, 2.0, 2.0, 1.0], "bins": [-16.46875, -16.0166015625, -15.564453125, -15.1123046875, -14.66015625, -14.2080078125, -13.755859375, -13.3037109375, -12.8515625, -12.3994140625, -11.947265625, -11.4951171875, -11.04296875, -10.5908203125, -10.138671875, -9.6865234375, -9.234375, -8.7822265625, -8.330078125, -7.8779296875, -7.42578125, -6.9736328125, -6.521484375, -6.0693359375, -5.6171875, -5.1650390625, -4.712890625, -4.2607421875, -3.80859375, -3.3564453125, -2.904296875, -2.4521484375, -2.0, -1.5478515625, -1.095703125, -0.6435546875, -0.19140625, 0.2607421875, 0.712890625, 1.1650390625, 1.6171875, 2.0693359375, 2.521484375, 2.9736328125, 3.42578125, 3.8779296875, 4.330078125, 4.7822265625, 5.234375, 5.6865234375, 6.138671875, 6.5908203125, 7.04296875, 7.4951171875, 7.947265625, 8.3994140625, 8.8515625, 9.3037109375, 9.755859375, 10.2080078125, 10.66015625, 11.1123046875, 11.564453125, 12.0166015625, 12.46875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 4.0, 4.0, 6.0, 4.0, 13.0, 17.0, 23.0, 19.0, 39.0, 44.0, 70.0, 106.0, 162.0, 163.0, 290.0, 403.0, 596.0, 922.0, 1416.0, 2101.0, 3629.0, 6746.0, 16619.0, 97672.0, 787589.0, 96610.0, 16574.0, 6632.0, 3565.0, 2215.0, 1434.0, 919.0, 602.0, 418.0, 264.0, 198.0, 136.0, 101.0, 66.0, 38.0, 33.0, 22.0, 29.0, 15.0, 9.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.78125, -34.47998046875, -33.1787109375, -31.87744140625, -30.576171875, -29.27490234375, -27.9736328125, -26.67236328125, -25.37109375, -24.06982421875, -22.7685546875, -21.46728515625, -20.166015625, -18.86474609375, -17.5634765625, -16.26220703125, -14.9609375, -13.65966796875, -12.3583984375, -11.05712890625, -9.755859375, -8.45458984375, -7.1533203125, -5.85205078125, -4.55078125, -3.24951171875, -1.9482421875, -0.64697265625, 0.654296875, 1.95556640625, 3.2568359375, 4.55810546875, 5.859375, 7.16064453125, 8.4619140625, 9.76318359375, 11.064453125, 12.36572265625, 13.6669921875, 14.96826171875, 16.26953125, 17.57080078125, 18.8720703125, 20.17333984375, 21.474609375, 22.77587890625, 24.0771484375, 25.37841796875, 26.6796875, 27.98095703125, 29.2822265625, 30.58349609375, 31.884765625, 33.18603515625, 34.4873046875, 35.78857421875, 37.08984375, 38.39111328125, 39.6923828125, 40.99365234375, 42.294921875, 43.59619140625, 44.8974609375, 46.19873046875, 47.5]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 6.0, 10.0, 5.0, 19.0, 14.0, 19.0, 19.0, 29.0, 29.0, 34.0, 42.0, 54.0, 61.0, 63.0, 98.0, 142.0, 367.0, 1395.0, 132.0, 81.0, 59.0, 72.0, 46.0, 43.0, 40.0, 30.0, 17.0, 22.0, 22.0, 11.0, 11.0, 5.0, 8.0, 1.0, 5.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.28125, -30.303955078125, -29.32666015625, -28.349365234375, -27.3720703125, -26.394775390625, -25.41748046875, -24.440185546875, -23.462890625, -22.485595703125, -21.50830078125, -20.531005859375, -19.5537109375, -18.576416015625, -17.59912109375, -16.621826171875, -15.64453125, -14.667236328125, -13.68994140625, -12.712646484375, -11.7353515625, -10.758056640625, -9.78076171875, -8.803466796875, -7.826171875, -6.848876953125, -5.87158203125, -4.894287109375, -3.9169921875, -2.939697265625, -1.96240234375, -0.985107421875, -0.0078125, 0.969482421875, 1.94677734375, 2.924072265625, 3.9013671875, 4.878662109375, 5.85595703125, 6.833251953125, 7.810546875, 8.787841796875, 9.76513671875, 10.742431640625, 11.7197265625, 12.697021484375, 13.67431640625, 14.651611328125, 15.62890625, 16.606201171875, 17.58349609375, 18.560791015625, 19.5380859375, 20.515380859375, 21.49267578125, 22.469970703125, 23.447265625, 24.424560546875, 25.40185546875, 26.379150390625, 27.3564453125, 28.333740234375, 29.31103515625, 30.288330078125, 31.265625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 7.0, 1.0, 2.0, 14.0, 5.0, 13.0, 20.0, 35.0, 58.0, 55.0, 90.0, 137.0, 300.0, 739.0, 3143.0, 3055820.0, 82441.0, 1569.0, 564.0, 261.0, 138.0, 85.0, 53.0, 44.0, 25.0, 21.0, 16.0, 9.0, 8.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.75, -128.943359375, -124.13671875, -119.330078125, -114.5234375, -109.716796875, -104.91015625, -100.103515625, -95.296875, -90.490234375, -85.68359375, -80.876953125, -76.0703125, -71.263671875, -66.45703125, -61.650390625, -56.84375, -52.037109375, -47.23046875, -42.423828125, -37.6171875, -32.810546875, -28.00390625, -23.197265625, -18.390625, -13.583984375, -8.77734375, -3.970703125, 0.8359375, 5.642578125, 10.44921875, 15.255859375, 20.0625, 24.869140625, 29.67578125, 34.482421875, 39.2890625, 44.095703125, 48.90234375, 53.708984375, 58.515625, 63.322265625, 68.12890625, 72.935546875, 77.7421875, 82.548828125, 87.35546875, 92.162109375, 96.96875, 101.775390625, 106.58203125, 111.388671875, 116.1953125, 121.001953125, 125.80859375, 130.615234375, 135.421875, 140.228515625, 145.03515625, 149.841796875, 154.6484375, 159.455078125, 164.26171875, 169.068359375, 173.875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 21.0, 32.0, 70.0, 208.0, 307.0, 224.0, 83.0, 37.0, 15.0, 4.0, 7.0], "bins": [-392.7497253417969, -385.93365478515625, -379.11761474609375, -372.3015441894531, -365.4854736328125, -358.66943359375, -351.8533630371094, -345.03729248046875, -338.22125244140625, -331.4051818847656, -324.5891418457031, -317.7730712890625, -310.9570007324219, -304.1409606933594, -297.32489013671875, -290.50885009765625, -283.6927795410156, -276.876708984375, -270.0606689453125, -263.2445983886719, -256.42852783203125, -249.61248779296875, -242.79641723632812, -235.98036193847656, -229.16429138183594, -222.34823608398438, -215.53216552734375, -208.7161102294922, -201.90005493164062, -195.083984375, -188.26792907714844, -181.45187377929688, -174.63580322265625, -167.8197479248047, -161.00367736816406, -154.1876220703125, -147.37156677246094, -140.55551147460938, -133.73944091796875, -126.92338562011719, -120.10733032226562, -113.29126739501953, -106.47521209716797, -99.65914916992188, -92.84309387207031, -86.02703094482422, -79.21096801757812, -72.39491271972656, -65.578857421875, -58.76279830932617, -51.946739196777344, -45.13067626953125, -38.31462097167969, -31.498558044433594, -24.682498931884766, -17.866439819335938, -11.050376892089844, -4.234317302703857, 2.581742286682129, 9.397802352905273, 16.2138614654541, 23.029922485351562, 29.84598159790039, 36.66204071044922, 43.47809982299805]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 8.0, 11.0, 20.0, 17.0, 16.0, 13.0, 19.0, 24.0, 30.0, 29.0, 39.0, 32.0, 39.0, 43.0, 32.0, 46.0, 41.0, 42.0, 38.0, 49.0, 38.0, 43.0, 45.0, 37.0, 26.0, 31.0, 25.0, 17.0, 17.0, 25.0, 17.0, 11.0, 9.0, 10.0, 11.0, 9.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.37979888916016, -83.68284606933594, -80.98590087890625, -78.28894805908203, -75.59200286865234, -72.89505004882812, -70.19810485839844, -67.50115203857422, -64.80419921875, -62.10725021362305, -59.410301208496094, -56.713348388671875, -54.01640319824219, -51.31945037841797, -48.622501373291016, -45.92555236816406, -43.228607177734375, -40.53165817260742, -37.83470916748047, -35.13775634765625, -32.44081115722656, -29.743860244750977, -27.04690933227539, -24.349960327148438, -21.653011322021484, -18.95606231689453, -16.259113311767578, -13.562162399291992, -10.865213394165039, -8.168264389038086, -5.4713134765625, -2.774364471435547, -0.077423095703125, 2.6195263862609863, 5.316475868225098, 8.013425827026367, 10.71037483215332, 13.407323837280273, 16.10427474975586, 18.801223754882812, 21.498172760009766, 24.19512176513672, 26.892070770263672, 29.589021682739258, 32.285972595214844, 34.98291778564453, 37.67987060546875, 40.3768196105957, 43.073768615722656, 45.77071762084961, 48.46766662597656, 51.16461944580078, 53.86156463623047, 56.55851745605469, 59.25546646118164, 61.952415466308594, 64.64936828613281, 67.34632110595703, 70.04326629638672, 72.74021911621094, 75.43716430664062, 78.13411712646484, 80.83106994628906, 83.52801513671875, 86.22496032714844]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 11.0, 15.0, 26.0, 19.0, 13.0, 22.0, 25.0, 29.0, 35.0, 43.0, 33.0, 31.0, 39.0, 42.0, 44.0, 35.0, 55.0, 37.0, 47.0, 51.0, 32.0, 33.0, 31.0, 30.0, 24.0, 28.0, 26.0, 27.0, 24.0, 19.0, 17.0, 5.0, 6.0, 8.0, 4.0, 8.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.046875, -15.5501708984375, -15.053466796875, -14.5567626953125, -14.06005859375, -13.5633544921875, -13.066650390625, -12.5699462890625, -12.0732421875, -11.5765380859375, -11.079833984375, -10.5831298828125, -10.08642578125, -9.5897216796875, -9.093017578125, -8.5963134765625, -8.099609375, -7.6029052734375, -7.106201171875, -6.6094970703125, -6.11279296875, -5.6160888671875, -5.119384765625, -4.6226806640625, -4.1259765625, -3.6292724609375, -3.132568359375, -2.6358642578125, -2.13916015625, -1.6424560546875, -1.145751953125, -0.6490478515625, -0.15234375, 0.3443603515625, 0.841064453125, 1.3377685546875, 1.83447265625, 2.3311767578125, 2.827880859375, 3.3245849609375, 3.8212890625, 4.3179931640625, 4.814697265625, 5.3114013671875, 5.80810546875, 6.3048095703125, 6.801513671875, 7.2982177734375, 7.794921875, 8.2916259765625, 8.788330078125, 9.2850341796875, 9.78173828125, 10.2784423828125, 10.775146484375, 11.2718505859375, 11.7685546875, 12.2652587890625, 12.761962890625, 13.2586669921875, 13.75537109375, 14.2520751953125, 14.748779296875, 15.2454833984375, 15.7421875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 3.0, 4.0, 10.0, 8.0, 18.0, 20.0, 15.0, 33.0, 38.0, 31.0, 60.0, 64.0, 97.0, 113.0, 153.0, 192.0, 290.0, 424.0, 725.0, 1456.0, 4214.0, 35970.0, 3367529.0, 765848.0, 11419.0, 2571.0, 1054.0, 583.0, 354.0, 240.0, 178.0, 133.0, 92.0, 88.0, 43.0, 46.0, 36.0, 30.0, 30.0, 5.0, 13.0, 14.0, 6.0, 10.0, 6.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-73.625, -71.380859375, -69.13671875, -66.892578125, -64.6484375, -62.404296875, -60.16015625, -57.916015625, -55.671875, -53.427734375, -51.18359375, -48.939453125, -46.6953125, -44.451171875, -42.20703125, -39.962890625, -37.71875, -35.474609375, -33.23046875, -30.986328125, -28.7421875, -26.498046875, -24.25390625, -22.009765625, -19.765625, -17.521484375, -15.27734375, -13.033203125, -10.7890625, -8.544921875, -6.30078125, -4.056640625, -1.8125, 0.431640625, 2.67578125, 4.919921875, 7.1640625, 9.408203125, 11.65234375, 13.896484375, 16.140625, 18.384765625, 20.62890625, 22.873046875, 25.1171875, 27.361328125, 29.60546875, 31.849609375, 34.09375, 36.337890625, 38.58203125, 40.826171875, 43.0703125, 45.314453125, 47.55859375, 49.802734375, 52.046875, 54.291015625, 56.53515625, 58.779296875, 61.0234375, 63.267578125, 65.51171875, 67.755859375, 70.0]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 6.0, 13.0, 24.0, 34.0, 66.0, 101.0, 182.0, 302.0, 579.0, 1024.0, 740.0, 417.0, 222.0, 122.0, 78.0, 51.0, 32.0, 23.0, 13.0, 9.0, 3.0, 9.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.75, -40.54638671875, -39.3427734375, -38.13916015625, -36.935546875, -35.73193359375, -34.5283203125, -33.32470703125, -32.12109375, -30.91748046875, -29.7138671875, -28.51025390625, -27.306640625, -26.10302734375, -24.8994140625, -23.69580078125, -22.4921875, -21.28857421875, -20.0849609375, -18.88134765625, -17.677734375, -16.47412109375, -15.2705078125, -14.06689453125, -12.86328125, -11.65966796875, -10.4560546875, -9.25244140625, -8.048828125, -6.84521484375, -5.6416015625, -4.43798828125, -3.234375, -2.03076171875, -0.8271484375, 0.37646484375, 1.580078125, 2.78369140625, 3.9873046875, 5.19091796875, 6.39453125, 7.59814453125, 8.8017578125, 10.00537109375, 11.208984375, 12.41259765625, 13.6162109375, 14.81982421875, 16.0234375, 17.22705078125, 18.4306640625, 19.63427734375, 20.837890625, 22.04150390625, 23.2451171875, 24.44873046875, 25.65234375, 26.85595703125, 28.0595703125, 29.26318359375, 30.466796875, 31.67041015625, 32.8740234375, 34.07763671875, 35.28125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 10.0, 8.0, 14.0, 21.0, 45.0, 69.0, 100.0, 224.0, 544.0, 1699.0, 8714.0, 174263.0, 3954268.0, 47831.0, 4588.0, 1149.0, 368.0, 164.0, 77.0, 51.0, 26.0, 13.0, 6.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.5, -80.6533203125, -77.806640625, -74.9599609375, -72.11328125, -69.2666015625, -66.419921875, -63.5732421875, -60.7265625, -57.8798828125, -55.033203125, -52.1865234375, -49.33984375, -46.4931640625, -43.646484375, -40.7998046875, -37.953125, -35.1064453125, -32.259765625, -29.4130859375, -26.56640625, -23.7197265625, -20.873046875, -18.0263671875, -15.1796875, -12.3330078125, -9.486328125, -6.6396484375, -3.79296875, -0.9462890625, 1.900390625, 4.7470703125, 7.59375, 10.4404296875, 13.287109375, 16.1337890625, 18.98046875, 21.8271484375, 24.673828125, 27.5205078125, 30.3671875, 33.2138671875, 36.060546875, 38.9072265625, 41.75390625, 44.6005859375, 47.447265625, 50.2939453125, 53.140625, 55.9873046875, 58.833984375, 61.6806640625, 64.52734375, 67.3740234375, 70.220703125, 73.0673828125, 75.9140625, 78.7607421875, 81.607421875, 84.4541015625, 87.30078125, 90.1474609375, 92.994140625, 95.8408203125, 98.6875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 11.0, 266.0, 696.0, 35.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1320.40576171875, -1294.0941162109375, -1267.7823486328125, -1241.470703125, -1215.158935546875, -1188.8472900390625, -1162.5355224609375, -1136.223876953125, -1109.912109375, -1083.6004638671875, -1057.2886962890625, -1030.97705078125, -1004.665283203125, -978.3535766601562, -952.0418701171875, -925.7301635742188, -899.41845703125, -873.1067504882812, -846.7950439453125, -820.4833374023438, -794.171630859375, -767.8599243164062, -741.5482177734375, -715.2365112304688, -688.9248657226562, -662.6131591796875, -636.3014526367188, -609.98974609375, -583.6780395507812, -557.3663330078125, -531.0546264648438, -504.742919921875, -478.4312438964844, -452.1195373535156, -425.8078308105469, -399.4961242675781, -373.1844177246094, -346.87274169921875, -320.56103515625, -294.24932861328125, -267.9376220703125, -241.62591552734375, -215.314208984375, -189.00250244140625, -162.6907958984375, -136.3791046142578, -110.06739807128906, -83.75569152832031, -57.4439697265625, -31.132265090942383, -4.820560455322266, 21.49114227294922, 47.80284881591797, 74.11454772949219, 100.42625427246094, 126.73796081542969, 153.04966735839844, 179.3613739013672, 205.67308044433594, 231.98477172851562, 258.2964782714844, 284.6081848144531, 310.9198913574219, 337.2315979003906, 363.5433044433594]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 3.0, 6.0, 8.0, 8.0, 15.0, 16.0, 12.0, 29.0, 23.0, 24.0, 27.0, 25.0, 32.0, 40.0, 33.0, 43.0, 37.0, 44.0, 36.0, 41.0, 39.0, 48.0, 37.0, 49.0, 32.0, 43.0, 28.0, 21.0, 29.0, 26.0, 26.0, 13.0, 18.0, 16.0, 18.0, 11.0, 10.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-85.37924194335938, -82.60194396972656, -79.82464599609375, -77.04734802246094, -74.27005004882812, -71.49275207519531, -68.7154541015625, -65.93815612792969, -63.160858154296875, -60.38356018066406, -57.60626220703125, -54.82896423339844, -52.051666259765625, -49.27436828613281, -46.4970703125, -43.71977233886719, -40.942474365234375, -38.16517639160156, -35.38787841796875, -32.61058044433594, -29.833282470703125, -27.055984497070312, -24.2786865234375, -21.501388549804688, -18.724090576171875, -15.946792602539062, -13.16949462890625, -10.392196655273438, -7.614898681640625, -4.8376007080078125, -2.060302734375, 0.7169952392578125, 3.4942855834960938, 6.271583557128906, 9.048881530761719, 11.826179504394531, 14.603477478027344, 17.380775451660156, 20.15807342529297, 22.93537139892578, 25.712669372558594, 28.489967346191406, 31.26726531982422, 34.04456329345703, 36.821861267089844, 39.599159240722656, 42.37645721435547, 45.15375518798828, 47.931053161621094, 50.708351135253906, 53.48564910888672, 56.26294708251953, 59.040245056152344, 61.817543029785156, 64.59484100341797, 67.37213897705078, 70.1494369506836, 72.9267349243164, 75.70403289794922, 78.48133087158203, 81.25862884521484, 84.03592681884766, 86.81322479248047, 89.59052276611328, 92.3678207397461]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 7.0, 10.0, 6.0, 11.0, 12.0, 14.0, 12.0, 20.0, 18.0, 21.0, 22.0, 14.0, 21.0, 39.0, 38.0, 37.0, 29.0, 36.0, 39.0, 36.0, 46.0, 39.0, 33.0, 22.0, 36.0, 35.0, 30.0, 22.0, 30.0, 35.0, 31.0, 16.0, 24.0, 24.0, 15.0, 17.0, 19.0, 8.0, 10.0, 11.0, 9.0, 9.0, 5.0, 7.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.5, -11.15380859375, -10.8076171875, -10.46142578125, -10.115234375, -9.76904296875, -9.4228515625, -9.07666015625, -8.73046875, -8.38427734375, -8.0380859375, -7.69189453125, -7.345703125, -6.99951171875, -6.6533203125, -6.30712890625, -5.9609375, -5.61474609375, -5.2685546875, -4.92236328125, -4.576171875, -4.22998046875, -3.8837890625, -3.53759765625, -3.19140625, -2.84521484375, -2.4990234375, -2.15283203125, -1.806640625, -1.46044921875, -1.1142578125, -0.76806640625, -0.421875, -0.07568359375, 0.2705078125, 0.61669921875, 0.962890625, 1.30908203125, 1.6552734375, 2.00146484375, 2.34765625, 2.69384765625, 3.0400390625, 3.38623046875, 3.732421875, 4.07861328125, 4.4248046875, 4.77099609375, 5.1171875, 5.46337890625, 5.8095703125, 6.15576171875, 6.501953125, 6.84814453125, 7.1943359375, 7.54052734375, 7.88671875, 8.23291015625, 8.5791015625, 8.92529296875, 9.271484375, 9.61767578125, 9.9638671875, 10.31005859375, 10.65625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 6.0, 2.0, 5.0, 17.0, 19.0, 33.0, 37.0, 64.0, 59.0, 118.0, 162.0, 236.0, 345.0, 575.0, 768.0, 1061.0, 1571.0, 2426.0, 3478.0, 5184.0, 7708.0, 11616.0, 17659.0, 27557.0, 43728.0, 72365.0, 123112.0, 199415.0, 201466.0, 126433.0, 74051.0, 44815.0, 27941.0, 18318.0, 11786.0, 7727.0, 5460.0, 3555.0, 2446.0, 1709.0, 1075.0, 745.0, 520.0, 388.0, 227.0, 192.0, 139.0, 85.0, 54.0, 35.0, 21.0, 15.0, 13.0, 9.0, 6.0, 7.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9560546875, -0.9262008666992188, -0.8963470458984375, -0.8664932250976562, -0.836639404296875, -0.8067855834960938, -0.7769317626953125, -0.7470779418945312, -0.71722412109375, -0.6873703002929688, -0.6575164794921875, -0.6276626586914062, -0.597808837890625, -0.5679550170898438, -0.5381011962890625, -0.5082473754882812, -0.4783935546875, -0.44853973388671875, -0.4186859130859375, -0.38883209228515625, -0.358978271484375, -0.32912445068359375, -0.2992706298828125, -0.26941680908203125, -0.23956298828125, -0.20970916748046875, -0.1798553466796875, -0.15000152587890625, -0.120147705078125, -0.09029388427734375, -0.0604400634765625, -0.03058624267578125, -0.000732421875, 0.02912139892578125, 0.0589752197265625, 0.08882904052734375, 0.118682861328125, 0.14853668212890625, 0.1783905029296875, 0.20824432373046875, 0.23809814453125, 0.26795196533203125, 0.2978057861328125, 0.32765960693359375, 0.357513427734375, 0.38736724853515625, 0.4172210693359375, 0.44707489013671875, 0.4769287109375, 0.5067825317382812, 0.5366363525390625, 0.5664901733398438, 0.596343994140625, 0.6261978149414062, 0.6560516357421875, 0.6859054565429688, 0.71575927734375, 0.7456130981445312, 0.7754669189453125, 0.8053207397460938, 0.835174560546875, 0.8650283813476562, 0.8948822021484375, 0.9247360229492188, 0.95458984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 11.0, 5.0, 6.0, 17.0, 12.0, 12.0, 17.0, 15.0, 30.0, 30.0, 37.0, 34.0, 35.0, 24.0, 26.0, 49.0, 37.0, 50.0, 40.0, 1063.0, 42.0, 50.0, 40.0, 20.0, 35.0, 36.0, 30.0, 23.0, 22.0, 29.0, 20.0, 18.0, 20.0, 17.0, 13.0, 10.0, 8.0, 9.0, 6.0, 3.0, 2.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.328125, -8.07720947265625, -7.8262939453125, -7.57537841796875, -7.324462890625, -7.07354736328125, -6.8226318359375, -6.57171630859375, -6.32080078125, -6.06988525390625, -5.8189697265625, -5.56805419921875, -5.317138671875, -5.06622314453125, -4.8153076171875, -4.56439208984375, -4.3134765625, -4.06256103515625, -3.8116455078125, -3.56072998046875, -3.309814453125, -3.05889892578125, -2.8079833984375, -2.55706787109375, -2.30615234375, -2.05523681640625, -1.8043212890625, -1.55340576171875, -1.302490234375, -1.05157470703125, -0.8006591796875, -0.54974365234375, -0.298828125, -0.04791259765625, 0.2030029296875, 0.45391845703125, 0.704833984375, 0.95574951171875, 1.2066650390625, 1.45758056640625, 1.70849609375, 1.95941162109375, 2.2103271484375, 2.46124267578125, 2.712158203125, 2.96307373046875, 3.2139892578125, 3.46490478515625, 3.7158203125, 3.96673583984375, 4.2176513671875, 4.46856689453125, 4.719482421875, 4.97039794921875, 5.2213134765625, 5.47222900390625, 5.72314453125, 5.97406005859375, 6.2249755859375, 6.47589111328125, 6.726806640625, 6.97772216796875, 7.2286376953125, 7.47955322265625, 7.73046875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 17.0, 24.0, 38.0, 53.0, 86.0, 160.0, 204.0, 325.0, 407.0, 739.0, 1075.0, 1566.0, 2420.0, 3554.0, 5319.0, 8284.0, 12411.0, 18667.0, 29423.0, 47370.0, 80212.0, 137386.0, 1251425.0, 200020.0, 114381.0, 66735.0, 41130.0, 25567.0, 16204.0, 10771.0, 7063.0, 4578.0, 3190.0, 2105.0, 1461.0, 925.0, 615.0, 447.0, 276.0, 158.0, 119.0, 76.0, 44.0, 37.0, 18.0, 11.0, 8.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.73876953125, -0.714813232421875, -0.69085693359375, -0.666900634765625, -0.6429443359375, -0.618988037109375, -0.59503173828125, -0.571075439453125, -0.547119140625, -0.523162841796875, -0.49920654296875, -0.475250244140625, -0.4512939453125, -0.427337646484375, -0.40338134765625, -0.379425048828125, -0.35546875, -0.331512451171875, -0.30755615234375, -0.283599853515625, -0.2596435546875, -0.235687255859375, -0.21173095703125, -0.187774658203125, -0.163818359375, -0.139862060546875, -0.11590576171875, -0.091949462890625, -0.0679931640625, -0.044036865234375, -0.02008056640625, 0.003875732421875, 0.02783203125, 0.051788330078125, 0.07574462890625, 0.099700927734375, 0.1236572265625, 0.147613525390625, 0.17156982421875, 0.195526123046875, 0.219482421875, 0.243438720703125, 0.26739501953125, 0.291351318359375, 0.3153076171875, 0.339263916015625, 0.36322021484375, 0.387176513671875, 0.4111328125, 0.435089111328125, 0.45904541015625, 0.483001708984375, 0.5069580078125, 0.530914306640625, 0.55487060546875, 0.578826904296875, 0.602783203125, 0.626739501953125, 0.65069580078125, 0.674652099609375, 0.6986083984375, 0.722564697265625, 0.74652099609375, 0.770477294921875, 0.79443359375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 14.0, 10.0, 23.0, 18.0, 55.0, 108.0, 206.0, 273.0, 111.0, 66.0, 32.0, 15.0, 13.0, 9.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033782958984375, -0.032663822174072266, -0.03154468536376953, -0.030425548553466797, -0.029306411743164062, -0.028187274932861328, -0.027068138122558594, -0.02594900131225586, -0.024829864501953125, -0.02371072769165039, -0.022591590881347656, -0.021472454071044922, -0.020353317260742188, -0.019234180450439453, -0.01811504364013672, -0.016995906829833984, -0.01587677001953125, -0.014757633209228516, -0.013638496398925781, -0.012519359588623047, -0.011400222778320312, -0.010281085968017578, -0.009161949157714844, -0.00804281234741211, -0.006923675537109375, -0.005804538726806641, -0.004685401916503906, -0.003566265106201172, -0.0024471282958984375, -0.0013279914855957031, -0.00020885467529296875, 0.0009102821350097656, 0.0020294189453125, 0.0031485557556152344, 0.004267692565917969, 0.005386829376220703, 0.0065059661865234375, 0.007625102996826172, 0.008744239807128906, 0.00986337661743164, 0.010982513427734375, 0.01210165023803711, 0.013220787048339844, 0.014339923858642578, 0.015459060668945312, 0.016578197479248047, 0.01769733428955078, 0.018816471099853516, 0.01993560791015625, 0.021054744720458984, 0.02217388153076172, 0.023293018341064453, 0.024412155151367188, 0.025531291961669922, 0.026650428771972656, 0.02776956558227539, 0.028888702392578125, 0.03000783920288086, 0.031126976013183594, 0.03224611282348633, 0.03336524963378906, 0.0344843864440918, 0.03560352325439453, 0.036722660064697266, 0.037841796875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 8.0, 3.0, 6.0, 14.0, 20.0, 21.0, 33.0, 55.0, 114.0, 267.0, 1041.0, 1030052.0, 15914.0, 497.0, 197.0, 90.0, 62.0, 41.0, 24.0, 20.0, 11.0, 6.0, 12.0, 7.0, 3.0, 7.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.744140625, -0.7221145629882812, -0.7000885009765625, -0.6780624389648438, -0.656036376953125, -0.6340103149414062, -0.6119842529296875, -0.5899581909179688, -0.56793212890625, -0.5459060668945312, -0.5238800048828125, -0.5018539428710938, -0.479827880859375, -0.45780181884765625, -0.4357757568359375, -0.41374969482421875, -0.3917236328125, -0.36969757080078125, -0.3476715087890625, -0.32564544677734375, -0.303619384765625, -0.28159332275390625, -0.2595672607421875, -0.23754119873046875, -0.21551513671875, -0.19348907470703125, -0.1714630126953125, -0.14943695068359375, -0.127410888671875, -0.10538482666015625, -0.0833587646484375, -0.06133270263671875, -0.039306640625, -0.01728057861328125, 0.0047454833984375, 0.02677154541015625, 0.048797607421875, 0.07082366943359375, 0.0928497314453125, 0.11487579345703125, 0.13690185546875, 0.15892791748046875, 0.1809539794921875, 0.20298004150390625, 0.225006103515625, 0.24703216552734375, 0.2690582275390625, 0.29108428955078125, 0.3131103515625, 0.33513641357421875, 0.3571624755859375, 0.37918853759765625, 0.401214599609375, 0.42324066162109375, 0.4452667236328125, 0.46729278564453125, 0.48931884765625, 0.5113449096679688, 0.5333709716796875, 0.5553970336914062, 0.577423095703125, 0.5994491577148438, 0.6214752197265625, 0.6435012817382812, 0.66552734375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 1000.0, 10.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177730530500412, -0.16547609865665436, -0.15322166681289673, -0.1409672349691391, -0.12871280312538147, -0.11645837128162384, -0.10420393943786621, -0.09194950759410858, -0.07969507575035095, -0.06744064390659332, -0.05518621206283569, -0.042931780219078064, -0.030677348375320435, -0.018422916531562805, -0.006168484687805176, 0.006085947155952454, 0.018340378999710083, 0.030594810843467712, 0.04284924268722534, 0.05510367453098297, 0.0673581063747406, 0.07961253821849823, 0.09186697006225586, 0.10412140190601349, 0.11637583374977112, 0.12863026559352875, 0.14088469743728638, 0.153139129281044, 0.16539356112480164, 0.17764799296855927, 0.1899024248123169, 0.20215685665607452, 0.21441125869750977, 0.2266656905412674, 0.23892012238502502, 0.25117456912994385, 0.2634289860725403, 0.2756834030151367, 0.28793784976005554, 0.30019229650497437, 0.3124467134475708, 0.32470113039016724, 0.33695557713508606, 0.3492100238800049, 0.3614644408226013, 0.37371885776519775, 0.3859733045101166, 0.3982277512550354, 0.41048216819763184, 0.42273658514022827, 0.4349910318851471, 0.4472454786300659, 0.45949989557266235, 0.4717543125152588, 0.4840087592601776, 0.49626320600509644, 0.5085176229476929, 0.5207720398902893, 0.5330264568328857, 0.545280933380127, 0.5575353503227234, 0.5697897672653198, 0.582044243812561, 0.5942986607551575, 0.6065530776977539]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 10.0, 11.0, 19.0, 31.0, 33.0, 59.0, 68.0, 67.0, 68.0, 71.0, 91.0, 64.0, 71.0, 75.0, 60.0, 41.0, 47.0, 32.0, 25.0, 21.0, 12.0, 10.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027426540851593018, -0.026311088353395462, -0.025195635855197906, -0.02408018335700035, -0.022964730858802795, -0.02184927836060524, -0.020733825862407684, -0.01961837336421013, -0.018502920866012573, -0.017387468367815018, -0.016272015869617462, -0.015156563371419907, -0.014041110873222351, -0.012925658375024796, -0.01181020587682724, -0.010694753378629684, -0.009579300880432129, -0.008463848382234573, -0.007348395884037018, -0.006232943385839462, -0.005117490887641907, -0.004002038389444351, -0.0028865858912467957, -0.0017711333930492401, -0.0006556808948516846, 0.00045977160334587097, 0.0015752241015434265, 0.002690676599740982, 0.0038061290979385376, 0.004921581596136093, 0.006037034094333649, 0.007152486592531204, 0.00826793909072876, 0.009383391588926315, 0.01049884408712387, 0.011614296585321426, 0.012729749083518982, 0.013845201581716537, 0.014960654079914093, 0.01607610657811165, 0.017191559076309204, 0.01830701157450676, 0.019422464072704315, 0.02053791657090187, 0.021653369069099426, 0.022768821567296982, 0.023884274065494537, 0.024999726563692093, 0.02611517906188965, 0.027230631560087204, 0.02834608405828476, 0.029461536556482315, 0.03057698905467987, 0.031692441552877426, 0.03280789405107498, 0.03392334654927254, 0.03503879904747009, 0.03615425154566765, 0.037269704043865204, 0.03838515654206276, 0.039500609040260315, 0.04061606153845787, 0.041731514036655426, 0.04284696653485298, 0.04396241903305054]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 7.0, 10.0, 6.0, 11.0, 12.0, 14.0, 12.0, 20.0, 17.0, 22.0, 22.0, 14.0, 19.0, 41.0, 38.0, 36.0, 30.0, 35.0, 39.0, 36.0, 47.0, 38.0, 34.0, 22.0, 35.0, 36.0, 30.0, 22.0, 29.0, 36.0, 31.0, 15.0, 25.0, 24.0, 15.0, 17.0, 19.0, 8.0, 10.0, 11.0, 9.0, 9.0, 5.0, 7.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.5078125, -11.1614990234375, -10.815185546875, -10.4688720703125, -10.12255859375, -9.7762451171875, -9.429931640625, -9.0836181640625, -8.7373046875, -8.3909912109375, -8.044677734375, -7.6983642578125, -7.35205078125, -7.0057373046875, -6.659423828125, -6.3131103515625, -5.966796875, -5.6204833984375, -5.274169921875, -4.9278564453125, -4.58154296875, -4.2352294921875, -3.888916015625, -3.5426025390625, -3.1962890625, -2.8499755859375, -2.503662109375, -2.1573486328125, -1.81103515625, -1.4647216796875, -1.118408203125, -0.7720947265625, -0.42578125, -0.0794677734375, 0.266845703125, 0.6131591796875, 0.95947265625, 1.3057861328125, 1.652099609375, 1.9984130859375, 2.3447265625, 2.6910400390625, 3.037353515625, 3.3836669921875, 3.72998046875, 4.0762939453125, 4.422607421875, 4.7689208984375, 5.115234375, 5.4615478515625, 5.807861328125, 6.1541748046875, 6.50048828125, 6.8468017578125, 7.193115234375, 7.5394287109375, 7.8857421875, 8.2320556640625, 8.578369140625, 8.9246826171875, 9.27099609375, 9.6173095703125, 9.963623046875, 10.3099365234375, 10.65625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 5.0, 5.0, 8.0, 13.0, 13.0, 23.0, 30.0, 30.0, 42.0, 50.0, 75.0, 105.0, 123.0, 164.0, 205.0, 326.0, 389.0, 670.0, 944.0, 1500.0, 2559.0, 5138.0, 12417.0, 43865.0, 252024.0, 592589.0, 95843.0, 22281.0, 7774.0, 3511.0, 1981.0, 1140.0, 752.0, 534.0, 376.0, 262.0, 179.0, 140.0, 117.0, 101.0, 57.0, 45.0, 34.0, 37.0, 24.0, 19.0, 10.0, 9.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-20.171875, -19.565185546875, -18.95849609375, -18.351806640625, -17.7451171875, -17.138427734375, -16.53173828125, -15.925048828125, -15.318359375, -14.711669921875, -14.10498046875, -13.498291015625, -12.8916015625, -12.284912109375, -11.67822265625, -11.071533203125, -10.46484375, -9.858154296875, -9.25146484375, -8.644775390625, -8.0380859375, -7.431396484375, -6.82470703125, -6.218017578125, -5.611328125, -5.004638671875, -4.39794921875, -3.791259765625, -3.1845703125, -2.577880859375, -1.97119140625, -1.364501953125, -0.7578125, -0.151123046875, 0.45556640625, 1.062255859375, 1.6689453125, 2.275634765625, 2.88232421875, 3.489013671875, 4.095703125, 4.702392578125, 5.30908203125, 5.915771484375, 6.5224609375, 7.129150390625, 7.73583984375, 8.342529296875, 8.94921875, 9.555908203125, 10.16259765625, 10.769287109375, 11.3759765625, 11.982666015625, 12.58935546875, 13.196044921875, 13.802734375, 14.409423828125, 15.01611328125, 15.622802734375, 16.2294921875, 16.836181640625, 17.44287109375, 18.049560546875, 18.65625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 5.0, 9.0, 6.0, 8.0, 16.0, 7.0, 17.0, 20.0, 17.0, 14.0, 36.0, 24.0, 30.0, 60.0, 47.0, 72.0, 87.0, 138.0, 1438.0, 387.0, 135.0, 87.0, 68.0, 49.0, 47.0, 26.0, 39.0, 23.0, 22.0, 16.0, 18.0, 11.0, 16.0, 9.0, 8.0, 9.0, 2.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.34375, -24.468505859375, -23.59326171875, -22.718017578125, -21.8427734375, -20.967529296875, -20.09228515625, -19.217041015625, -18.341796875, -17.466552734375, -16.59130859375, -15.716064453125, -14.8408203125, -13.965576171875, -13.09033203125, -12.215087890625, -11.33984375, -10.464599609375, -9.58935546875, -8.714111328125, -7.8388671875, -6.963623046875, -6.08837890625, -5.213134765625, -4.337890625, -3.462646484375, -2.58740234375, -1.712158203125, -0.8369140625, 0.038330078125, 0.91357421875, 1.788818359375, 2.6640625, 3.539306640625, 4.41455078125, 5.289794921875, 6.1650390625, 7.040283203125, 7.91552734375, 8.790771484375, 9.666015625, 10.541259765625, 11.41650390625, 12.291748046875, 13.1669921875, 14.042236328125, 14.91748046875, 15.792724609375, 16.66796875, 17.543212890625, 18.41845703125, 19.293701171875, 20.1689453125, 21.044189453125, 21.91943359375, 22.794677734375, 23.669921875, 24.545166015625, 25.42041015625, 26.295654296875, 27.1708984375, 28.046142578125, 28.92138671875, 29.796630859375, 30.671875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 9.0, 9.0, 16.0, 19.0, 18.0, 26.0, 35.0, 34.0, 55.0, 80.0, 94.0, 157.0, 213.0, 419.0, 817.0, 2068.0, 32692.0, 3084225.0, 20926.0, 1850.0, 699.0, 418.0, 225.0, 142.0, 115.0, 65.0, 55.0, 48.0, 41.0, 20.0, 23.0, 12.0, 14.0, 15.0, 9.0, 3.0, 7.0, 6.0, 3.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-61.6875, -59.89697265625, -58.1064453125, -56.31591796875, -54.525390625, -52.73486328125, -50.9443359375, -49.15380859375, -47.36328125, -45.57275390625, -43.7822265625, -41.99169921875, -40.201171875, -38.41064453125, -36.6201171875, -34.82958984375, -33.0390625, -31.24853515625, -29.4580078125, -27.66748046875, -25.876953125, -24.08642578125, -22.2958984375, -20.50537109375, -18.71484375, -16.92431640625, -15.1337890625, -13.34326171875, -11.552734375, -9.76220703125, -7.9716796875, -6.18115234375, -4.390625, -2.60009765625, -0.8095703125, 0.98095703125, 2.771484375, 4.56201171875, 6.3525390625, 8.14306640625, 9.93359375, 11.72412109375, 13.5146484375, 15.30517578125, 17.095703125, 18.88623046875, 20.6767578125, 22.46728515625, 24.2578125, 26.04833984375, 27.8388671875, 29.62939453125, 31.419921875, 33.21044921875, 35.0009765625, 36.79150390625, 38.58203125, 40.37255859375, 42.1630859375, 43.95361328125, 45.744140625, 47.53466796875, 49.3251953125, 51.11572265625, 52.90625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 47.0, 697.0, 254.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-653.3788452148438, -640.7673950195312, -628.1559448242188, -615.5444946289062, -602.9330444335938, -590.3215942382812, -577.7101440429688, -565.0986938476562, -552.4872436523438, -539.8757934570312, -527.2643432617188, -514.6528930664062, -502.04144287109375, -489.42999267578125, -476.81854248046875, -464.20709228515625, -451.59564208984375, -438.98419189453125, -426.37274169921875, -413.76129150390625, -401.14984130859375, -388.53839111328125, -375.92694091796875, -363.31549072265625, -350.70404052734375, -338.09259033203125, -325.48114013671875, -312.86968994140625, -300.25823974609375, -287.64678955078125, -275.03533935546875, -262.42388916015625, -249.81240844726562, -237.20095825195312, -224.58950805664062, -211.97805786132812, -199.36660766601562, -186.75515747070312, -174.14370727539062, -161.53225708007812, -148.92080688476562, -136.30935668945312, -123.69790649414062, -111.08645629882812, -98.47500610351562, -85.86355590820312, -73.25210571289062, -60.640655517578125, -48.029205322265625, -35.417755126953125, -22.806304931640625, -10.194854736328125, 2.416595458984375, 15.028045654296875, 27.639495849609375, 40.250946044921875, 52.862396240234375, 65.47384643554688, 78.08529663085938, 90.69674682617188, 103.30819702148438, 115.91964721679688, 128.53109741210938, 141.14254760742188, 153.75399780273438]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 8.0, 4.0, 5.0, 13.0, 8.0, 16.0, 10.0, 13.0, 21.0, 22.0, 20.0, 27.0, 22.0, 20.0, 23.0, 30.0, 35.0, 37.0, 32.0, 38.0, 35.0, 52.0, 38.0, 41.0, 32.0, 37.0, 32.0, 38.0, 27.0, 28.0, 21.0, 28.0, 30.0, 20.0, 22.0, 10.0, 18.0, 22.0, 13.0, 8.0, 9.0, 16.0, 9.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.07286071777344, -66.01931762695312, -63.96577835083008, -61.91223907470703, -59.85869598388672, -57.805152893066406, -55.75161361694336, -53.69807434082031, -51.64453125, -49.59098815917969, -47.53744888305664, -45.483909606933594, -43.43036651611328, -41.37682342529297, -39.32328414916992, -37.269744873046875, -35.21620178222656, -33.16265869140625, -31.109119415283203, -29.055578231811523, -27.002037048339844, -24.948495864868164, -22.894954681396484, -20.841413497924805, -18.787872314453125, -16.734331130981445, -14.680789947509766, -12.627248764038086, -10.573707580566406, -8.520166397094727, -6.466625213623047, -4.413084030151367, -2.3595352172851562, -0.30599403381347656, 1.7475471496582031, 3.801088333129883, 5.8546295166015625, 7.908170700073242, 9.961711883544922, 12.015253067016602, 14.068794250488281, 16.12233543395996, 18.17587661743164, 20.22941780090332, 22.282958984375, 24.33650016784668, 26.39004135131836, 28.44358253479004, 30.49712371826172, 32.55066680908203, 34.60420608520508, 36.657745361328125, 38.71128845214844, 40.76483154296875, 42.8183708190918, 44.871910095214844, 46.925453186035156, 48.97899627685547, 51.032535552978516, 53.08607482910156, 55.139617919921875, 57.19316101074219, 59.246700286865234, 61.30023956298828, 63.353782653808594]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 8.0, 8.0, 15.0, 11.0, 6.0, 13.0, 15.0, 18.0, 24.0, 20.0, 16.0, 27.0, 22.0, 38.0, 30.0, 33.0, 32.0, 41.0, 39.0, 32.0, 38.0, 46.0, 38.0, 30.0, 40.0, 39.0, 29.0, 33.0, 20.0, 36.0, 28.0, 25.0, 23.0, 17.0, 14.0, 11.0, 12.0, 6.0, 11.0, 7.0, 6.0, 11.0, 5.0, 5.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.0703125, -11.6793212890625, -11.288330078125, -10.8973388671875, -10.50634765625, -10.1153564453125, -9.724365234375, -9.3333740234375, -8.9423828125, -8.5513916015625, -8.160400390625, -7.7694091796875, -7.37841796875, -6.9874267578125, -6.596435546875, -6.2054443359375, -5.814453125, -5.4234619140625, -5.032470703125, -4.6414794921875, -4.25048828125, -3.8594970703125, -3.468505859375, -3.0775146484375, -2.6865234375, -2.2955322265625, -1.904541015625, -1.5135498046875, -1.12255859375, -0.7315673828125, -0.340576171875, 0.0504150390625, 0.44140625, 0.8323974609375, 1.223388671875, 1.6143798828125, 2.00537109375, 2.3963623046875, 2.787353515625, 3.1783447265625, 3.5693359375, 3.9603271484375, 4.351318359375, 4.7423095703125, 5.13330078125, 5.5242919921875, 5.915283203125, 6.3062744140625, 6.697265625, 7.0882568359375, 7.479248046875, 7.8702392578125, 8.26123046875, 8.6522216796875, 9.043212890625, 9.4342041015625, 9.8251953125, 10.2161865234375, 10.607177734375, 10.9981689453125, 11.38916015625, 11.7801513671875, 12.171142578125, 12.5621337890625, 12.953125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 7.0, 4.0, 3.0, 11.0, 15.0, 16.0, 13.0, 17.0, 25.0, 47.0, 63.0, 68.0, 119.0, 144.0, 225.0, 328.0, 508.0, 794.0, 1334.0, 2559.0, 5559.0, 14167.0, 106854.0, 3422785.0, 600437.0, 22613.0, 7833.0, 3291.0, 1732.0, 890.0, 571.0, 370.0, 241.0, 177.0, 130.0, 88.0, 62.0, 45.0, 32.0, 27.0, 19.0, 10.0, 15.0, 4.0, 6.0, 6.0, 10.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-63.0625, -61.072265625, -59.08203125, -57.091796875, -55.1015625, -53.111328125, -51.12109375, -49.130859375, -47.140625, -45.150390625, -43.16015625, -41.169921875, -39.1796875, -37.189453125, -35.19921875, -33.208984375, -31.21875, -29.228515625, -27.23828125, -25.248046875, -23.2578125, -21.267578125, -19.27734375, -17.287109375, -15.296875, -13.306640625, -11.31640625, -9.326171875, -7.3359375, -5.345703125, -3.35546875, -1.365234375, 0.625, 2.615234375, 4.60546875, 6.595703125, 8.5859375, 10.576171875, 12.56640625, 14.556640625, 16.546875, 18.537109375, 20.52734375, 22.517578125, 24.5078125, 26.498046875, 28.48828125, 30.478515625, 32.46875, 34.458984375, 36.44921875, 38.439453125, 40.4296875, 42.419921875, 44.41015625, 46.400390625, 48.390625, 50.380859375, 52.37109375, 54.361328125, 56.3515625, 58.341796875, 60.33203125, 62.322265625, 64.3125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 7.0, 4.0, 12.0, 9.0, 14.0, 22.0, 42.0, 42.0, 67.0, 107.0, 203.0, 428.0, 888.0, 967.0, 579.0, 264.0, 136.0, 82.0, 52.0, 32.0, 33.0, 24.0, 19.0, 8.0, 11.0, 9.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.71875, -36.37939453125, -35.0400390625, -33.70068359375, -32.361328125, -31.02197265625, -29.6826171875, -28.34326171875, -27.00390625, -25.66455078125, -24.3251953125, -22.98583984375, -21.646484375, -20.30712890625, -18.9677734375, -17.62841796875, -16.2890625, -14.94970703125, -13.6103515625, -12.27099609375, -10.931640625, -9.59228515625, -8.2529296875, -6.91357421875, -5.57421875, -4.23486328125, -2.8955078125, -1.55615234375, -0.216796875, 1.12255859375, 2.4619140625, 3.80126953125, 5.140625, 6.47998046875, 7.8193359375, 9.15869140625, 10.498046875, 11.83740234375, 13.1767578125, 14.51611328125, 15.85546875, 17.19482421875, 18.5341796875, 19.87353515625, 21.212890625, 22.55224609375, 23.8916015625, 25.23095703125, 26.5703125, 27.90966796875, 29.2490234375, 30.58837890625, 31.927734375, 33.26708984375, 34.6064453125, 35.94580078125, 37.28515625, 38.62451171875, 39.9638671875, 41.30322265625, 42.642578125, 43.98193359375, 45.3212890625, 46.66064453125, 48.0]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 9.0, 10.0, 5.0, 17.0, 18.0, 42.0, 51.0, 92.0, 118.0, 189.0, 252.0, 447.0, 806.0, 1493.0, 2918.0, 6039.0, 13054.0, 32025.0, 104986.0, 1057356.0, 2712195.0, 182830.0, 45878.0, 17612.0, 7819.0, 3687.0, 1875.0, 1014.0, 523.0, 309.0, 204.0, 108.0, 66.0, 69.0, 37.0, 37.0, 30.0, 18.0, 9.0, 9.0, 9.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-32.84375, -31.853515625, -30.86328125, -29.873046875, -28.8828125, -27.892578125, -26.90234375, -25.912109375, -24.921875, -23.931640625, -22.94140625, -21.951171875, -20.9609375, -19.970703125, -18.98046875, -17.990234375, -17.0, -16.009765625, -15.01953125, -14.029296875, -13.0390625, -12.048828125, -11.05859375, -10.068359375, -9.078125, -8.087890625, -7.09765625, -6.107421875, -5.1171875, -4.126953125, -3.13671875, -2.146484375, -1.15625, -0.166015625, 0.82421875, 1.814453125, 2.8046875, 3.794921875, 4.78515625, 5.775390625, 6.765625, 7.755859375, 8.74609375, 9.736328125, 10.7265625, 11.716796875, 12.70703125, 13.697265625, 14.6875, 15.677734375, 16.66796875, 17.658203125, 18.6484375, 19.638671875, 20.62890625, 21.619140625, 22.609375, 23.599609375, 24.58984375, 25.580078125, 26.5703125, 27.560546875, 28.55078125, 29.541015625, 30.53125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 9.0, 13.0, 16.0, 15.0, 36.0, 35.0, 66.0, 74.0, 80.0, 112.0, 127.0, 103.0, 74.0, 70.0, 34.0, 29.0, 21.0, 20.0, 15.0, 12.0, 12.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.45872497558594, -152.8987579345703, -146.33877563476562, -139.77880859375, -133.21884155273438, -126.65885925292969, -120.09889221191406, -113.5389175415039, -106.97894287109375, -100.4189682006836, -93.85899353027344, -87.29902648925781, -80.73905181884766, -74.1790771484375, -67.61911010742188, -61.05913543701172, -54.49916076660156, -47.939186096191406, -41.379215240478516, -34.819244384765625, -28.25926971435547, -21.699295043945312, -15.139324188232422, -8.579353332519531, -2.019378662109375, 4.540594100952148, 11.100566864013672, 17.660539627075195, 24.22051239013672, 30.780487060546875, 37.340457916259766, 43.900428771972656, 50.460418701171875, 57.02039337158203, 63.58036422729492, 70.14033508300781, 76.70030975341797, 83.26028442382812, 89.82025146484375, 96.3802261352539, 102.94020080566406, 109.50017547607422, 116.06015014648438, 122.6201171875, 129.18008422851562, 135.7400665283203, 142.30003356933594, 148.86001586914062, 155.41998291015625, 161.97994995117188, 168.53993225097656, 175.0998992919922, 181.65988159179688, 188.2198486328125, 194.77981567382812, 201.33978271484375, 207.89976501464844, 214.45973205566406, 221.01971435546875, 227.57968139648438, 234.1396484375, 240.6996307373047, 247.2595977783203, 253.819580078125, 260.3795471191406]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 1.0, 3.0, 10.0, 7.0, 7.0, 16.0, 11.0, 15.0, 11.0, 14.0, 16.0, 24.0, 38.0, 24.0, 34.0, 39.0, 48.0, 34.0, 30.0, 42.0, 47.0, 39.0, 34.0, 34.0, 37.0, 34.0, 34.0, 32.0, 33.0, 32.0, 29.0, 30.0, 19.0, 22.0, 17.0, 22.0, 11.0, 15.0, 12.0, 7.0, 9.0, 8.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-123.80955505371094, -120.26142120361328, -116.71328735351562, -113.16515350341797, -109.61701965332031, -106.06888580322266, -102.520751953125, -98.97261810302734, -95.42448425292969, -91.87635040283203, -88.32821655273438, -84.78008270263672, -81.23194885253906, -77.6838150024414, -74.13568115234375, -70.5875473022461, -67.03941345214844, -63.49127960205078, -59.943145751953125, -56.39501190185547, -52.84687805175781, -49.298744201660156, -45.7506103515625, -42.202476501464844, -38.65434265136719, -35.10620880126953, -31.558074951171875, -28.00994110107422, -24.461807250976562, -20.913673400878906, -17.36553955078125, -13.817405700683594, -10.269271850585938, -6.721138000488281, -3.173004150390625, 0.37512969970703125, 3.9232635498046875, 7.471397399902344, 11.01953125, 14.567665100097656, 18.115798950195312, 21.66393280029297, 25.212066650390625, 28.76020050048828, 32.30833435058594, 35.856468200683594, 39.40460205078125, 42.952735900878906, 46.50086975097656, 50.04900360107422, 53.597137451171875, 57.14527130126953, 60.69340515136719, 64.24153900146484, 67.7896728515625, 71.33780670166016, 74.88594055175781, 78.43407440185547, 81.98220825195312, 85.53034210205078, 89.07847595214844, 92.6266098022461, 96.17474365234375, 99.7228775024414, 103.27101135253906]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 10.0, 6.0, 6.0, 8.0, 6.0, 16.0, 15.0, 16.0, 26.0, 13.0, 28.0, 29.0, 24.0, 38.0, 37.0, 44.0, 48.0, 43.0, 48.0, 41.0, 43.0, 41.0, 40.0, 45.0, 37.0, 33.0, 34.0, 29.0, 33.0, 20.0, 20.0, 27.0, 15.0, 16.0, 8.0, 14.0, 10.0, 9.0, 9.0, 10.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-223.75, -217.376953125, -211.00390625, -204.630859375, -198.2578125, -191.884765625, -185.51171875, -179.138671875, -172.765625, -166.392578125, -160.01953125, -153.646484375, -147.2734375, -140.900390625, -134.52734375, -128.154296875, -121.78125, -115.408203125, -109.03515625, -102.662109375, -96.2890625, -89.916015625, -83.54296875, -77.169921875, -70.796875, -64.423828125, -58.05078125, -51.677734375, -45.3046875, -38.931640625, -32.55859375, -26.185546875, -19.8125, -13.439453125, -7.06640625, -0.693359375, 5.6796875, 12.052734375, 18.42578125, 24.798828125, 31.171875, 37.544921875, 43.91796875, 50.291015625, 56.6640625, 63.037109375, 69.41015625, 75.783203125, 82.15625, 88.529296875, 94.90234375, 101.275390625, 107.6484375, 114.021484375, 120.39453125, 126.767578125, 133.140625, 139.513671875, 145.88671875, 152.259765625, 158.6328125, 165.005859375, 171.37890625, 177.751953125, 184.125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 10.0, 13.0, 16.0, 25.0, 36.0, 40.0, 51.0, 106.0, 160.0, 207.0, 302.0, 477.0, 686.0, 986.0, 1346.0, 2002.0, 3098.0, 4438.0, 6575.0, 9885.0, 14992.0, 23254.0, 37012.0, 61449.0, 109662.0, 196985.0, 230691.0, 139597.0, 77254.0, 45613.0, 28054.0, 17712.0, 11649.0, 7761.0, 5209.0, 3585.0, 2421.0, 1615.0, 1195.0, 786.0, 486.0, 350.0, 255.0, 180.0, 119.0, 68.0, 51.0, 35.0, 23.0, 19.0, 6.0, 7.0, 4.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-12.015625, -11.6177978515625, -11.219970703125, -10.8221435546875, -10.42431640625, -10.0264892578125, -9.628662109375, -9.2308349609375, -8.8330078125, -8.4351806640625, -8.037353515625, -7.6395263671875, -7.24169921875, -6.8438720703125, -6.446044921875, -6.0482177734375, -5.650390625, -5.2525634765625, -4.854736328125, -4.4569091796875, -4.05908203125, -3.6612548828125, -3.263427734375, -2.8656005859375, -2.4677734375, -2.0699462890625, -1.672119140625, -1.2742919921875, -0.87646484375, -0.4786376953125, -0.080810546875, 0.3170166015625, 0.71484375, 1.1126708984375, 1.510498046875, 1.9083251953125, 2.30615234375, 2.7039794921875, 3.101806640625, 3.4996337890625, 3.8974609375, 4.2952880859375, 4.693115234375, 5.0909423828125, 5.48876953125, 5.8865966796875, 6.284423828125, 6.6822509765625, 7.080078125, 7.4779052734375, 7.875732421875, 8.2735595703125, 8.67138671875, 9.0692138671875, 9.467041015625, 9.8648681640625, 10.2626953125, 10.6605224609375, 11.058349609375, 11.4561767578125, 11.85400390625, 12.2518310546875, 12.649658203125, 13.0474853515625, 13.4453125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 1.0, 5.0, 3.0, 5.0, 10.0, 12.0, 11.0, 14.0, 18.0, 18.0, 13.0, 23.0, 24.0, 22.0, 33.0, 28.0, 35.0, 30.0, 32.0, 47.0, 30.0, 34.0, 36.0, 1056.0, 30.0, 33.0, 28.0, 41.0, 36.0, 36.0, 30.0, 21.0, 33.0, 17.0, 22.0, 22.0, 20.0, 19.0, 8.0, 13.0, 13.0, 12.0, 12.0, 8.0, 6.0, 3.0, 4.0, 5.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-109.1875, -105.744140625, -102.30078125, -98.857421875, -95.4140625, -91.970703125, -88.52734375, -85.083984375, -81.640625, -78.197265625, -74.75390625, -71.310546875, -67.8671875, -64.423828125, -60.98046875, -57.537109375, -54.09375, -50.650390625, -47.20703125, -43.763671875, -40.3203125, -36.876953125, -33.43359375, -29.990234375, -26.546875, -23.103515625, -19.66015625, -16.216796875, -12.7734375, -9.330078125, -5.88671875, -2.443359375, 1.0, 4.443359375, 7.88671875, 11.330078125, 14.7734375, 18.216796875, 21.66015625, 25.103515625, 28.546875, 31.990234375, 35.43359375, 38.876953125, 42.3203125, 45.763671875, 49.20703125, 52.650390625, 56.09375, 59.537109375, 62.98046875, 66.423828125, 69.8671875, 73.310546875, 76.75390625, 80.197265625, 83.640625, 87.083984375, 90.52734375, 93.970703125, 97.4140625, 100.857421875, 104.30078125, 107.744140625, 111.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 13.0, 15.0, 17.0, 36.0, 70.0, 111.0, 127.0, 197.0, 297.0, 459.0, 732.0, 1142.0, 1793.0, 2666.0, 3924.0, 6093.0, 9155.0, 14557.0, 23135.0, 37010.0, 62570.0, 110490.0, 206754.0, 1266801.0, 143441.0, 80766.0, 46151.0, 28147.0, 17691.0, 11460.0, 7217.0, 4746.0, 3294.0, 2039.0, 1388.0, 868.0, 621.0, 400.0, 258.0, 161.0, 116.0, 74.0, 40.0, 32.0, 18.0, 12.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.484375, -11.1043701171875, -10.724365234375, -10.3443603515625, -9.96435546875, -9.5843505859375, -9.204345703125, -8.8243408203125, -8.4443359375, -8.0643310546875, -7.684326171875, -7.3043212890625, -6.92431640625, -6.5443115234375, -6.164306640625, -5.7843017578125, -5.404296875, -5.0242919921875, -4.644287109375, -4.2642822265625, -3.88427734375, -3.5042724609375, -3.124267578125, -2.7442626953125, -2.3642578125, -1.9842529296875, -1.604248046875, -1.2242431640625, -0.84423828125, -0.4642333984375, -0.084228515625, 0.2957763671875, 0.67578125, 1.0557861328125, 1.435791015625, 1.8157958984375, 2.19580078125, 2.5758056640625, 2.955810546875, 3.3358154296875, 3.7158203125, 4.0958251953125, 4.475830078125, 4.8558349609375, 5.23583984375, 5.6158447265625, 5.995849609375, 6.3758544921875, 6.755859375, 7.1358642578125, 7.515869140625, 7.8958740234375, 8.27587890625, 8.6558837890625, 9.035888671875, 9.4158935546875, 9.7958984375, 10.1759033203125, 10.555908203125, 10.9359130859375, 11.31591796875, 11.6959228515625, 12.075927734375, 12.4559326171875, 12.8359375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 11.0, 3.0, 8.0, 7.0, 7.0, 14.0, 21.0, 15.0, 32.0, 20.0, 30.0, 39.0, 52.0, 73.0, 103.0, 77.0, 86.0, 59.0, 59.0, 43.0, 41.0, 30.0, 30.0, 21.0, 20.0, 18.0, 8.0, 18.0, 8.0, 6.0, 6.0, 2.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.10626220703125, -0.10278892517089844, -0.09931564331054688, -0.09584236145019531, -0.09236907958984375, -0.08889579772949219, -0.08542251586914062, -0.08194923400878906, -0.0784759521484375, -0.07500267028808594, -0.07152938842773438, -0.06805610656738281, -0.06458282470703125, -0.06110954284667969, -0.057636260986328125, -0.05416297912597656, -0.050689697265625, -0.04721641540527344, -0.043743133544921875, -0.04026985168457031, -0.03679656982421875, -0.03332328796386719, -0.029850006103515625, -0.026376724243164062, -0.0229034423828125, -0.019430160522460938, -0.015956878662109375, -0.012483596801757812, -0.00901031494140625, -0.0055370330810546875, -0.002063751220703125, 0.0014095306396484375, 0.0048828125, 0.008356094360351562, 0.011829376220703125, 0.015302658081054688, 0.01877593994140625, 0.022249221801757812, 0.025722503662109375, 0.029195785522460938, 0.0326690673828125, 0.03614234924316406, 0.039615631103515625, 0.04308891296386719, 0.04656219482421875, 0.05003547668457031, 0.053508758544921875, 0.05698204040527344, 0.060455322265625, 0.06392860412597656, 0.06740188598632812, 0.07087516784667969, 0.07434844970703125, 0.07782173156738281, 0.08129501342773438, 0.08476829528808594, 0.0882415771484375, 0.09171485900878906, 0.09518814086914062, 0.09866142272949219, 0.10213470458984375, 0.10560798645019531, 0.10908126831054688, 0.11255455017089844, 0.11602783203125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 5.0, 9.0, 9.0, 12.0, 16.0, 21.0, 33.0, 37.0, 26.0, 62.0, 64.0, 81.0, 105.0, 188.0, 274.0, 449.0, 752.0, 1277.0, 2652.0, 5324.0, 12013.0, 30273.0, 90976.0, 393859.0, 371929.0, 86638.0, 28870.0, 11612.0, 5134.0, 2510.0, 1264.0, 761.0, 444.0, 263.0, 165.0, 108.0, 77.0, 64.0, 31.0, 38.0, 27.0, 26.0, 17.0, 14.0, 7.0, 8.0, 7.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.60986328125, -0.59136962890625, -0.5728759765625, -0.55438232421875, -0.535888671875, -0.51739501953125, -0.4989013671875, -0.48040771484375, -0.4619140625, -0.44342041015625, -0.4249267578125, -0.40643310546875, -0.387939453125, -0.36944580078125, -0.3509521484375, -0.33245849609375, -0.31396484375, -0.29547119140625, -0.2769775390625, -0.25848388671875, -0.239990234375, -0.22149658203125, -0.2030029296875, -0.18450927734375, -0.166015625, -0.14752197265625, -0.1290283203125, -0.11053466796875, -0.092041015625, -0.07354736328125, -0.0550537109375, -0.03656005859375, -0.01806640625, 0.00042724609375, 0.0189208984375, 0.03741455078125, 0.055908203125, 0.07440185546875, 0.0928955078125, 0.11138916015625, 0.1298828125, 0.14837646484375, 0.1668701171875, 0.18536376953125, 0.203857421875, 0.22235107421875, 0.2408447265625, 0.25933837890625, 0.27783203125, 0.29632568359375, 0.3148193359375, 0.33331298828125, 0.351806640625, 0.37030029296875, 0.3887939453125, 0.40728759765625, 0.42578125, 0.44427490234375, 0.4627685546875, 0.48126220703125, 0.499755859375, 0.51824951171875, 0.5367431640625, 0.55523681640625, 0.57373046875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 9.0, 14.0, 41.0, 94.0, 205.0, 225.0, 155.0, 88.0, 52.0, 41.0, 22.0, 22.0, 7.0, 12.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11078447103500366, -0.09978906810283661, -0.08879366517066956, -0.0777982547879219, -0.06680285185575485, -0.0558074489235878, -0.04481203854084015, -0.033816635608673096, -0.022821232676506042, -0.01182582788169384, -0.0008304230868816376, 0.010164983570575714, 0.021160386502742767, 0.03215578943490982, 0.04315119981765747, 0.054146602749824524, 0.06514200568199158, 0.07613740861415863, 0.08713281154632568, 0.09812822192907333, 0.10912362486124039, 0.12011902779340744, 0.1311144381761551, 0.14210984110832214, 0.1531052440404892, 0.16410064697265625, 0.1750960499048233, 0.18609145283699036, 0.1970868706703186, 0.20808225870132446, 0.2190776765346527, 0.23007307946681976, 0.24106848239898682, 0.25206390023231506, 0.2630592882633209, 0.27405470609664917, 0.28505009412765503, 0.2960455119609833, 0.3070409297943115, 0.3180363178253174, 0.32903170585632324, 0.3400271236896515, 0.35102251172065735, 0.3620179295539856, 0.37301331758499146, 0.3840087354183197, 0.39500415325164795, 0.4059995412826538, 0.41699495911598206, 0.4279903769493103, 0.43898576498031616, 0.4499811828136444, 0.46097657084465027, 0.4719719886779785, 0.4829673767089844, 0.4939627945423126, 0.5049582123756409, 0.5159536004066467, 0.5269490480422974, 0.5379444360733032, 0.5489398241043091, 0.5599352121353149, 0.5709306597709656, 0.5819260478019714, 0.5929214358329773]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 6.0, 7.0, 7.0, 8.0, 12.0, 13.0, 14.0, 14.0, 14.0, 18.0, 39.0, 28.0, 19.0, 18.0, 34.0, 34.0, 39.0, 33.0, 34.0, 39.0, 36.0, 29.0, 36.0, 45.0, 39.0, 38.0, 33.0, 21.0, 28.0, 24.0, 32.0, 24.0, 28.0, 20.0, 18.0, 15.0, 13.0, 12.0, 8.0, 19.0, 16.0, 11.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.11677920818328857, -0.11341586709022522, -0.11005252599716187, -0.10668918490409851, -0.10332584381103516, -0.0999625027179718, -0.09659916907548904, -0.09323582798242569, -0.08987248688936234, -0.08650914579629898, -0.08314580470323563, -0.07978246361017227, -0.07641912996768951, -0.07305578887462616, -0.0696924477815628, -0.06632910668849945, -0.0629657655954361, -0.05960242450237274, -0.05623908340930939, -0.05287574604153633, -0.04951240494847298, -0.04614906385540962, -0.042785726487636566, -0.03942238539457321, -0.03605904430150986, -0.0326957032084465, -0.029332363978028297, -0.025969024747610092, -0.022605683654546738, -0.019242342561483383, -0.015879003331065178, -0.012515664100646973, -0.009152323007583618, -0.005788982845842838, -0.0024256426841020584, 0.0009376974776387215, 0.004301037639379501, 0.007664378732442856, 0.011027717962861061, 0.014391057193279266, 0.01775439828634262, 0.021117739379405975, 0.02448107860982418, 0.027844417840242386, 0.03120775893330574, 0.034571100026369095, 0.03793443739414215, 0.041297778487205505, 0.04466111958026886, 0.048024460673332214, 0.05138780176639557, 0.054751139134168625, 0.05811448022723198, 0.061477821320295334, 0.06484115868806839, 0.06820449978113174, 0.0715678408741951, 0.07493118196725845, 0.07829452306032181, 0.08165786415338516, 0.08502119779586792, 0.08838453888893127, 0.09174787998199463, 0.09511122107505798, 0.09847456216812134]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 10.0, 5.0, 7.0, 8.0, 6.0, 16.0, 15.0, 16.0, 25.0, 14.0, 30.0, 27.0, 24.0, 38.0, 36.0, 44.0, 50.0, 42.0, 49.0, 40.0, 43.0, 43.0, 37.0, 46.0, 37.0, 32.0, 36.0, 27.0, 33.0, 21.0, 21.0, 27.0, 14.0, 17.0, 7.0, 14.0, 10.0, 9.0, 9.0, 11.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-223.75, -217.376953125, -211.00390625, -204.630859375, -198.2578125, -191.884765625, -185.51171875, -179.138671875, -172.765625, -166.392578125, -160.01953125, -153.646484375, -147.2734375, -140.900390625, -134.52734375, -128.154296875, -121.78125, -115.408203125, -109.03515625, -102.662109375, -96.2890625, -89.916015625, -83.54296875, -77.169921875, -70.796875, -64.423828125, -58.05078125, -51.677734375, -45.3046875, -38.931640625, -32.55859375, -26.185546875, -19.8125, -13.439453125, -7.06640625, -0.693359375, 5.6796875, 12.052734375, 18.42578125, 24.798828125, 31.171875, 37.544921875, 43.91796875, 50.291015625, 56.6640625, 63.037109375, 69.41015625, 75.783203125, 82.15625, 88.529296875, 94.90234375, 101.275390625, 107.6484375, 114.021484375, 120.39453125, 126.767578125, 133.140625, 139.513671875, 145.88671875, 152.259765625, 158.6328125, 165.005859375, 171.37890625, 177.751953125, 184.125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 11.0, 11.0, 10.0, 17.0, 25.0, 16.0, 37.0, 28.0, 34.0, 44.0, 52.0, 80.0, 111.0, 176.0, 304.0, 570.0, 1349.0, 3523.0, 11027.0, 44139.0, 279682.0, 586974.0, 91421.0, 19160.0, 5717.0, 2010.0, 819.0, 431.0, 232.0, 136.0, 74.0, 67.0, 51.0, 41.0, 26.0, 29.0, 25.0, 19.0, 19.0, 11.0, 14.0, 13.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-41.71875, -40.49951171875, -39.2802734375, -38.06103515625, -36.841796875, -35.62255859375, -34.4033203125, -33.18408203125, -31.96484375, -30.74560546875, -29.5263671875, -28.30712890625, -27.087890625, -25.86865234375, -24.6494140625, -23.43017578125, -22.2109375, -20.99169921875, -19.7724609375, -18.55322265625, -17.333984375, -16.11474609375, -14.8955078125, -13.67626953125, -12.45703125, -11.23779296875, -10.0185546875, -8.79931640625, -7.580078125, -6.36083984375, -5.1416015625, -3.92236328125, -2.703125, -1.48388671875, -0.2646484375, 0.95458984375, 2.173828125, 3.39306640625, 4.6123046875, 5.83154296875, 7.05078125, 8.27001953125, 9.4892578125, 10.70849609375, 11.927734375, 13.14697265625, 14.3662109375, 15.58544921875, 16.8046875, 18.02392578125, 19.2431640625, 20.46240234375, 21.681640625, 22.90087890625, 24.1201171875, 25.33935546875, 26.55859375, 27.77783203125, 28.9970703125, 30.21630859375, 31.435546875, 32.65478515625, 33.8740234375, 35.09326171875, 36.3125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 9.0, 14.0, 14.0, 20.0, 35.0, 49.0, 38.0, 43.0, 67.0, 75.0, 60.0, 2101.0, 96.0, 67.0, 75.0, 57.0, 50.0, 34.0, 37.0, 25.0, 21.0, 9.0, 14.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-328.0, -316.15625, -304.3125, -292.46875, -280.625, -268.78125, -256.9375, -245.09375, -233.25, -221.40625, -209.5625, -197.71875, -185.875, -174.03125, -162.1875, -150.34375, -138.5, -126.65625, -114.8125, -102.96875, -91.125, -79.28125, -67.4375, -55.59375, -43.75, -31.90625, -20.0625, -8.21875, 3.625, 15.46875, 27.3125, 39.15625, 51.0, 62.84375, 74.6875, 86.53125, 98.375, 110.21875, 122.0625, 133.90625, 145.75, 157.59375, 169.4375, 181.28125, 193.125, 204.96875, 216.8125, 228.65625, 240.5, 252.34375, 264.1875, 276.03125, 287.875, 299.71875, 311.5625, 323.40625, 335.25, 347.09375, 358.9375, 370.78125, 382.625, 394.46875, 406.3125, 418.15625, 430.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 12.0, 9.0, 15.0, 25.0, 29.0, 46.0, 79.0, 140.0, 236.0, 409.0, 1015.0, 2612.0, 17733.0, 2813542.0, 296379.0, 9680.0, 2055.0, 788.0, 389.0, 210.0, 90.0, 81.0, 40.0, 27.0, 22.0, 12.0, 12.0, 0.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-86.5, -84.154296875, -81.80859375, -79.462890625, -77.1171875, -74.771484375, -72.42578125, -70.080078125, -67.734375, -65.388671875, -63.04296875, -60.697265625, -58.3515625, -56.005859375, -53.66015625, -51.314453125, -48.96875, -46.623046875, -44.27734375, -41.931640625, -39.5859375, -37.240234375, -34.89453125, -32.548828125, -30.203125, -27.857421875, -25.51171875, -23.166015625, -20.8203125, -18.474609375, -16.12890625, -13.783203125, -11.4375, -9.091796875, -6.74609375, -4.400390625, -2.0546875, 0.291015625, 2.63671875, 4.982421875, 7.328125, 9.673828125, 12.01953125, 14.365234375, 16.7109375, 19.056640625, 21.40234375, 23.748046875, 26.09375, 28.439453125, 30.78515625, 33.130859375, 35.4765625, 37.822265625, 40.16796875, 42.513671875, 44.859375, 47.205078125, 49.55078125, 51.896484375, 54.2421875, 56.587890625, 58.93359375, 61.279296875, 63.625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 6.0, 18.0, 16.0, 17.0, 67.0, 93.0, 184.0, 192.0, 174.0, 92.0, 49.0, 29.0, 15.0, 11.0, 7.0, 4.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-541.301513671875, -526.8113403320312, -512.3211669921875, -497.83099365234375, -483.3407897949219, -468.8506164550781, -454.3604431152344, -439.8702697753906, -425.38006591796875, -410.889892578125, -396.39971923828125, -381.9095458984375, -367.4193420410156, -352.9291687011719, -338.4389953613281, -323.9488220214844, -309.4586486816406, -294.9684753417969, -280.4783020019531, -265.98809814453125, -251.4979248046875, -237.00775146484375, -222.517578125, -208.02740478515625, -193.53721618652344, -179.0470428466797, -164.55685424804688, -150.06668090820312, -135.57650756835938, -121.08631896972656, -106.59614562988281, -92.10596466064453, -77.61578369140625, -63.12560272216797, -48.63542556762695, -34.14524841308594, -19.655067443847656, -5.164886474609375, 9.325286865234375, 23.815467834472656, 38.30564880371094, 52.79582977294922, 67.2860107421875, 81.77618408203125, 96.26636505126953, 110.75654602050781, 125.24671936035156, 139.73690795898438, 154.22708129882812, 168.71725463867188, 183.2074432373047, 197.69761657714844, 212.18780517578125, 226.677978515625, 241.16815185546875, 255.6583251953125, 270.14849853515625, 284.638671875, 299.12884521484375, 313.6190185546875, 328.1092224121094, 342.5993957519531, 357.0895690917969, 371.5797424316406, 386.0699462890625]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 8.0, 6.0, 13.0, 8.0, 19.0, 24.0, 29.0, 32.0, 31.0, 30.0, 43.0, 44.0, 46.0, 39.0, 57.0, 57.0, 50.0, 43.0, 45.0, 57.0, 32.0, 41.0, 47.0, 26.0, 35.0, 23.0, 24.0, 19.0, 9.0, 13.0, 2.0, 8.0, 6.0, 5.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-411.3312072753906, -399.6236267089844, -387.9160461425781, -376.2084655761719, -364.5008850097656, -352.7933349609375, -341.08575439453125, -329.378173828125, -317.67059326171875, -305.9630126953125, -294.25543212890625, -282.5478515625, -270.84027099609375, -259.1326904296875, -247.4251251220703, -235.71755981445312, -224.0099639892578, -212.30238342285156, -200.5948028564453, -188.88723754882812, -177.17965698242188, -165.47207641601562, -153.76449584960938, -142.05691528320312, -130.34933471679688, -118.64175415039062, -106.9341812133789, -95.22660064697266, -83.51902770996094, -71.81144714355469, -60.10386657714844, -48.39629364013672, -36.688720703125, -24.981143951416016, -13.273565292358398, -1.5659866333007812, 10.141590118408203, 21.849166870117188, 33.55674743652344, 45.264320373535156, 56.971900939941406, 68.67948150634766, 80.38705444335938, 92.09463500976562, 103.80221557617188, 115.5097885131836, 127.21736907958984, 138.92494201660156, 150.6325225830078, 162.34010314941406, 174.0476837158203, 185.7552490234375, 197.46282958984375, 209.17041015625, 220.87799072265625, 232.5855712890625, 244.29315185546875, 256.000732421875, 267.70831298828125, 279.4158935546875, 291.12347412109375, 302.8310546875, 314.53863525390625, 326.2461853027344, 337.9537658691406]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 7.0, 3.0, 1.0, 8.0, 10.0, 12.0, 15.0, 9.0, 20.0, 24.0, 12.0, 28.0, 23.0, 34.0, 44.0, 55.0, 86.0, 153.0, 302.0, 612.0, 1125.0, 1041124.0, 2352.0, 1047.0, 616.0, 288.0, 151.0, 82.0, 49.0, 48.0, 35.0, 19.0, 26.0, 23.0, 20.0, 15.0, 17.0, 11.0, 8.0, 9.0, 10.0, 4.0, 8.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-183.59390258789062, -178.02786254882812, -172.46182250976562, -166.89578247070312, -161.32974243164062, -155.7637176513672, -150.1976776123047, -144.6316375732422, -139.0655975341797, -133.4995574951172, -127.93351745605469, -122.36748504638672, -116.80144500732422, -111.23540496826172, -105.66937255859375, -100.10333251953125, -94.53729248046875, -88.97125244140625, -83.40521240234375, -77.83917999267578, -72.27313995361328, -66.70709991455078, -61.14106369018555, -55.57502746582031, -50.00898742675781, -44.44294738769531, -38.87691116333008, -33.310874938964844, -27.744834899902344, -22.178796768188477, -16.61275863647461, -11.046722412109375, -5.4806976318359375, 0.08534049987792969, 5.651378631591797, 11.217416763305664, 16.78345489501953, 22.3494930267334, 27.915531158447266, 33.4815673828125, 39.047607421875, 44.6136474609375, 50.179683685302734, 55.74571990966797, 61.31175994873047, 66.87779998779297, 72.44383239746094, 78.00987243652344, 83.57591247558594, 89.14195251464844, 94.70799255371094, 100.2740249633789, 105.8400650024414, 111.4061050415039, 116.97213745117188, 122.53817749023438, 128.10421752929688, 133.67025756835938, 139.23629760742188, 144.80233764648438, 150.36837768554688, 155.9344024658203, 161.5004425048828, 167.0664825439453, 172.6325225830078]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 2.0, 4.0, 8.0, 6.0, 8.0, 14.0, 13.0, 15.0, 28.0, 35.0, 78.0, 349.0, 51441860.0, 20352.0, 273.0, 50.0, 29.0, 17.0, 7.0, 7.0, 6.0, 9.0, 1.0, 7.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2284.1474609375, -2216.785888671875, -2149.424072265625, -2082.0625, -2014.70068359375, -1947.339111328125, -1879.9774169921875, -1812.61572265625, -1745.2540283203125, -1677.892333984375, -1610.5306396484375, -1543.1689453125, -1475.807373046875, -1408.445556640625, -1341.083984375, -1273.7222900390625, -1206.360595703125, -1138.9989013671875, -1071.63720703125, -1004.2755737304688, -936.9138793945312, -869.5521850585938, -802.1905517578125, -734.828857421875, -667.4671630859375, -600.10546875, -532.7437744140625, -465.38214111328125, -398.02044677734375, -330.65875244140625, -263.2970886230469, -195.9354248046875, -128.57373046875, -61.21205139160156, 6.149627685546875, 73.51130676269531, 140.87298583984375, 208.23468017578125, 275.5963439941406, 342.9580078125, 410.3197021484375, 477.681396484375, 545.0430908203125, 612.4047241210938, 679.7664184570312, 747.1281127929688, 814.48974609375, 881.8514404296875, 949.213134765625, 1016.5748291015625, 1083.9365234375, 1151.2982177734375, 1218.659912109375, 1286.021484375, 1353.3831787109375, 1420.744873046875, 1488.1065673828125, 1555.46826171875, 1622.8299560546875, 1690.191650390625, 1757.55322265625, 1824.9150390625, 1892.276611328125, 1959.6383056640625, 2027.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 13.0, 29.0, 37.0, 47.0, 80.0, 153.0, 202.0, 307.0, 556.0, 870.0, 1315.0, 1966.0, 3094.0, 4846.0, 7423.0, 11045.0, 17809.0, 28319.0, 45431.0, 73579.0, 125278.0, 219306.0, 390510.0, 1635331.0, 2751805.0, 408674.0, 227935.0, 130027.0, 77588.0, 47348.0, 29040.0, 18273.0, 11620.0, 7698.0, 4893.0, 3057.0, 2082.0, 1341.0, 875.0, 560.0, 358.0, 258.0, 163.0, 105.0, 73.0, 39.0, 29.0, 19.0, 9.0, 9.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.525390625, -3.41180419921875, -3.2982177734375, -3.18463134765625, -3.071044921875, -2.95745849609375, -2.8438720703125, -2.73028564453125, -2.61669921875, -2.50311279296875, -2.3895263671875, -2.27593994140625, -2.162353515625, -2.04876708984375, -1.9351806640625, -1.82159423828125, -1.7080078125, -1.59442138671875, -1.4808349609375, -1.36724853515625, -1.253662109375, -1.14007568359375, -1.0264892578125, -0.91290283203125, -0.79931640625, -0.68572998046875, -0.5721435546875, -0.45855712890625, -0.344970703125, -0.23138427734375, -0.1177978515625, -0.00421142578125, 0.109375, 0.22296142578125, 0.3365478515625, 0.45013427734375, 0.563720703125, 0.67730712890625, 0.7908935546875, 0.90447998046875, 1.01806640625, 1.13165283203125, 1.2452392578125, 1.35882568359375, 1.472412109375, 1.58599853515625, 1.6995849609375, 1.81317138671875, 1.9267578125, 2.04034423828125, 2.1539306640625, 2.26751708984375, 2.381103515625, 2.49468994140625, 2.6082763671875, 2.72186279296875, 2.83544921875, 2.94903564453125, 3.0626220703125, 3.17620849609375, 3.289794921875, 3.40338134765625, 3.5169677734375, 3.63055419921875, 3.744140625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 6.0, 3.0, 6.0, 12.0, 10.0, 11.0, 10.0, 7.0, 11.0, 16.0, 17.0, 14.0, 22.0, 26.0, 30.0, 30.0, 36.0, 24.0, 35.0, 29.0, 41.0, 44.0, 120.0, 955.0, 83.0, 39.0, 28.0, 28.0, 33.0, 41.0, 31.0, 40.0, 29.0, 20.0, 17.0, 13.0, 23.0, 17.0, 13.0, 14.0, 15.0, 4.0, 5.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.0, -32.71533203125, -31.4306640625, -30.14599609375, -28.861328125, -27.57666015625, -26.2919921875, -25.00732421875, -23.72265625, -22.43798828125, -21.1533203125, -19.86865234375, -18.583984375, -17.29931640625, -16.0146484375, -14.72998046875, -13.4453125, -12.16064453125, -10.8759765625, -9.59130859375, -8.306640625, -7.02197265625, -5.7373046875, -4.45263671875, -3.16796875, -1.88330078125, -0.5986328125, 0.68603515625, 1.970703125, 3.25537109375, 4.5400390625, 5.82470703125, 7.109375, 8.39404296875, 9.6787109375, 10.96337890625, 12.248046875, 13.53271484375, 14.8173828125, 16.10205078125, 17.38671875, 18.67138671875, 19.9560546875, 21.24072265625, 22.525390625, 23.81005859375, 25.0947265625, 26.37939453125, 27.6640625, 28.94873046875, 30.2333984375, 31.51806640625, 32.802734375, 34.08740234375, 35.3720703125, 36.65673828125, 37.94140625, 39.22607421875, 40.5107421875, 41.79541015625, 43.080078125, 44.36474609375, 45.6494140625, 46.93408203125, 48.21875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 10.0, 20.0, 15.0, 30.0, 32.0, 64.0, 95.0, 170.0, 277.0, 479.0, 690.0, 1100.0, 1759.0, 2853.0, 4622.0, 7351.0, 11619.0, 18706.0, 30237.0, 48658.0, 79088.0, 131886.0, 218741.0, 340194.0, 506527.0, 3615205.0, 452069.0, 312398.0, 197273.0, 119950.0, 72053.0, 44687.0, 27303.0, 17087.0, 10303.0, 6690.0, 4244.0, 2609.0, 1678.0, 926.0, 654.0, 408.0, 220.0, 156.0, 109.0, 75.0, 39.0, 32.0, 12.0, 9.0, 8.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0], "bins": [-2.775390625, -2.689727783203125, -2.60406494140625, -2.518402099609375, -2.4327392578125, -2.347076416015625, -2.26141357421875, -2.175750732421875, -2.090087890625, -2.004425048828125, -1.91876220703125, -1.833099365234375, -1.7474365234375, -1.661773681640625, -1.57611083984375, -1.490447998046875, -1.40478515625, -1.319122314453125, -1.23345947265625, -1.147796630859375, -1.0621337890625, -0.976470947265625, -0.89080810546875, -0.805145263671875, -0.719482421875, -0.633819580078125, -0.54815673828125, -0.462493896484375, -0.3768310546875, -0.291168212890625, -0.20550537109375, -0.119842529296875, -0.0341796875, 0.051483154296875, 0.13714599609375, 0.222808837890625, 0.3084716796875, 0.394134521484375, 0.47979736328125, 0.565460205078125, 0.651123046875, 0.736785888671875, 0.82244873046875, 0.908111572265625, 0.9937744140625, 1.079437255859375, 1.16510009765625, 1.250762939453125, 1.33642578125, 1.422088623046875, 1.50775146484375, 1.593414306640625, 1.6790771484375, 1.764739990234375, 1.85040283203125, 1.936065673828125, 2.021728515625, 2.107391357421875, 2.19305419921875, 2.278717041015625, 2.3643798828125, 2.450042724609375, 2.53570556640625, 2.621368408203125, 2.70703125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 9.0, 4.0, 5.0, 5.0, 12.0, 9.0, 13.0, 18.0, 22.0, 23.0, 21.0, 28.0, 29.0, 25.0, 34.0, 44.0, 28.0, 33.0, 40.0, 34.0, 125.0, 966.0, 49.0, 36.0, 37.0, 39.0, 41.0, 27.0, 36.0, 25.0, 25.0, 29.0, 23.0, 15.0, 17.0, 12.0, 15.0, 11.0, 13.0, 15.0, 7.0, 9.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-31.125, -30.165283203125, -29.20556640625, -28.245849609375, -27.2861328125, -26.326416015625, -25.36669921875, -24.406982421875, -23.447265625, -22.487548828125, -21.52783203125, -20.568115234375, -19.6083984375, -18.648681640625, -17.68896484375, -16.729248046875, -15.76953125, -14.809814453125, -13.85009765625, -12.890380859375, -11.9306640625, -10.970947265625, -10.01123046875, -9.051513671875, -8.091796875, -7.132080078125, -6.17236328125, -5.212646484375, -4.2529296875, -3.293212890625, -2.33349609375, -1.373779296875, -0.4140625, 0.545654296875, 1.50537109375, 2.465087890625, 3.4248046875, 4.384521484375, 5.34423828125, 6.303955078125, 7.263671875, 8.223388671875, 9.18310546875, 10.142822265625, 11.1025390625, 12.062255859375, 13.02197265625, 13.981689453125, 14.94140625, 15.901123046875, 16.86083984375, 17.820556640625, 18.7802734375, 19.739990234375, 20.69970703125, 21.659423828125, 22.619140625, 23.578857421875, 24.53857421875, 25.498291015625, 26.4580078125, 27.417724609375, 28.37744140625, 29.337158203125, 30.296875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 12.0, 9.0, 7.0, 12.0, 17.0, 25.0, 28.0, 28.0, 51.0, 93.0, 123.0, 188.0, 208.0, 270.0, 397.0, 577.0, 1012.0, 1630.0, 3041.0, 5997.0, 12029.0, 24706.0, 52903.0, 114482.0, 5659354.0, 243140.0, 88709.0, 41753.0, 19955.0, 9637.0, 4693.0, 2520.0, 1286.0, 774.0, 486.0, 364.0, 261.0, 164.0, 143.0, 98.0, 74.0, 52.0, 29.0, 25.0, 21.0, 13.0, 14.0, 14.0, 5.0, 4.0, 3.0, 4.0, 0.0, 3.0], "bins": [-10.3984375, -10.0999755859375, -9.801513671875, -9.5030517578125, -9.20458984375, -8.9061279296875, -8.607666015625, -8.3092041015625, -8.0107421875, -7.7122802734375, -7.413818359375, -7.1153564453125, -6.81689453125, -6.5184326171875, -6.219970703125, -5.9215087890625, -5.623046875, -5.3245849609375, -5.026123046875, -4.7276611328125, -4.42919921875, -4.1307373046875, -3.832275390625, -3.5338134765625, -3.2353515625, -2.9368896484375, -2.638427734375, -2.3399658203125, -2.04150390625, -1.7430419921875, -1.444580078125, -1.1461181640625, -0.84765625, -0.5491943359375, -0.250732421875, 0.0477294921875, 0.34619140625, 0.6446533203125, 0.943115234375, 1.2415771484375, 1.5400390625, 1.8385009765625, 2.136962890625, 2.4354248046875, 2.73388671875, 3.0323486328125, 3.330810546875, 3.6292724609375, 3.927734375, 4.2261962890625, 4.524658203125, 4.8231201171875, 5.12158203125, 5.4200439453125, 5.718505859375, 6.0169677734375, 6.3154296875, 6.6138916015625, 6.912353515625, 7.2108154296875, 7.50927734375, 7.8077392578125, 8.106201171875, 8.4046630859375, 8.703125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 4.0, 3.0, 8.0, 4.0, 8.0, 10.0, 13.0, 12.0, 11.0, 15.0, 13.0, 20.0, 26.0, 28.0, 35.0, 33.0, 28.0, 20.0, 29.0, 36.0, 44.0, 35.0, 566.0, 556.0, 38.0, 32.0, 42.0, 38.0, 29.0, 43.0, 31.0, 35.0, 32.0, 21.0, 20.0, 23.0, 14.0, 14.0, 20.0, 9.0, 7.0, 8.0, 5.0, 5.0, 3.0, 1.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.671875, -21.801513671875, -20.93115234375, -20.060791015625, -19.1904296875, -18.320068359375, -17.44970703125, -16.579345703125, -15.708984375, -14.838623046875, -13.96826171875, -13.097900390625, -12.2275390625, -11.357177734375, -10.48681640625, -9.616455078125, -8.74609375, -7.875732421875, -7.00537109375, -6.135009765625, -5.2646484375, -4.394287109375, -3.52392578125, -2.653564453125, -1.783203125, -0.912841796875, -0.04248046875, 0.827880859375, 1.6982421875, 2.568603515625, 3.43896484375, 4.309326171875, 5.1796875, 6.050048828125, 6.92041015625, 7.790771484375, 8.6611328125, 9.531494140625, 10.40185546875, 11.272216796875, 12.142578125, 13.012939453125, 13.88330078125, 14.753662109375, 15.6240234375, 16.494384765625, 17.36474609375, 18.235107421875, 19.10546875, 19.975830078125, 20.84619140625, 21.716552734375, 22.5869140625, 23.457275390625, 24.32763671875, 25.197998046875, 26.068359375, 26.938720703125, 27.80908203125, 28.679443359375, 29.5498046875, 30.420166015625, 31.29052734375, 32.160888671875, 33.03125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 18.0, 34.0, 78.0, 238.0, 380.0, 157.0, 55.0, 26.0, 9.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.63021850585938, -165.21250915527344, -160.79481506347656, -156.37710571289062, -151.9593963623047, -147.54168701171875, -143.12399291992188, -138.70628356933594, -134.28857421875, -129.87086486816406, -125.45316314697266, -121.03546142578125, -116.61775207519531, -112.2000503540039, -107.7823486328125, -103.36463928222656, -98.94693756103516, -94.52923583984375, -90.11152648925781, -85.6938247680664, -81.27611541748047, -76.85841369628906, -72.44070434570312, -68.02300262451172, -63.60529708862305, -59.187591552734375, -54.7698860168457, -50.35218048095703, -45.934478759765625, -41.51676940917969, -37.09906768798828, -32.68136215209961, -28.263656616210938, -23.845951080322266, -19.428245544433594, -15.010541915893555, -10.592836380004883, -6.175130844116211, -1.7574272155761719, 2.6602783203125, 7.077983856201172, 11.495689392089844, 15.9133939743042, 20.331098556518555, 24.748804092407227, 29.1665096282959, 33.58421325683594, 38.00191879272461, 42.41962432861328, 46.83732986450195, 51.255035400390625, 55.67273712158203, 60.09044647216797, 64.50814819335938, 68.92585754394531, 73.34355926513672, 77.76126098632812, 82.17896270751953, 86.59667205810547, 91.01437377929688, 95.43208312988281, 99.84978485107422, 104.26748657226562, 108.68519592285156, 113.1029052734375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 6.0, 7.0, 7.0, 11.0, 14.0, 14.0, 19.0, 27.0, 17.0, 29.0, 34.0, 39.0, 45.0, 52.0, 40.0, 57.0, 49.0, 55.0, 48.0, 47.0, 40.0, 45.0, 49.0, 29.0, 35.0, 40.0, 28.0, 21.0, 16.0, 11.0, 18.0, 9.0, 13.0, 6.0, 8.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-73.93032836914062, -71.72845458984375, -69.5265884399414, -67.32471466064453, -65.12284851074219, -62.92097473144531, -60.71910095214844, -58.51723098754883, -56.31536102294922, -54.11349105834961, -51.91162109375, -49.709747314453125, -47.507877349853516, -45.306007385253906, -43.10413360595703, -40.90226364135742, -38.70039367675781, -36.4985237121582, -34.296653747558594, -32.09477996826172, -29.89291000366211, -27.6910400390625, -25.489168167114258, -23.287296295166016, -21.085426330566406, -18.883556365966797, -16.681684494018555, -14.479813575744629, -12.277942657470703, -10.076071739196777, -7.874200820922852, -5.672329902648926, -3.470458984375, -1.2685880661010742, 0.9332828521728516, 3.1351537704467773, 5.337024688720703, 7.538895606994629, 9.740766525268555, 11.94263744354248, 14.144508361816406, 16.346378326416016, 18.548250198364258, 20.7501220703125, 22.95199203491211, 25.15386199951172, 27.35573387145996, 29.557605743408203, 31.759475708007812, 33.96134567260742, 36.16321563720703, 38.365089416503906, 40.566959381103516, 42.768829345703125, 44.970703125, 47.17257308959961, 49.37444305419922, 51.57631301879883, 53.77818298339844, 55.98005676269531, 58.18192672729492, 60.38379669189453, 62.585670471191406, 64.78753662109375, 66.98941040039062]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 13.0, 11.0, 9.0, 24.0, 17.0, 17.0, 31.0, 54.0, 56.0, 94.0, 120.0, 153.0, 215.0, 302.0, 401.0, 614.0, 1117.0, 1989.0, 4024.0, 10613.0, 46441.0, 3963256.0, 131930.0, 18634.0, 6440.0, 2994.0, 1554.0, 956.0, 573.0, 434.0, 281.0, 196.0, 149.0, 101.0, 101.0, 78.0, 51.0, 56.0, 33.0, 27.0, 17.0, 25.0, 15.0, 10.0, 8.0, 8.0, 11.0, 9.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.56640625, -0.5473403930664062, -0.5282745361328125, -0.5092086791992188, -0.490142822265625, -0.47107696533203125, -0.4520111083984375, -0.43294525146484375, -0.41387939453125, -0.39481353759765625, -0.3757476806640625, -0.35668182373046875, -0.337615966796875, -0.31855010986328125, -0.2994842529296875, -0.28041839599609375, -0.2613525390625, -0.24228668212890625, -0.2232208251953125, -0.20415496826171875, -0.185089111328125, -0.16602325439453125, -0.1469573974609375, -0.12789154052734375, -0.10882568359375, -0.08975982666015625, -0.0706939697265625, -0.05162811279296875, -0.032562255859375, -0.01349639892578125, 0.0055694580078125, 0.02463531494140625, 0.043701171875, 0.06276702880859375, 0.0818328857421875, 0.10089874267578125, 0.119964599609375, 0.13903045654296875, 0.1580963134765625, 0.17716217041015625, 0.19622802734375, 0.21529388427734375, 0.2343597412109375, 0.25342559814453125, 0.272491455078125, 0.29155731201171875, 0.3106231689453125, 0.32968902587890625, 0.3487548828125, 0.36782073974609375, 0.3868865966796875, 0.40595245361328125, 0.425018310546875, 0.44408416748046875, 0.4631500244140625, 0.48221588134765625, 0.50128173828125, 0.5203475952148438, 0.5394134521484375, 0.5584793090820312, 0.577545166015625, 0.5966110229492188, 0.6156768798828125, 0.6347427368164062, 0.65380859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 4.0, 6.0, 2.0, 10.0, 5.0, 7.0, 13.0, 17.0, 14.0, 23.0, 759.0, 24.0, 15.0, 11.0, 12.0, 6.0, 7.0, 8.0, 5.0, 5.0, 7.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261474609375, -0.25269317626953125, -0.2439117431640625, -0.23513031005859375, -0.226348876953125, -0.21756744384765625, -0.2087860107421875, -0.20000457763671875, -0.19122314453125, -0.18244171142578125, -0.1736602783203125, -0.16487884521484375, -0.156097412109375, -0.14731597900390625, -0.1385345458984375, -0.12975311279296875, -0.1209716796875, -0.11219024658203125, -0.1034088134765625, -0.09462738037109375, -0.085845947265625, -0.07706451416015625, -0.0682830810546875, -0.05950164794921875, -0.05072021484375, -0.04193878173828125, -0.0331573486328125, -0.02437591552734375, -0.015594482421875, -0.00681304931640625, 0.0019683837890625, 0.01074981689453125, 0.01953125, 0.02831268310546875, 0.0370941162109375, 0.04587554931640625, 0.054656982421875, 0.06343841552734375, 0.0722198486328125, 0.08100128173828125, 0.08978271484375, 0.09856414794921875, 0.1073455810546875, 0.11612701416015625, 0.124908447265625, 0.13368988037109375, 0.1424713134765625, 0.15125274658203125, 0.1600341796875, 0.16881561279296875, 0.1775970458984375, 0.18637847900390625, 0.195159912109375, 0.20394134521484375, 0.2127227783203125, 0.22150421142578125, 0.23028564453125, 0.23906707763671875, 0.2478485107421875, 0.25662994384765625, 0.265411376953125, 0.27419281005859375, 0.2829742431640625, 0.29175567626953125, 0.300537109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 2.0, 1.0, 5.0, 9.0, 17.0, 11.0, 16.0, 34.0, 36.0, 71.0, 100.0, 145.0, 228.0, 303.0, 549.0, 892.0, 1734.0, 3424.0, 8993.0, 32504.0, 379314.0, 3632159.0, 103446.0, 18123.0, 5969.0, 2522.0, 1382.0, 795.0, 498.0, 333.0, 221.0, 154.0, 81.0, 55.0, 43.0, 34.0, 19.0, 13.0, 10.0, 7.0, 10.0, 3.0, 3.0, 5.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.6402511596679688, -0.6183929443359375, -0.5965347290039062, -0.574676513671875, -0.5528182983398438, -0.5309600830078125, -0.5091018676757812, -0.48724365234375, -0.46538543701171875, -0.4435272216796875, -0.42166900634765625, -0.399810791015625, -0.37795257568359375, -0.3560943603515625, -0.33423614501953125, -0.3123779296875, -0.29051971435546875, -0.2686614990234375, -0.24680328369140625, -0.224945068359375, -0.20308685302734375, -0.1812286376953125, -0.15937042236328125, -0.13751220703125, -0.11565399169921875, -0.0937957763671875, -0.07193756103515625, -0.050079345703125, -0.02822113037109375, -0.0063629150390625, 0.01549530029296875, 0.037353515625, 0.05921173095703125, 0.0810699462890625, 0.10292816162109375, 0.124786376953125, 0.14664459228515625, 0.1685028076171875, 0.19036102294921875, 0.21221923828125, 0.23407745361328125, 0.2559356689453125, 0.27779388427734375, 0.299652099609375, 0.32151031494140625, 0.3433685302734375, 0.36522674560546875, 0.3870849609375, 0.40894317626953125, 0.4308013916015625, 0.45265960693359375, 0.474517822265625, 0.49637603759765625, 0.5182342529296875, 0.5400924682617188, 0.56195068359375, 0.5838088989257812, 0.6056671142578125, 0.6275253295898438, 0.649383544921875, 0.6712417602539062, 0.6930999755859375, 0.7149581909179688, 0.73681640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 9.0, 5.0, 13.0, 9.0, 22.0, 45.0, 62.0, 162.0, 797.0, 2140.0, 514.0, 130.0, 58.0, 37.0, 19.0, 12.0, 6.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.4912109375, -0.4760284423828125, -0.460845947265625, -0.4456634521484375, -0.43048095703125, -0.4152984619140625, -0.400115966796875, -0.3849334716796875, -0.3697509765625, -0.3545684814453125, -0.339385986328125, -0.3242034912109375, -0.30902099609375, -0.2938385009765625, -0.278656005859375, -0.2634735107421875, -0.248291015625, -0.2331085205078125, -0.217926025390625, -0.2027435302734375, -0.18756103515625, -0.1723785400390625, -0.157196044921875, -0.1420135498046875, -0.1268310546875, -0.1116485595703125, -0.096466064453125, -0.0812835693359375, -0.06610107421875, -0.0509185791015625, -0.035736083984375, -0.0205535888671875, -0.00537109375, 0.0098114013671875, 0.024993896484375, 0.0401763916015625, 0.05535888671875, 0.0705413818359375, 0.085723876953125, 0.1009063720703125, 0.1160888671875, 0.1312713623046875, 0.146453857421875, 0.1616363525390625, 0.17681884765625, 0.1920013427734375, 0.207183837890625, 0.2223663330078125, 0.237548828125, 0.2527313232421875, 0.267913818359375, 0.2830963134765625, 0.29827880859375, 0.3134613037109375, 0.328643798828125, 0.3438262939453125, 0.3590087890625, 0.3741912841796875, 0.389373779296875, 0.4045562744140625, 0.41973876953125, 0.4349212646484375, 0.450103759765625, 0.4652862548828125, 0.48046875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 8.0, 14.0, 39.0, 115.0, 316.0, 324.0, 117.0, 39.0, 14.0, 6.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6542479991912842, -1.5881787538528442, -1.5221095085144043, -1.4560402631759644, -1.3899710178375244, -1.3239017724990845, -1.2578325271606445, -1.1917634010314941, -1.1256940364837646, -1.0596247911453247, -0.9935555458068848, -0.9274863004684448, -0.8614170551300049, -0.7953478097915649, -0.7292786240577698, -0.6632093787193298, -0.5971401929855347, -0.5310709476470947, -0.4650017023086548, -0.39893248677253723, -0.3328632414340973, -0.26679399609565735, -0.2007247805595398, -0.13465553522109985, -0.06858628988265991, -0.0025170519948005676, 0.06355218589305878, 0.12962141633033752, 0.19569066166877747, 0.2617599070072174, 0.32782912254333496, 0.3938983678817749, 0.45996761322021484, 0.5260368585586548, 0.5921061038970947, 0.6581753492355347, 0.7242445945739746, 0.7903138399124146, 0.8563830256462097, 0.9224522709846497, 0.9885215163230896, 1.0545907020568848, 1.1206599473953247, 1.1867291927337646, 1.2527984380722046, 1.3188676834106445, 1.3849369287490845, 1.4510061740875244, 1.5170754194259644, 1.5831446647644043, 1.6492139101028442, 1.7152831554412842, 1.7813524007797241, 1.847421646118164, 1.9134907722473145, 1.979560136795044, 2.0456292629241943, 2.1116983890533447, 2.177767753601074, 2.2438368797302246, 2.309906244277954, 2.3759753704071045, 2.442044734954834, 2.5081138610839844, 2.574183225631714]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 6.0, 5.0, 6.0, 17.0, 7.0, 21.0, 22.0, 24.0, 38.0, 36.0, 48.0, 55.0, 79.0, 64.0, 59.0, 66.0, 77.0, 61.0, 49.0, 43.0, 40.0, 29.0, 18.0, 18.0, 20.0, 14.0, 10.0, 14.0, 13.0, 7.0, 3.0, 11.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0924677848815918, -1.0598351955413818, -1.0272026062011719, -0.9945700764656067, -0.9619375467300415, -0.9293049573898315, -0.8966723680496216, -0.8640397787094116, -0.8314072489738464, -0.7987746596336365, -0.7661421298980713, -0.7335095405578613, -0.7008769512176514, -0.6682444214820862, -0.6356118321418762, -0.602979302406311, -0.5703467130661011, -0.5377141237258911, -0.5050815939903259, -0.47244900465011597, -0.4398164451122284, -0.4071838855743408, -0.37455129623413086, -0.3419187366962433, -0.3092861771583557, -0.27665361762046814, -0.24402104318141937, -0.2113884687423706, -0.17875590920448303, -0.14612334966659546, -0.11349077522754669, -0.08085820078849792, -0.0482257604598999, -0.015593193471431732, 0.017039373517036438, 0.04967194050550461, 0.08230450749397278, 0.11493706703186035, 0.14756964147090912, 0.18020221590995789, 0.21283477544784546, 0.24546733498573303, 0.2780998945236206, 0.31073248386383057, 0.34336504340171814, 0.3759976029396057, 0.4086301922798157, 0.44126275181770325, 0.4738953113555908, 0.5065279006958008, 0.539160430431366, 0.5717930197715759, 0.6044255495071411, 0.6370581388473511, 0.669690728187561, 0.702323317527771, 0.7349558472633362, 0.7675884366035461, 0.8002209663391113, 0.8328535556793213, 0.8654861450195312, 0.8981186747550964, 0.9307512640953064, 0.9633837938308716, 0.9960163831710815]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 9.0, 1.0, 8.0, 11.0, 12.0, 19.0, 20.0, 45.0, 55.0, 94.0, 132.0, 225.0, 301.0, 412.0, 610.0, 884.0, 1380.0, 2053.0, 3015.0, 4951.0, 8374.0, 16038.0, 35675.0, 857250.0, 64900.0, 22650.0, 11574.0, 6562.0, 3926.0, 2469.0, 1567.0, 1032.0, 740.0, 499.0, 352.0, 236.0, 166.0, 87.0, 70.0, 53.0, 41.0, 25.0, 11.0, 14.0, 5.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3798828125, -1.337738037109375, -1.29559326171875, -1.253448486328125, -1.2113037109375, -1.169158935546875, -1.12701416015625, -1.084869384765625, -1.042724609375, -1.000579833984375, -0.95843505859375, -0.916290283203125, -0.8741455078125, -0.832000732421875, -0.78985595703125, -0.747711181640625, -0.70556640625, -0.663421630859375, -0.62127685546875, -0.579132080078125, -0.5369873046875, -0.494842529296875, -0.45269775390625, -0.410552978515625, -0.368408203125, -0.326263427734375, -0.28411865234375, -0.241973876953125, -0.1998291015625, -0.157684326171875, -0.11553955078125, -0.073394775390625, -0.03125, 0.010894775390625, 0.05303955078125, 0.095184326171875, 0.1373291015625, 0.179473876953125, 0.22161865234375, 0.263763427734375, 0.305908203125, 0.348052978515625, 0.39019775390625, 0.432342529296875, 0.4744873046875, 0.516632080078125, 0.55877685546875, 0.600921630859375, 0.64306640625, 0.685211181640625, 0.72735595703125, 0.769500732421875, 0.8116455078125, 0.853790283203125, 0.89593505859375, 0.938079833984375, 0.980224609375, 1.022369384765625, 1.06451416015625, 1.106658935546875, 1.1488037109375, 1.190948486328125, 1.23309326171875, 1.275238037109375, 1.3173828125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 0.0, 4.0, 2.0, 5.0, 9.0, 4.0, 5.0, 10.0, 13.0, 14.0, 20.0, 162.0, 616.0, 25.0, 16.0, 8.0, 14.0, 7.0, 3.0, 10.0, 4.0, 3.0, 6.0, 10.0, 1.0, 3.0, 6.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2418212890625, -0.2333087921142578, -0.22479629516601562, -0.21628379821777344, -0.20777130126953125, -0.19925880432128906, -0.19074630737304688, -0.1822338104248047, -0.1737213134765625, -0.1652088165283203, -0.15669631958007812, -0.14818382263183594, -0.13967132568359375, -0.13115882873535156, -0.12264633178710938, -0.11413383483886719, -0.105621337890625, -0.09710884094238281, -0.08859634399414062, -0.08008384704589844, -0.07157135009765625, -0.06305885314941406, -0.054546356201171875, -0.04603385925292969, -0.0375213623046875, -0.029008865356445312, -0.020496368408203125, -0.011983871459960938, -0.00347137451171875, 0.0050411224365234375, 0.013553619384765625, 0.022066116333007812, 0.03057861328125, 0.03909111022949219, 0.047603607177734375, 0.05611610412597656, 0.06462860107421875, 0.07314109802246094, 0.08165359497070312, 0.09016609191894531, 0.0986785888671875, 0.10719108581542969, 0.11570358276367188, 0.12421607971191406, 0.13272857666015625, 0.14124107360839844, 0.14975357055664062, 0.1582660675048828, 0.166778564453125, 0.1752910614013672, 0.18380355834960938, 0.19231605529785156, 0.20082855224609375, 0.20934104919433594, 0.21785354614257812, 0.2263660430908203, 0.2348785400390625, 0.2433910369873047, 0.2519035339355469, 0.26041603088378906, 0.26892852783203125, 0.27744102478027344, 0.2859535217285156, 0.2944660186767578, 0.302978515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 10.0, 14.0, 17.0, 25.0, 30.0, 33.0, 48.0, 63.0, 92.0, 127.0, 196.0, 260.0, 436.0, 636.0, 1249.0, 2555.0, 5588.0, 13293.0, 35240.0, 106623.0, 366738.0, 353034.0, 103668.0, 34334.0, 13083.0, 5448.0, 2427.0, 1256.0, 707.0, 434.0, 247.0, 156.0, 118.0, 95.0, 68.0, 67.0, 41.0, 26.0, 21.0, 14.0, 16.0, 8.0, 2.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73779296875, -0.71234130859375, -0.6868896484375, -0.66143798828125, -0.635986328125, -0.61053466796875, -0.5850830078125, -0.55963134765625, -0.5341796875, -0.50872802734375, -0.4832763671875, -0.45782470703125, -0.432373046875, -0.40692138671875, -0.3814697265625, -0.35601806640625, -0.33056640625, -0.30511474609375, -0.2796630859375, -0.25421142578125, -0.228759765625, -0.20330810546875, -0.1778564453125, -0.15240478515625, -0.126953125, -0.10150146484375, -0.0760498046875, -0.05059814453125, -0.025146484375, 0.00030517578125, 0.0257568359375, 0.05120849609375, 0.07666015625, 0.10211181640625, 0.1275634765625, 0.15301513671875, 0.178466796875, 0.20391845703125, 0.2293701171875, 0.25482177734375, 0.2802734375, 0.30572509765625, 0.3311767578125, 0.35662841796875, 0.382080078125, 0.40753173828125, 0.4329833984375, 0.45843505859375, 0.48388671875, 0.50933837890625, 0.5347900390625, 0.56024169921875, 0.585693359375, 0.61114501953125, 0.6365966796875, 0.66204833984375, 0.6875, 0.71295166015625, 0.7384033203125, 0.76385498046875, 0.789306640625, 0.81475830078125, 0.8402099609375, 0.86566162109375, 0.89111328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 8.0, 4.0, 4.0, 9.0, 9.0, 22.0, 15.0, 8.0, 16.0, 14.0, 20.0, 31.0, 26.0, 26.0, 31.0, 25.0, 33.0, 32.0, 31.0, 39.0, 29.0, 34.0, 37.0, 33.0, 38.0, 34.0, 35.0, 26.0, 34.0, 21.0, 33.0, 36.0, 30.0, 24.0, 20.0, 28.0, 18.0, 9.0, 14.0, 9.0, 11.0, 8.0, 6.0, 8.0, 6.0, 8.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8662109375, -0.8380355834960938, -0.8098602294921875, -0.7816848754882812, -0.753509521484375, -0.7253341674804688, -0.6971588134765625, -0.6689834594726562, -0.64080810546875, -0.6126327514648438, -0.5844573974609375, -0.5562820434570312, -0.528106689453125, -0.49993133544921875, -0.4717559814453125, -0.44358062744140625, -0.4154052734375, -0.38722991943359375, -0.3590545654296875, -0.33087921142578125, -0.302703857421875, -0.27452850341796875, -0.2463531494140625, -0.21817779541015625, -0.19000244140625, -0.16182708740234375, -0.1336517333984375, -0.10547637939453125, -0.077301025390625, -0.04912567138671875, -0.0209503173828125, 0.00722503662109375, 0.035400390625, 0.06357574462890625, 0.0917510986328125, 0.11992645263671875, 0.148101806640625, 0.17627716064453125, 0.2044525146484375, 0.23262786865234375, 0.26080322265625, 0.28897857666015625, 0.3171539306640625, 0.34532928466796875, 0.373504638671875, 0.40167999267578125, 0.4298553466796875, 0.45803070068359375, 0.4862060546875, 0.5143814086914062, 0.5425567626953125, 0.5707321166992188, 0.598907470703125, 0.6270828247070312, 0.6552581787109375, 0.6834335327148438, 0.71160888671875, 0.7397842407226562, 0.7679595947265625, 0.7961349487304688, 0.824310302734375, 0.8524856567382812, 0.8806610107421875, 0.9088363647460938, 0.93701171875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 7.0, 2.0, 5.0, 4.0, 6.0, 13.0, 15.0, 18.0, 24.0, 39.0, 56.0, 52.0, 103.0, 138.0, 212.0, 374.0, 641.0, 1137.0, 2883.0, 8051.0, 41367.0, 814926.0, 154539.0, 15740.0, 4335.0, 1757.0, 826.0, 467.0, 286.0, 188.0, 95.0, 76.0, 42.0, 36.0, 22.0, 22.0, 13.0, 12.0, 6.0, 8.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.99560546875, -0.9597091674804688, -0.9238128662109375, -0.8879165649414062, -0.852020263671875, -0.8161239624023438, -0.7802276611328125, -0.7443313598632812, -0.70843505859375, -0.6725387573242188, -0.6366424560546875, -0.6007461547851562, -0.564849853515625, -0.5289535522460938, -0.4930572509765625, -0.45716094970703125, -0.4212646484375, -0.38536834716796875, -0.3494720458984375, -0.31357574462890625, -0.277679443359375, -0.24178314208984375, -0.2058868408203125, -0.16999053955078125, -0.13409423828125, -0.09819793701171875, -0.0623016357421875, -0.02640533447265625, 0.009490966796875, 0.04538726806640625, 0.0812835693359375, 0.11717987060546875, 0.153076171875, 0.18897247314453125, 0.2248687744140625, 0.26076507568359375, 0.296661376953125, 0.33255767822265625, 0.3684539794921875, 0.40435028076171875, 0.44024658203125, 0.47614288330078125, 0.5120391845703125, 0.5479354858398438, 0.583831787109375, 0.6197280883789062, 0.6556243896484375, 0.6915206909179688, 0.7274169921875, 0.7633132934570312, 0.7992095947265625, 0.8351058959960938, 0.871002197265625, 0.9068984985351562, 0.9427947998046875, 0.9786911010742188, 1.01458740234375, 1.0504837036132812, 1.0863800048828125, 1.1222763061523438, 1.158172607421875, 1.1940689086914062, 1.2299652099609375, 1.2658615112304688, 1.3017578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 1.0, 5.0, 6.0, 10.0, 18.0, 15.0, 27.0, 33.0, 56.0, 66.0, 83.0, 93.0, 96.0, 120.0, 98.0, 85.0, 55.0, 33.0, 27.0, 23.0, 15.0, 6.0, 6.0, 8.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.765127182006836e-05, -6.594602018594742e-05, -6.424076855182648e-05, -6.253551691770554e-05, -6.0830265283584595e-05, -5.9125013649463654e-05, -5.741976201534271e-05, -5.571451038122177e-05, -5.400925874710083e-05, -5.230400711297989e-05, -5.059875547885895e-05, -4.8893503844738007e-05, -4.7188252210617065e-05, -4.5483000576496124e-05, -4.377774894237518e-05, -4.207249730825424e-05, -4.03672456741333e-05, -3.866199404001236e-05, -3.695674240589142e-05, -3.525149077177048e-05, -3.3546239137649536e-05, -3.1840987503528595e-05, -3.0135735869407654e-05, -2.8430484235286713e-05, -2.672523260116577e-05, -2.501998096704483e-05, -2.331472933292389e-05, -2.1609477698802948e-05, -1.9904226064682007e-05, -1.8198974430561066e-05, -1.6493722796440125e-05, -1.4788471162319183e-05, -1.3083219528198242e-05, -1.1377967894077301e-05, -9.67271625995636e-06, -7.967464625835419e-06, -6.2622129917144775e-06, -4.556961357593536e-06, -2.8517097234725952e-06, -1.146458089351654e-06, 5.587935447692871e-07, 2.2640451788902283e-06, 3.9692968130111694e-06, 5.674548447132111e-06, 7.379800081253052e-06, 9.085051715373993e-06, 1.0790303349494934e-05, 1.2495554983615875e-05, 1.4200806617736816e-05, 1.5906058251857758e-05, 1.76113098859787e-05, 1.931656152009964e-05, 2.102181315422058e-05, 2.2727064788341522e-05, 2.4432316422462463e-05, 2.6137568056583405e-05, 2.7842819690704346e-05, 2.9548071324825287e-05, 3.125332295894623e-05, 3.295857459306717e-05, 3.466382622718811e-05, 3.636907786130905e-05, 3.807432949542999e-05, 3.9779581129550934e-05, 4.1484832763671875e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 10.0, 6.0, 5.0, 18.0, 34.0, 19.0, 66.0, 83.0, 131.0, 216.0, 338.0, 667.0, 1204.0, 2546.0, 5680.0, 16447.0, 93561.0, 799687.0, 99189.0, 17108.0, 5954.0, 2554.0, 1338.0, 679.0, 359.0, 219.0, 149.0, 93.0, 61.0, 29.0, 20.0, 14.0, 19.0, 11.0, 13.0, 7.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.158203125, -1.1161041259765625, -1.074005126953125, -1.0319061279296875, -0.98980712890625, -0.9477081298828125, -0.905609130859375, -0.8635101318359375, -0.8214111328125, -0.7793121337890625, -0.737213134765625, -0.6951141357421875, -0.65301513671875, -0.6109161376953125, -0.568817138671875, -0.5267181396484375, -0.484619140625, -0.4425201416015625, -0.400421142578125, -0.3583221435546875, -0.31622314453125, -0.2741241455078125, -0.232025146484375, -0.1899261474609375, -0.1478271484375, -0.1057281494140625, -0.063629150390625, -0.0215301513671875, 0.02056884765625, 0.0626678466796875, 0.104766845703125, 0.1468658447265625, 0.18896484375, 0.2310638427734375, 0.273162841796875, 0.3152618408203125, 0.35736083984375, 0.3994598388671875, 0.441558837890625, 0.4836578369140625, 0.5257568359375, 0.5678558349609375, 0.609954833984375, 0.6520538330078125, 0.69415283203125, 0.7362518310546875, 0.778350830078125, 0.8204498291015625, 0.862548828125, 0.9046478271484375, 0.946746826171875, 0.9888458251953125, 1.03094482421875, 1.0730438232421875, 1.115142822265625, 1.1572418212890625, 1.1993408203125, 1.2414398193359375, 1.283538818359375, 1.3256378173828125, 1.36773681640625, 1.4098358154296875, 1.451934814453125, 1.4940338134765625, 1.5361328125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 1.0, 7.0, 6.0, 8.0, 8.0, 7.0, 12.0, 26.0, 21.0, 44.0, 66.0, 63.0, 102.0, 115.0, 104.0, 114.0, 60.0, 49.0, 39.0, 39.0, 16.0, 17.0, 19.0, 5.0, 11.0, 8.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.4140625, -1.3710784912109375, -1.328094482421875, -1.2851104736328125, -1.24212646484375, -1.1991424560546875, -1.156158447265625, -1.1131744384765625, -1.0701904296875, -1.0272064208984375, -0.984222412109375, -0.9412384033203125, -0.89825439453125, -0.8552703857421875, -0.812286376953125, -0.7693023681640625, -0.726318359375, -0.6833343505859375, -0.640350341796875, -0.5973663330078125, -0.55438232421875, -0.5113983154296875, -0.468414306640625, -0.4254302978515625, -0.3824462890625, -0.3394622802734375, -0.296478271484375, -0.2534942626953125, -0.21051025390625, -0.1675262451171875, -0.124542236328125, -0.0815582275390625, -0.03857421875, 0.0044097900390625, 0.047393798828125, 0.0903778076171875, 0.13336181640625, 0.1763458251953125, 0.219329833984375, 0.2623138427734375, 0.3052978515625, 0.3482818603515625, 0.391265869140625, 0.4342498779296875, 0.47723388671875, 0.5202178955078125, 0.563201904296875, 0.6061859130859375, 0.649169921875, 0.6921539306640625, 0.735137939453125, 0.7781219482421875, 0.82110595703125, 0.8640899658203125, 0.907073974609375, 0.9500579833984375, 0.9930419921875, 1.0360260009765625, 1.079010009765625, 1.1219940185546875, 1.16497802734375, 1.2079620361328125, 1.250946044921875, 1.2939300537109375, 1.3369140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 16.0, 28.0, 144.0, 483.0, 228.0, 59.0, 20.0, 9.0, 7.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.70941925048828, -16.927597045898438, -16.145774841308594, -15.363953590393066, -14.582131385803223, -13.800310134887695, -13.018487930297852, -12.236665725708008, -11.454843521118164, -10.67302131652832, -9.891200065612793, -9.10937786102295, -8.327555656433105, -7.54573392868042, -6.763912200927734, -5.982089996337891, -5.200268745422363, -4.418447017669678, -3.636624813079834, -2.8548030853271484, -2.072981119155884, -1.2911591529846191, -0.5093374252319336, 0.27248477935791016, 1.0543065071105957, 1.8361284732818604, 2.617950439453125, 3.3997721672058105, 4.181593894958496, 4.96341609954834, 5.745237827301025, 6.527060031890869, 7.308881759643555, 8.090703964233398, 8.872525215148926, 9.65434741973877, 10.436169624328613, 11.21799087524414, 11.999813079833984, 12.781635284423828, 13.563457489013672, 14.345279693603516, 15.127100944519043, 15.908923149108887, 16.690744400024414, 17.472566604614258, 18.2543888092041, 19.036211013793945, 19.818031311035156, 20.599853515625, 21.381675720214844, 22.163497924804688, 22.9453182220459, 23.727140426635742, 24.508962631225586, 25.29078483581543, 26.072607040405273, 26.854429244995117, 27.63625144958496, 28.418071746826172, 29.199893951416016, 29.98171615600586, 30.763538360595703, 31.545360565185547, 32.32718276977539]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 9.0, 10.0, 6.0, 6.0, 12.0, 17.0, 24.0, 43.0, 71.0, 73.0, 121.0, 111.0, 95.0, 97.0, 73.0, 61.0, 39.0, 15.0, 25.0, 11.0, 10.0, 6.0, 4.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-15.543840408325195, -15.022405624389648, -14.500970840454102, -13.979536056518555, -13.458101272583008, -12.936666488647461, -12.415230751037598, -11.89379596710205, -11.372361183166504, -10.850926399230957, -10.32949161529541, -9.808056831359863, -9.28662109375, -8.765186309814453, -8.243751525878906, -7.722316741943359, -7.2008819580078125, -6.679447174072266, -6.158012390136719, -5.636577129364014, -5.115142345428467, -4.59370756149292, -4.072272300720215, -3.550837516784668, -3.029402732849121, -2.507967948913574, -1.9865329265594482, -1.4650980234146118, -0.9436631202697754, -0.4222283363342285, 0.09920668601989746, 0.6206417083740234, 1.1420783996582031, 1.6635133028030396, 2.184948205947876, 2.706383228302002, 3.227818012237549, 3.7492527961730957, 4.270688056945801, 4.792122840881348, 5.3135576248168945, 5.834992408752441, 6.356427192687988, 6.877862453460693, 7.39929723739624, 7.920732021331787, 8.442167282104492, 8.963602066040039, 9.485036849975586, 10.006471633911133, 10.52790641784668, 11.049341201782227, 11.570775985717773, 12.09221076965332, 12.613646507263184, 13.13508129119873, 13.656516075134277, 14.177950859069824, 14.699385643005371, 15.220820426940918, 15.742256164550781, 16.263690948486328, 16.785125732421875, 17.306560516357422, 17.82799530029297]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 10.0, 14.0, 21.0, 20.0, 40.0, 54.0, 86.0, 98.0, 172.0, 278.0, 393.0, 718.0, 1172.0, 2013.0, 3684.0, 7468.0, 18054.0, 66999.0, 3765508.0, 261350.0, 36599.0, 13686.0, 6860.0, 3580.0, 2055.0, 1211.0, 821.0, 450.0, 281.0, 198.0, 120.0, 93.0, 47.0, 42.0, 25.0, 23.0, 12.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.9609375, -1.9028778076171875, -1.844818115234375, -1.7867584228515625, -1.72869873046875, -1.6706390380859375, -1.612579345703125, -1.5545196533203125, -1.4964599609375, -1.4384002685546875, -1.380340576171875, -1.3222808837890625, -1.26422119140625, -1.2061614990234375, -1.148101806640625, -1.0900421142578125, -1.031982421875, -0.9739227294921875, -0.915863037109375, -0.8578033447265625, -0.79974365234375, -0.7416839599609375, -0.683624267578125, -0.6255645751953125, -0.5675048828125, -0.5094451904296875, -0.451385498046875, -0.3933258056640625, -0.33526611328125, -0.2772064208984375, -0.219146728515625, -0.1610870361328125, -0.10302734375, -0.0449676513671875, 0.013092041015625, 0.0711517333984375, 0.12921142578125, 0.1872711181640625, 0.245330810546875, 0.3033905029296875, 0.3614501953125, 0.4195098876953125, 0.477569580078125, 0.5356292724609375, 0.59368896484375, 0.6517486572265625, 0.709808349609375, 0.7678680419921875, 0.825927734375, 0.8839874267578125, 0.942047119140625, 1.0001068115234375, 1.05816650390625, 1.1162261962890625, 1.174285888671875, 1.2323455810546875, 1.2904052734375, 1.3484649658203125, 1.406524658203125, 1.4645843505859375, 1.52264404296875, 1.5807037353515625, 1.638763427734375, 1.6968231201171875, 1.7548828125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 7.0, 4.0, 0.0, 4.0, 9.0, 10.0, 9.0, 9.0, 12.0, 28.0, 51.0, 145.0, 270.0, 214.0, 77.0, 37.0, 20.0, 10.0, 7.0, 11.0, 7.0, 7.0, 5.0, 5.0, 4.0, 5.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.2041015625, -0.1980915069580078, -0.19208145141601562, -0.18607139587402344, -0.18006134033203125, -0.17405128479003906, -0.16804122924804688, -0.1620311737060547, -0.1560211181640625, -0.1500110626220703, -0.14400100708007812, -0.13799095153808594, -0.13198089599609375, -0.12597084045410156, -0.11996078491210938, -0.11395072937011719, -0.107940673828125, -0.10193061828613281, -0.09592056274414062, -0.08991050720214844, -0.08390045166015625, -0.07789039611816406, -0.07188034057617188, -0.06587028503417969, -0.0598602294921875, -0.05385017395019531, -0.047840118408203125, -0.04183006286621094, -0.03582000732421875, -0.029809951782226562, -0.023799896240234375, -0.017789840698242188, -0.01177978515625, -0.0057697296142578125, 0.000240325927734375, 0.0062503814697265625, 0.01226043701171875, 0.018270492553710938, 0.024280548095703125, 0.030290603637695312, 0.0363006591796875, 0.04231071472167969, 0.048320770263671875, 0.05433082580566406, 0.06034088134765625, 0.06635093688964844, 0.07236099243164062, 0.07837104797363281, 0.084381103515625, 0.09039115905761719, 0.09640121459960938, 0.10241127014160156, 0.10842132568359375, 0.11443138122558594, 0.12044143676757812, 0.1264514923095703, 0.1324615478515625, 0.1384716033935547, 0.14448165893554688, 0.15049171447753906, 0.15650177001953125, 0.16251182556152344, 0.16852188110351562, 0.1745319366455078, 0.1805419921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 4.0, 7.0, 8.0, 13.0, 12.0, 24.0, 33.0, 45.0, 55.0, 96.0, 132.0, 185.0, 340.0, 601.0, 1042.0, 2229.0, 5329.0, 15178.0, 57765.0, 580572.0, 3356868.0, 131879.0, 26991.0, 8156.0, 3301.0, 1484.0, 788.0, 404.0, 235.0, 161.0, 108.0, 60.0, 45.0, 33.0, 30.0, 17.0, 11.0, 10.0, 11.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.091796875, -1.0531158447265625, -1.014434814453125, -0.9757537841796875, -0.93707275390625, -0.8983917236328125, -0.859710693359375, -0.8210296630859375, -0.7823486328125, -0.7436676025390625, -0.704986572265625, -0.6663055419921875, -0.62762451171875, -0.5889434814453125, -0.550262451171875, -0.5115814208984375, -0.472900390625, -0.4342193603515625, -0.395538330078125, -0.3568572998046875, -0.31817626953125, -0.2794952392578125, -0.240814208984375, -0.2021331787109375, -0.1634521484375, -0.1247711181640625, -0.086090087890625, -0.0474090576171875, -0.00872802734375, 0.0299530029296875, 0.068634033203125, 0.1073150634765625, 0.14599609375, 0.1846771240234375, 0.223358154296875, 0.2620391845703125, 0.30072021484375, 0.3394012451171875, 0.378082275390625, 0.4167633056640625, 0.4554443359375, 0.4941253662109375, 0.532806396484375, 0.5714874267578125, 0.61016845703125, 0.6488494873046875, 0.687530517578125, 0.7262115478515625, 0.764892578125, 0.8035736083984375, 0.842254638671875, 0.8809356689453125, 0.91961669921875, 0.9582977294921875, 0.996978759765625, 1.0356597900390625, 1.0743408203125, 1.1130218505859375, 1.151702880859375, 1.1903839111328125, 1.22906494140625, 1.2677459716796875, 1.306427001953125, 1.3451080322265625, 1.3837890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 11.0, 7.0, 11.0, 14.0, 15.0, 31.0, 28.0, 41.0, 56.0, 92.0, 150.0, 462.0, 1523.0, 806.0, 331.0, 161.0, 85.0, 56.0, 36.0, 41.0, 23.0, 21.0, 10.0, 15.0, 10.0, 4.0, 3.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.275146484375, -0.2669963836669922, -0.2588462829589844, -0.25069618225097656, -0.24254608154296875, -0.23439598083496094, -0.22624588012695312, -0.2180957794189453, -0.2099456787109375, -0.2017955780029297, -0.19364547729492188, -0.18549537658691406, -0.17734527587890625, -0.16919517517089844, -0.16104507446289062, -0.1528949737548828, -0.144744873046875, -0.1365947723388672, -0.12844467163085938, -0.12029457092285156, -0.11214447021484375, -0.10399436950683594, -0.09584426879882812, -0.08769416809082031, -0.0795440673828125, -0.07139396667480469, -0.06324386596679688, -0.05509376525878906, -0.04694366455078125, -0.03879356384277344, -0.030643463134765625, -0.022493362426757812, -0.01434326171875, -0.0061931610107421875, 0.001956939697265625, 0.010107040405273438, 0.01825714111328125, 0.026407241821289062, 0.034557342529296875, 0.04270744323730469, 0.0508575439453125, 0.05900764465332031, 0.06715774536132812, 0.07530784606933594, 0.08345794677734375, 0.09160804748535156, 0.09975814819335938, 0.10790824890136719, 0.116058349609375, 0.12420845031738281, 0.13235855102539062, 0.14050865173339844, 0.14865875244140625, 0.15680885314941406, 0.16495895385742188, 0.1731090545654297, 0.1812591552734375, 0.1894092559814453, 0.19755935668945312, 0.20570945739746094, 0.21385955810546875, 0.22200965881347656, 0.23015975952148438, 0.2383098602294922, 0.2464599609375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 32.0, 344.0, 486.0, 92.0, 14.0, 9.0, 8.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.371602535247803, -5.226481914520264, -5.081361293792725, -4.936240196228027, -4.791119575500488, -4.645998954772949, -4.50087833404541, -4.355757713317871, -4.210637092590332, -4.065516471862793, -3.920395612716675, -3.7752749919891357, -3.6301541328430176, -3.4850335121154785, -3.3399128913879395, -3.1947922706604004, -3.049671173095703, -2.904550552368164, -2.759429693222046, -2.614309072494507, -2.4691882133483887, -2.3240675926208496, -2.1789469718933105, -2.0338263511657715, -1.8887054920196533, -1.7435847520828247, -1.598464012145996, -1.453343391418457, -1.3082226514816284, -1.1631019115447998, -1.0179812908172607, -0.8728605508804321, -0.7277393341064453, -0.5826185941696167, -0.43749791383743286, -0.29237720370292664, -0.1472564935684204, -0.002135753631591797, 0.14298492670059204, 0.2881056070327759, 0.4332263469696045, 0.5783470869064331, 0.7234677672386169, 0.8685884475708008, 1.0137091875076294, 1.158829927444458, 1.303950548171997, 1.4490712881088257, 1.5941920280456543, 1.739312767982483, 1.8844335079193115, 2.0295541286468506, 2.1746749877929688, 2.319795608520508, 2.464916229248047, 2.610036849975586, 2.755157709121704, 2.900278329849243, 3.0453991889953613, 3.1905198097229004, 3.3356404304504395, 3.4807612895965576, 3.6258819103240967, 3.771002769470215, 3.916123390197754]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 13.0, 9.0, 8.0, 25.0, 17.0, 28.0, 30.0, 43.0, 60.0, 63.0, 69.0, 66.0, 79.0, 75.0, 64.0, 56.0, 60.0, 39.0, 49.0, 31.0, 28.0, 22.0, 13.0, 14.0, 9.0, 5.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4345269203186035, -1.3878427743911743, -1.3411585092544556, -1.2944743633270264, -1.2477902173995972, -1.201106071472168, -1.1544218063354492, -1.10773766040802, -1.0610535144805908, -1.0143693685531616, -0.9676851630210876, -0.9210009574890137, -0.8743168115615845, -0.8276326060295105, -0.7809484004974365, -0.7342642545700073, -0.6875800490379333, -0.6408958435058594, -0.5942116975784302, -0.5475274920463562, -0.500843346118927, -0.454159140586853, -0.40747496485710144, -0.36079078912734985, -0.31410661339759827, -0.2674224376678467, -0.2207382619380951, -0.1740540713071823, -0.12736989557743073, -0.08068571984767914, -0.03400152921676636, 0.01268264651298523, 0.059366822242736816, 0.1060509979724884, 0.15273517370224, 0.19941936433315277, 0.24610354006290436, 0.29278773069381714, 0.3394719064235687, 0.3861560821533203, 0.4328402578830719, 0.4795244336128235, 0.5262086391448975, 0.5728927850723267, 0.6195769906044006, 0.6662611365318298, 0.7129453420639038, 0.759629487991333, 0.806313693523407, 0.852997899055481, 0.8996820449829102, 0.9463662505149841, 0.9930503964424133, 1.0397346019744873, 1.0864187479019165, 1.1331028938293457, 1.1797871589660645, 1.2264713048934937, 1.2731555700302124, 1.3198397159576416, 1.3665238618850708, 1.4132080078125, 1.4598922729492188, 1.506576418876648, 1.5532605648040771]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 4.0, 6.0, 7.0, 11.0, 22.0, 36.0, 47.0, 65.0, 91.0, 149.0, 205.0, 339.0, 487.0, 662.0, 1020.0, 1659.0, 2344.0, 3585.0, 5686.0, 9206.0, 17101.0, 41404.0, 332349.0, 528745.0, 55804.0, 19354.0, 10292.0, 6136.0, 3869.0, 2615.0, 1760.0, 1158.0, 736.0, 497.0, 373.0, 220.0, 176.0, 112.0, 70.0, 47.0, 39.0, 18.0, 12.0, 6.0, 9.0, 6.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.0556640625, -1.0227813720703125, -0.989898681640625, -0.9570159912109375, -0.92413330078125, -0.8912506103515625, -0.858367919921875, -0.8254852294921875, -0.7926025390625, -0.7597198486328125, -0.726837158203125, -0.6939544677734375, -0.66107177734375, -0.6281890869140625, -0.595306396484375, -0.5624237060546875, -0.529541015625, -0.4966583251953125, -0.463775634765625, -0.4308929443359375, -0.39801025390625, -0.3651275634765625, -0.332244873046875, -0.2993621826171875, -0.2664794921875, -0.2335968017578125, -0.200714111328125, -0.1678314208984375, -0.13494873046875, -0.1020660400390625, -0.069183349609375, -0.0363006591796875, -0.00341796875, 0.0294647216796875, 0.062347412109375, 0.0952301025390625, 0.12811279296875, 0.1609954833984375, 0.193878173828125, 0.2267608642578125, 0.2596435546875, 0.2925262451171875, 0.325408935546875, 0.3582916259765625, 0.39117431640625, 0.4240570068359375, 0.456939697265625, 0.4898223876953125, 0.522705078125, 0.5555877685546875, 0.588470458984375, 0.6213531494140625, 0.65423583984375, 0.6871185302734375, 0.720001220703125, 0.7528839111328125, 0.7857666015625, 0.8186492919921875, 0.851531982421875, 0.8844146728515625, 0.91729736328125, 0.9501800537109375, 0.983062744140625, 1.0159454345703125, 1.048828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 2.0, 3.0, 7.0, 13.0, 3.0, 12.0, 17.0, 19.0, 49.0, 132.0, 192.0, 188.0, 140.0, 77.0, 36.0, 16.0, 17.0, 6.0, 8.0, 3.0, 9.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.1898193359375, -0.18430709838867188, -0.17879486083984375, -0.17328262329101562, -0.1677703857421875, -0.16225814819335938, -0.15674591064453125, -0.15123367309570312, -0.145721435546875, -0.14020919799804688, -0.13469696044921875, -0.12918472290039062, -0.1236724853515625, -0.11816024780273438, -0.11264801025390625, -0.10713577270507812, -0.10162353515625, -0.09611129760742188, -0.09059906005859375, -0.08508682250976562, -0.0795745849609375, -0.07406234741210938, -0.06855010986328125, -0.06303787231445312, -0.057525634765625, -0.052013397216796875, -0.04650115966796875, -0.040988922119140625, -0.0354766845703125, -0.029964447021484375, -0.02445220947265625, -0.018939971923828125, -0.013427734375, -0.007915496826171875, -0.00240325927734375, 0.003108978271484375, 0.0086212158203125, 0.014133453369140625, 0.01964569091796875, 0.025157928466796875, 0.030670166015625, 0.036182403564453125, 0.04169464111328125, 0.047206878662109375, 0.0527191162109375, 0.058231353759765625, 0.06374359130859375, 0.06925582885742188, 0.07476806640625, 0.08028030395507812, 0.08579254150390625, 0.09130477905273438, 0.0968170166015625, 0.10232925415039062, 0.10784149169921875, 0.11335372924804688, 0.118865966796875, 0.12437820434570312, 0.12989044189453125, 0.13540267944335938, 0.1409149169921875, 0.14642715454101562, 0.15193939208984375, 0.15745162963867188, 0.1629638671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 6.0, 19.0, 41.0, 92.0, 402.0, 1458.0, 15261.0, 596680.0, 422476.0, 10426.0, 1197.0, 319.0, 106.0, 30.0, 19.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.876953125, -2.789642333984375, -2.70233154296875, -2.615020751953125, -2.5277099609375, -2.440399169921875, -2.35308837890625, -2.265777587890625, -2.178466796875, -2.091156005859375, -2.00384521484375, -1.916534423828125, -1.8292236328125, -1.741912841796875, -1.65460205078125, -1.567291259765625, -1.47998046875, -1.392669677734375, -1.30535888671875, -1.218048095703125, -1.1307373046875, -1.043426513671875, -0.95611572265625, -0.868804931640625, -0.781494140625, -0.694183349609375, -0.60687255859375, -0.519561767578125, -0.4322509765625, -0.344940185546875, -0.25762939453125, -0.170318603515625, -0.0830078125, 0.004302978515625, 0.09161376953125, 0.178924560546875, 0.2662353515625, 0.353546142578125, 0.44085693359375, 0.528167724609375, 0.615478515625, 0.702789306640625, 0.79010009765625, 0.877410888671875, 0.9647216796875, 1.052032470703125, 1.13934326171875, 1.226654052734375, 1.31396484375, 1.401275634765625, 1.48858642578125, 1.575897216796875, 1.6632080078125, 1.750518798828125, 1.83782958984375, 1.925140380859375, 2.012451171875, 2.099761962890625, 2.18707275390625, 2.274383544921875, 2.3616943359375, 2.449005126953125, 2.53631591796875, 2.623626708984375, 2.7109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 5.0, 5.0, 8.0, 8.0, 9.0, 14.0, 12.0, 15.0, 13.0, 26.0, 20.0, 24.0, 31.0, 25.0, 22.0, 32.0, 37.0, 35.0, 31.0, 48.0, 36.0, 48.0, 38.0, 53.0, 35.0, 51.0, 31.0, 40.0, 27.0, 45.0, 25.0, 22.0, 19.0, 15.0, 17.0, 17.0, 9.0, 10.0, 14.0, 11.0, 7.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60693359375, -0.5877609252929688, -0.5685882568359375, -0.5494155883789062, -0.530242919921875, -0.5110702514648438, -0.4918975830078125, -0.47272491455078125, -0.45355224609375, -0.43437957763671875, -0.4152069091796875, -0.39603424072265625, -0.376861572265625, -0.35768890380859375, -0.3385162353515625, -0.31934356689453125, -0.3001708984375, -0.28099822998046875, -0.2618255615234375, -0.24265289306640625, -0.223480224609375, -0.20430755615234375, -0.1851348876953125, -0.16596221923828125, -0.14678955078125, -0.12761688232421875, -0.1084442138671875, -0.08927154541015625, -0.070098876953125, -0.05092620849609375, -0.0317535400390625, -0.01258087158203125, 0.006591796875, 0.02576446533203125, 0.0449371337890625, 0.06410980224609375, 0.083282470703125, 0.10245513916015625, 0.1216278076171875, 0.14080047607421875, 0.15997314453125, 0.17914581298828125, 0.1983184814453125, 0.21749114990234375, 0.236663818359375, 0.25583648681640625, 0.2750091552734375, 0.29418182373046875, 0.3133544921875, 0.33252716064453125, 0.3516998291015625, 0.37087249755859375, 0.390045166015625, 0.40921783447265625, 0.4283905029296875, 0.44756317138671875, 0.46673583984375, 0.48590850830078125, 0.5050811767578125, 0.5242538452148438, 0.543426513671875, 0.5625991821289062, 0.5817718505859375, 0.6009445190429688, 0.6201171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 2.0, 3.0, 3.0, 5.0, 3.0, 7.0, 16.0, 18.0, 23.0, 38.0, 50.0, 53.0, 109.0, 215.0, 418.0, 949.0, 2604.0, 12306.0, 383541.0, 627735.0, 15453.0, 2916.0, 996.0, 449.0, 237.0, 136.0, 84.0, 59.0, 28.0, 27.0, 16.0, 12.0, 12.0, 7.0, 3.0, 8.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.146484375, -2.0834503173828125, -2.020416259765625, -1.9573822021484375, -1.89434814453125, -1.8313140869140625, -1.768280029296875, -1.7052459716796875, -1.6422119140625, -1.5791778564453125, -1.516143798828125, -1.4531097412109375, -1.39007568359375, -1.3270416259765625, -1.264007568359375, -1.2009735107421875, -1.137939453125, -1.0749053955078125, -1.011871337890625, -0.9488372802734375, -0.88580322265625, -0.8227691650390625, -0.759735107421875, -0.6967010498046875, -0.6336669921875, -0.5706329345703125, -0.507598876953125, -0.4445648193359375, -0.38153076171875, -0.3184967041015625, -0.255462646484375, -0.1924285888671875, -0.12939453125, -0.0663604736328125, -0.003326416015625, 0.0597076416015625, 0.12274169921875, 0.1857757568359375, 0.248809814453125, 0.3118438720703125, 0.3748779296875, 0.4379119873046875, 0.500946044921875, 0.5639801025390625, 0.62701416015625, 0.6900482177734375, 0.753082275390625, 0.8161163330078125, 0.879150390625, 0.9421844482421875, 1.005218505859375, 1.0682525634765625, 1.13128662109375, 1.1943206787109375, 1.257354736328125, 1.3203887939453125, 1.3834228515625, 1.4464569091796875, 1.509490966796875, 1.5725250244140625, 1.63555908203125, 1.6985931396484375, 1.761627197265625, 1.8246612548828125, 1.8876953125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 14.0, 11.0, 16.0, 23.0, 36.0, 49.0, 81.0, 134.0, 159.0, 147.0, 112.0, 67.0, 46.0, 37.0, 16.0, 20.0, 7.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.791685104370117e-05, -8.463207632303238e-05, -8.134730160236359e-05, -7.80625268816948e-05, -7.4777752161026e-05, -7.149297744035721e-05, -6.820820271968842e-05, -6.492342799901962e-05, -6.163865327835083e-05, -5.835387855768204e-05, -5.5069103837013245e-05, -5.178432911634445e-05, -4.849955439567566e-05, -4.5214779675006866e-05, -4.1930004954338074e-05, -3.864523023366928e-05, -3.536045551300049e-05, -3.2075680792331696e-05, -2.8790906071662903e-05, -2.550613135099411e-05, -2.2221356630325317e-05, -1.8936581909656525e-05, -1.5651807188987732e-05, -1.236703246831894e-05, -9.082257747650146e-06, -5.797483026981354e-06, -2.512708306312561e-06, 7.720664143562317e-07, 4.056841135025024e-06, 7.341615855693817e-06, 1.062639057636261e-05, 1.3911165297031403e-05, 1.7195940017700195e-05, 2.0480714738368988e-05, 2.376548945903778e-05, 2.7050264179706573e-05, 3.0335038900375366e-05, 3.361981362104416e-05, 3.690458834171295e-05, 4.0189363062381744e-05, 4.347413778305054e-05, 4.675891250371933e-05, 5.004368722438812e-05, 5.3328461945056915e-05, 5.661323666572571e-05, 5.98980113863945e-05, 6.31827861070633e-05, 6.646756082773209e-05, 6.975233554840088e-05, 7.303711026906967e-05, 7.632188498973846e-05, 7.960665971040726e-05, 8.289143443107605e-05, 8.617620915174484e-05, 8.946098387241364e-05, 9.274575859308243e-05, 9.603053331375122e-05, 9.931530803442001e-05, 0.0001026000827550888, 0.0001058848574757576, 0.00010916963219642639, 0.00011245440691709518, 0.00011573918163776398, 0.00011902395635843277, 0.00012230873107910156]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 10.0, 15.0, 26.0, 18.0, 50.0, 74.0, 108.0, 178.0, 281.0, 569.0, 1318.0, 3701.0, 13090.0, 87029.0, 793038.0, 125490.0, 16202.0, 4440.0, 1517.0, 640.0, 321.0, 153.0, 105.0, 58.0, 46.0, 17.0, 20.0, 11.0, 8.0, 3.0, 5.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.44140625, -1.40087890625, -1.3603515625, -1.31982421875, -1.279296875, -1.23876953125, -1.1982421875, -1.15771484375, -1.1171875, -1.07666015625, -1.0361328125, -0.99560546875, -0.955078125, -0.91455078125, -0.8740234375, -0.83349609375, -0.79296875, -0.75244140625, -0.7119140625, -0.67138671875, -0.630859375, -0.59033203125, -0.5498046875, -0.50927734375, -0.46875, -0.42822265625, -0.3876953125, -0.34716796875, -0.306640625, -0.26611328125, -0.2255859375, -0.18505859375, -0.14453125, -0.10400390625, -0.0634765625, -0.02294921875, 0.017578125, 0.05810546875, 0.0986328125, 0.13916015625, 0.1796875, 0.22021484375, 0.2607421875, 0.30126953125, 0.341796875, 0.38232421875, 0.4228515625, 0.46337890625, 0.50390625, 0.54443359375, 0.5849609375, 0.62548828125, 0.666015625, 0.70654296875, 0.7470703125, 0.78759765625, 0.828125, 0.86865234375, 0.9091796875, 0.94970703125, 0.990234375, 1.03076171875, 1.0712890625, 1.11181640625, 1.15234375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 9.0, 9.0, 6.0, 17.0, 18.0, 24.0, 50.0, 70.0, 118.0, 120.0, 135.0, 114.0, 90.0, 69.0, 47.0, 30.0, 17.0, 18.0, 6.0, 8.0, 10.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2626953125, -1.2306365966796875, -1.198577880859375, -1.1665191650390625, -1.13446044921875, -1.1024017333984375, -1.070343017578125, -1.0382843017578125, -1.0062255859375, -0.9741668701171875, -0.942108154296875, -0.9100494384765625, -0.87799072265625, -0.8459320068359375, -0.813873291015625, -0.7818145751953125, -0.749755859375, -0.7176971435546875, -0.685638427734375, -0.6535797119140625, -0.62152099609375, -0.5894622802734375, -0.557403564453125, -0.5253448486328125, -0.4932861328125, -0.4612274169921875, -0.429168701171875, -0.3971099853515625, -0.36505126953125, -0.3329925537109375, -0.300933837890625, -0.2688751220703125, -0.23681640625, -0.2047576904296875, -0.172698974609375, -0.1406402587890625, -0.10858154296875, -0.0765228271484375, -0.044464111328125, -0.0124053955078125, 0.0196533203125, 0.0517120361328125, 0.083770751953125, 0.1158294677734375, 0.14788818359375, 0.1799468994140625, 0.212005615234375, 0.2440643310546875, 0.276123046875, 0.3081817626953125, 0.340240478515625, 0.3722991943359375, 0.40435791015625, 0.4364166259765625, 0.468475341796875, 0.5005340576171875, 0.5325927734375, 0.5646514892578125, 0.596710205078125, 0.6287689208984375, 0.66082763671875, 0.6928863525390625, 0.724945068359375, 0.7570037841796875, 0.7890625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 12.0, 59.0, 433.0, 399.0, 59.0, 15.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.027870178222656, -20.369081497192383, -19.71029281616211, -19.051504135131836, -18.392715454101562, -17.73392677307129, -17.075138092041016, -16.416349411010742, -15.757560729980469, -15.098772048950195, -14.439983367919922, -13.781194686889648, -13.122406005859375, -12.463617324829102, -11.804828643798828, -11.146039962768555, -10.487252235412598, -9.828463554382324, -9.16967487335205, -8.510886192321777, -7.852097511291504, -7.1933088302612305, -6.534520626068115, -5.875731945037842, -5.216943264007568, -4.558154582977295, -3.8993659019470215, -3.240577459335327, -2.5817887783050537, -1.9230000972747803, -1.264211654663086, -0.6054229736328125, 0.05336570739746094, 0.7121543288230896, 1.3709429502487183, 2.029731512069702, 2.6885201930999756, 3.347308874130249, 4.006097316741943, 4.664885997772217, 5.32367467880249, 5.982463359832764, 6.641252040863037, 7.300040245056152, 7.958828926086426, 8.6176176071167, 9.276406288146973, 9.935194969177246, 10.59398365020752, 11.252772331237793, 11.911561012268066, 12.57034969329834, 13.229138374328613, 13.887927055358887, 14.546714782714844, 15.205503463745117, 15.86429214477539, 16.523080825805664, 17.181869506835938, 17.84065818786621, 18.499446868896484, 19.158235549926758, 19.81702423095703, 20.475812911987305, 21.134601593017578]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 5.0, 9.0, 4.0, 2.0, 5.0, 8.0, 8.0, 20.0, 19.0, 41.0, 61.0, 61.0, 92.0, 96.0, 109.0, 98.0, 68.0, 65.0, 59.0, 46.0, 32.0, 17.0, 14.0, 19.0, 8.0, 5.0, 12.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-9.805558204650879, -9.537004470825195, -9.268450736999512, -8.999897003173828, -8.731342315673828, -8.462788581848145, -8.194234848022461, -7.925681114196777, -7.657127380371094, -7.38857364654541, -7.120019912719727, -6.851465702056885, -6.582911968231201, -6.314358234405518, -6.045804023742676, -5.777250289916992, -5.508696556091309, -5.240142822265625, -4.971589088439941, -4.7030348777771, -4.434481143951416, -4.165927410125732, -3.8973734378814697, -3.628819465637207, -3.3602657318115234, -3.09171199798584, -2.823158025741577, -2.5546040534973145, -2.286050319671631, -2.0174965858459473, -1.7489426136016846, -1.4803887605667114, -1.2118349075317383, -0.9432810544967651, -0.674727201461792, -0.40617334842681885, -0.1376194953918457, 0.13093435764312744, 0.3994882106781006, 0.6680420637130737, 0.9365959167480469, 1.20514976978302, 1.4737036228179932, 1.7422574758529663, 2.0108113288879395, 2.279365062713623, 2.5479190349578857, 2.8164730072021484, 3.085026741027832, 3.3535804748535156, 3.6221344470977783, 3.890688419342041, 4.159242153167725, 4.427795886993408, 4.69635009765625, 4.964903831481934, 5.233457565307617, 5.502011299133301, 5.770565032958984, 6.039119243621826, 6.30767297744751, 6.576226711273193, 6.844780921936035, 7.113334655761719, 7.381888389587402]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 8.0, 4.0, 12.0, 14.0, 14.0, 17.0, 32.0, 32.0, 38.0, 64.0, 72.0, 120.0, 165.0, 247.0, 459.0, 792.0, 1626.0, 4307.0, 21349.0, 4037364.0, 112071.0, 9387.0, 3026.0, 1250.0, 688.0, 393.0, 231.0, 172.0, 99.0, 54.0, 60.0, 37.0, 20.0, 19.0, 11.0, 7.0, 8.0, 1.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.26971435546875, -5.1136474609375, -4.95758056640625, -4.801513671875, -4.64544677734375, -4.4893798828125, -4.33331298828125, -4.17724609375, -4.02117919921875, -3.8651123046875, -3.70904541015625, -3.552978515625, -3.39691162109375, -3.2408447265625, -3.08477783203125, -2.9287109375, -2.77264404296875, -2.6165771484375, -2.46051025390625, -2.304443359375, -2.14837646484375, -1.9923095703125, -1.83624267578125, -1.68017578125, -1.52410888671875, -1.3680419921875, -1.21197509765625, -1.055908203125, -0.89984130859375, -0.7437744140625, -0.58770751953125, -0.431640625, -0.27557373046875, -0.1195068359375, 0.03656005859375, 0.192626953125, 0.34869384765625, 0.5047607421875, 0.66082763671875, 0.81689453125, 0.97296142578125, 1.1290283203125, 1.28509521484375, 1.441162109375, 1.59722900390625, 1.7532958984375, 1.90936279296875, 2.0654296875, 2.22149658203125, 2.3775634765625, 2.53363037109375, 2.689697265625, 2.84576416015625, 3.0018310546875, 3.15789794921875, 3.31396484375, 3.47003173828125, 3.6260986328125, 3.78216552734375, 3.938232421875, 4.09429931640625, 4.2503662109375, 4.40643310546875, 4.5625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 8.0, 6.0, 6.0, 14.0, 17.0, 26.0, 69.0, 125.0, 178.0, 187.0, 144.0, 79.0, 44.0, 19.0, 17.0, 19.0, 5.0, 5.0, 6.0, 6.0, 7.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2322998046875, -0.22590065002441406, -0.21950149536132812, -0.2131023406982422, -0.20670318603515625, -0.2003040313720703, -0.19390487670898438, -0.18750572204589844, -0.1811065673828125, -0.17470741271972656, -0.16830825805664062, -0.1619091033935547, -0.15550994873046875, -0.1491107940673828, -0.14271163940429688, -0.13631248474121094, -0.129913330078125, -0.12351417541503906, -0.11711502075195312, -0.11071586608886719, -0.10431671142578125, -0.09791755676269531, -0.09151840209960938, -0.08511924743652344, -0.0787200927734375, -0.07232093811035156, -0.06592178344726562, -0.05952262878417969, -0.05312347412109375, -0.04672431945800781, -0.040325164794921875, -0.03392601013183594, -0.02752685546875, -0.021127700805664062, -0.014728546142578125, -0.008329391479492188, -0.00193023681640625, 0.0044689178466796875, 0.010868072509765625, 0.017267227172851562, 0.0236663818359375, 0.030065536499023438, 0.036464691162109375, 0.04286384582519531, 0.04926300048828125, 0.05566215515136719, 0.062061309814453125, 0.06846046447753906, 0.074859619140625, 0.08125877380371094, 0.08765792846679688, 0.09405708312988281, 0.10045623779296875, 0.10685539245605469, 0.11325454711914062, 0.11965370178222656, 0.1260528564453125, 0.13245201110839844, 0.13885116577148438, 0.1452503204345703, 0.15164947509765625, 0.1580486297607422, 0.16444778442382812, 0.17084693908691406, 0.17724609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 5.0, 6.0, 10.0, 14.0, 18.0, 24.0, 32.0, 67.0, 116.0, 442.0, 2888.0, 136169.0, 4044204.0, 8973.0, 853.0, 177.0, 101.0, 51.0, 29.0, 19.0, 9.0, 16.0, 9.0, 10.0, 6.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.07421875, -5.8912353515625, -5.708251953125, -5.5252685546875, -5.34228515625, -5.1593017578125, -4.976318359375, -4.7933349609375, -4.6103515625, -4.4273681640625, -4.244384765625, -4.0614013671875, -3.87841796875, -3.6954345703125, -3.512451171875, -3.3294677734375, -3.146484375, -2.9635009765625, -2.780517578125, -2.5975341796875, -2.41455078125, -2.2315673828125, -2.048583984375, -1.8656005859375, -1.6826171875, -1.4996337890625, -1.316650390625, -1.1336669921875, -0.95068359375, -0.7677001953125, -0.584716796875, -0.4017333984375, -0.21875, -0.0357666015625, 0.147216796875, 0.3302001953125, 0.51318359375, 0.6961669921875, 0.879150390625, 1.0621337890625, 1.2451171875, 1.4281005859375, 1.611083984375, 1.7940673828125, 1.97705078125, 2.1600341796875, 2.343017578125, 2.5260009765625, 2.708984375, 2.8919677734375, 3.074951171875, 3.2579345703125, 3.44091796875, 3.6239013671875, 3.806884765625, 3.9898681640625, 4.1728515625, 4.3558349609375, 4.538818359375, 4.7218017578125, 4.90478515625, 5.0877685546875, 5.270751953125, 5.4537353515625, 5.63671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 7.0, 4.0, 9.0, 13.0, 11.0, 16.0, 22.0, 39.0, 60.0, 90.0, 167.0, 368.0, 964.0, 1480.0, 360.0, 152.0, 92.0, 59.0, 35.0, 21.0, 14.0, 22.0, 11.0, 13.0, 6.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.2315673828125, -0.22388267517089844, -0.21619796752929688, -0.2085132598876953, -0.20082855224609375, -0.1931438446044922, -0.18545913696289062, -0.17777442932128906, -0.1700897216796875, -0.16240501403808594, -0.15472030639648438, -0.1470355987548828, -0.13935089111328125, -0.1316661834716797, -0.12398147583007812, -0.11629676818847656, -0.108612060546875, -0.10092735290527344, -0.09324264526367188, -0.08555793762207031, -0.07787322998046875, -0.07018852233886719, -0.06250381469726562, -0.05481910705566406, -0.0471343994140625, -0.03944969177246094, -0.031764984130859375, -0.024080276489257812, -0.01639556884765625, -0.008710861206054688, -0.001026153564453125, 0.0066585540771484375, 0.01434326171875, 0.022027969360351562, 0.029712677001953125, 0.03739738464355469, 0.04508209228515625, 0.05276679992675781, 0.060451507568359375, 0.06813621520996094, 0.0758209228515625, 0.08350563049316406, 0.09119033813476562, 0.09887504577636719, 0.10655975341796875, 0.11424446105957031, 0.12192916870117188, 0.12961387634277344, 0.137298583984375, 0.14498329162597656, 0.15266799926757812, 0.1603527069091797, 0.16803741455078125, 0.1757221221923828, 0.18340682983398438, 0.19109153747558594, 0.1987762451171875, 0.20646095275878906, 0.21414566040039062, 0.2218303680419922, 0.22951507568359375, 0.2371997833251953, 0.24488449096679688, 0.25256919860839844, 0.26025390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 4.0, 2.0, 9.0, 11.0, 29.0, 175.0, 540.0, 195.0, 31.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.672968864440918, -3.5300850868225098, -3.3872010707855225, -3.2443172931671143, -3.101433277130127, -2.9585494995117188, -2.8156657218933105, -2.6727819442749023, -2.529897928237915, -2.387014150619507, -2.2441301345825195, -2.1012463569641113, -1.9583624601364136, -1.8154785633087158, -1.6725947856903076, -1.5297108888626099, -1.386826992034912, -1.2439430952072144, -1.1010591983795166, -0.9581754207611084, -0.8152915239334106, -0.6724076271057129, -0.5295237898826599, -0.38663995265960693, -0.24375605583190918, -0.10087218880653381, 0.04201167821884155, 0.18489554524421692, 0.3277794122695923, 0.47066330909729004, 0.613547146320343, 0.756430983543396, 0.899315357208252, 1.0421992540359497, 1.1850831508636475, 1.3279669284820557, 1.4708508253097534, 1.6137347221374512, 1.7566184997558594, 1.8995023965835571, 2.042386293411255, 2.185270071029663, 2.3281540870666504, 2.4710378646850586, 2.613921642303467, 2.756805658340454, 2.8996894359588623, 3.0425734519958496, 3.185457229614258, 3.328341007232666, 3.4712250232696533, 3.6141088008880615, 3.756992816925049, 3.899876594543457, 4.042760372161865, 4.185644149780273, 4.32852840423584, 4.471412181854248, 4.614295959472656, 4.757180213928223, 4.900063991546631, 5.042947769165039, 5.185831546783447, 5.3287153244018555, 5.471599102020264]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 9.0, 10.0, 9.0, 25.0, 28.0, 31.0, 49.0, 59.0, 60.0, 70.0, 83.0, 102.0, 96.0, 71.0, 59.0, 58.0, 52.0, 29.0, 29.0, 17.0, 15.0, 11.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.363701343536377, -1.3197206258773804, -1.2757399082183838, -1.2317591905593872, -1.1877784729003906, -1.143797755241394, -1.0998170375823975, -1.0558363199234009, -1.0118556022644043, -0.9678748846054077, -0.9238941669464111, -0.8799134492874146, -0.835932731628418, -0.7919520139694214, -0.7479712963104248, -0.7039905786514282, -0.6600098609924316, -0.6160291433334351, -0.5720484256744385, -0.5280677080154419, -0.4840869903564453, -0.44010627269744873, -0.39612555503845215, -0.35214483737945557, -0.308164119720459, -0.2641834020614624, -0.22020268440246582, -0.17622196674346924, -0.13224124908447266, -0.08826053142547607, -0.04427981376647949, -0.00029909610748291016, 0.04368162155151367, 0.08766233921051025, 0.13164305686950684, 0.17562377452850342, 0.2196044921875, 0.2635852098464966, 0.30756592750549316, 0.35154664516448975, 0.39552736282348633, 0.4395080804824829, 0.4834887981414795, 0.5274695158004761, 0.5714502334594727, 0.6154309511184692, 0.6594116687774658, 0.7033923864364624, 0.747373104095459, 0.7913538217544556, 0.8353345394134521, 0.8793152570724487, 0.9232959747314453, 0.9672766923904419, 1.0112574100494385, 1.055238127708435, 1.0992188453674316, 1.1431995630264282, 1.1871802806854248, 1.2311609983444214, 1.275141716003418, 1.3191224336624146, 1.3631031513214111, 1.4070838689804077, 1.4510645866394043]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 3.0, 4.0, 6.0, 7.0, 15.0, 31.0, 27.0, 40.0, 60.0, 119.0, 228.0, 398.0, 957.0, 2472.0, 11183.0, 380327.0, 634140.0, 13606.0, 2883.0, 996.0, 459.0, 231.0, 125.0, 72.0, 52.0, 37.0, 13.0, 12.0, 16.0, 5.0, 6.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.380859375, -3.275390625, -3.169921875, -3.064453125, -2.958984375, -2.853515625, -2.748046875, -2.642578125, -2.537109375, -2.431640625, -2.326171875, -2.220703125, -2.115234375, -2.009765625, -1.904296875, -1.798828125, -1.693359375, -1.587890625, -1.482421875, -1.376953125, -1.271484375, -1.166015625, -1.060546875, -0.955078125, -0.849609375, -0.744140625, -0.638671875, -0.533203125, -0.427734375, -0.322265625, -0.216796875, -0.111328125, -0.005859375, 0.099609375, 0.205078125, 0.310546875, 0.416015625, 0.521484375, 0.626953125, 0.732421875, 0.837890625, 0.943359375, 1.048828125, 1.154296875, 1.259765625, 1.365234375, 1.470703125, 1.576171875, 1.681640625, 1.787109375, 1.892578125, 1.998046875, 2.103515625, 2.208984375, 2.314453125, 2.419921875, 2.525390625, 2.630859375, 2.736328125, 2.841796875, 2.947265625, 3.052734375, 3.158203125, 3.263671875, 3.369140625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 8.0, 10.0, 25.0, 66.0, 162.0, 227.0, 234.0, 130.0, 56.0, 34.0, 16.0, 4.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2188720703125, -0.2107715606689453, -0.20267105102539062, -0.19457054138183594, -0.18647003173828125, -0.17836952209472656, -0.17026901245117188, -0.1621685028076172, -0.1540679931640625, -0.1459674835205078, -0.13786697387695312, -0.12976646423339844, -0.12166595458984375, -0.11356544494628906, -0.10546493530273438, -0.09736442565917969, -0.089263916015625, -0.08116340637207031, -0.07306289672851562, -0.06496238708496094, -0.05686187744140625, -0.04876136779785156, -0.040660858154296875, -0.03256034851074219, -0.0244598388671875, -0.016359329223632812, -0.008258819580078125, -0.0001583099365234375, 0.00794219970703125, 0.016042709350585938, 0.024143218994140625, 0.03224372863769531, 0.04034423828125, 0.04844474792480469, 0.056545257568359375, 0.06464576721191406, 0.07274627685546875, 0.08084678649902344, 0.08894729614257812, 0.09704780578613281, 0.1051483154296875, 0.11324882507324219, 0.12134933471679688, 0.12944984436035156, 0.13755035400390625, 0.14565086364746094, 0.15375137329101562, 0.1618518829345703, 0.169952392578125, 0.1780529022216797, 0.18615341186523438, 0.19425392150878906, 0.20235443115234375, 0.21045494079589844, 0.21855545043945312, 0.2266559600830078, 0.2347564697265625, 0.2428569793701172, 0.2509574890136719, 0.25905799865722656, 0.26715850830078125, 0.27525901794433594, 0.2833595275878906, 0.2914600372314453, 0.299560546875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 5.0, 6.0, 11.0, 13.0, 20.0, 14.0, 24.0, 23.0, 48.0, 55.0, 70.0, 97.0, 152.0, 209.0, 331.0, 617.0, 1320.0, 3335.0, 10852.0, 44925.0, 242481.0, 550616.0, 151407.0, 29387.0, 7594.0, 2496.0, 992.0, 494.0, 284.0, 187.0, 134.0, 84.0, 71.0, 47.0, 37.0, 36.0, 19.0, 24.0, 18.0, 10.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.345703125, -1.30279541015625, -1.2598876953125, -1.21697998046875, -1.174072265625, -1.13116455078125, -1.0882568359375, -1.04534912109375, -1.00244140625, -0.95953369140625, -0.9166259765625, -0.87371826171875, -0.830810546875, -0.78790283203125, -0.7449951171875, -0.70208740234375, -0.6591796875, -0.61627197265625, -0.5733642578125, -0.53045654296875, -0.487548828125, -0.44464111328125, -0.4017333984375, -0.35882568359375, -0.31591796875, -0.27301025390625, -0.2301025390625, -0.18719482421875, -0.144287109375, -0.10137939453125, -0.0584716796875, -0.01556396484375, 0.02734375, 0.07025146484375, 0.1131591796875, 0.15606689453125, 0.198974609375, 0.24188232421875, 0.2847900390625, 0.32769775390625, 0.37060546875, 0.41351318359375, 0.4564208984375, 0.49932861328125, 0.542236328125, 0.58514404296875, 0.6280517578125, 0.67095947265625, 0.7138671875, 0.75677490234375, 0.7996826171875, 0.84259033203125, 0.885498046875, 0.92840576171875, 0.9713134765625, 1.01422119140625, 1.05712890625, 1.10003662109375, 1.1429443359375, 1.18585205078125, 1.228759765625, 1.27166748046875, 1.3145751953125, 1.35748291015625, 1.400390625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 12.0, 4.0, 9.0, 14.0, 17.0, 19.0, 23.0, 16.0, 33.0, 38.0, 35.0, 46.0, 48.0, 51.0, 51.0, 46.0, 54.0, 55.0, 56.0, 51.0, 41.0, 47.0, 37.0, 45.0, 26.0, 21.0, 22.0, 18.0, 14.0, 11.0, 9.0, 7.0, 4.0, 4.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64599609375, -0.6233596801757812, -0.6007232666015625, -0.5780868530273438, -0.555450439453125, -0.5328140258789062, -0.5101776123046875, -0.48754119873046875, -0.46490478515625, -0.44226837158203125, -0.4196319580078125, -0.39699554443359375, -0.374359130859375, -0.35172271728515625, -0.3290863037109375, -0.30644989013671875, -0.2838134765625, -0.26117706298828125, -0.2385406494140625, -0.21590423583984375, -0.193267822265625, -0.17063140869140625, -0.1479949951171875, -0.12535858154296875, -0.10272216796875, -0.08008575439453125, -0.0574493408203125, -0.03481292724609375, -0.012176513671875, 0.01045989990234375, 0.0330963134765625, 0.05573272705078125, 0.078369140625, 0.10100555419921875, 0.1236419677734375, 0.14627838134765625, 0.168914794921875, 0.19155120849609375, 0.2141876220703125, 0.23682403564453125, 0.25946044921875, 0.28209686279296875, 0.3047332763671875, 0.32736968994140625, 0.350006103515625, 0.37264251708984375, 0.3952789306640625, 0.41791534423828125, 0.4405517578125, 0.46318817138671875, 0.4858245849609375, 0.5084609985351562, 0.531097412109375, 0.5537338256835938, 0.5763702392578125, 0.5990066528320312, 0.62164306640625, 0.6442794799804688, 0.6669158935546875, 0.6895523071289062, 0.712188720703125, 0.7348251342773438, 0.7574615478515625, 0.7800979614257812, 0.802734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 4.0, 5.0, 5.0, 12.0, 11.0, 30.0, 35.0, 57.0, 109.0, 208.0, 509.0, 1594.0, 6596.0, 56877.0, 893023.0, 78706.0, 7720.0, 1923.0, 612.0, 242.0, 105.0, 67.0, 30.0, 20.0, 19.0, 12.0, 6.0, 2.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3203125, -2.26446533203125, -2.2086181640625, -2.15277099609375, -2.096923828125, -2.04107666015625, -1.9852294921875, -1.92938232421875, -1.87353515625, -1.81768798828125, -1.7618408203125, -1.70599365234375, -1.650146484375, -1.59429931640625, -1.5384521484375, -1.48260498046875, -1.4267578125, -1.37091064453125, -1.3150634765625, -1.25921630859375, -1.203369140625, -1.14752197265625, -1.0916748046875, -1.03582763671875, -0.97998046875, -0.92413330078125, -0.8682861328125, -0.81243896484375, -0.756591796875, -0.70074462890625, -0.6448974609375, -0.58905029296875, -0.533203125, -0.47735595703125, -0.4215087890625, -0.36566162109375, -0.309814453125, -0.25396728515625, -0.1981201171875, -0.14227294921875, -0.08642578125, -0.03057861328125, 0.0252685546875, 0.08111572265625, 0.136962890625, 0.19281005859375, 0.2486572265625, 0.30450439453125, 0.3603515625, 0.41619873046875, 0.4720458984375, 0.52789306640625, 0.583740234375, 0.63958740234375, 0.6954345703125, 0.75128173828125, 0.80712890625, 0.86297607421875, 0.9188232421875, 0.97467041015625, 1.030517578125, 1.08636474609375, 1.1422119140625, 1.19805908203125, 1.25390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 7.0, 15.0, 20.0, 15.0, 41.0, 53.0, 92.0, 154.0, 157.0, 131.0, 99.0, 70.0, 46.0, 28.0, 15.0, 11.0, 12.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0001633167266845703, -0.00015886686742305756, -0.0001544170081615448, -0.00014996714890003204, -0.0001455172896385193, -0.00014106743037700653, -0.00013661757111549377, -0.00013216771185398102, -0.00012771785259246826, -0.0001232679933309555, -0.00011881813406944275, -0.00011436827480792999, -0.00010991841554641724, -0.00010546855628490448, -0.00010101869702339172, -9.656883776187897e-05, -9.211897850036621e-05, -8.766911923885345e-05, -8.32192599773407e-05, -7.876940071582794e-05, -7.431954145431519e-05, -6.986968219280243e-05, -6.541982293128967e-05, -6.0969963669776917e-05, -5.652010440826416e-05, -5.2070245146751404e-05, -4.762038588523865e-05, -4.317052662372589e-05, -3.8720667362213135e-05, -3.427080810070038e-05, -2.9820948839187622e-05, -2.5371089577674866e-05, -2.092123031616211e-05, -1.6471371054649353e-05, -1.2021511793136597e-05, -7.57165253162384e-06, -3.121793270111084e-06, 1.3280659914016724e-06, 5.777925252914429e-06, 1.0227784514427185e-05, 1.4677643775939941e-05, 1.9127503037452698e-05, 2.3577362298965454e-05, 2.802722156047821e-05, 3.247708082199097e-05, 3.692694008350372e-05, 4.137679934501648e-05, 4.5826658606529236e-05, 5.027651786804199e-05, 5.472637712955475e-05, 5.9176236391067505e-05, 6.362609565258026e-05, 6.807595491409302e-05, 7.252581417560577e-05, 7.697567343711853e-05, 8.142553269863129e-05, 8.587539196014404e-05, 9.03252512216568e-05, 9.477511048316956e-05, 9.922496974468231e-05, 0.00010367482900619507, 0.00010812468826770782, 0.00011257454752922058, 0.00011702440679073334, 0.0001214742660522461]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 9.0, 3.0, 11.0, 21.0, 19.0, 28.0, 55.0, 80.0, 142.0, 287.0, 550.0, 1240.0, 3328.0, 10246.0, 69096.0, 842185.0, 102637.0, 12274.0, 3658.0, 1414.0, 587.0, 282.0, 164.0, 76.0, 51.0, 36.0, 21.0, 15.0, 7.0, 12.0, 1.0, 5.0, 4.0, 1.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.826171875, -1.7762298583984375, -1.726287841796875, -1.6763458251953125, -1.62640380859375, -1.5764617919921875, -1.526519775390625, -1.4765777587890625, -1.4266357421875, -1.3766937255859375, -1.326751708984375, -1.2768096923828125, -1.22686767578125, -1.1769256591796875, -1.126983642578125, -1.0770416259765625, -1.027099609375, -0.9771575927734375, -0.927215576171875, -0.8772735595703125, -0.82733154296875, -0.7773895263671875, -0.727447509765625, -0.6775054931640625, -0.6275634765625, -0.5776214599609375, -0.527679443359375, -0.4777374267578125, -0.42779541015625, -0.3778533935546875, -0.327911376953125, -0.2779693603515625, -0.22802734375, -0.1780853271484375, -0.128143310546875, -0.0782012939453125, -0.02825927734375, 0.0216827392578125, 0.071624755859375, 0.1215667724609375, 0.1715087890625, 0.2214508056640625, 0.271392822265625, 0.3213348388671875, 0.37127685546875, 0.4212188720703125, 0.471160888671875, 0.5211029052734375, 0.571044921875, 0.6209869384765625, 0.670928955078125, 0.7208709716796875, 0.77081298828125, 0.8207550048828125, 0.870697021484375, 0.9206390380859375, 0.9705810546875, 1.0205230712890625, 1.070465087890625, 1.1204071044921875, 1.17034912109375, 1.2202911376953125, 1.270233154296875, 1.3201751708984375, 1.3701171875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 1.0, 6.0, 13.0, 11.0, 14.0, 16.0, 21.0, 30.0, 49.0, 48.0, 73.0, 85.0, 106.0, 89.0, 82.0, 78.0, 68.0, 58.0, 33.0, 28.0, 23.0, 11.0, 13.0, 8.0, 3.0, 3.0, 2.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.443359375, -0.428192138671875, -0.41302490234375, -0.397857666015625, -0.3826904296875, -0.367523193359375, -0.35235595703125, -0.337188720703125, -0.322021484375, -0.306854248046875, -0.29168701171875, -0.276519775390625, -0.2613525390625, -0.246185302734375, -0.23101806640625, -0.215850830078125, -0.20068359375, -0.185516357421875, -0.17034912109375, -0.155181884765625, -0.1400146484375, -0.124847412109375, -0.10968017578125, -0.094512939453125, -0.079345703125, -0.064178466796875, -0.04901123046875, -0.033843994140625, -0.0186767578125, -0.003509521484375, 0.01165771484375, 0.026824951171875, 0.0419921875, 0.057159423828125, 0.07232666015625, 0.087493896484375, 0.1026611328125, 0.117828369140625, 0.13299560546875, 0.148162841796875, 0.163330078125, 0.178497314453125, 0.19366455078125, 0.208831787109375, 0.2239990234375, 0.239166259765625, 0.25433349609375, 0.269500732421875, 0.28466796875, 0.299835205078125, 0.31500244140625, 0.330169677734375, 0.3453369140625, 0.360504150390625, 0.37567138671875, 0.390838623046875, 0.406005859375, 0.421173095703125, 0.43634033203125, 0.451507568359375, 0.4666748046875, 0.481842041015625, 0.49700927734375, 0.512176513671875, 0.52734375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 12.0, 41.0, 159.0, 469.0, 232.0, 67.0, 13.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.33147621154785, -15.641979217529297, -14.952482223510742, -14.262985229492188, -13.573487281799316, -12.883990287780762, -12.194493293762207, -11.504995346069336, -10.815498352050781, -10.126001358032227, -9.436504364013672, -8.747007369995117, -8.057509422302246, -7.368012428283691, -6.678515434265137, -5.989017963409424, -5.299521446228027, -4.610024452209473, -3.9205269813537598, -3.231029987335205, -2.5415327548980713, -1.8520355224609375, -1.1625385284423828, -0.4730410575866699, 0.21645593643188477, 0.9059531092643738, 1.5954502820968628, 2.284947395324707, 2.974444627761841, 3.6639418601989746, 4.353438854217529, 5.042936325073242, 5.732433319091797, 6.421930313110352, 7.1114277839660645, 7.800924777984619, 8.490422248840332, 9.179919242858887, 9.869416236877441, 10.558914184570312, 11.248411178588867, 11.937908172607422, 12.627405166625977, 13.316902160644531, 14.006400108337402, 14.695897102355957, 15.385394096374512, 16.074892044067383, 16.764389038085938, 17.453886032104492, 18.143383026123047, 18.8328800201416, 19.522377014160156, 20.211875915527344, 20.901371002197266, 21.590869903564453, 22.280364990234375, 22.96986198425293, 23.659358978271484, 24.34885597229004, 25.038352966308594, 25.72785186767578, 26.417346954345703, 27.10684585571289, 27.796342849731445]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 9.0, 9.0, 12.0, 18.0, 24.0, 36.0, 40.0, 46.0, 37.0, 60.0, 61.0, 78.0, 58.0, 59.0, 64.0, 66.0, 57.0, 46.0, 34.0, 40.0, 38.0, 26.0, 17.0, 9.0, 11.0, 11.0, 6.0, 11.0, 5.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.256053924560547, -5.034274101257324, -4.812494277954102, -4.590714454650879, -4.3689351081848145, -4.147155284881592, -3.925375461578369, -3.7035956382751465, -3.481815814971924, -3.260035991668701, -3.0382564067840576, -2.816476583480835, -2.5946967601776123, -2.3729171752929688, -2.151137351989746, -1.9293575286865234, -1.7075779438018799, -1.4857982397079468, -1.2640184164047241, -1.042238712310791, -0.8204589486122131, -0.5986791849136353, -0.37689948081970215, -0.1551196575164795, 0.06666004657745361, 0.2884398102760315, 0.5102195739746094, 0.7319992780685425, 0.9537790417671204, 1.1755588054656982, 1.3973385095596313, 1.619118332862854, 1.840898036956787, 2.0626778602600098, 2.2844574451446533, 2.506237268447876, 2.7280170917510986, 2.949796676635742, 3.171576499938965, 3.3933563232421875, 3.61513614654541, 3.836915969848633, 4.0586957931518555, 4.280475616455078, 4.502254962921143, 4.724034786224365, 4.945814609527588, 5.1675944328308105, 5.389373779296875, 5.611153602600098, 5.83293342590332, 6.054713249206543, 6.276492595672607, 6.49827241897583, 6.720052242279053, 6.941832065582275, 7.163611888885498, 7.385391712188721, 7.607171535491943, 7.828950881958008, 8.05073070526123, 8.272510528564453, 8.494290351867676, 8.716070175170898, 8.937849998474121]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 9.0, 20.0, 31.0, 93.0, 201.0, 563.0, 4911.0, 4160226.0, 26140.0, 1261.0, 393.0, 177.0, 100.0, 59.0, 30.0, 16.0, 11.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.890625, -11.4901123046875, -11.089599609375, -10.6890869140625, -10.28857421875, -9.8880615234375, -9.487548828125, -9.0870361328125, -8.6865234375, -8.2860107421875, -7.885498046875, -7.4849853515625, -7.08447265625, -6.6839599609375, -6.283447265625, -5.8829345703125, -5.482421875, -5.0819091796875, -4.681396484375, -4.2808837890625, -3.88037109375, -3.4798583984375, -3.079345703125, -2.6788330078125, -2.2783203125, -1.8778076171875, -1.477294921875, -1.0767822265625, -0.67626953125, -0.2757568359375, 0.124755859375, 0.5252685546875, 0.92578125, 1.3262939453125, 1.726806640625, 2.1273193359375, 2.52783203125, 2.9283447265625, 3.328857421875, 3.7293701171875, 4.1298828125, 4.5303955078125, 4.930908203125, 5.3314208984375, 5.73193359375, 6.1324462890625, 6.532958984375, 6.9334716796875, 7.333984375, 7.7344970703125, 8.135009765625, 8.5355224609375, 8.93603515625, 9.3365478515625, 9.737060546875, 10.1375732421875, 10.5380859375, 10.9385986328125, 11.339111328125, 11.7396240234375, 12.14013671875, 12.5406494140625, 12.941162109375, 13.3416748046875, 13.7421875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 12.0, 14.0, 39.0, 62.0, 114.0, 143.0, 155.0, 160.0, 102.0, 80.0, 37.0, 29.0, 14.0, 12.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26171875, -0.252593994140625, -0.24346923828125, -0.234344482421875, -0.2252197265625, -0.216094970703125, -0.20697021484375, -0.197845458984375, -0.188720703125, -0.179595947265625, -0.17047119140625, -0.161346435546875, -0.1522216796875, -0.143096923828125, -0.13397216796875, -0.124847412109375, -0.11572265625, -0.106597900390625, -0.09747314453125, -0.088348388671875, -0.0792236328125, -0.070098876953125, -0.06097412109375, -0.051849365234375, -0.042724609375, -0.033599853515625, -0.02447509765625, -0.015350341796875, -0.0062255859375, 0.002899169921875, 0.01202392578125, 0.021148681640625, 0.0302734375, 0.039398193359375, 0.04852294921875, 0.057647705078125, 0.0667724609375, 0.075897216796875, 0.08502197265625, 0.094146728515625, 0.103271484375, 0.112396240234375, 0.12152099609375, 0.130645751953125, 0.1397705078125, 0.148895263671875, 0.15802001953125, 0.167144775390625, 0.17626953125, 0.185394287109375, 0.19451904296875, 0.203643798828125, 0.2127685546875, 0.221893310546875, 0.23101806640625, 0.240142822265625, 0.249267578125, 0.258392333984375, 0.26751708984375, 0.276641845703125, 0.2857666015625, 0.294891357421875, 0.30401611328125, 0.313140869140625, 0.322265625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 10.0, 14.0, 15.0, 30.0, 37.0, 34.0, 44.0, 73.0, 87.0, 109.0, 119.0, 163.0, 1075.0, 463141.0, 3726703.0, 1601.0, 267.0, 142.0, 107.0, 85.0, 70.0, 76.0, 52.0, 57.0, 39.0, 35.0, 26.0, 21.0, 15.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.6953125, -12.3331298828125, -11.970947265625, -11.6087646484375, -11.24658203125, -10.8843994140625, -10.522216796875, -10.1600341796875, -9.7978515625, -9.4356689453125, -9.073486328125, -8.7113037109375, -8.34912109375, -7.9869384765625, -7.624755859375, -7.2625732421875, -6.900390625, -6.5382080078125, -6.176025390625, -5.8138427734375, -5.45166015625, -5.0894775390625, -4.727294921875, -4.3651123046875, -4.0029296875, -3.6407470703125, -3.278564453125, -2.9163818359375, -2.55419921875, -2.1920166015625, -1.829833984375, -1.4676513671875, -1.10546875, -0.7432861328125, -0.381103515625, -0.0189208984375, 0.34326171875, 0.7054443359375, 1.067626953125, 1.4298095703125, 1.7919921875, 2.1541748046875, 2.516357421875, 2.8785400390625, 3.24072265625, 3.6029052734375, 3.965087890625, 4.3272705078125, 4.689453125, 5.0516357421875, 5.413818359375, 5.7760009765625, 6.13818359375, 6.5003662109375, 6.862548828125, 7.2247314453125, 7.5869140625, 7.9490966796875, 8.311279296875, 8.6734619140625, 9.03564453125, 9.3978271484375, 9.760009765625, 10.1221923828125, 10.484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 8.0, 8.0, 10.0, 34.0, 78.0, 319.0, 2847.0, 609.0, 113.0, 35.0, 11.0, 10.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3486328125, -0.3125762939453125, -0.276519775390625, -0.2404632568359375, -0.20440673828125, -0.1683502197265625, -0.132293701171875, -0.0962371826171875, -0.0601806640625, -0.0241241455078125, 0.011932373046875, 0.0479888916015625, 0.08404541015625, 0.1201019287109375, 0.156158447265625, 0.1922149658203125, 0.228271484375, 0.2643280029296875, 0.300384521484375, 0.3364410400390625, 0.37249755859375, 0.4085540771484375, 0.444610595703125, 0.4806671142578125, 0.5167236328125, 0.5527801513671875, 0.588836669921875, 0.6248931884765625, 0.66094970703125, 0.6970062255859375, 0.733062744140625, 0.7691192626953125, 0.80517578125, 0.8412322998046875, 0.877288818359375, 0.9133453369140625, 0.94940185546875, 0.9854583740234375, 1.021514892578125, 1.0575714111328125, 1.0936279296875, 1.1296844482421875, 1.165740966796875, 1.2017974853515625, 1.23785400390625, 1.2739105224609375, 1.309967041015625, 1.3460235595703125, 1.382080078125, 1.4181365966796875, 1.454193115234375, 1.4902496337890625, 1.52630615234375, 1.5623626708984375, 1.598419189453125, 1.6344757080078125, 1.6705322265625, 1.7065887451171875, 1.742645263671875, 1.7787017822265625, 1.81475830078125, 1.8508148193359375, 1.886871337890625, 1.9229278564453125, 1.958984375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 13.0, 35.0, 88.0, 542.0, 248.0, 53.0, 15.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.062538146972656, -11.574601173400879, -11.086664199829102, -10.598726272583008, -10.11078929901123, -9.622852325439453, -9.134915351867676, -8.646978378295898, -8.159040451049805, -7.671103477478027, -7.183166027069092, -6.6952290534973145, -6.207291603088379, -5.719354629516602, -5.231417655944824, -4.743480682373047, -4.2555437088012695, -3.767606496810913, -3.2796692848205566, -2.7917323112487793, -2.303795099258423, -1.8158578872680664, -1.327920913696289, -0.8399837017059326, -0.35204648971557617, 0.1358906626701355, 0.6238278150558472, 1.111764907836914, 1.5997021198272705, 2.087639331817627, 2.5755763053894043, 3.0635135173797607, 3.551450729370117, 4.0393877029418945, 4.52732515335083, 5.015262126922607, 5.503199577331543, 5.99113655090332, 6.479073524475098, 6.967010498046875, 7.4549479484558105, 7.942884922027588, 8.430822372436523, 8.9187593460083, 9.406696319580078, 9.894634246826172, 10.382570266723633, 10.870508193969727, 11.358445167541504, 11.846382141113281, 12.334319114685059, 12.822256088256836, 13.31019401550293, 13.798130989074707, 14.286067962646484, 14.774004936218262, 15.261941909790039, 15.749878883361816, 16.237815856933594, 16.725753784179688, 17.21368980407715, 17.701627731323242, 18.189563751220703, 18.677501678466797, 19.16543960571289]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 14.0, 25.0, 53.0, 88.0, 75.0, 117.0, 128.0, 134.0, 126.0, 94.0, 59.0, 37.0, 22.0, 14.0, 8.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.903992652893066, -5.729015827178955, -5.554039001464844, -5.379061698913574, -5.204084873199463, -5.029108047485352, -4.85413122177124, -4.679154396057129, -4.504177570343018, -4.329200744628906, -4.154223918914795, -3.9792468547821045, -3.804270029067993, -3.6292929649353027, -3.4543161392211914, -3.27933931350708, -3.1043622493743896, -2.9293854236602783, -2.754408359527588, -2.5794315338134766, -2.4044547080993652, -2.229477882385254, -2.0545008182525635, -1.8795239925384521, -1.7045470476150513, -1.5295701026916504, -1.354593276977539, -1.1796163320541382, -1.0046393871307373, -0.829662561416626, -0.6546856164932251, -0.47970879077911377, -0.3047318458557129, -0.1297549456357956, 0.045221954584121704, 0.2201988697052002, 0.3951757550239563, 0.5701526403427124, 0.7451295852661133, 0.9201064109802246, 1.0950833559036255, 1.2700603008270264, 1.4450371265411377, 1.6200140714645386, 1.7949910163879395, 1.9699678421020508, 2.144944667816162, 2.3199214935302734, 2.494898557662964, 2.669875383377075, 2.8448524475097656, 3.019829273223877, 3.1948060989379883, 3.3697829246520996, 3.54475998878479, 3.7197368144989014, 3.894713878631592, 4.069690704345703, 4.2446675300598145, 4.419644355773926, 4.594621658325195, 4.769598484039307, 4.944575309753418, 5.119552135467529, 5.294528961181641]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 11.0, 3.0, 9.0, 5.0, 10.0, 15.0, 10.0, 33.0, 49.0, 71.0, 92.0, 199.0, 413.0, 938.0, 2667.0, 11728.0, 134652.0, 818723.0, 67396.0, 7918.0, 2032.0, 752.0, 337.0, 184.0, 103.0, 61.0, 34.0, 31.0, 19.0, 16.0, 12.0, 8.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.62890625, -4.505096435546875, -4.38128662109375, -4.257476806640625, -4.1336669921875, -4.009857177734375, -3.88604736328125, -3.762237548828125, -3.638427734375, -3.514617919921875, -3.39080810546875, -3.266998291015625, -3.1431884765625, -3.019378662109375, -2.89556884765625, -2.771759033203125, -2.64794921875, -2.524139404296875, -2.40032958984375, -2.276519775390625, -2.1527099609375, -2.028900146484375, -1.90509033203125, -1.781280517578125, -1.657470703125, -1.533660888671875, -1.40985107421875, -1.286041259765625, -1.1622314453125, -1.038421630859375, -0.91461181640625, -0.790802001953125, -0.6669921875, -0.543182373046875, -0.41937255859375, -0.295562744140625, -0.1717529296875, -0.047943115234375, 0.07586669921875, 0.199676513671875, 0.323486328125, 0.447296142578125, 0.57110595703125, 0.694915771484375, 0.8187255859375, 0.942535400390625, 1.06634521484375, 1.190155029296875, 1.31396484375, 1.437774658203125, 1.56158447265625, 1.685394287109375, 1.8092041015625, 1.933013916015625, 2.05682373046875, 2.180633544921875, 2.304443359375, 2.428253173828125, 2.55206298828125, 2.675872802734375, 2.7996826171875, 2.923492431640625, 3.04730224609375, 3.171112060546875, 3.294921875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 8.0, 13.0, 21.0, 42.0, 64.0, 107.0, 119.0, 161.0, 120.0, 108.0, 87.0, 66.0, 35.0, 17.0, 13.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.27957916259765625, -0.2683868408203125, -0.25719451904296875, -0.246002197265625, -0.23480987548828125, -0.2236175537109375, -0.21242523193359375, -0.20123291015625, -0.19004058837890625, -0.1788482666015625, -0.16765594482421875, -0.156463623046875, -0.14527130126953125, -0.1340789794921875, -0.12288665771484375, -0.1116943359375, -0.10050201416015625, -0.0893096923828125, -0.07811737060546875, -0.066925048828125, -0.05573272705078125, -0.0445404052734375, -0.03334808349609375, -0.02215576171875, -0.01096343994140625, 0.0002288818359375, 0.01142120361328125, 0.022613525390625, 0.03380584716796875, 0.0449981689453125, 0.05619049072265625, 0.0673828125, 0.07857513427734375, 0.0897674560546875, 0.10095977783203125, 0.112152099609375, 0.12334442138671875, 0.1345367431640625, 0.14572906494140625, 0.15692138671875, 0.16811370849609375, 0.1793060302734375, 0.19049835205078125, 0.201690673828125, 0.21288299560546875, 0.2240753173828125, 0.23526763916015625, 0.2464599609375, 0.25765228271484375, 0.2688446044921875, 0.28003692626953125, 0.291229248046875, 0.30242156982421875, 0.3136138916015625, 0.32480621337890625, 0.33599853515625, 0.34719085693359375, 0.3583831787109375, 0.36957550048828125, 0.380767822265625, 0.39196014404296875, 0.4031524658203125, 0.41434478759765625, 0.425537109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 6.0, 4.0, 18.0, 22.0, 23.0, 39.0, 48.0, 81.0, 88.0, 158.0, 217.0, 360.0, 650.0, 1258.0, 3017.0, 8533.0, 31487.0, 142713.0, 500468.0, 277310.0, 59049.0, 14721.0, 4582.0, 1654.0, 763.0, 478.0, 250.0, 161.0, 126.0, 75.0, 61.0, 41.0, 32.0, 13.0, 13.0, 7.0, 11.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.7490234375, -1.698638916015625, -1.64825439453125, -1.597869873046875, -1.5474853515625, -1.497100830078125, -1.44671630859375, -1.396331787109375, -1.345947265625, -1.295562744140625, -1.24517822265625, -1.194793701171875, -1.1444091796875, -1.094024658203125, -1.04364013671875, -0.993255615234375, -0.94287109375, -0.892486572265625, -0.84210205078125, -0.791717529296875, -0.7413330078125, -0.690948486328125, -0.64056396484375, -0.590179443359375, -0.539794921875, -0.489410400390625, -0.43902587890625, -0.388641357421875, -0.3382568359375, -0.287872314453125, -0.23748779296875, -0.187103271484375, -0.13671875, -0.086334228515625, -0.03594970703125, 0.014434814453125, 0.0648193359375, 0.115203857421875, 0.16558837890625, 0.215972900390625, 0.266357421875, 0.316741943359375, 0.36712646484375, 0.417510986328125, 0.4678955078125, 0.518280029296875, 0.56866455078125, 0.619049072265625, 0.66943359375, 0.719818115234375, 0.77020263671875, 0.820587158203125, 0.8709716796875, 0.921356201171875, 0.97174072265625, 1.022125244140625, 1.072509765625, 1.122894287109375, 1.17327880859375, 1.223663330078125, 1.2740478515625, 1.324432373046875, 1.37481689453125, 1.425201416015625, 1.4755859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 5.0, 8.0, 9.0, 11.0, 11.0, 20.0, 20.0, 31.0, 34.0, 36.0, 48.0, 50.0, 56.0, 63.0, 76.0, 63.0, 67.0, 48.0, 66.0, 47.0, 40.0, 42.0, 25.0, 37.0, 20.0, 21.0, 17.0, 7.0, 13.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9716796875, -0.9374847412109375, -0.903289794921875, -0.8690948486328125, -0.83489990234375, -0.8007049560546875, -0.766510009765625, -0.7323150634765625, -0.6981201171875, -0.6639251708984375, -0.629730224609375, -0.5955352783203125, -0.56134033203125, -0.5271453857421875, -0.492950439453125, -0.4587554931640625, -0.424560546875, -0.3903656005859375, -0.356170654296875, -0.3219757080078125, -0.28778076171875, -0.2535858154296875, -0.219390869140625, -0.1851959228515625, -0.1510009765625, -0.1168060302734375, -0.082611083984375, -0.0484161376953125, -0.01422119140625, 0.0199737548828125, 0.054168701171875, 0.0883636474609375, 0.12255859375, 0.1567535400390625, 0.190948486328125, 0.2251434326171875, 0.25933837890625, 0.2935333251953125, 0.327728271484375, 0.3619232177734375, 0.3961181640625, 0.4303131103515625, 0.464508056640625, 0.4987030029296875, 0.53289794921875, 0.5670928955078125, 0.601287841796875, 0.6354827880859375, 0.669677734375, 0.7038726806640625, 0.738067626953125, 0.7722625732421875, 0.80645751953125, 0.8406524658203125, 0.874847412109375, 0.9090423583984375, 0.9432373046875, 0.9774322509765625, 1.011627197265625, 1.0458221435546875, 1.08001708984375, 1.1142120361328125, 1.148406982421875, 1.1826019287109375, 1.216796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 8.0, 10.0, 17.0, 29.0, 18.0, 49.0, 53.0, 89.0, 117.0, 228.0, 457.0, 945.0, 2823.0, 12164.0, 172265.0, 815859.0, 34933.0, 5300.0, 1639.0, 720.0, 299.0, 178.0, 103.0, 71.0, 48.0, 26.0, 24.0, 15.0, 13.0, 9.0, 7.0, 3.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-1.87890625, -1.814666748046875, -1.75042724609375, -1.686187744140625, -1.6219482421875, -1.557708740234375, -1.49346923828125, -1.429229736328125, -1.364990234375, -1.300750732421875, -1.23651123046875, -1.172271728515625, -1.1080322265625, -1.043792724609375, -0.97955322265625, -0.915313720703125, -0.85107421875, -0.786834716796875, -0.72259521484375, -0.658355712890625, -0.5941162109375, -0.529876708984375, -0.46563720703125, -0.401397705078125, -0.337158203125, -0.272918701171875, -0.20867919921875, -0.144439697265625, -0.0802001953125, -0.015960693359375, 0.04827880859375, 0.112518310546875, 0.1767578125, 0.240997314453125, 0.30523681640625, 0.369476318359375, 0.4337158203125, 0.497955322265625, 0.56219482421875, 0.626434326171875, 0.690673828125, 0.754913330078125, 0.81915283203125, 0.883392333984375, 0.9476318359375, 1.011871337890625, 1.07611083984375, 1.140350341796875, 1.20458984375, 1.268829345703125, 1.33306884765625, 1.397308349609375, 1.4615478515625, 1.525787353515625, 1.59002685546875, 1.654266357421875, 1.718505859375, 1.782745361328125, 1.84698486328125, 1.911224365234375, 1.9754638671875, 2.039703369140625, 2.10394287109375, 2.168182373046875, 2.232421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 10.0, 18.0, 22.0, 37.0, 47.0, 82.0, 143.0, 198.0, 171.0, 91.0, 60.0, 37.0, 22.0, 17.0, 9.0, 8.0, 5.0, 3.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024247169494628906, -0.0002358369529247284, -0.00022920221090316772, -0.00022256746888160706, -0.0002159327268600464, -0.00020929798483848572, -0.00020266324281692505, -0.00019602850079536438, -0.0001893937587738037, -0.00018275901675224304, -0.00017612427473068237, -0.0001694895327091217, -0.00016285479068756104, -0.00015622004866600037, -0.0001495853066444397, -0.00014295056462287903, -0.00013631582260131836, -0.0001296810805797577, -0.00012304633855819702, -0.00011641159653663635, -0.00010977685451507568, -0.00010314211249351501, -9.650737047195435e-05, -8.987262845039368e-05, -8.323788642883301e-05, -7.660314440727234e-05, -6.996840238571167e-05, -6.3333660364151e-05, -5.669891834259033e-05, -5.006417632102966e-05, -4.3429434299468994e-05, -3.6794692277908325e-05, -3.0159950256347656e-05, -2.3525208234786987e-05, -1.689046621322632e-05, -1.025572419166565e-05, -3.6209821701049805e-06, 3.0137598514556885e-06, 9.648501873016357e-06, 1.6283243894577026e-05, 2.2917985916137695e-05, 2.9552727937698364e-05, 3.618746995925903e-05, 4.28222119808197e-05, 4.945695400238037e-05, 5.609169602394104e-05, 6.272643804550171e-05, 6.936118006706238e-05, 7.599592208862305e-05, 8.263066411018372e-05, 8.926540613174438e-05, 9.590014815330505e-05, 0.00010253489017486572, 0.00010916963219642639, 0.00011580437421798706, 0.00012243911623954773, 0.0001290738582611084, 0.00013570860028266907, 0.00014234334230422974, 0.0001489780843257904, 0.00015561282634735107, 0.00016224756836891174, 0.0001688823103904724, 0.00017551705241203308, 0.00018215179443359375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 13.0, 19.0, 30.0, 65.0, 96.0, 162.0, 320.0, 745.0, 2156.0, 7774.0, 50880.0, 844427.0, 124782.0, 12118.0, 3052.0, 1042.0, 384.0, 209.0, 100.0, 61.0, 34.0, 14.0, 19.0, 10.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.341796875, -2.2812042236328125, -2.220611572265625, -2.1600189208984375, -2.09942626953125, -2.0388336181640625, -1.978240966796875, -1.9176483154296875, -1.8570556640625, -1.7964630126953125, -1.735870361328125, -1.6752777099609375, -1.61468505859375, -1.5540924072265625, -1.493499755859375, -1.4329071044921875, -1.372314453125, -1.3117218017578125, -1.251129150390625, -1.1905364990234375, -1.12994384765625, -1.0693511962890625, -1.008758544921875, -0.9481658935546875, -0.8875732421875, -0.8269805908203125, -0.766387939453125, -0.7057952880859375, -0.64520263671875, -0.5846099853515625, -0.524017333984375, -0.4634246826171875, -0.40283203125, -0.3422393798828125, -0.281646728515625, -0.2210540771484375, -0.16046142578125, -0.0998687744140625, -0.039276123046875, 0.0213165283203125, 0.0819091796875, 0.1425018310546875, 0.203094482421875, 0.2636871337890625, 0.32427978515625, 0.3848724365234375, 0.445465087890625, 0.5060577392578125, 0.566650390625, 0.6272430419921875, 0.687835693359375, 0.7484283447265625, 0.80902099609375, 0.8696136474609375, 0.930206298828125, 0.9907989501953125, 1.0513916015625, 1.1119842529296875, 1.172576904296875, 1.2331695556640625, 1.29376220703125, 1.3543548583984375, 1.414947509765625, 1.4755401611328125, 1.5361328125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 9.0, 4.0, 9.0, 15.0, 20.0, 36.0, 46.0, 47.0, 76.0, 129.0, 105.0, 121.0, 95.0, 82.0, 51.0, 40.0, 27.0, 27.0, 9.0, 10.0, 8.0, 5.0, 4.0, 5.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.73974609375, -0.718505859375, -0.697265625, -0.676025390625, -0.65478515625, -0.633544921875, -0.6123046875, -0.591064453125, -0.56982421875, -0.548583984375, -0.52734375, -0.506103515625, -0.48486328125, -0.463623046875, -0.4423828125, -0.421142578125, -0.39990234375, -0.378662109375, -0.357421875, -0.336181640625, -0.31494140625, -0.293701171875, -0.2724609375, -0.251220703125, -0.22998046875, -0.208740234375, -0.1875, -0.166259765625, -0.14501953125, -0.123779296875, -0.1025390625, -0.081298828125, -0.06005859375, -0.038818359375, -0.017578125, 0.003662109375, 0.02490234375, 0.046142578125, 0.0673828125, 0.088623046875, 0.10986328125, 0.131103515625, 0.15234375, 0.173583984375, 0.19482421875, 0.216064453125, 0.2373046875, 0.258544921875, 0.27978515625, 0.301025390625, 0.322265625, 0.343505859375, 0.36474609375, 0.385986328125, 0.4072265625, 0.428466796875, 0.44970703125, 0.470947265625, 0.4921875, 0.513427734375, 0.53466796875, 0.555908203125, 0.5771484375, 0.598388671875, 0.61962890625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 17.0, 33.0, 63.0, 144.0, 199.0, 242.0, 146.0, 73.0, 38.0, 21.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.205010414123535, -9.782374382019043, -9.359739303588867, -8.937103271484375, -8.5144681930542, -8.091832160949707, -7.669196605682373, -7.246561050415039, -6.823925495147705, -6.401289939880371, -5.978654384613037, -5.556018829345703, -5.133382797241211, -4.710747718811035, -4.288111686706543, -3.865476131439209, -3.442840576171875, -3.020205020904541, -2.597569465637207, -2.174933671951294, -1.75229811668396, -1.329662561416626, -0.9070267677307129, -0.4843912124633789, -0.06175565719604492, 0.36087995767593384, 0.7835155725479126, 1.2061512470245361, 1.6287868022918701, 2.051422357559204, 2.474058151245117, 2.896693706512451, 3.3193283081054688, 3.7419638633728027, 4.164599418640137, 4.587235450744629, 5.009870529174805, 5.432506561279297, 5.855142116546631, 6.277777671813965, 6.700413227081299, 7.123048782348633, 7.545684337615967, 7.968319892883301, 8.390955924987793, 8.813591003417969, 9.236227035522461, 9.658863067626953, 10.081498146057129, 10.504134178161621, 10.926769256591797, 11.349405288696289, 11.772040367126465, 12.194676399230957, 12.617311477661133, 13.039947509765625, 13.462583541870117, 13.88521957397461, 14.307854652404785, 14.730490684509277, 15.153125762939453, 15.575761795043945, 15.998397827148438, 16.421031951904297, 16.84366798400879]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 10.0, 7.0, 11.0, 11.0, 19.0, 18.0, 31.0, 29.0, 39.0, 42.0, 41.0, 51.0, 44.0, 51.0, 61.0, 58.0, 51.0, 47.0, 59.0, 47.0, 44.0, 32.0, 39.0, 33.0, 23.0, 24.0, 21.0, 9.0, 12.0, 7.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.999790191650391, -5.7956647872924805, -5.591538906097412, -5.387413501739502, -5.183288097381592, -4.979162216186523, -4.775036811828613, -4.570911407470703, -4.366786003112793, -4.162660598754883, -3.9585349559783936, -3.7544093132019043, -3.550283908843994, -3.346158266067505, -3.1420326232910156, -2.9379072189331055, -2.733781337738037, -2.529655694961548, -2.3255302906036377, -2.1214046478271484, -1.9172791242599487, -1.713153600692749, -1.5090279579162598, -1.30490243434906, -1.1007769107818604, -0.8966513872146606, -0.6925258040428162, -0.4884002208709717, -0.284274697303772, -0.08014917373657227, 0.12397646903991699, 0.3281019926071167, 0.5322275161743164, 0.7363530397415161, 0.9404786229133606, 1.144604206085205, 1.3487297296524048, 1.5528552532196045, 1.7569808959960938, 1.9611064195632935, 2.165231943130493, 2.3693575859069824, 2.5734829902648926, 2.777608633041382, 2.981734275817871, 3.1858596801757812, 3.3899853229522705, 3.5941109657287598, 3.79823637008667, 4.00236177444458, 4.206487655639648, 4.410613059997559, 4.614738464355469, 4.818863868713379, 5.022989749908447, 5.227115154266357, 5.431241035461426, 5.635366439819336, 5.839492321014404, 6.0436177253723145, 6.247743129730225, 6.451869010925293, 6.655994415283203, 6.860119819641113, 7.064245223999023]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 9.0, 8.0, 12.0, 37.0, 47.0, 82.0, 168.0, 346.0, 969.0, 2938.0, 12042.0, 124431.0, 4002103.0, 40983.0, 6583.0, 1827.0, 662.0, 363.0, 183.0, 113.0, 97.0, 69.0, 42.0, 33.0, 35.0, 12.0, 11.0, 17.0, 10.0, 7.0, 9.0, 3.0, 4.0, 2.0, 5.0, 4.0, 8.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.5234375, -4.35784912109375, -4.1922607421875, -4.02667236328125, -3.861083984375, -3.69549560546875, -3.5299072265625, -3.36431884765625, -3.19873046875, -3.03314208984375, -2.8675537109375, -2.70196533203125, -2.536376953125, -2.37078857421875, -2.2052001953125, -2.03961181640625, -1.8740234375, -1.70843505859375, -1.5428466796875, -1.37725830078125, -1.211669921875, -1.04608154296875, -0.8804931640625, -0.71490478515625, -0.54931640625, -0.38372802734375, -0.2181396484375, -0.05255126953125, 0.113037109375, 0.27862548828125, 0.4442138671875, 0.60980224609375, 0.775390625, 0.94097900390625, 1.1065673828125, 1.27215576171875, 1.437744140625, 1.60333251953125, 1.7689208984375, 1.93450927734375, 2.10009765625, 2.26568603515625, 2.4312744140625, 2.59686279296875, 2.762451171875, 2.92803955078125, 3.0936279296875, 3.25921630859375, 3.4248046875, 3.59039306640625, 3.7559814453125, 3.92156982421875, 4.087158203125, 4.25274658203125, 4.4183349609375, 4.58392333984375, 4.74951171875, 4.91510009765625, 5.0806884765625, 5.24627685546875, 5.411865234375, 5.57745361328125, 5.7430419921875, 5.90863037109375, 6.07421875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 12.0, 7.0, 5.0, 26.0, 44.0, 62.0, 85.0, 113.0, 136.0, 132.0, 98.0, 91.0, 58.0, 54.0, 31.0, 20.0, 11.0, 7.0, 5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328857421875, -0.31723785400390625, -0.3056182861328125, -0.29399871826171875, -0.282379150390625, -0.27075958251953125, -0.2591400146484375, -0.24752044677734375, -0.23590087890625, -0.22428131103515625, -0.2126617431640625, -0.20104217529296875, -0.189422607421875, -0.17780303955078125, -0.1661834716796875, -0.15456390380859375, -0.1429443359375, -0.13132476806640625, -0.1197052001953125, -0.10808563232421875, -0.096466064453125, -0.08484649658203125, -0.0732269287109375, -0.06160736083984375, -0.04998779296875, -0.03836822509765625, -0.0267486572265625, -0.01512908935546875, -0.003509521484375, 0.00811004638671875, 0.0197296142578125, 0.03134918212890625, 0.04296875, 0.05458831787109375, 0.0662078857421875, 0.07782745361328125, 0.089447021484375, 0.10106658935546875, 0.1126861572265625, 0.12430572509765625, 0.13592529296875, 0.14754486083984375, 0.1591644287109375, 0.17078399658203125, 0.182403564453125, 0.19402313232421875, 0.2056427001953125, 0.21726226806640625, 0.2288818359375, 0.24050140380859375, 0.2521209716796875, 0.26374053955078125, 0.275360107421875, 0.28697967529296875, 0.2985992431640625, 0.31021881103515625, 0.32183837890625, 0.33345794677734375, 0.3450775146484375, 0.35669708251953125, 0.368316650390625, 0.37993621826171875, 0.3915557861328125, 0.40317535400390625, 0.414794921875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 13.0, 22.0, 33.0, 63.0, 108.0, 227.0, 423.0, 1206.0, 4852.0, 48228.0, 4069008.0, 62549.0, 5106.0, 1167.0, 478.0, 290.0, 170.0, 115.0, 61.0, 49.0, 36.0, 19.0, 19.0, 10.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1328125, -5.9443359375, -5.755859375, -5.5673828125, -5.37890625, -5.1904296875, -5.001953125, -4.8134765625, -4.625, -4.4365234375, -4.248046875, -4.0595703125, -3.87109375, -3.6826171875, -3.494140625, -3.3056640625, -3.1171875, -2.9287109375, -2.740234375, -2.5517578125, -2.36328125, -2.1748046875, -1.986328125, -1.7978515625, -1.609375, -1.4208984375, -1.232421875, -1.0439453125, -0.85546875, -0.6669921875, -0.478515625, -0.2900390625, -0.1015625, 0.0869140625, 0.275390625, 0.4638671875, 0.65234375, 0.8408203125, 1.029296875, 1.2177734375, 1.40625, 1.5947265625, 1.783203125, 1.9716796875, 2.16015625, 2.3486328125, 2.537109375, 2.7255859375, 2.9140625, 3.1025390625, 3.291015625, 3.4794921875, 3.66796875, 3.8564453125, 4.044921875, 4.2333984375, 4.421875, 4.6103515625, 4.798828125, 4.9873046875, 5.17578125, 5.3642578125, 5.552734375, 5.7412109375, 5.9296875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 8.0, 6.0, 17.0, 18.0, 25.0, 33.0, 60.0, 121.0, 311.0, 1954.0, 1023.0, 232.0, 93.0, 48.0, 35.0, 31.0, 17.0, 9.0, 14.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.421142578125, -0.3999290466308594, -0.37871551513671875, -0.3575019836425781, -0.3362884521484375, -0.3150749206542969, -0.29386138916015625, -0.2726478576660156, -0.251434326171875, -0.23022079467773438, -0.20900726318359375, -0.18779373168945312, -0.1665802001953125, -0.14536666870117188, -0.12415313720703125, -0.10293960571289062, -0.08172607421875, -0.060512542724609375, -0.03929901123046875, -0.018085479736328125, 0.0031280517578125, 0.024341583251953125, 0.04555511474609375, 0.06676864624023438, 0.087982177734375, 0.10919570922851562, 0.13040924072265625, 0.15162277221679688, 0.1728363037109375, 0.19404983520507812, 0.21526336669921875, 0.23647689819335938, 0.2576904296875, 0.2789039611816406, 0.30011749267578125, 0.3213310241699219, 0.3425445556640625, 0.3637580871582031, 0.38497161865234375, 0.4061851501464844, 0.427398681640625, 0.4486122131347656, 0.46982574462890625, 0.4910392761230469, 0.5122528076171875, 0.5334663391113281, 0.5546798706054688, 0.5758934020996094, 0.59710693359375, 0.6183204650878906, 0.6395339965820312, 0.6607475280761719, 0.6819610595703125, 0.7031745910644531, 0.7243881225585938, 0.7456016540527344, 0.766815185546875, 0.7880287170410156, 0.8092422485351562, 0.8304557800292969, 0.8516693115234375, 0.8728828430175781, 0.8940963745117188, 0.9153099060058594, 0.9365234375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 17.0, 35.0, 88.0, 233.0, 335.0, 180.0, 59.0, 13.0, 9.0, 9.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5915632247924805, -4.385827541351318, -4.180091381072998, -3.974355697631836, -3.7686197757720947, -3.5628838539123535, -3.3571481704711914, -3.15141224861145, -2.945676326751709, -2.7399404048919678, -2.5342044830322266, -2.3284687995910645, -2.1227328777313232, -1.916996955871582, -1.7112611532211304, -1.5055253505706787, -1.2997894287109375, -1.0940535068511963, -0.8883177042007446, -0.6825818419456482, -0.47684597969055176, -0.27111005783081055, -0.06537425518035889, 0.14036154747009277, 0.346097469329834, 0.5518333315849304, 0.7575691938400269, 0.9633050560951233, 1.1690409183502197, 1.374776840209961, 1.5805126428604126, 1.7862484455108643, 1.9919843673706055, 2.1977202892303467, 2.403456211090088, 2.60919189453125, 2.814927816390991, 3.0206637382507324, 3.2263994216918945, 3.4321353435516357, 3.637871265411377, 3.843607187271118, 4.049343109130859, 4.2550787925720215, 4.460814476013184, 4.666550636291504, 4.872286319732666, 5.078022003173828, 5.283758163452148, 5.4894938468933105, 5.695230007171631, 5.900965690612793, 6.106701850891113, 6.312437534332275, 6.5181732177734375, 6.723909378051758, 6.92964506149292, 7.135380744934082, 7.341116905212402, 7.5468525886535645, 7.752588272094727, 7.958324432373047, 8.164060592651367, 8.369795799255371, 8.575531959533691]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 8.0, 17.0, 20.0, 33.0, 41.0, 54.0, 59.0, 69.0, 93.0, 102.0, 106.0, 85.0, 56.0, 59.0, 45.0, 41.0, 29.0, 20.0, 15.0, 13.0, 9.0, 8.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8537631034851074, -2.7675726413726807, -2.681381940841675, -2.595191478729248, -2.5090010166168213, -2.4228103160858154, -2.3366198539733887, -2.250429153442383, -2.164238691329956, -2.0780482292175293, -1.991857647895813, -1.9056670665740967, -1.8194764852523804, -1.733285903930664, -1.6470954418182373, -1.560904860496521, -1.4747143983840942, -1.388523817062378, -1.3023333549499512, -1.2161427736282349, -1.1299521923065186, -1.0437617301940918, -0.9575711488723755, -0.8713805675506592, -0.7851900458335876, -0.6989995241165161, -0.6128089427947998, -0.5266184210777283, -0.44042786955833435, -0.35423731803894043, -0.2680467963218689, -0.1818562150001526, -0.09566569328308105, -0.00947514921426773, 0.0767153948545456, 0.16290593147277832, 0.24909648299217224, 0.33528703451156616, 0.4214775562286377, 0.507668137550354, 0.5938586592674255, 0.6800491809844971, 0.7662397623062134, 0.8524302840232849, 0.9386208057403564, 1.0248113870620728, 1.111001968383789, 1.1971924304962158, 1.2833830118179321, 1.3695735931396484, 1.4557640552520752, 1.5419546365737915, 1.6281452178955078, 1.7143356800079346, 1.8005262613296509, 1.8867168426513672, 1.972907304763794, 2.0590977668762207, 2.1452884674072266, 2.2314789295196533, 2.31766939163208, 2.403860092163086, 2.4900505542755127, 2.5762410163879395, 2.6624317169189453]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 9.0, 6.0, 15.0, 13.0, 31.0, 34.0, 56.0, 82.0, 116.0, 182.0, 327.0, 615.0, 1376.0, 3610.0, 13287.0, 94959.0, 711062.0, 193081.0, 21152.0, 5044.0, 1715.0, 742.0, 394.0, 212.0, 134.0, 94.0, 56.0, 40.0, 25.0, 21.0, 12.0, 11.0, 13.0, 4.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.076171875, -2.98736572265625, -2.8985595703125, -2.80975341796875, -2.720947265625, -2.63214111328125, -2.5433349609375, -2.45452880859375, -2.36572265625, -2.27691650390625, -2.1881103515625, -2.09930419921875, -2.010498046875, -1.92169189453125, -1.8328857421875, -1.74407958984375, -1.6552734375, -1.56646728515625, -1.4776611328125, -1.38885498046875, -1.300048828125, -1.21124267578125, -1.1224365234375, -1.03363037109375, -0.94482421875, -0.85601806640625, -0.7672119140625, -0.67840576171875, -0.589599609375, -0.50079345703125, -0.4119873046875, -0.32318115234375, -0.234375, -0.14556884765625, -0.0567626953125, 0.03204345703125, 0.120849609375, 0.20965576171875, 0.2984619140625, 0.38726806640625, 0.47607421875, 0.56488037109375, 0.6536865234375, 0.74249267578125, 0.831298828125, 0.92010498046875, 1.0089111328125, 1.09771728515625, 1.1865234375, 1.27532958984375, 1.3641357421875, 1.45294189453125, 1.541748046875, 1.63055419921875, 1.7193603515625, 1.80816650390625, 1.89697265625, 1.98577880859375, 2.0745849609375, 2.16339111328125, 2.252197265625, 2.34100341796875, 2.4298095703125, 2.51861572265625, 2.607421875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 8.0, 16.0, 23.0, 40.0, 54.0, 79.0, 108.0, 115.0, 113.0, 106.0, 103.0, 70.0, 60.0, 36.0, 21.0, 16.0, 6.0, 5.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.322998046875, -0.3112945556640625, -0.299591064453125, -0.2878875732421875, -0.27618408203125, -0.2644805908203125, -0.252777099609375, -0.2410736083984375, -0.2293701171875, -0.2176666259765625, -0.205963134765625, -0.1942596435546875, -0.18255615234375, -0.1708526611328125, -0.159149169921875, -0.1474456787109375, -0.1357421875, -0.1240386962890625, -0.112335205078125, -0.1006317138671875, -0.08892822265625, -0.0772247314453125, -0.065521240234375, -0.0538177490234375, -0.0421142578125, -0.0304107666015625, -0.018707275390625, -0.0070037841796875, 0.00469970703125, 0.0164031982421875, 0.028106689453125, 0.0398101806640625, 0.051513671875, 0.0632171630859375, 0.074920654296875, 0.0866241455078125, 0.09832763671875, 0.1100311279296875, 0.121734619140625, 0.1334381103515625, 0.1451416015625, 0.1568450927734375, 0.168548583984375, 0.1802520751953125, 0.19195556640625, 0.2036590576171875, 0.215362548828125, 0.2270660400390625, 0.23876953125, 0.2504730224609375, 0.262176513671875, 0.2738800048828125, 0.28558349609375, 0.2972869873046875, 0.308990478515625, 0.3206939697265625, 0.3323974609375, 0.3441009521484375, 0.355804443359375, 0.3675079345703125, 0.37921142578125, 0.3909149169921875, 0.402618408203125, 0.4143218994140625, 0.426025390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 8.0, 6.0, 6.0, 12.0, 12.0, 19.0, 34.0, 41.0, 58.0, 69.0, 102.0, 199.0, 241.0, 486.0, 758.0, 1419.0, 3092.0, 7192.0, 19880.0, 60874.0, 199670.0, 416620.0, 230112.0, 70265.0, 22114.0, 8270.0, 3334.0, 1582.0, 790.0, 431.0, 287.0, 171.0, 112.0, 91.0, 59.0, 32.0, 27.0, 22.0, 19.0, 13.0, 6.0, 7.0, 6.0, 7.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.3056640625, -1.26556396484375, -1.2254638671875, -1.18536376953125, -1.145263671875, -1.10516357421875, -1.0650634765625, -1.02496337890625, -0.98486328125, -0.94476318359375, -0.9046630859375, -0.86456298828125, -0.824462890625, -0.78436279296875, -0.7442626953125, -0.70416259765625, -0.6640625, -0.62396240234375, -0.5838623046875, -0.54376220703125, -0.503662109375, -0.46356201171875, -0.4234619140625, -0.38336181640625, -0.34326171875, -0.30316162109375, -0.2630615234375, -0.22296142578125, -0.182861328125, -0.14276123046875, -0.1026611328125, -0.06256103515625, -0.0224609375, 0.01763916015625, 0.0577392578125, 0.09783935546875, 0.137939453125, 0.17803955078125, 0.2181396484375, 0.25823974609375, 0.29833984375, 0.33843994140625, 0.3785400390625, 0.41864013671875, 0.458740234375, 0.49884033203125, 0.5389404296875, 0.57904052734375, 0.619140625, 0.65924072265625, 0.6993408203125, 0.73944091796875, 0.779541015625, 0.81964111328125, 0.8597412109375, 0.89984130859375, 0.93994140625, 0.98004150390625, 1.0201416015625, 1.06024169921875, 1.100341796875, 1.14044189453125, 1.1805419921875, 1.22064208984375, 1.2607421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 4.0, 3.0, 6.0, 11.0, 10.0, 8.0, 12.0, 21.0, 25.0, 16.0, 23.0, 31.0, 27.0, 31.0, 33.0, 32.0, 42.0, 48.0, 51.0, 46.0, 37.0, 46.0, 43.0, 42.0, 31.0, 44.0, 33.0, 30.0, 25.0, 39.0, 24.0, 20.0, 22.0, 16.0, 12.0, 15.0, 6.0, 11.0, 5.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8994140625, -0.8723068237304688, -0.8451995849609375, -0.8180923461914062, -0.790985107421875, -0.7638778686523438, -0.7367706298828125, -0.7096633911132812, -0.68255615234375, -0.6554489135742188, -0.6283416748046875, -0.6012344360351562, -0.574127197265625, -0.5470199584960938, -0.5199127197265625, -0.49280548095703125, -0.4656982421875, -0.43859100341796875, -0.4114837646484375, -0.38437652587890625, -0.357269287109375, -0.33016204833984375, -0.3030548095703125, -0.27594757080078125, -0.24884033203125, -0.22173309326171875, -0.1946258544921875, -0.16751861572265625, -0.140411376953125, -0.11330413818359375, -0.0861968994140625, -0.05908966064453125, -0.031982421875, -0.00487518310546875, 0.0222320556640625, 0.04933929443359375, 0.076446533203125, 0.10355377197265625, 0.1306610107421875, 0.15776824951171875, 0.18487548828125, 0.21198272705078125, 0.2390899658203125, 0.26619720458984375, 0.293304443359375, 0.32041168212890625, 0.3475189208984375, 0.37462615966796875, 0.4017333984375, 0.42884063720703125, 0.4559478759765625, 0.48305511474609375, 0.510162353515625, 0.5372695922851562, 0.5643768310546875, 0.5914840698242188, 0.61859130859375, 0.6456985473632812, 0.6728057861328125, 0.6999130249023438, 0.727020263671875, 0.7541275024414062, 0.7812347412109375, 0.8083419799804688, 0.83544921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 9.0, 22.0, 21.0, 21.0, 34.0, 44.0, 68.0, 116.0, 188.0, 394.0, 860.0, 2171.0, 6244.0, 23669.0, 172745.0, 728892.0, 89522.0, 15862.0, 4548.0, 1624.0, 691.0, 345.0, 168.0, 79.0, 50.0, 31.0, 27.0, 23.0, 21.0, 14.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.998046875, -0.9672088623046875, -0.936370849609375, -0.9055328369140625, -0.87469482421875, -0.8438568115234375, -0.813018798828125, -0.7821807861328125, -0.7513427734375, -0.7205047607421875, -0.689666748046875, -0.6588287353515625, -0.62799072265625, -0.5971527099609375, -0.566314697265625, -0.5354766845703125, -0.504638671875, -0.4738006591796875, -0.442962646484375, -0.4121246337890625, -0.38128662109375, -0.3504486083984375, -0.319610595703125, -0.2887725830078125, -0.2579345703125, -0.2270965576171875, -0.196258544921875, -0.1654205322265625, -0.13458251953125, -0.1037445068359375, -0.072906494140625, -0.0420684814453125, -0.01123046875, 0.0196075439453125, 0.050445556640625, 0.0812835693359375, 0.11212158203125, 0.1429595947265625, 0.173797607421875, 0.2046356201171875, 0.2354736328125, 0.2663116455078125, 0.297149658203125, 0.3279876708984375, 0.35882568359375, 0.3896636962890625, 0.420501708984375, 0.4513397216796875, 0.482177734375, 0.5130157470703125, 0.543853759765625, 0.5746917724609375, 0.60552978515625, 0.6363677978515625, 0.667205810546875, 0.6980438232421875, 0.7288818359375, 0.7597198486328125, 0.790557861328125, 0.8213958740234375, 0.85223388671875, 0.8830718994140625, 0.913909912109375, 0.9447479248046875, 0.9755859375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 14.0, 22.0, 31.0, 36.0, 62.0, 107.0, 175.0, 186.0, 141.0, 76.0, 44.0, 22.0, 23.0, 19.0, 9.0, 6.0, 1.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020837783813476562, -0.00020262226462364197, -0.0001968666911125183, -0.00019111111760139465, -0.000185355544090271, -0.00017959997057914734, -0.00017384439706802368, -0.00016808882355690002, -0.00016233325004577637, -0.0001565776765346527, -0.00015082210302352905, -0.0001450665295124054, -0.00013931095600128174, -0.00013355538249015808, -0.00012779980897903442, -0.00012204423546791077, -0.00011628866195678711, -0.00011053308844566345, -0.0001047775149345398, -9.902194142341614e-05, -9.326636791229248e-05, -8.751079440116882e-05, -8.175522089004517e-05, -7.599964737892151e-05, -7.024407386779785e-05, -6.44885003566742e-05, -5.873292684555054e-05, -5.297735333442688e-05, -4.722177982330322e-05, -4.1466206312179565e-05, -3.571063280105591e-05, -2.995505928993225e-05, -2.4199485778808594e-05, -1.8443912267684937e-05, -1.268833875656128e-05, -6.932765245437622e-06, -1.1771917343139648e-06, 4.578381776809692e-06, 1.033395528793335e-05, 1.6089528799057007e-05, 2.1845102310180664e-05, 2.760067582130432e-05, 3.335624933242798e-05, 3.9111822843551636e-05, 4.486739635467529e-05, 5.062296986579895e-05, 5.637854337692261e-05, 6.213411688804626e-05, 6.788969039916992e-05, 7.364526391029358e-05, 7.940083742141724e-05, 8.51564109325409e-05, 9.091198444366455e-05, 9.666755795478821e-05, 0.00010242313146591187, 0.00010817870497703552, 0.00011393427848815918, 0.00011968985199928284, 0.0001254454255104065, 0.00013120099902153015, 0.0001369565725326538, 0.00014271214604377747, 0.00014846771955490112, 0.00015422329306602478, 0.00015997886657714844]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 6.0, 9.0, 6.0, 12.0, 17.0, 26.0, 37.0, 44.0, 89.0, 121.0, 223.0, 392.0, 829.0, 1992.0, 5598.0, 21805.0, 151649.0, 742135.0, 98770.0, 16798.0, 4795.0, 1667.0, 707.0, 330.0, 182.0, 121.0, 50.0, 50.0, 30.0, 21.0, 12.0, 10.0, 4.0, 7.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.6913223266601562, -0.6604766845703125, -0.6296310424804688, -0.598785400390625, -0.5679397583007812, -0.5370941162109375, -0.5062484741210938, -0.47540283203125, -0.44455718994140625, -0.4137115478515625, -0.38286590576171875, -0.352020263671875, -0.32117462158203125, -0.2903289794921875, -0.25948333740234375, -0.2286376953125, -0.19779205322265625, -0.1669464111328125, -0.13610076904296875, -0.105255126953125, -0.07440948486328125, -0.0435638427734375, -0.01271820068359375, 0.01812744140625, 0.04897308349609375, 0.0798187255859375, 0.11066436767578125, 0.141510009765625, 0.17235565185546875, 0.2032012939453125, 0.23404693603515625, 0.264892578125, 0.29573822021484375, 0.3265838623046875, 0.35742950439453125, 0.388275146484375, 0.41912078857421875, 0.4499664306640625, 0.48081207275390625, 0.51165771484375, 0.5425033569335938, 0.5733489990234375, 0.6041946411132812, 0.635040283203125, 0.6658859252929688, 0.6967315673828125, 0.7275772094726562, 0.7584228515625, 0.7892684936523438, 0.8201141357421875, 0.8509597778320312, 0.881805419921875, 0.9126510620117188, 0.9434967041015625, 0.9743423461914062, 1.00518798828125, 1.0360336303710938, 1.0668792724609375, 1.0977249145507812, 1.128570556640625, 1.1594161987304688, 1.1902618408203125, 1.2211074829101562, 1.251953125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 8.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 20.0, 12.0, 26.0, 31.0, 55.0, 74.0, 115.0, 122.0, 135.0, 125.0, 77.0, 47.0, 40.0, 30.0, 21.0, 12.0, 15.0, 10.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.64190673828125, -0.6217041015625, -0.60150146484375, -0.581298828125, -0.56109619140625, -0.5408935546875, -0.52069091796875, -0.50048828125, -0.48028564453125, -0.4600830078125, -0.43988037109375, -0.419677734375, -0.39947509765625, -0.3792724609375, -0.35906982421875, -0.3388671875, -0.31866455078125, -0.2984619140625, -0.27825927734375, -0.258056640625, -0.23785400390625, -0.2176513671875, -0.19744873046875, -0.17724609375, -0.15704345703125, -0.1368408203125, -0.11663818359375, -0.096435546875, -0.07623291015625, -0.0560302734375, -0.03582763671875, -0.015625, 0.00457763671875, 0.0247802734375, 0.04498291015625, 0.065185546875, 0.08538818359375, 0.1055908203125, 0.12579345703125, 0.14599609375, 0.16619873046875, 0.1864013671875, 0.20660400390625, 0.226806640625, 0.24700927734375, 0.2672119140625, 0.28741455078125, 0.3076171875, 0.32781982421875, 0.3480224609375, 0.36822509765625, 0.388427734375, 0.40863037109375, 0.4288330078125, 0.44903564453125, 0.46923828125, 0.48944091796875, 0.5096435546875, 0.52984619140625, 0.550048828125, 0.57025146484375, 0.5904541015625, 0.61065673828125, 0.630859375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 9.0, 22.0, 35.0, 87.0, 229.0, 309.0, 189.0, 71.0, 32.0, 15.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.56186294555664, -23.955339431762695, -23.34881591796875, -22.742292404174805, -22.13576889038086, -21.529247283935547, -20.9227237701416, -20.316200256347656, -19.70967674255371, -19.103153228759766, -18.49662971496582, -17.890106201171875, -17.283584594726562, -16.677061080932617, -16.070537567138672, -15.464014053344727, -14.857490539550781, -14.250967025756836, -13.64444351196289, -13.037920951843262, -12.431397438049316, -11.824873924255371, -11.218351364135742, -10.611827850341797, -10.005304336547852, -9.398780822753906, -8.792257308959961, -8.185734748840332, -7.579211235046387, -6.972687721252441, -6.366164684295654, -5.759641647338867, -5.1531171798706055, -4.54659366607666, -3.940070629119873, -3.333547353744507, -2.7270240783691406, -2.1205008029937744, -1.5139775276184082, -0.9074544906616211, -0.3009309768676758, 0.30559229850769043, 0.9121155738830566, 1.5186388492584229, 2.125162124633789, 2.7316854000091553, 3.3382086753845215, 3.9447317123413086, 4.551255226135254, 5.157778739929199, 5.764301776885986, 6.370824813842773, 6.977348327636719, 7.583871841430664, 8.19039535522461, 8.796917915344238, 9.403441429138184, 10.009964942932129, 10.616487503051758, 11.223011016845703, 11.829534530639648, 12.436058044433594, 13.042581558227539, 13.649104118347168, 14.255627632141113]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 4.0, 6.0, 16.0, 15.0, 10.0, 16.0, 21.0, 32.0, 47.0, 42.0, 38.0, 44.0, 53.0, 54.0, 47.0, 63.0, 60.0, 60.0, 60.0, 53.0, 48.0, 31.0, 23.0, 36.0, 19.0, 20.0, 14.0, 18.0, 11.0, 7.0, 10.0, 11.0, 5.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-8.05985164642334, -7.851208209991455, -7.64256477355957, -7.433920860290527, -7.225277423858643, -7.016633987426758, -6.807990074157715, -6.59934663772583, -6.390703201293945, -6.1820597648620605, -5.973416328430176, -5.764772415161133, -5.556128978729248, -5.347485542297363, -5.13884162902832, -4.9301981925964355, -4.721554756164551, -4.512911319732666, -4.304267883300781, -4.095623970031738, -3.8869805335998535, -3.6783370971679688, -3.469693422317505, -3.261049747467041, -3.0524063110351562, -2.8437628746032715, -2.6351191997528076, -2.4264755249023438, -2.217832088470459, -2.009188652038574, -1.8005449771881104, -1.591901421546936, -1.3832578659057617, -1.1746143102645874, -0.9659707546234131, -0.7573271989822388, -0.5486836433410645, -0.34004008769989014, -0.13139653205871582, 0.0772470235824585, 0.2858905792236328, 0.49453413486480713, 0.7031776905059814, 0.9118212461471558, 1.12046480178833, 1.3291083574295044, 1.5377519130706787, 1.746395468711853, 1.9550390243530273, 2.163682460784912, 2.372326135635376, 2.58096981048584, 2.7896132469177246, 2.9982566833496094, 3.2069003582000732, 3.415544033050537, 3.624187469482422, 3.8328309059143066, 4.041474342346191, 4.250118255615234, 4.458761692047119, 4.667405128479004, 4.876049041748047, 5.084692478179932, 5.293335914611816]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 7.0, 12.0, 15.0, 22.0, 42.0, 60.0, 73.0, 132.0, 234.0, 475.0, 1028.0, 2776.0, 9995.0, 59699.0, 4037014.0, 67162.0, 10291.0, 2792.0, 1031.0, 468.0, 297.0, 154.0, 109.0, 99.0, 49.0, 43.0, 54.0, 28.0, 22.0, 11.0, 14.0, 23.0, 8.0, 8.0, 7.0, 3.0, 6.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.797760009765625, -2.66778564453125, -2.537811279296875, -2.4078369140625, -2.277862548828125, -2.14788818359375, -2.017913818359375, -1.887939453125, -1.757965087890625, -1.62799072265625, -1.498016357421875, -1.3680419921875, -1.238067626953125, -1.10809326171875, -0.978118896484375, -0.84814453125, -0.718170166015625, -0.58819580078125, -0.458221435546875, -0.3282470703125, -0.198272705078125, -0.06829833984375, 0.061676025390625, 0.191650390625, 0.321624755859375, 0.45159912109375, 0.581573486328125, 0.7115478515625, 0.841522216796875, 0.97149658203125, 1.101470947265625, 1.2314453125, 1.361419677734375, 1.49139404296875, 1.621368408203125, 1.7513427734375, 1.881317138671875, 2.01129150390625, 2.141265869140625, 2.271240234375, 2.401214599609375, 2.53118896484375, 2.661163330078125, 2.7911376953125, 2.921112060546875, 3.05108642578125, 3.181060791015625, 3.31103515625, 3.441009521484375, 3.57098388671875, 3.700958251953125, 3.8309326171875, 3.960906982421875, 4.09088134765625, 4.220855712890625, 4.350830078125, 4.480804443359375, 4.61077880859375, 4.740753173828125, 4.8707275390625, 5.000701904296875, 5.13067626953125, 5.260650634765625, 5.390625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 6.0, 8.0, 15.0, 25.0, 47.0, 71.0, 90.0, 93.0, 119.0, 115.0, 91.0, 92.0, 69.0, 49.0, 36.0, 23.0, 14.0, 10.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31640625, -0.3047943115234375, -0.293182373046875, -0.2815704345703125, -0.26995849609375, -0.2583465576171875, -0.246734619140625, -0.2351226806640625, -0.2235107421875, -0.2118988037109375, -0.200286865234375, -0.1886749267578125, -0.17706298828125, -0.1654510498046875, -0.153839111328125, -0.1422271728515625, -0.130615234375, -0.1190032958984375, -0.107391357421875, -0.0957794189453125, -0.08416748046875, -0.0725555419921875, -0.060943603515625, -0.0493316650390625, -0.0377197265625, -0.0261077880859375, -0.014495849609375, -0.0028839111328125, 0.00872802734375, 0.0203399658203125, 0.031951904296875, 0.0435638427734375, 0.05517578125, 0.0667877197265625, 0.078399658203125, 0.0900115966796875, 0.10162353515625, 0.1132354736328125, 0.124847412109375, 0.1364593505859375, 0.1480712890625, 0.1596832275390625, 0.171295166015625, 0.1829071044921875, 0.19451904296875, 0.2061309814453125, 0.217742919921875, 0.2293548583984375, 0.240966796875, 0.2525787353515625, 0.264190673828125, 0.2758026123046875, 0.28741455078125, 0.2990264892578125, 0.310638427734375, 0.3222503662109375, 0.3338623046875, 0.3454742431640625, 0.357086181640625, 0.3686981201171875, 0.38031005859375, 0.3919219970703125, 0.403533935546875, 0.4151458740234375, 0.4267578125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 9.0, 6.0, 10.0, 13.0, 40.0, 49.0, 100.0, 149.0, 341.0, 633.0, 1595.0, 4766.0, 21390.0, 432061.0, 3691061.0, 31908.0, 6374.0, 1964.0, 805.0, 401.0, 230.0, 128.0, 89.0, 50.0, 32.0, 30.0, 18.0, 11.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.2265625, -5.099456787109375, -4.97235107421875, -4.845245361328125, -4.7181396484375, -4.591033935546875, -4.46392822265625, -4.336822509765625, -4.209716796875, -4.082611083984375, -3.95550537109375, -3.828399658203125, -3.7012939453125, -3.574188232421875, -3.44708251953125, -3.319976806640625, -3.19287109375, -3.065765380859375, -2.93865966796875, -2.811553955078125, -2.6844482421875, -2.557342529296875, -2.43023681640625, -2.303131103515625, -2.176025390625, -2.048919677734375, -1.92181396484375, -1.794708251953125, -1.6676025390625, -1.540496826171875, -1.41339111328125, -1.286285400390625, -1.1591796875, -1.032073974609375, -0.90496826171875, -0.777862548828125, -0.6507568359375, -0.523651123046875, -0.39654541015625, -0.269439697265625, -0.142333984375, -0.015228271484375, 0.11187744140625, 0.238983154296875, 0.3660888671875, 0.493194580078125, 0.62030029296875, 0.747406005859375, 0.87451171875, 1.001617431640625, 1.12872314453125, 1.255828857421875, 1.3829345703125, 1.510040283203125, 1.63714599609375, 1.764251708984375, 1.891357421875, 2.018463134765625, 2.14556884765625, 2.272674560546875, 2.3997802734375, 2.526885986328125, 2.65399169921875, 2.781097412109375, 2.908203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 11.0, 17.0, 16.0, 22.0, 38.0, 63.0, 119.0, 388.0, 2373.0, 670.0, 168.0, 71.0, 33.0, 20.0, 16.0, 11.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51025390625, -0.48667144775390625, -0.4630889892578125, -0.43950653076171875, -0.415924072265625, -0.39234161376953125, -0.3687591552734375, -0.34517669677734375, -0.32159423828125, -0.29801177978515625, -0.2744293212890625, -0.25084686279296875, -0.227264404296875, -0.20368194580078125, -0.1800994873046875, -0.15651702880859375, -0.1329345703125, -0.10935211181640625, -0.0857696533203125, -0.06218719482421875, -0.038604736328125, -0.01502227783203125, 0.0085601806640625, 0.03214263916015625, 0.05572509765625, 0.07930755615234375, 0.1028900146484375, 0.12647247314453125, 0.150054931640625, 0.17363739013671875, 0.1972198486328125, 0.22080230712890625, 0.244384765625, 0.26796722412109375, 0.2915496826171875, 0.31513214111328125, 0.338714599609375, 0.36229705810546875, 0.3858795166015625, 0.40946197509765625, 0.43304443359375, 0.45662689208984375, 0.4802093505859375, 0.5037918090820312, 0.527374267578125, 0.5509567260742188, 0.5745391845703125, 0.5981216430664062, 0.6217041015625, 0.6452865600585938, 0.6688690185546875, 0.6924514770507812, 0.716033935546875, 0.7396163940429688, 0.7631988525390625, 0.7867813110351562, 0.81036376953125, 0.8339462280273438, 0.8575286865234375, 0.8811111450195312, 0.904693603515625, 0.9282760620117188, 0.9518585205078125, 0.9754409790039062, 0.9990234375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 13.0, 43.0, 96.0, 249.0, 325.0, 174.0, 62.0, 23.0, 10.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.948447227478027, -6.703046798706055, -6.457646369934082, -6.212245941162109, -5.966845512390137, -5.721445083618164, -5.476044654846191, -5.230644226074219, -4.985243797302246, -4.739843368530273, -4.494442939758301, -4.249042510986328, -4.0036420822143555, -3.758241653442383, -3.512840986251831, -3.2674405574798584, -3.0220398902893066, -2.776639461517334, -2.5312390327453613, -2.2858386039733887, -2.040438175201416, -1.7950376272201538, -1.5496370792388916, -1.304236650466919, -1.0588362216949463, -0.8134357929229736, -0.5680353045463562, -0.32263481616973877, -0.07723438739776611, 0.16816604137420654, 0.41356658935546875, 0.6589670181274414, 0.9043674468994141, 1.1497678756713867, 1.3951683044433594, 1.6405688524246216, 1.8859692811965942, 2.1313695907592773, 2.376770257949829, 2.6221706867218018, 2.8675711154937744, 3.112971544265747, 3.3583719730377197, 3.6037726402282715, 3.849173069000244, 4.094573497772217, 4.3399739265441895, 4.585374355316162, 4.830774784088135, 5.076175212860107, 5.32157564163208, 5.566976070404053, 5.812376499176025, 6.057776927947998, 6.303177833557129, 6.548578262329102, 6.793978691101074, 7.039379119873047, 7.2847795486450195, 7.530179977416992, 7.775580406188965, 8.020980834960938, 8.26638126373291, 8.511781692504883, 8.757182121276855]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 10.0, 5.0, 10.0, 13.0, 16.0, 14.0, 22.0, 28.0, 24.0, 21.0, 36.0, 43.0, 48.0, 52.0, 45.0, 44.0, 45.0, 54.0, 57.0, 33.0, 39.0, 49.0, 35.0, 26.0, 32.0, 27.0, 32.0, 23.0, 22.0, 21.0, 10.0, 17.0, 6.0, 10.0, 9.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4789817333221436, -1.424920916557312, -1.3708600997924805, -1.316799283027649, -1.2627384662628174, -1.2086775302886963, -1.1546168327331543, -1.1005558967590332, -1.0464950799942017, -0.9924342632293701, -0.9383734464645386, -0.884312629699707, -0.8302517533302307, -0.7761909365653992, -0.7221301198005676, -0.6680692434310913, -0.6140084862709045, -0.559947669506073, -0.5058868527412415, -0.4518260061740875, -0.3977651596069336, -0.34370434284210205, -0.2896435260772705, -0.23558267951011658, -0.18152186274528503, -0.1274610310792923, -0.07340020686388016, -0.019339382648468018, 0.03472144901752472, 0.08878228068351746, 0.142843097448349, 0.19690394401550293, 0.2509647607803345, 0.305025577545166, 0.35908642411231995, 0.4131472408771515, 0.4672080874443054, 0.521268904209137, 0.5753297209739685, 0.6293905973434448, 0.6834514141082764, 0.7375122308731079, 0.7915730476379395, 0.845633864402771, 0.8996947407722473, 0.9537555575370789, 1.0078163146972656, 1.0618772506713867, 1.1159379482269287, 1.1699987649917603, 1.2240595817565918, 1.2781203985214233, 1.3321812152862549, 1.386242151260376, 1.440302848815918, 1.494363784790039, 1.5484246015548706, 1.6024854183197021, 1.6565462350845337, 1.7106070518493652, 1.7646678686141968, 1.8187286853790283, 1.8727896213531494, 1.926850438117981, 1.9809112548828125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 11.0, 13.0, 11.0, 24.0, 33.0, 43.0, 66.0, 119.0, 200.0, 366.0, 598.0, 1482.0, 3640.0, 13257.0, 81294.0, 628492.0, 276388.0, 31248.0, 6819.0, 2339.0, 975.0, 459.0, 238.0, 150.0, 81.0, 61.0, 37.0, 34.0, 19.0, 20.0, 11.0, 7.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3671875, -2.275299072265625, -2.18341064453125, -2.091522216796875, -1.9996337890625, -1.907745361328125, -1.81585693359375, -1.723968505859375, -1.632080078125, -1.540191650390625, -1.44830322265625, -1.356414794921875, -1.2645263671875, -1.172637939453125, -1.08074951171875, -0.988861083984375, -0.89697265625, -0.805084228515625, -0.71319580078125, -0.621307373046875, -0.5294189453125, -0.437530517578125, -0.34564208984375, -0.253753662109375, -0.161865234375, -0.069976806640625, 0.02191162109375, 0.113800048828125, 0.2056884765625, 0.297576904296875, 0.38946533203125, 0.481353759765625, 0.5732421875, 0.665130615234375, 0.75701904296875, 0.848907470703125, 0.9407958984375, 1.032684326171875, 1.12457275390625, 1.216461181640625, 1.308349609375, 1.400238037109375, 1.49212646484375, 1.584014892578125, 1.6759033203125, 1.767791748046875, 1.85968017578125, 1.951568603515625, 2.04345703125, 2.135345458984375, 2.22723388671875, 2.319122314453125, 2.4110107421875, 2.502899169921875, 2.59478759765625, 2.686676025390625, 2.778564453125, 2.870452880859375, 2.96234130859375, 3.054229736328125, 3.1461181640625, 3.238006591796875, 3.32989501953125, 3.421783447265625, 3.513671875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 7.0, 8.0, 7.0, 23.0, 34.0, 46.0, 73.0, 68.0, 96.0, 108.0, 111.0, 100.0, 87.0, 58.0, 59.0, 34.0, 18.0, 19.0, 10.0, 11.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3203125, -0.3080902099609375, -0.295867919921875, -0.2836456298828125, -0.27142333984375, -0.2592010498046875, -0.246978759765625, -0.2347564697265625, -0.2225341796875, -0.2103118896484375, -0.198089599609375, -0.1858673095703125, -0.17364501953125, -0.1614227294921875, -0.149200439453125, -0.1369781494140625, -0.124755859375, -0.1125335693359375, -0.100311279296875, -0.0880889892578125, -0.07586669921875, -0.0636444091796875, -0.051422119140625, -0.0391998291015625, -0.0269775390625, -0.0147552490234375, -0.002532958984375, 0.0096893310546875, 0.02191162109375, 0.0341339111328125, 0.046356201171875, 0.0585784912109375, 0.07080078125, 0.0830230712890625, 0.095245361328125, 0.1074676513671875, 0.11968994140625, 0.1319122314453125, 0.144134521484375, 0.1563568115234375, 0.1685791015625, 0.1808013916015625, 0.193023681640625, 0.2052459716796875, 0.21746826171875, 0.2296905517578125, 0.241912841796875, 0.2541351318359375, 0.266357421875, 0.2785797119140625, 0.290802001953125, 0.3030242919921875, 0.31524658203125, 0.3274688720703125, 0.339691162109375, 0.3519134521484375, 0.3641357421875, 0.3763580322265625, 0.388580322265625, 0.4008026123046875, 0.41302490234375, 0.4252471923828125, 0.437469482421875, 0.4496917724609375, 0.4619140625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 6.0, 9.0, 21.0, 18.0, 29.0, 61.0, 109.0, 196.0, 329.0, 614.0, 1503.0, 3931.0, 15120.0, 81796.0, 490465.0, 379661.0, 57515.0, 11380.0, 3378.0, 1196.0, 579.0, 273.0, 143.0, 88.0, 44.0, 32.0, 20.0, 9.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.49609375, -2.42657470703125, -2.3570556640625, -2.28753662109375, -2.218017578125, -2.14849853515625, -2.0789794921875, -2.00946044921875, -1.93994140625, -1.87042236328125, -1.8009033203125, -1.73138427734375, -1.661865234375, -1.59234619140625, -1.5228271484375, -1.45330810546875, -1.3837890625, -1.31427001953125, -1.2447509765625, -1.17523193359375, -1.105712890625, -1.03619384765625, -0.9666748046875, -0.89715576171875, -0.82763671875, -0.75811767578125, -0.6885986328125, -0.61907958984375, -0.549560546875, -0.48004150390625, -0.4105224609375, -0.34100341796875, -0.271484375, -0.20196533203125, -0.1324462890625, -0.06292724609375, 0.006591796875, 0.07611083984375, 0.1456298828125, 0.21514892578125, 0.28466796875, 0.35418701171875, 0.4237060546875, 0.49322509765625, 0.562744140625, 0.63226318359375, 0.7017822265625, 0.77130126953125, 0.8408203125, 0.91033935546875, 0.9798583984375, 1.04937744140625, 1.118896484375, 1.18841552734375, 1.2579345703125, 1.32745361328125, 1.39697265625, 1.46649169921875, 1.5360107421875, 1.60552978515625, 1.675048828125, 1.74456787109375, 1.8140869140625, 1.88360595703125, 1.953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 4.0, 6.0, 4.0, 2.0, 11.0, 11.0, 21.0, 13.0, 18.0, 20.0, 29.0, 34.0, 37.0, 38.0, 44.0, 59.0, 50.0, 53.0, 47.0, 46.0, 54.0, 48.0, 37.0, 47.0, 46.0, 29.0, 29.0, 26.0, 22.0, 22.0, 26.0, 12.0, 11.0, 7.0, 10.0, 10.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93408203125, -0.8997726440429688, -0.8654632568359375, -0.8311538696289062, -0.796844482421875, -0.7625350952148438, -0.7282257080078125, -0.6939163208007812, -0.65960693359375, -0.6252975463867188, -0.5909881591796875, -0.5566787719726562, -0.522369384765625, -0.48805999755859375, -0.4537506103515625, -0.41944122314453125, -0.3851318359375, -0.35082244873046875, -0.3165130615234375, -0.28220367431640625, -0.247894287109375, -0.21358489990234375, -0.1792755126953125, -0.14496612548828125, -0.11065673828125, -0.07634735107421875, -0.0420379638671875, -0.00772857666015625, 0.026580810546875, 0.06089019775390625, 0.0951995849609375, 0.12950897216796875, 0.163818359375, 0.19812774658203125, 0.2324371337890625, 0.26674652099609375, 0.301055908203125, 0.33536529541015625, 0.3696746826171875, 0.40398406982421875, 0.43829345703125, 0.47260284423828125, 0.5069122314453125, 0.5412216186523438, 0.575531005859375, 0.6098403930664062, 0.6441497802734375, 0.6784591674804688, 0.7127685546875, 0.7470779418945312, 0.7813873291015625, 0.8156967163085938, 0.850006103515625, 0.8843154907226562, 0.9186248779296875, 0.9529342651367188, 0.98724365234375, 1.0215530395507812, 1.0558624267578125, 1.0901718139648438, 1.124481201171875, 1.1587905883789062, 1.1930999755859375, 1.2274093627929688, 1.26171875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 10.0, 13.0, 6.0, 15.0, 28.0, 43.0, 54.0, 130.0, 187.0, 366.0, 985.0, 2796.0, 12259.0, 105854.0, 849691.0, 63280.0, 8988.0, 2275.0, 770.0, 337.0, 186.0, 79.0, 57.0, 38.0, 34.0, 14.0, 10.0, 14.0, 10.0, 2.0, 7.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.626953125, -1.576751708984375, -1.52655029296875, -1.476348876953125, -1.4261474609375, -1.375946044921875, -1.32574462890625, -1.275543212890625, -1.225341796875, -1.175140380859375, -1.12493896484375, -1.074737548828125, -1.0245361328125, -0.974334716796875, -0.92413330078125, -0.873931884765625, -0.82373046875, -0.773529052734375, -0.72332763671875, -0.673126220703125, -0.6229248046875, -0.572723388671875, -0.52252197265625, -0.472320556640625, -0.422119140625, -0.371917724609375, -0.32171630859375, -0.271514892578125, -0.2213134765625, -0.171112060546875, -0.12091064453125, -0.070709228515625, -0.0205078125, 0.029693603515625, 0.07989501953125, 0.130096435546875, 0.1802978515625, 0.230499267578125, 0.28070068359375, 0.330902099609375, 0.381103515625, 0.431304931640625, 0.48150634765625, 0.531707763671875, 0.5819091796875, 0.632110595703125, 0.68231201171875, 0.732513427734375, 0.78271484375, 0.832916259765625, 0.88311767578125, 0.933319091796875, 0.9835205078125, 1.033721923828125, 1.08392333984375, 1.134124755859375, 1.184326171875, 1.234527587890625, 1.28472900390625, 1.334930419921875, 1.3851318359375, 1.435333251953125, 1.48553466796875, 1.535736083984375, 1.5859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 5.0, 5.0, 14.0, 14.0, 28.0, 39.0, 58.0, 88.0, 146.0, 148.0, 124.0, 94.0, 68.0, 32.0, 34.0, 17.0, 9.0, 10.0, 7.0, 7.0, 5.0, 7.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00021529197692871094, -0.00020903348922729492, -0.0002027750015258789, -0.0001965165138244629, -0.00019025802612304688, -0.00018399953842163086, -0.00017774105072021484, -0.00017148256301879883, -0.0001652240753173828, -0.0001589655876159668, -0.00015270709991455078, -0.00014644861221313477, -0.00014019012451171875, -0.00013393163681030273, -0.00012767314910888672, -0.0001214146614074707, -0.00011515617370605469, -0.00010889768600463867, -0.00010263919830322266, -9.638071060180664e-05, -9.012222290039062e-05, -8.386373519897461e-05, -7.76052474975586e-05, -7.134675979614258e-05, -6.508827209472656e-05, -5.882978439331055e-05, -5.257129669189453e-05, -4.6312808990478516e-05, -4.00543212890625e-05, -3.3795833587646484e-05, -2.753734588623047e-05, -2.1278858184814453e-05, -1.5020370483398438e-05, -8.761882781982422e-06, -2.5033950805664062e-06, 3.7550926208496094e-06, 1.0013580322265625e-05, 1.627206802368164e-05, 2.2530555725097656e-05, 2.8789043426513672e-05, 3.504753112792969e-05, 4.13060188293457e-05, 4.756450653076172e-05, 5.3822994232177734e-05, 6.008148193359375e-05, 6.633996963500977e-05, 7.259845733642578e-05, 7.88569450378418e-05, 8.511543273925781e-05, 9.137392044067383e-05, 9.763240814208984e-05, 0.00010389089584350586, 0.00011014938354492188, 0.00011640787124633789, 0.0001226663589477539, 0.00012892484664916992, 0.00013518333435058594, 0.00014144182205200195, 0.00014770030975341797, 0.00015395879745483398, 0.00016021728515625, 0.00016647577285766602, 0.00017273426055908203, 0.00017899274826049805, 0.00018525123596191406]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 10.0, 6.0, 7.0, 10.0, 12.0, 18.0, 25.0, 54.0, 88.0, 156.0, 268.0, 562.0, 1268.0, 4178.0, 25605.0, 810881.0, 188945.0, 11994.0, 2566.0, 926.0, 440.0, 238.0, 124.0, 56.0, 35.0, 31.0, 22.0, 13.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8056640625, -1.7383270263671875, -1.670989990234375, -1.6036529541015625, -1.53631591796875, -1.4689788818359375, -1.401641845703125, -1.3343048095703125, -1.2669677734375, -1.1996307373046875, -1.132293701171875, -1.0649566650390625, -0.99761962890625, -0.9302825927734375, -0.862945556640625, -0.7956085205078125, -0.728271484375, -0.6609344482421875, -0.593597412109375, -0.5262603759765625, -0.45892333984375, -0.3915863037109375, -0.324249267578125, -0.2569122314453125, -0.1895751953125, -0.1222381591796875, -0.054901123046875, 0.0124359130859375, 0.07977294921875, 0.1471099853515625, 0.214447021484375, 0.2817840576171875, 0.34912109375, 0.4164581298828125, 0.483795166015625, 0.5511322021484375, 0.61846923828125, 0.6858062744140625, 0.753143310546875, 0.8204803466796875, 0.8878173828125, 0.9551544189453125, 1.022491455078125, 1.0898284912109375, 1.15716552734375, 1.2245025634765625, 1.291839599609375, 1.3591766357421875, 1.426513671875, 1.4938507080078125, 1.561187744140625, 1.6285247802734375, 1.69586181640625, 1.7631988525390625, 1.830535888671875, 1.8978729248046875, 1.9652099609375, 2.0325469970703125, 2.099884033203125, 2.1672210693359375, 2.23455810546875, 2.3018951416015625, 2.369232177734375, 2.4365692138671875, 2.50390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 12.0, 19.0, 22.0, 34.0, 54.0, 73.0, 110.0, 180.0, 169.0, 128.0, 65.0, 36.0, 31.0, 19.0, 8.0, 10.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0556640625, -1.0254898071289062, -0.9953155517578125, -0.9651412963867188, -0.934967041015625, -0.9047927856445312, -0.8746185302734375, -0.8444442749023438, -0.81427001953125, -0.7840957641601562, -0.7539215087890625, -0.7237472534179688, -0.693572998046875, -0.6633987426757812, -0.6332244873046875, -0.6030502319335938, -0.5728759765625, -0.5427017211914062, -0.5125274658203125, -0.48235321044921875, -0.452178955078125, -0.42200469970703125, -0.3918304443359375, -0.36165618896484375, -0.33148193359375, -0.30130767822265625, -0.2711334228515625, -0.24095916748046875, -0.210784912109375, -0.18061065673828125, -0.1504364013671875, -0.12026214599609375, -0.090087890625, -0.05991363525390625, -0.0297393798828125, 0.00043487548828125, 0.030609130859375, 0.06078338623046875, 0.0909576416015625, 0.12113189697265625, 0.15130615234375, 0.18148040771484375, 0.2116546630859375, 0.24182891845703125, 0.272003173828125, 0.30217742919921875, 0.3323516845703125, 0.36252593994140625, 0.3927001953125, 0.42287445068359375, 0.4530487060546875, 0.48322296142578125, 0.513397216796875, 0.5435714721679688, 0.5737457275390625, 0.6039199829101562, 0.63409423828125, 0.6642684936523438, 0.6944427490234375, 0.7246170043945312, 0.754791259765625, 0.7849655151367188, 0.8151397705078125, 0.8453140258789062, 0.87548828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 11.0, 14.0, 30.0, 51.0, 115.0, 183.0, 218.0, 175.0, 100.0, 44.0, 25.0, 22.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.00187873840332, -7.482860565185547, -6.963841915130615, -6.444823265075684, -5.92580509185791, -5.406786918640137, -4.887768268585205, -4.368749618530273, -3.8497314453125, -3.3307130336761475, -2.811694622039795, -2.2926762104034424, -1.7736577987670898, -1.2546393871307373, -0.7356209754943848, -0.21660256385803223, 0.3024158477783203, 0.8214342594146729, 1.3404526710510254, 1.859471082687378, 2.3784894943237305, 2.897507905960083, 3.4165263175964355, 3.935544729232788, 4.454563140869141, 4.973581314086914, 5.492599964141846, 6.011618614196777, 6.530636787414551, 7.049654960632324, 7.568673610687256, 8.087692260742188, 8.606710433959961, 9.125728607177734, 9.644746780395508, 10.163765907287598, 10.682784080505371, 11.201802253723145, 11.720821380615234, 12.239839553833008, 12.758857727050781, 13.277875900268555, 13.796894073486328, 14.315913200378418, 14.834931373596191, 15.353949546813965, 15.872968673706055, 16.391986846923828, 16.9110050201416, 17.430023193359375, 17.94904136657715, 18.468059539794922, 18.987079620361328, 19.5060977935791, 20.025115966796875, 20.54413414001465, 21.063152313232422, 21.582170486450195, 22.10118865966797, 22.620206832885742, 23.139225006103516, 23.658245086669922, 24.177263259887695, 24.69628143310547, 25.215299606323242]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 7.0, 14.0, 10.0, 14.0, 14.0, 20.0, 20.0, 25.0, 28.0, 34.0, 52.0, 50.0, 54.0, 52.0, 66.0, 48.0, 57.0, 63.0, 43.0, 55.0, 48.0, 37.0, 35.0, 27.0, 27.0, 21.0, 18.0, 14.0, 16.0, 11.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.04636287689209, -5.812415599822998, -5.578468322753906, -5.344521522521973, -5.110574245452881, -4.876626968383789, -4.642679691314697, -4.4087324142456055, -4.174785137176514, -3.940837860107422, -3.706890821456909, -3.4729435443878174, -3.2389962673187256, -3.005049228668213, -2.771101951599121, -2.5371546745300293, -2.3032076358795166, -2.069260358810425, -1.8353132009506226, -1.6013660430908203, -1.3674187660217285, -1.1334716081619263, -0.899524450302124, -0.6655771732330322, -0.43163001537323, -0.19768281280994415, 0.036264389753341675, 0.2702115774154663, 0.5041587948799133, 0.7381060123443604, 0.9720531702041626, 1.2060004472732544, 1.4399476051330566, 1.6738947629928589, 1.9078420400619507, 2.141789197921753, 2.3757364749908447, 2.6096835136413574, 2.843630790710449, 3.077578067779541, 3.311525344848633, 3.5454726219177246, 3.7794196605682373, 4.01336669921875, 4.247313976287842, 4.481261253356934, 4.715208530426025, 4.949155807495117, 5.183102607727051, 5.417049884796143, 5.650997161865234, 5.884943962097168, 6.11889123916626, 6.352838516235352, 6.586785793304443, 6.820733070373535, 7.054680347442627, 7.288627624511719, 7.5225749015808105, 7.756522178649902, 7.990468978881836, 8.224416732788086, 8.45836353302002, 8.692310333251953, 8.926258087158203]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 19.0, 30.0, 48.0, 98.0, 186.0, 409.0, 896.0, 2451.0, 9659.0, 66338.0, 3995051.0, 101035.0, 12961.0, 2810.0, 973.0, 439.0, 276.0, 179.0, 113.0, 71.0, 68.0, 38.0, 43.0, 23.0, 16.0, 15.0, 13.0, 4.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.419921875, -3.268463134765625, -3.11700439453125, -2.965545654296875, -2.8140869140625, -2.662628173828125, -2.51116943359375, -2.359710693359375, -2.208251953125, -2.056793212890625, -1.90533447265625, -1.753875732421875, -1.6024169921875, -1.450958251953125, -1.29949951171875, -1.148040771484375, -0.99658203125, -0.845123291015625, -0.69366455078125, -0.542205810546875, -0.3907470703125, -0.239288330078125, -0.08782958984375, 0.063629150390625, 0.215087890625, 0.366546630859375, 0.51800537109375, 0.669464111328125, 0.8209228515625, 0.972381591796875, 1.12384033203125, 1.275299072265625, 1.4267578125, 1.578216552734375, 1.72967529296875, 1.881134033203125, 2.0325927734375, 2.184051513671875, 2.33551025390625, 2.486968994140625, 2.638427734375, 2.789886474609375, 2.94134521484375, 3.092803955078125, 3.2442626953125, 3.395721435546875, 3.54718017578125, 3.698638916015625, 3.85009765625, 4.001556396484375, 4.15301513671875, 4.304473876953125, 4.4559326171875, 4.607391357421875, 4.75885009765625, 4.910308837890625, 5.061767578125, 5.213226318359375, 5.36468505859375, 5.516143798828125, 5.6676025390625, 5.819061279296875, 5.97052001953125, 6.121978759765625, 6.2734375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 7.0, 4.0, 7.0, 12.0, 30.0, 42.0, 49.0, 59.0, 84.0, 95.0, 94.0, 95.0, 90.0, 78.0, 61.0, 55.0, 37.0, 18.0, 27.0, 13.0, 9.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.285888671875, -0.2740287780761719, -0.26216888427734375, -0.2503089904785156, -0.2384490966796875, -0.22658920288085938, -0.21472930908203125, -0.20286941528320312, -0.191009521484375, -0.17914962768554688, -0.16728973388671875, -0.15542984008789062, -0.1435699462890625, -0.13171005249023438, -0.11985015869140625, -0.10799026489257812, -0.09613037109375, -0.08427047729492188, -0.07241058349609375, -0.060550689697265625, -0.0486907958984375, -0.036830902099609375, -0.02497100830078125, -0.013111114501953125, -0.001251220703125, 0.010608673095703125, 0.02246856689453125, 0.034328460693359375, 0.0461883544921875, 0.058048248291015625, 0.06990814208984375, 0.08176803588867188, 0.0936279296875, 0.10548782348632812, 0.11734771728515625, 0.12920761108398438, 0.1410675048828125, 0.15292739868164062, 0.16478729248046875, 0.17664718627929688, 0.188507080078125, 0.20036697387695312, 0.21222686767578125, 0.22408676147460938, 0.2359466552734375, 0.24780654907226562, 0.25966644287109375, 0.2715263366699219, 0.28338623046875, 0.2952461242675781, 0.30710601806640625, 0.3189659118652344, 0.3308258056640625, 0.3426856994628906, 0.35454559326171875, 0.3664054870605469, 0.378265380859375, 0.3901252746582031, 0.40198516845703125, 0.4138450622558594, 0.4257049560546875, 0.4375648498535156, 0.44942474365234375, 0.4612846374511719, 0.47314453125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 8.0, 11.0, 15.0, 14.0, 36.0, 73.0, 107.0, 153.0, 288.0, 558.0, 1192.0, 2903.0, 9605.0, 49739.0, 3809965.0, 287198.0, 22373.0, 5702.0, 2110.0, 985.0, 499.0, 274.0, 168.0, 95.0, 53.0, 49.0, 22.0, 24.0, 17.0, 5.0, 9.0, 4.0, 4.0, 5.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.609375, -5.464752197265625, -5.32012939453125, -5.175506591796875, -5.0308837890625, -4.886260986328125, -4.74163818359375, -4.597015380859375, -4.452392578125, -4.307769775390625, -4.16314697265625, -4.018524169921875, -3.8739013671875, -3.729278564453125, -3.58465576171875, -3.440032958984375, -3.29541015625, -3.150787353515625, -3.00616455078125, -2.861541748046875, -2.7169189453125, -2.572296142578125, -2.42767333984375, -2.283050537109375, -2.138427734375, -1.993804931640625, -1.84918212890625, -1.704559326171875, -1.5599365234375, -1.415313720703125, -1.27069091796875, -1.126068115234375, -0.9814453125, -0.836822509765625, -0.69219970703125, -0.547576904296875, -0.4029541015625, -0.258331298828125, -0.11370849609375, 0.030914306640625, 0.175537109375, 0.320159912109375, 0.46478271484375, 0.609405517578125, 0.7540283203125, 0.898651123046875, 1.04327392578125, 1.187896728515625, 1.33251953125, 1.477142333984375, 1.62176513671875, 1.766387939453125, 1.9110107421875, 2.055633544921875, 2.20025634765625, 2.344879150390625, 2.489501953125, 2.634124755859375, 2.77874755859375, 2.923370361328125, 3.0679931640625, 3.212615966796875, 3.35723876953125, 3.501861572265625, 3.646484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 11.0, 18.0, 14.0, 24.0, 23.0, 49.0, 89.0, 180.0, 540.0, 2022.0, 665.0, 171.0, 72.0, 52.0, 34.0, 26.0, 25.0, 7.0, 9.0, 6.0, 7.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.994140625, -0.9593353271484375, -0.924530029296875, -0.8897247314453125, -0.85491943359375, -0.8201141357421875, -0.785308837890625, -0.7505035400390625, -0.7156982421875, -0.6808929443359375, -0.646087646484375, -0.6112823486328125, -0.57647705078125, -0.5416717529296875, -0.506866455078125, -0.4720611572265625, -0.437255859375, -0.4024505615234375, -0.367645263671875, -0.3328399658203125, -0.29803466796875, -0.2632293701171875, -0.228424072265625, -0.1936187744140625, -0.1588134765625, -0.1240081787109375, -0.089202880859375, -0.0543975830078125, -0.01959228515625, 0.0152130126953125, 0.050018310546875, 0.0848236083984375, 0.11962890625, 0.1544342041015625, 0.189239501953125, 0.2240447998046875, 0.25885009765625, 0.2936553955078125, 0.328460693359375, 0.3632659912109375, 0.3980712890625, 0.4328765869140625, 0.467681884765625, 0.5024871826171875, 0.53729248046875, 0.5720977783203125, 0.606903076171875, 0.6417083740234375, 0.676513671875, 0.7113189697265625, 0.746124267578125, 0.7809295654296875, 0.81573486328125, 0.8505401611328125, 0.885345458984375, 0.9201507568359375, 0.9549560546875, 0.9897613525390625, 1.024566650390625, 1.0593719482421875, 1.09417724609375, 1.1289825439453125, 1.163787841796875, 1.1985931396484375, 1.2333984375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 12.0, 18.0, 74.0, 229.0, 434.0, 180.0, 43.0, 9.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.375373363494873, -6.826822280883789, -6.278271675109863, -5.729720592498779, -5.181169509887695, -4.6326189041137695, -4.0840678215026855, -3.5355169773101807, -2.986966133117676, -2.438415288925171, -1.8898643255233765, -1.341313362121582, -0.7927625179290771, -0.24421167373657227, 0.3043394088745117, 0.8528902530670166, 1.4014410972595215, 1.9499919414520264, 2.4985427856445312, 3.0470938682556152, 3.59564471244812, 4.144195556640625, 4.692746639251709, 5.241297721862793, 5.789848327636719, 6.338399410247803, 6.8869500160217285, 7.4355010986328125, 7.984051704406738, 8.532602310180664, 9.081153869628906, 9.629704475402832, 10.17825698852539, 10.726807594299316, 11.275359153747559, 11.823909759521484, 12.37246036529541, 12.921010971069336, 13.469562530517578, 14.018113136291504, 14.56666374206543, 15.115214347839355, 15.663765907287598, 16.212316513061523, 16.760868072509766, 17.309417724609375, 17.857969284057617, 18.40652084350586, 18.95507049560547, 19.50362205505371, 20.05217170715332, 20.600723266601562, 21.149274826049805, 21.697824478149414, 22.246376037597656, 22.7949275970459, 23.34347915649414, 23.892030715942383, 24.440580368041992, 24.989131927490234, 25.537683486938477, 26.086233139038086, 26.634784698486328, 27.18333625793457, 27.73188591003418]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 11.0, 12.0, 10.0, 15.0, 48.0, 60.0, 72.0, 82.0, 106.0, 90.0, 105.0, 88.0, 76.0, 53.0, 50.0, 31.0, 40.0, 29.0, 14.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.436782360076904, -6.256065845489502, -6.0753493309021, -5.8946332931518555, -5.713916778564453, -5.533200263977051, -5.352483749389648, -5.171767234802246, -4.991050720214844, -4.810334205627441, -4.629617691040039, -4.448901176452637, -4.268185138702393, -4.08746862411499, -3.906752109527588, -3.7260355949401855, -3.5453195571899414, -3.364603042602539, -3.183886766433716, -3.0031702518463135, -2.8224539756774902, -2.641737461090088, -2.4610209465026855, -2.280304431915283, -2.09958815574646, -1.9188717603683472, -1.7381553649902344, -1.557438850402832, -1.3767224550247192, -1.1960060596466064, -1.015289545059204, -0.8345731496810913, -0.6538572311401367, -0.47314080595970154, -0.29242438077926636, -0.11170792579650879, 0.069008469581604, 0.2497248649597168, 0.43044137954711914, 0.6111577749252319, 0.7918741703033447, 0.9725905656814575, 1.1533069610595703, 1.3340234756469727, 1.5147398710250854, 1.6954562664031982, 1.8761727809906006, 2.056889057159424, 2.237605571746826, 2.4183220863342285, 2.5990383625030518, 2.779754877090454, 2.9604711532592773, 3.1411876678466797, 3.321904182434082, 3.5026206970214844, 3.6833369731903076, 3.86405348777771, 4.044769763946533, 4.2254862785339355, 4.406202793121338, 4.586918830871582, 4.767635345458984, 4.948351860046387, 5.129068374633789]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 6.0, 1.0, 6.0, 13.0, 15.0, 12.0, 16.0, 27.0, 46.0, 53.0, 99.0, 124.0, 187.0, 306.0, 526.0, 1057.0, 2356.0, 6631.0, 29248.0, 271570.0, 640698.0, 76078.0, 12449.0, 3698.0, 1515.0, 735.0, 365.0, 241.0, 144.0, 117.0, 63.0, 46.0, 28.0, 24.0, 13.0, 17.0, 8.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.189453125, -3.09051513671875, -2.9915771484375, -2.89263916015625, -2.793701171875, -2.69476318359375, -2.5958251953125, -2.49688720703125, -2.39794921875, -2.29901123046875, -2.2000732421875, -2.10113525390625, -2.002197265625, -1.90325927734375, -1.8043212890625, -1.70538330078125, -1.6064453125, -1.50750732421875, -1.4085693359375, -1.30963134765625, -1.210693359375, -1.11175537109375, -1.0128173828125, -0.91387939453125, -0.81494140625, -0.71600341796875, -0.6170654296875, -0.51812744140625, -0.419189453125, -0.32025146484375, -0.2213134765625, -0.12237548828125, -0.0234375, 0.07550048828125, 0.1744384765625, 0.27337646484375, 0.372314453125, 0.47125244140625, 0.5701904296875, 0.66912841796875, 0.76806640625, 0.86700439453125, 0.9659423828125, 1.06488037109375, 1.163818359375, 1.26275634765625, 1.3616943359375, 1.46063232421875, 1.5595703125, 1.65850830078125, 1.7574462890625, 1.85638427734375, 1.955322265625, 2.05426025390625, 2.1531982421875, 2.25213623046875, 2.35107421875, 2.45001220703125, 2.5489501953125, 2.64788818359375, 2.746826171875, 2.84576416015625, 2.9447021484375, 3.04364013671875, 3.142578125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 14.0, 14.0, 21.0, 35.0, 47.0, 95.0, 116.0, 122.0, 122.0, 100.0, 95.0, 82.0, 36.0, 32.0, 27.0, 14.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47998046875, -0.463623046875, -0.447265625, -0.430908203125, -0.41455078125, -0.398193359375, -0.3818359375, -0.365478515625, -0.34912109375, -0.332763671875, -0.31640625, -0.300048828125, -0.28369140625, -0.267333984375, -0.2509765625, -0.234619140625, -0.21826171875, -0.201904296875, -0.185546875, -0.169189453125, -0.15283203125, -0.136474609375, -0.1201171875, -0.103759765625, -0.08740234375, -0.071044921875, -0.0546875, -0.038330078125, -0.02197265625, -0.005615234375, 0.0107421875, 0.027099609375, 0.04345703125, 0.059814453125, 0.076171875, 0.092529296875, 0.10888671875, 0.125244140625, 0.1416015625, 0.157958984375, 0.17431640625, 0.190673828125, 0.20703125, 0.223388671875, 0.23974609375, 0.256103515625, 0.2724609375, 0.288818359375, 0.30517578125, 0.321533203125, 0.337890625, 0.354248046875, 0.37060546875, 0.386962890625, 0.4033203125, 0.419677734375, 0.43603515625, 0.452392578125, 0.46875, 0.485107421875, 0.50146484375, 0.517822265625, 0.5341796875, 0.550537109375, 0.56689453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 13.0, 12.0, 19.0, 21.0, 36.0, 36.0, 74.0, 85.0, 139.0, 185.0, 292.0, 519.0, 862.0, 1605.0, 3193.0, 6824.0, 16420.0, 42460.0, 117174.0, 295449.0, 332344.0, 143017.0, 51696.0, 19660.0, 8194.0, 3741.0, 1745.0, 1041.0, 552.0, 358.0, 231.0, 162.0, 110.0, 80.0, 54.0, 40.0, 22.0, 25.0, 11.0, 11.0, 11.0, 6.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0888671875, -1.0526885986328125, -1.016510009765625, -0.9803314208984375, -0.94415283203125, -0.9079742431640625, -0.871795654296875, -0.8356170654296875, -0.7994384765625, -0.7632598876953125, -0.727081298828125, -0.6909027099609375, -0.65472412109375, -0.6185455322265625, -0.582366943359375, -0.5461883544921875, -0.510009765625, -0.4738311767578125, -0.437652587890625, -0.4014739990234375, -0.36529541015625, -0.3291168212890625, -0.292938232421875, -0.2567596435546875, -0.2205810546875, -0.1844024658203125, -0.148223876953125, -0.1120452880859375, -0.07586669921875, -0.0396881103515625, -0.003509521484375, 0.0326690673828125, 0.06884765625, 0.1050262451171875, 0.141204833984375, 0.1773834228515625, 0.21356201171875, 0.2497406005859375, 0.285919189453125, 0.3220977783203125, 0.3582763671875, 0.3944549560546875, 0.430633544921875, 0.4668121337890625, 0.50299072265625, 0.5391693115234375, 0.575347900390625, 0.6115264892578125, 0.647705078125, 0.6838836669921875, 0.720062255859375, 0.7562408447265625, 0.79241943359375, 0.8285980224609375, 0.864776611328125, 0.9009552001953125, 0.9371337890625, 0.9733123779296875, 1.009490966796875, 1.0456695556640625, 1.08184814453125, 1.1180267333984375, 1.154205322265625, 1.1903839111328125, 1.2265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 9.0, 7.0, 14.0, 16.0, 9.0, 22.0, 20.0, 30.0, 34.0, 29.0, 49.0, 37.0, 43.0, 39.0, 40.0, 50.0, 55.0, 61.0, 40.0, 38.0, 41.0, 45.0, 17.0, 34.0, 33.0, 28.0, 24.0, 17.0, 15.0, 22.0, 15.0, 7.0, 5.0, 7.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1015625, -1.0679168701171875, -1.034271240234375, -1.0006256103515625, -0.96697998046875, -0.9333343505859375, -0.899688720703125, -0.8660430908203125, -0.8323974609375, -0.7987518310546875, -0.765106201171875, -0.7314605712890625, -0.69781494140625, -0.6641693115234375, -0.630523681640625, -0.5968780517578125, -0.563232421875, -0.5295867919921875, -0.495941162109375, -0.4622955322265625, -0.42864990234375, -0.3950042724609375, -0.361358642578125, -0.3277130126953125, -0.2940673828125, -0.2604217529296875, -0.226776123046875, -0.1931304931640625, -0.15948486328125, -0.1258392333984375, -0.092193603515625, -0.0585479736328125, -0.02490234375, 0.0087432861328125, 0.042388916015625, 0.0760345458984375, 0.10968017578125, 0.1433258056640625, 0.176971435546875, 0.2106170654296875, 0.2442626953125, 0.2779083251953125, 0.311553955078125, 0.3451995849609375, 0.37884521484375, 0.4124908447265625, 0.446136474609375, 0.4797821044921875, 0.513427734375, 0.5470733642578125, 0.580718994140625, 0.6143646240234375, 0.64801025390625, 0.6816558837890625, 0.715301513671875, 0.7489471435546875, 0.7825927734375, 0.8162384033203125, 0.849884033203125, 0.8835296630859375, 0.91717529296875, 0.9508209228515625, 0.984466552734375, 1.0181121826171875, 1.0517578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 7.0, 4.0, 10.0, 12.0, 14.0, 40.0, 47.0, 70.0, 119.0, 180.0, 338.0, 627.0, 1230.0, 2664.0, 6608.0, 20800.0, 102768.0, 661638.0, 203922.0, 31487.0, 9148.0, 3544.0, 1503.0, 741.0, 392.0, 239.0, 156.0, 78.0, 47.0, 27.0, 39.0, 15.0, 7.0, 11.0, 11.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0693359375, -1.036590576171875, -1.00384521484375, -0.971099853515625, -0.9383544921875, -0.905609130859375, -0.87286376953125, -0.840118408203125, -0.807373046875, -0.774627685546875, -0.74188232421875, -0.709136962890625, -0.6763916015625, -0.643646240234375, -0.61090087890625, -0.578155517578125, -0.54541015625, -0.512664794921875, -0.47991943359375, -0.447174072265625, -0.4144287109375, -0.381683349609375, -0.34893798828125, -0.316192626953125, -0.283447265625, -0.250701904296875, -0.21795654296875, -0.185211181640625, -0.1524658203125, -0.119720458984375, -0.08697509765625, -0.054229736328125, -0.021484375, 0.011260986328125, 0.04400634765625, 0.076751708984375, 0.1094970703125, 0.142242431640625, 0.17498779296875, 0.207733154296875, 0.240478515625, 0.273223876953125, 0.30596923828125, 0.338714599609375, 0.3714599609375, 0.404205322265625, 0.43695068359375, 0.469696044921875, 0.50244140625, 0.535186767578125, 0.56793212890625, 0.600677490234375, 0.6334228515625, 0.666168212890625, 0.69891357421875, 0.731658935546875, 0.764404296875, 0.797149658203125, 0.82989501953125, 0.862640380859375, 0.8953857421875, 0.928131103515625, 0.96087646484375, 0.993621826171875, 1.0263671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 7.0, 9.0, 12.0, 11.0, 21.0, 21.0, 31.0, 49.0, 69.0, 77.0, 127.0, 142.0, 101.0, 80.0, 49.0, 54.0, 25.0, 25.0, 13.0, 12.0, 14.0, 10.0, 10.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0001386404037475586, -0.00013392791152000427, -0.00012921541929244995, -0.00012450292706489563, -0.00011979043483734131, -0.00011507794260978699, -0.00011036545038223267, -0.00010565295815467834, -0.00010094046592712402, -9.62279736995697e-05, -9.151548147201538e-05, -8.680298924446106e-05, -8.209049701690674e-05, -7.737800478935242e-05, -7.26655125617981e-05, -6.795302033424377e-05, -6.324052810668945e-05, -5.852803587913513e-05, -5.381554365158081e-05, -4.910305142402649e-05, -4.439055919647217e-05, -3.967806696891785e-05, -3.4965574741363525e-05, -3.0253082513809204e-05, -2.5540590286254883e-05, -2.082809805870056e-05, -1.611560583114624e-05, -1.1403113603591919e-05, -6.690621376037598e-06, -1.9781291484832764e-06, 2.734363079071045e-06, 7.446855306625366e-06, 1.2159347534179688e-05, 1.687183976173401e-05, 2.158433198928833e-05, 2.629682421684265e-05, 3.100931644439697e-05, 3.5721808671951294e-05, 4.0434300899505615e-05, 4.5146793127059937e-05, 4.985928535461426e-05, 5.457177758216858e-05, 5.92842698097229e-05, 6.399676203727722e-05, 6.870925426483154e-05, 7.342174649238586e-05, 7.813423871994019e-05, 8.284673094749451e-05, 8.755922317504883e-05, 9.227171540260315e-05, 9.698420763015747e-05, 0.00010169669985771179, 0.00010640919208526611, 0.00011112168431282043, 0.00011583417654037476, 0.00012054666876792908, 0.0001252591609954834, 0.00012997165322303772, 0.00013468414545059204, 0.00013939663767814636, 0.00014410912990570068, 0.000148821622133255, 0.00015353411436080933, 0.00015824660658836365, 0.00016295909881591797]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 15.0, 8.0, 21.0, 39.0, 68.0, 126.0, 258.0, 570.0, 1640.0, 5671.0, 30867.0, 754638.0, 233066.0, 16004.0, 3560.0, 1085.0, 457.0, 192.0, 109.0, 44.0, 43.0, 23.0, 10.0, 9.0, 11.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26171875, -2.19677734375, -2.1318359375, -2.06689453125, -2.001953125, -1.93701171875, -1.8720703125, -1.80712890625, -1.7421875, -1.67724609375, -1.6123046875, -1.54736328125, -1.482421875, -1.41748046875, -1.3525390625, -1.28759765625, -1.22265625, -1.15771484375, -1.0927734375, -1.02783203125, -0.962890625, -0.89794921875, -0.8330078125, -0.76806640625, -0.703125, -0.63818359375, -0.5732421875, -0.50830078125, -0.443359375, -0.37841796875, -0.3134765625, -0.24853515625, -0.18359375, -0.11865234375, -0.0537109375, 0.01123046875, 0.076171875, 0.14111328125, 0.2060546875, 0.27099609375, 0.3359375, 0.40087890625, 0.4658203125, 0.53076171875, 0.595703125, 0.66064453125, 0.7255859375, 0.79052734375, 0.85546875, 0.92041015625, 0.9853515625, 1.05029296875, 1.115234375, 1.18017578125, 1.2451171875, 1.31005859375, 1.375, 1.43994140625, 1.5048828125, 1.56982421875, 1.634765625, 1.69970703125, 1.7646484375, 1.82958984375, 1.89453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 12.0, 7.0, 10.0, 15.0, 14.0, 12.0, 14.0, 29.0, 55.0, 76.0, 100.0, 127.0, 143.0, 125.0, 78.0, 47.0, 40.0, 26.0, 17.0, 16.0, 6.0, 4.0, 7.0, 2.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91162109375, -0.8832244873046875, -0.854827880859375, -0.8264312744140625, -0.79803466796875, -0.7696380615234375, -0.741241455078125, -0.7128448486328125, -0.6844482421875, -0.6560516357421875, -0.627655029296875, -0.5992584228515625, -0.57086181640625, -0.5424652099609375, -0.514068603515625, -0.4856719970703125, -0.457275390625, -0.4288787841796875, -0.400482177734375, -0.3720855712890625, -0.34368896484375, -0.3152923583984375, -0.286895751953125, -0.2584991455078125, -0.2301025390625, -0.2017059326171875, -0.173309326171875, -0.1449127197265625, -0.11651611328125, -0.0881195068359375, -0.059722900390625, -0.0313262939453125, -0.0029296875, 0.0254669189453125, 0.053863525390625, 0.0822601318359375, 0.11065673828125, 0.1390533447265625, 0.167449951171875, 0.1958465576171875, 0.2242431640625, 0.2526397705078125, 0.281036376953125, 0.3094329833984375, 0.33782958984375, 0.3662261962890625, 0.394622802734375, 0.4230194091796875, 0.451416015625, 0.4798126220703125, 0.508209228515625, 0.5366058349609375, 0.56500244140625, 0.5933990478515625, 0.621795654296875, 0.6501922607421875, 0.6785888671875, 0.7069854736328125, 0.735382080078125, 0.7637786865234375, 0.79217529296875, 0.8205718994140625, 0.848968505859375, 0.8773651123046875, 0.90576171875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 9.0, 10.0, 23.0, 32.0, 40.0, 59.0, 113.0, 111.0, 144.0, 141.0, 117.0, 79.0, 38.0, 36.0, 20.0, 7.0, 11.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.018125534057617, -12.676589012145996, -12.335051536560059, -11.993515014648438, -11.651978492736816, -11.310441970825195, -10.968904495239258, -10.627367973327637, -10.285831451416016, -9.944294929504395, -9.602757453918457, -9.261220932006836, -8.919684410095215, -8.578147888183594, -8.236610412597656, -7.895073890686035, -7.553536415100098, -7.211999416351318, -6.870462894439697, -6.528925895690918, -6.187389373779297, -5.845852375030518, -5.504315376281738, -5.162778854370117, -4.821241855621338, -4.479704856872559, -4.1381683349609375, -3.796631336212158, -3.455094575881958, -3.113557815551758, -2.7720208168029785, -2.4304840564727783, -2.0889463424682617, -1.7474095821380615, -1.4058727025985718, -1.064335823059082, -0.7227990627288818, -0.38126230239868164, -0.039725303649902344, 0.30181145668029785, 0.643348217010498, 0.984885036945343, 1.326421856880188, 1.6679587364196777, 2.009495496749878, 2.351032257080078, 2.6925692558288574, 3.0341060161590576, 3.375642776489258, 3.717179536819458, 4.058716297149658, 4.4002532958984375, 4.741789817810059, 5.083326816558838, 5.424863815307617, 5.766400337219238, 6.107937335968018, 6.449474334716797, 6.791010856628418, 7.132547855377197, 7.474084854125977, 7.815621376037598, 8.157157897949219, 8.498695373535156, 8.840231895446777]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 5.0, 11.0, 13.0, 12.0, 12.0, 22.0, 17.0, 28.0, 15.0, 24.0, 16.0, 23.0, 27.0, 32.0, 31.0, 31.0, 43.0, 31.0, 35.0, 46.0, 36.0, 29.0, 48.0, 34.0, 38.0, 33.0, 40.0, 27.0, 33.0, 24.0, 32.0, 21.0, 22.0, 21.0, 13.0, 8.0, 11.0, 10.0, 7.0, 3.0, 5.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.346571445465088, -5.179823875427246, -5.013076305389404, -4.8463287353515625, -4.679581165313721, -4.512833595275879, -4.346086025238037, -4.179338455200195, -4.0125908851623535, -3.8458433151245117, -3.67909574508667, -3.512348175048828, -3.3456006050109863, -3.1788530349731445, -3.0121054649353027, -2.845357894897461, -2.678610324859619, -2.5118627548217773, -2.3451151847839355, -2.1783676147460938, -2.011620044708252, -1.8448724746704102, -1.6781249046325684, -1.5113773345947266, -1.3446297645568848, -1.177882194519043, -1.0111346244812012, -0.8443870544433594, -0.6776394844055176, -0.5108919143676758, -0.344144344329834, -0.1773967742919922, -0.010649681091308594, 0.1560978889465332, 0.322845458984375, 0.4895930290222168, 0.6563405990600586, 0.8230881690979004, 0.9898357391357422, 1.156583309173584, 1.3233308792114258, 1.4900784492492676, 1.6568260192871094, 1.8235735893249512, 1.990321159362793, 2.1570687294006348, 2.3238162994384766, 2.4905638694763184, 2.65731143951416, 2.824059009552002, 2.9908065795898438, 3.1575541496276855, 3.3243017196655273, 3.491049289703369, 3.657796859741211, 3.8245444297790527, 3.9912919998168945, 4.158039569854736, 4.324787139892578, 4.49153470993042, 4.658282279968262, 4.8250298500061035, 4.991777420043945, 5.158524990081787, 5.325272560119629]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 7.0, 8.0, 6.0, 10.0, 8.0, 22.0, 22.0, 34.0, 82.0, 138.0, 338.0, 925.0, 3384.0, 19195.0, 3827233.0, 326171.0, 12301.0, 2553.0, 831.0, 365.0, 197.0, 122.0, 83.0, 61.0, 37.0, 35.0, 26.0, 22.0, 21.0, 13.0, 7.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.37109375, -5.212646484375, -5.05419921875, -4.895751953125, -4.7373046875, -4.578857421875, -4.42041015625, -4.261962890625, -4.103515625, -3.945068359375, -3.78662109375, -3.628173828125, -3.4697265625, -3.311279296875, -3.15283203125, -2.994384765625, -2.8359375, -2.677490234375, -2.51904296875, -2.360595703125, -2.2021484375, -2.043701171875, -1.88525390625, -1.726806640625, -1.568359375, -1.409912109375, -1.25146484375, -1.093017578125, -0.9345703125, -0.776123046875, -0.61767578125, -0.459228515625, -0.30078125, -0.142333984375, 0.01611328125, 0.174560546875, 0.3330078125, 0.491455078125, 0.64990234375, 0.808349609375, 0.966796875, 1.125244140625, 1.28369140625, 1.442138671875, 1.6005859375, 1.759033203125, 1.91748046875, 2.075927734375, 2.234375, 2.392822265625, 2.55126953125, 2.709716796875, 2.8681640625, 3.026611328125, 3.18505859375, 3.343505859375, 3.501953125, 3.660400390625, 3.81884765625, 3.977294921875, 4.1357421875, 4.294189453125, 4.45263671875, 4.611083984375, 4.76953125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 5.0, 11.0, 29.0, 33.0, 56.0, 68.0, 89.0, 103.0, 108.0, 84.0, 112.0, 76.0, 77.0, 42.0, 37.0, 23.0, 11.0, 11.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.448486328125, -0.4330406188964844, -0.41759490966796875, -0.4021492004394531, -0.3867034912109375, -0.3712577819824219, -0.35581207275390625, -0.3403663635253906, -0.324920654296875, -0.3094749450683594, -0.29402923583984375, -0.2785835266113281, -0.2631378173828125, -0.24769210815429688, -0.23224639892578125, -0.21680068969726562, -0.20135498046875, -0.18590927124023438, -0.17046356201171875, -0.15501785278320312, -0.1395721435546875, -0.12412643432617188, -0.10868072509765625, -0.09323501586914062, -0.077789306640625, -0.062343597412109375, -0.04689788818359375, -0.031452178955078125, -0.0160064697265625, -0.000560760498046875, 0.01488494873046875, 0.030330657958984375, 0.0457763671875, 0.061222076416015625, 0.07666778564453125, 0.09211349487304688, 0.1075592041015625, 0.12300491333007812, 0.13845062255859375, 0.15389633178710938, 0.169342041015625, 0.18478775024414062, 0.20023345947265625, 0.21567916870117188, 0.2311248779296875, 0.24657058715820312, 0.26201629638671875, 0.2774620056152344, 0.29290771484375, 0.3083534240722656, 0.32379913330078125, 0.3392448425292969, 0.3546905517578125, 0.3701362609863281, 0.38558197021484375, 0.4010276794433594, 0.416473388671875, 0.4319190979003906, 0.44736480712890625, 0.4628105163574219, 0.4782562255859375, 0.4937019348144531, 0.5091476440429688, 0.5245933532714844, 0.5400390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 8.0, 13.0, 27.0, 44.0, 59.0, 124.0, 236.0, 410.0, 772.0, 1561.0, 3212.0, 7509.0, 21593.0, 123156.0, 3807792.0, 186433.0, 25979.0, 8326.0, 3542.0, 1641.0, 801.0, 424.0, 258.0, 137.0, 71.0, 47.0, 32.0, 28.0, 7.0, 12.0, 7.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.4921875, -2.42010498046875, -2.3480224609375, -2.27593994140625, -2.203857421875, -2.13177490234375, -2.0596923828125, -1.98760986328125, -1.91552734375, -1.84344482421875, -1.7713623046875, -1.69927978515625, -1.627197265625, -1.55511474609375, -1.4830322265625, -1.41094970703125, -1.3388671875, -1.26678466796875, -1.1947021484375, -1.12261962890625, -1.050537109375, -0.97845458984375, -0.9063720703125, -0.83428955078125, -0.76220703125, -0.69012451171875, -0.6180419921875, -0.54595947265625, -0.473876953125, -0.40179443359375, -0.3297119140625, -0.25762939453125, -0.185546875, -0.11346435546875, -0.0413818359375, 0.03070068359375, 0.102783203125, 0.17486572265625, 0.2469482421875, 0.31903076171875, 0.39111328125, 0.46319580078125, 0.5352783203125, 0.60736083984375, 0.679443359375, 0.75152587890625, 0.8236083984375, 0.89569091796875, 0.9677734375, 1.03985595703125, 1.1119384765625, 1.18402099609375, 1.256103515625, 1.32818603515625, 1.4002685546875, 1.47235107421875, 1.54443359375, 1.61651611328125, 1.6885986328125, 1.76068115234375, 1.832763671875, 1.90484619140625, 1.9769287109375, 2.04901123046875, 2.12109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 3.0, 5.0, 7.0, 5.0, 5.0, 12.0, 10.0, 19.0, 18.0, 24.0, 46.0, 77.0, 135.0, 290.0, 1064.0, 1585.0, 337.0, 168.0, 92.0, 47.0, 23.0, 22.0, 14.0, 8.0, 8.0, 7.0, 8.0, 4.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.57568359375, -0.5565567016601562, -0.5374298095703125, -0.5183029174804688, -0.499176025390625, -0.48004913330078125, -0.4609222412109375, -0.44179534912109375, -0.42266845703125, -0.40354156494140625, -0.3844146728515625, -0.36528778076171875, -0.346160888671875, -0.32703399658203125, -0.3079071044921875, -0.28878021240234375, -0.2696533203125, -0.25052642822265625, -0.2313995361328125, -0.21227264404296875, -0.193145751953125, -0.17401885986328125, -0.1548919677734375, -0.13576507568359375, -0.11663818359375, -0.09751129150390625, -0.0783843994140625, -0.05925750732421875, -0.040130615234375, -0.02100372314453125, -0.0018768310546875, 0.01725006103515625, 0.036376953125, 0.05550384521484375, 0.0746307373046875, 0.09375762939453125, 0.112884521484375, 0.13201141357421875, 0.1511383056640625, 0.17026519775390625, 0.18939208984375, 0.20851898193359375, 0.2276458740234375, 0.24677276611328125, 0.265899658203125, 0.28502655029296875, 0.3041534423828125, 0.32328033447265625, 0.3424072265625, 0.36153411865234375, 0.3806610107421875, 0.39978790283203125, 0.418914794921875, 0.43804168701171875, 0.4571685791015625, 0.47629547119140625, 0.49542236328125, 0.5145492553710938, 0.5336761474609375, 0.5528030395507812, 0.571929931640625, 0.5910568237304688, 0.6101837158203125, 0.6293106079101562, 0.6484375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 7.0, 9.0, 13.0, 36.0, 50.0, 95.0, 179.0, 203.0, 186.0, 102.0, 52.0, 35.0, 12.0, 8.0, 10.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.484475612640381, -6.312633991241455, -6.140791893005371, -5.968950271606445, -5.7971086502075195, -5.6252665519714355, -5.45342493057251, -5.281582832336426, -5.1097412109375, -4.937899589538574, -4.76605749130249, -4.5942158699035645, -4.4223737716674805, -4.250532150268555, -4.078690528869629, -3.906848669052124, -3.735006809234619, -3.5631649494171143, -3.3913230895996094, -3.2194814682006836, -3.0476396083831787, -2.875797748565674, -2.703956127166748, -2.532114267349243, -2.3602724075317383, -2.1884305477142334, -2.0165886878967285, -1.8447470664978027, -1.6729052066802979, -1.501063346862793, -1.3292216062545776, -1.1573798656463623, -0.9855375289916992, -0.8136957287788391, -0.641853928565979, -0.4700121283531189, -0.2981703281402588, -0.12632852792739868, 0.045513272285461426, 0.21735501289367676, 0.38919687271118164, 0.5610386729240417, 0.7328804731369019, 0.904722273349762, 1.076564073562622, 1.248405933380127, 1.4202476739883423, 1.5920894145965576, 1.7639312744140625, 1.9357731342315674, 2.1076149940490723, 2.279456615447998, 2.451298475265503, 2.623140335083008, 2.7949819564819336, 2.9668238162994385, 3.1386656761169434, 3.3105075359344482, 3.482349395751953, 3.654191017150879, 3.826032876968384, 3.9978747367858887, 4.1697163581848145, 4.341558456420898, 4.513400077819824]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 9.0, 10.0, 13.0, 9.0, 16.0, 20.0, 25.0, 27.0, 38.0, 33.0, 48.0, 40.0, 40.0, 51.0, 45.0, 42.0, 54.0, 56.0, 49.0, 57.0, 52.0, 53.0, 40.0, 20.0, 27.0, 20.0, 20.0, 13.0, 14.0, 14.0, 15.0, 14.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.7820212841033936, -2.7063207626342773, -2.6306204795837402, -2.554919958114624, -2.479219675064087, -2.4035191535949707, -2.3278188705444336, -2.2521183490753174, -2.176417827606201, -2.100717306137085, -2.025017023086548, -1.9493165016174316, -1.873616099357605, -1.7979156970977783, -1.7222152948379517, -1.646514892578125, -1.5708144903182983, -1.4951140880584717, -1.419413685798645, -1.3437132835388184, -1.2680127620697021, -1.1923123598098755, -1.1166119575500488, -1.0409114360809326, -0.9652110934257507, -0.8895106911659241, -0.8138102293014526, -0.738109827041626, -0.6624094247817993, -0.5867089629173279, -0.5110085606575012, -0.4353080987930298, -0.3596076965332031, -0.2839072644710541, -0.20820684731006622, -0.13250643014907837, -0.05680599808692932, 0.018894433975219727, 0.09459483623504639, 0.17029529809951782, 0.24599570035934448, 0.32169613242149353, 0.3973965644836426, 0.47309696674346924, 0.5487973690032959, 0.6244978308677673, 0.700198233127594, 0.7758986949920654, 0.8515990972518921, 0.9272994995117188, 1.0029999017715454, 1.078700304031372, 1.1544008255004883, 1.230101227760315, 1.3058016300201416, 1.3815021514892578, 1.457202434539795, 1.5329028367996216, 1.6086032390594482, 1.6843037605285645, 1.7600041627883911, 1.8357045650482178, 1.9114049673080444, 1.987105369567871, 2.0628058910369873]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 18.0, 20.0, 18.0, 25.0, 43.0, 68.0, 122.0, 159.0, 283.0, 485.0, 1002.0, 2080.0, 5410.0, 18791.0, 119398.0, 629306.0, 227381.0, 31164.0, 7452.0, 2675.0, 1209.0, 552.0, 316.0, 176.0, 106.0, 89.0, 53.0, 27.0, 32.0, 15.0, 18.0, 8.0, 8.0, 7.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.771484375, -2.681060791015625, -2.59063720703125, -2.500213623046875, -2.4097900390625, -2.319366455078125, -2.22894287109375, -2.138519287109375, -2.048095703125, -1.957672119140625, -1.86724853515625, -1.776824951171875, -1.6864013671875, -1.595977783203125, -1.50555419921875, -1.415130615234375, -1.32470703125, -1.234283447265625, -1.14385986328125, -1.053436279296875, -0.9630126953125, -0.872589111328125, -0.78216552734375, -0.691741943359375, -0.601318359375, -0.510894775390625, -0.42047119140625, -0.330047607421875, -0.2396240234375, -0.149200439453125, -0.05877685546875, 0.031646728515625, 0.1220703125, 0.212493896484375, 0.30291748046875, 0.393341064453125, 0.4837646484375, 0.574188232421875, 0.66461181640625, 0.755035400390625, 0.845458984375, 0.935882568359375, 1.02630615234375, 1.116729736328125, 1.2071533203125, 1.297576904296875, 1.38800048828125, 1.478424072265625, 1.56884765625, 1.659271240234375, 1.74969482421875, 1.840118408203125, 1.9305419921875, 2.020965576171875, 2.11138916015625, 2.201812744140625, 2.292236328125, 2.382659912109375, 2.47308349609375, 2.563507080078125, 2.6539306640625, 2.744354248046875, 2.83477783203125, 2.925201416015625, 3.015625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 10.0, 15.0, 13.0, 32.0, 34.0, 53.0, 73.0, 82.0, 90.0, 101.0, 98.0, 105.0, 79.0, 67.0, 57.0, 35.0, 21.0, 5.0, 9.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.458251953125, -0.4423789978027344, -0.42650604248046875, -0.4106330871582031, -0.3947601318359375, -0.3788871765136719, -0.36301422119140625, -0.3471412658691406, -0.331268310546875, -0.3153953552246094, -0.29952239990234375, -0.2836494445800781, -0.2677764892578125, -0.2519035339355469, -0.23603057861328125, -0.22015762329101562, -0.20428466796875, -0.18841171264648438, -0.17253875732421875, -0.15666580200195312, -0.1407928466796875, -0.12491989135742188, -0.10904693603515625, -0.09317398071289062, -0.077301025390625, -0.061428070068359375, -0.04555511474609375, -0.029682159423828125, -0.0138092041015625, 0.002063751220703125, 0.01793670654296875, 0.033809661865234375, 0.0496826171875, 0.06555557250976562, 0.08142852783203125, 0.09730148315429688, 0.1131744384765625, 0.12904739379882812, 0.14492034912109375, 0.16079330444335938, 0.176666259765625, 0.19253921508789062, 0.20841217041015625, 0.22428512573242188, 0.2401580810546875, 0.2560310363769531, 0.27190399169921875, 0.2877769470214844, 0.30364990234375, 0.3195228576660156, 0.33539581298828125, 0.3512687683105469, 0.3671417236328125, 0.3830146789550781, 0.39888763427734375, 0.4147605895996094, 0.430633544921875, 0.4465065002441406, 0.46237945556640625, 0.4782524108886719, 0.4941253662109375, 0.5099983215332031, 0.5258712768554688, 0.5417442321777344, 0.5576171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 11.0, 17.0, 16.0, 17.0, 27.0, 42.0, 50.0, 63.0, 109.0, 161.0, 256.0, 459.0, 713.0, 1310.0, 2663.0, 5906.0, 14786.0, 40392.0, 120400.0, 317846.0, 336441.0, 133286.0, 44544.0, 16207.0, 6586.0, 2943.0, 1338.0, 739.0, 403.0, 259.0, 167.0, 97.0, 90.0, 54.0, 35.0, 36.0, 17.0, 21.0, 11.0, 6.0, 6.0, 5.0, 3.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2236328125, -1.1842193603515625, -1.144805908203125, -1.1053924560546875, -1.06597900390625, -1.0265655517578125, -0.987152099609375, -0.9477386474609375, -0.9083251953125, -0.8689117431640625, -0.829498291015625, -0.7900848388671875, -0.75067138671875, -0.7112579345703125, -0.671844482421875, -0.6324310302734375, -0.593017578125, -0.5536041259765625, -0.514190673828125, -0.4747772216796875, -0.43536376953125, -0.3959503173828125, -0.356536865234375, -0.3171234130859375, -0.2777099609375, -0.2382965087890625, -0.198883056640625, -0.1594696044921875, -0.12005615234375, -0.0806427001953125, -0.041229248046875, -0.0018157958984375, 0.03759765625, 0.0770111083984375, 0.116424560546875, 0.1558380126953125, 0.19525146484375, 0.2346649169921875, 0.274078369140625, 0.3134918212890625, 0.3529052734375, 0.3923187255859375, 0.431732177734375, 0.4711456298828125, 0.51055908203125, 0.5499725341796875, 0.589385986328125, 0.6287994384765625, 0.668212890625, 0.7076263427734375, 0.747039794921875, 0.7864532470703125, 0.82586669921875, 0.8652801513671875, 0.904693603515625, 0.9441070556640625, 0.9835205078125, 1.0229339599609375, 1.062347412109375, 1.1017608642578125, 1.14117431640625, 1.1805877685546875, 1.220001220703125, 1.2594146728515625, 1.298828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 9.0, 10.0, 8.0, 12.0, 14.0, 15.0, 20.0, 26.0, 33.0, 40.0, 37.0, 34.0, 36.0, 46.0, 48.0, 46.0, 51.0, 37.0, 52.0, 41.0, 45.0, 46.0, 44.0, 47.0, 22.0, 29.0, 30.0, 27.0, 18.0, 18.0, 8.0, 7.0, 12.0, 9.0, 6.0, 5.0, 9.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2548828125, -1.2169036865234375, -1.178924560546875, -1.1409454345703125, -1.10296630859375, -1.0649871826171875, -1.027008056640625, -0.9890289306640625, -0.9510498046875, -0.9130706787109375, -0.875091552734375, -0.8371124267578125, -0.79913330078125, -0.7611541748046875, -0.723175048828125, -0.6851959228515625, -0.647216796875, -0.6092376708984375, -0.571258544921875, -0.5332794189453125, -0.49530029296875, -0.4573211669921875, -0.419342041015625, -0.3813629150390625, -0.3433837890625, -0.3054046630859375, -0.267425537109375, -0.2294464111328125, -0.19146728515625, -0.1534881591796875, -0.115509033203125, -0.0775299072265625, -0.03955078125, -0.0015716552734375, 0.036407470703125, 0.0743865966796875, 0.11236572265625, 0.1503448486328125, 0.188323974609375, 0.2263031005859375, 0.2642822265625, 0.3022613525390625, 0.340240478515625, 0.3782196044921875, 0.41619873046875, 0.4541778564453125, 0.492156982421875, 0.5301361083984375, 0.568115234375, 0.6060943603515625, 0.644073486328125, 0.6820526123046875, 0.72003173828125, 0.7580108642578125, 0.795989990234375, 0.8339691162109375, 0.8719482421875, 0.9099273681640625, 0.947906494140625, 0.9858856201171875, 1.02386474609375, 1.0618438720703125, 1.099822998046875, 1.1378021240234375, 1.17578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 9.0, 17.0, 37.0, 47.0, 88.0, 181.0, 313.0, 857.0, 3091.0, 20045.0, 341728.0, 640843.0, 34733.0, 4606.0, 1085.0, 396.0, 197.0, 101.0, 73.0, 40.0, 22.0, 10.0, 9.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.85546875, -1.80548095703125, -1.7554931640625, -1.70550537109375, -1.655517578125, -1.60552978515625, -1.5555419921875, -1.50555419921875, -1.45556640625, -1.40557861328125, -1.3555908203125, -1.30560302734375, -1.255615234375, -1.20562744140625, -1.1556396484375, -1.10565185546875, -1.0556640625, -1.00567626953125, -0.9556884765625, -0.90570068359375, -0.855712890625, -0.80572509765625, -0.7557373046875, -0.70574951171875, -0.65576171875, -0.60577392578125, -0.5557861328125, -0.50579833984375, -0.455810546875, -0.40582275390625, -0.3558349609375, -0.30584716796875, -0.255859375, -0.20587158203125, -0.1558837890625, -0.10589599609375, -0.055908203125, -0.00592041015625, 0.0440673828125, 0.09405517578125, 0.14404296875, 0.19403076171875, 0.2440185546875, 0.29400634765625, 0.343994140625, 0.39398193359375, 0.4439697265625, 0.49395751953125, 0.5439453125, 0.59393310546875, 0.6439208984375, 0.69390869140625, 0.743896484375, 0.79388427734375, 0.8438720703125, 0.89385986328125, 0.94384765625, 0.99383544921875, 1.0438232421875, 1.09381103515625, 1.143798828125, 1.19378662109375, 1.2437744140625, 1.29376220703125, 1.34375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 3.0, 6.0, 7.0, 12.0, 16.0, 31.0, 47.0, 76.0, 96.0, 131.0, 160.0, 136.0, 93.0, 60.0, 41.0, 24.0, 12.0, 9.0, 7.0, 5.0, 7.0, 3.0, 7.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019216537475585938, -0.00018562376499176025, -0.00017908215522766113, -0.000172540545463562, -0.0001659989356994629, -0.00015945732593536377, -0.00015291571617126465, -0.00014637410640716553, -0.0001398324966430664, -0.00013329088687896729, -0.00012674927711486816, -0.00012020766735076904, -0.00011366605758666992, -0.0001071244478225708, -0.00010058283805847168, -9.404122829437256e-05, -8.749961853027344e-05, -8.095800876617432e-05, -7.44163990020752e-05, -6.787478923797607e-05, -6.133317947387695e-05, -5.479156970977783e-05, -4.824995994567871e-05, -4.170835018157959e-05, -3.516674041748047e-05, -2.8625130653381348e-05, -2.2083520889282227e-05, -1.5541911125183105e-05, -9.000301361083984e-06, -2.4586915969848633e-06, 4.082918167114258e-06, 1.0624527931213379e-05, 1.71661376953125e-05, 2.370774745941162e-05, 3.0249357223510742e-05, 3.679096698760986e-05, 4.3332576751708984e-05, 4.9874186515808105e-05, 5.6415796279907227e-05, 6.295740604400635e-05, 6.949901580810547e-05, 7.604062557220459e-05, 8.258223533630371e-05, 8.912384510040283e-05, 9.566545486450195e-05, 0.00010220706462860107, 0.0001087486743927002, 0.00011529028415679932, 0.00012183189392089844, 0.00012837350368499756, 0.00013491511344909668, 0.0001414567232131958, 0.00014799833297729492, 0.00015453994274139404, 0.00016108155250549316, 0.00016762316226959229, 0.0001741647720336914, 0.00018070638179779053, 0.00018724799156188965, 0.00019378960132598877, 0.0002003312110900879, 0.000206872820854187, 0.00021341443061828613, 0.00021995604038238525, 0.00022649765014648438]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 8.0, 10.0, 9.0, 24.0, 46.0, 48.0, 98.0, 175.0, 471.0, 1610.0, 8752.0, 113499.0, 855823.0, 60008.0, 6007.0, 1202.0, 365.0, 178.0, 95.0, 46.0, 30.0, 18.0, 17.0, 8.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5234375, -1.465728759765625, -1.40802001953125, -1.350311279296875, -1.2926025390625, -1.234893798828125, -1.17718505859375, -1.119476318359375, -1.061767578125, -1.004058837890625, -0.94635009765625, -0.888641357421875, -0.8309326171875, -0.773223876953125, -0.71551513671875, -0.657806396484375, -0.60009765625, -0.542388916015625, -0.48468017578125, -0.426971435546875, -0.3692626953125, -0.311553955078125, -0.25384521484375, -0.196136474609375, -0.138427734375, -0.080718994140625, -0.02301025390625, 0.034698486328125, 0.0924072265625, 0.150115966796875, 0.20782470703125, 0.265533447265625, 0.3232421875, 0.380950927734375, 0.43865966796875, 0.496368408203125, 0.5540771484375, 0.611785888671875, 0.66949462890625, 0.727203369140625, 0.784912109375, 0.842620849609375, 0.90032958984375, 0.958038330078125, 1.0157470703125, 1.073455810546875, 1.13116455078125, 1.188873291015625, 1.24658203125, 1.304290771484375, 1.36199951171875, 1.419708251953125, 1.4774169921875, 1.535125732421875, 1.59283447265625, 1.650543212890625, 1.708251953125, 1.765960693359375, 1.82366943359375, 1.881378173828125, 1.9390869140625, 1.996795654296875, 2.05450439453125, 2.112213134765625, 2.169921875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 1.0, 9.0, 12.0, 20.0, 27.0, 41.0, 51.0, 85.0, 111.0, 113.0, 140.0, 133.0, 81.0, 58.0, 39.0, 32.0, 20.0, 12.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56494140625, -0.5354843139648438, -0.5060272216796875, -0.47657012939453125, -0.447113037109375, -0.41765594482421875, -0.3881988525390625, -0.35874176025390625, -0.32928466796875, -0.29982757568359375, -0.2703704833984375, -0.24091339111328125, -0.211456298828125, -0.18199920654296875, -0.1525421142578125, -0.12308502197265625, -0.0936279296875, -0.06417083740234375, -0.0347137451171875, -0.00525665283203125, 0.024200439453125, 0.05365753173828125, 0.0831146240234375, 0.11257171630859375, 0.14202880859375, 0.17148590087890625, 0.2009429931640625, 0.23040008544921875, 0.259857177734375, 0.28931427001953125, 0.3187713623046875, 0.34822845458984375, 0.377685546875, 0.40714263916015625, 0.4365997314453125, 0.46605682373046875, 0.495513916015625, 0.5249710083007812, 0.5544281005859375, 0.5838851928710938, 0.61334228515625, 0.6427993774414062, 0.6722564697265625, 0.7017135620117188, 0.731170654296875, 0.7606277465820312, 0.7900848388671875, 0.8195419311523438, 0.8489990234375, 0.8784561157226562, 0.9079132080078125, 0.9373703002929688, 0.966827392578125, 0.9962844848632812, 1.0257415771484375, 1.0551986694335938, 1.08465576171875, 1.1141128540039062, 1.1435699462890625, 1.1730270385742188, 1.202484130859375, 1.2319412231445312, 1.2613983154296875, 1.2908554077148438, 1.3203125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 17.0, 40.0, 111.0, 216.0, 321.0, 174.0, 76.0, 32.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.068765640258789, -11.287035942077637, -10.505306243896484, -9.723577499389648, -8.941847801208496, -8.160118103027344, -7.37838888168335, -6.5966596603393555, -5.814929962158203, -5.033200263977051, -4.251471042633057, -3.4697415828704834, -2.68801212310791, -1.906282663345337, -1.1245532035827637, -0.34282398223876953, 0.4389057159423828, 1.220635175704956, 2.0023646354675293, 2.7840940952301025, 3.565823554992676, 4.347553253173828, 5.129282474517822, 5.911011695861816, 6.692741394042969, 7.474471092224121, 8.256200790405273, 9.03792953491211, 9.819659233093262, 10.601388931274414, 11.38311767578125, 12.164847373962402, 12.946578979492188, 13.72830867767334, 14.510038375854492, 15.291767120361328, 16.073497772216797, 16.855226516723633, 17.63695526123047, 18.418685913085938, 19.200414657592773, 19.98214340209961, 20.763874053955078, 21.545602798461914, 22.32733154296875, 23.10906219482422, 23.890790939331055, 24.67251968383789, 25.45425033569336, 26.235979080200195, 27.017709732055664, 27.7994384765625, 28.58116912841797, 29.362897872924805, 30.14462661743164, 30.92635726928711, 31.708086013793945, 32.48981475830078, 33.27154541015625, 34.05327606201172, 34.83500289916992, 35.61673355102539, 36.39846420288086, 37.18019104003906, 37.96192169189453]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 5.0, 8.0, 6.0, 13.0, 19.0, 13.0, 17.0, 19.0, 20.0, 28.0, 20.0, 29.0, 38.0, 39.0, 30.0, 41.0, 45.0, 38.0, 51.0, 32.0, 46.0, 40.0, 39.0, 46.0, 28.0, 42.0, 32.0, 23.0, 24.0, 23.0, 27.0, 17.0, 21.0, 12.0, 11.0, 9.0, 7.0, 9.0, 2.0, 5.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.174185752868652, -5.975380897521973, -5.776576519012451, -5.5777716636657715, -5.37896728515625, -5.18016242980957, -4.981357574462891, -4.782553195953369, -4.583748817443848, -4.384943962097168, -4.1861395835876465, -3.987334728240967, -3.7885303497314453, -3.5897254943847656, -3.390920877456665, -3.1921162605285645, -2.9933114051818848, -2.794506788253784, -2.5957021713256836, -2.396897315979004, -2.1980929374694824, -1.9992882013320923, -1.8004834651947021, -1.6016788482666016, -1.402874231338501, -1.2040696144104004, -1.0052649974822998, -0.8064602613449097, -0.6076556444168091, -0.4088510274887085, -0.21004629135131836, -0.011241674423217773, 0.18756341934204102, 0.386368066072464, 0.585172712802887, 0.7839773893356323, 0.9827820062637329, 1.1815866231918335, 1.3803913593292236, 1.5791959762573242, 1.7780005931854248, 1.9768052101135254, 2.175609827041626, 2.3744144439697266, 2.5732192993164062, 2.7720236778259277, 2.9708285331726074, 3.169633150100708, 3.3684377670288086, 3.567242383956909, 3.7660470008850098, 3.9648518562316895, 4.163656234741211, 4.362461090087891, 4.56126594543457, 4.760070323944092, 4.958874702453613, 5.157679557800293, 5.3564839363098145, 5.555288791656494, 5.754093170166016, 5.952898025512695, 6.151702880859375, 6.3505072593688965, 6.549312114715576]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 8.0, 8.0, 9.0, 11.0, 24.0, 36.0, 52.0, 80.0, 132.0, 239.0, 461.0, 1318.0, 4155.0, 18081.0, 452383.0, 3683279.0, 25534.0, 5238.0, 1654.0, 637.0, 308.0, 188.0, 113.0, 84.0, 58.0, 39.0, 30.0, 19.0, 23.0, 22.0, 9.0, 7.0, 6.0, 3.0, 6.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.69921875, -4.5614013671875, -4.423583984375, -4.2857666015625, -4.14794921875, -4.0101318359375, -3.872314453125, -3.7344970703125, -3.5966796875, -3.4588623046875, -3.321044921875, -3.1832275390625, -3.04541015625, -2.9075927734375, -2.769775390625, -2.6319580078125, -2.494140625, -2.3563232421875, -2.218505859375, -2.0806884765625, -1.94287109375, -1.8050537109375, -1.667236328125, -1.5294189453125, -1.3916015625, -1.2537841796875, -1.115966796875, -0.9781494140625, -0.84033203125, -0.7025146484375, -0.564697265625, -0.4268798828125, -0.2890625, -0.1512451171875, -0.013427734375, 0.1243896484375, 0.26220703125, 0.4000244140625, 0.537841796875, 0.6756591796875, 0.8134765625, 0.9512939453125, 1.089111328125, 1.2269287109375, 1.36474609375, 1.5025634765625, 1.640380859375, 1.7781982421875, 1.916015625, 2.0538330078125, 2.191650390625, 2.3294677734375, 2.46728515625, 2.6051025390625, 2.742919921875, 2.8807373046875, 3.0185546875, 3.1563720703125, 3.294189453125, 3.4320068359375, 3.56982421875, 3.7076416015625, 3.845458984375, 3.9832763671875, 4.12109375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 8.0, 15.0, 13.0, 21.0, 25.0, 40.0, 45.0, 68.0, 69.0, 87.0, 86.0, 86.0, 72.0, 85.0, 64.0, 61.0, 47.0, 34.0, 22.0, 9.0, 12.0, 6.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.454833984375, -0.4397926330566406, -0.42475128173828125, -0.4097099304199219, -0.3946685791015625, -0.3796272277832031, -0.36458587646484375, -0.3495445251464844, -0.334503173828125, -0.3194618225097656, -0.30442047119140625, -0.2893791198730469, -0.2743377685546875, -0.2592964172363281, -0.24425506591796875, -0.22921371459960938, -0.21417236328125, -0.19913101196289062, -0.18408966064453125, -0.16904830932617188, -0.1540069580078125, -0.13896560668945312, -0.12392425537109375, -0.10888290405273438, -0.093841552734375, -0.07880020141601562, -0.06375885009765625, -0.048717498779296875, -0.0336761474609375, -0.018634796142578125, -0.00359344482421875, 0.011447906494140625, 0.0264892578125, 0.041530609130859375, 0.05657196044921875, 0.07161331176757812, 0.0866546630859375, 0.10169601440429688, 0.11673736572265625, 0.13177871704101562, 0.146820068359375, 0.16186141967773438, 0.17690277099609375, 0.19194412231445312, 0.2069854736328125, 0.22202682495117188, 0.23706817626953125, 0.2521095275878906, 0.26715087890625, 0.2821922302246094, 0.29723358154296875, 0.3122749328613281, 0.3273162841796875, 0.3423576354980469, 0.35739898681640625, 0.3724403381347656, 0.387481689453125, 0.4025230407714844, 0.41756439208984375, 0.4326057434082031, 0.4476470947265625, 0.4626884460449219, 0.47772979736328125, 0.4927711486816406, 0.5078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 7.0, 6.0, 12.0, 11.0, 20.0, 36.0, 45.0, 72.0, 118.0, 198.0, 320.0, 545.0, 892.0, 1615.0, 3346.0, 7419.0, 19648.0, 70440.0, 1489584.0, 2484813.0, 77961.0, 21003.0, 8015.0, 3686.0, 1916.0, 1016.0, 551.0, 363.0, 199.0, 133.0, 102.0, 63.0, 41.0, 28.0, 13.0, 13.0, 10.0, 4.0, 2.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0], "bins": [-2.365234375, -2.30303955078125, -2.2408447265625, -2.17864990234375, -2.116455078125, -2.05426025390625, -1.9920654296875, -1.92987060546875, -1.86767578125, -1.80548095703125, -1.7432861328125, -1.68109130859375, -1.618896484375, -1.55670166015625, -1.4945068359375, -1.43231201171875, -1.3701171875, -1.30792236328125, -1.2457275390625, -1.18353271484375, -1.121337890625, -1.05914306640625, -0.9969482421875, -0.93475341796875, -0.87255859375, -0.81036376953125, -0.7481689453125, -0.68597412109375, -0.623779296875, -0.56158447265625, -0.4993896484375, -0.43719482421875, -0.375, -0.31280517578125, -0.2506103515625, -0.18841552734375, -0.126220703125, -0.06402587890625, -0.0018310546875, 0.06036376953125, 0.12255859375, 0.18475341796875, 0.2469482421875, 0.30914306640625, 0.371337890625, 0.43353271484375, 0.4957275390625, 0.55792236328125, 0.6201171875, 0.68231201171875, 0.7445068359375, 0.80670166015625, 0.868896484375, 0.93109130859375, 0.9932861328125, 1.05548095703125, 1.11767578125, 1.17987060546875, 1.2420654296875, 1.30426025390625, 1.366455078125, 1.42864990234375, 1.4908447265625, 1.55303955078125, 1.615234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 15.0, 10.0, 21.0, 40.0, 35.0, 68.0, 183.0, 468.0, 2085.0, 686.0, 180.0, 97.0, 46.0, 35.0, 20.0, 14.0, 13.0, 9.0, 7.0, 10.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94189453125, -0.9089431762695312, -0.8759918212890625, -0.8430404663085938, -0.810089111328125, -0.7771377563476562, -0.7441864013671875, -0.7112350463867188, -0.67828369140625, -0.6453323364257812, -0.6123809814453125, -0.5794296264648438, -0.546478271484375, -0.5135269165039062, -0.4805755615234375, -0.44762420654296875, -0.4146728515625, -0.38172149658203125, -0.3487701416015625, -0.31581878662109375, -0.282867431640625, -0.24991607666015625, -0.2169647216796875, -0.18401336669921875, -0.15106201171875, -0.11811065673828125, -0.0851593017578125, -0.05220794677734375, -0.019256591796875, 0.01369476318359375, 0.0466461181640625, 0.07959747314453125, 0.112548828125, 0.14550018310546875, 0.1784515380859375, 0.21140289306640625, 0.244354248046875, 0.27730560302734375, 0.3102569580078125, 0.34320831298828125, 0.37615966796875, 0.40911102294921875, 0.4420623779296875, 0.47501373291015625, 0.507965087890625, 0.5409164428710938, 0.5738677978515625, 0.6068191528320312, 0.6397705078125, 0.6727218627929688, 0.7056732177734375, 0.7386245727539062, 0.771575927734375, 0.8045272827148438, 0.8374786376953125, 0.8704299926757812, 0.90338134765625, 0.9363327026367188, 0.9692840576171875, 1.0022354125976562, 1.035186767578125, 1.0681381225585938, 1.1010894775390625, 1.1340408325195312, 1.1669921875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 36.0, 106.0, 288.0, 328.0, 148.0, 54.0, 23.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.847047805786133, -11.43986701965332, -11.032686233520508, -10.625505447387695, -10.2183256149292, -9.811144828796387, -9.403964042663574, -8.996783256530762, -8.589603424072266, -8.182422637939453, -7.775242328643799, -7.368061542510986, -6.960881233215332, -6.5537004470825195, -6.146519660949707, -5.7393388748168945, -5.332158088684082, -4.9249773025512695, -4.517796993255615, -4.110616207122803, -3.7034356594085693, -3.296255111694336, -2.8890743255615234, -2.48189377784729, -2.0747132301330566, -1.6675326824188232, -1.2603520154953003, -0.8531713485717773, -0.44599080085754395, -0.03881025314331055, 0.36837053298950195, 0.7755510807037354, 1.1827316284179688, 1.5899121761322021, 1.997092843055725, 2.404273509979248, 2.8114540576934814, 3.218634605407715, 3.6258153915405273, 4.03299617767334, 4.440176486968994, 4.847357273101807, 5.254537582397461, 5.661718368530273, 6.068899154663086, 6.47607946395874, 6.883260250091553, 7.290440559387207, 7.6976213455200195, 8.104802131652832, 8.511982917785645, 8.91916275024414, 9.326343536376953, 9.733524322509766, 10.140705108642578, 10.54788589477539, 10.955066680908203, 11.362247467041016, 11.769428253173828, 12.17660903930664, 12.583788871765137, 12.99096965789795, 13.398150444030762, 13.805331230163574, 14.21251106262207]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 11.0, 10.0, 17.0, 16.0, 14.0, 13.0, 17.0, 33.0, 32.0, 49.0, 33.0, 48.0, 56.0, 58.0, 57.0, 49.0, 41.0, 59.0, 54.0, 51.0, 41.0, 37.0, 43.0, 32.0, 21.0, 28.0, 22.0, 20.0, 14.0, 5.0, 8.0, 2.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.402423858642578, -3.296762228012085, -3.191100597381592, -3.0854389667510986, -2.9797773361206055, -2.874115467071533, -2.76845383644104, -2.662792205810547, -2.5571305751800537, -2.4514689445495605, -2.3458073139190674, -2.240145683288574, -2.134483814239502, -2.028822422027588, -1.9231605529785156, -1.8174989223480225, -1.7118372917175293, -1.6061756610870361, -1.500514030456543, -1.3948522806167603, -1.289190649986267, -1.183529019355774, -1.0778672695159912, -0.972205638885498, -0.8665440082550049, -0.7608823776245117, -0.6552206873893738, -0.5495589971542358, -0.4438973665237427, -0.3382357358932495, -0.23257404565811157, -0.12691235542297363, -0.02125072479248047, 0.08441093564033508, 0.19007259607315063, 0.2957342565059662, 0.40139591693878174, 0.5070575475692749, 0.6127192378044128, 0.7183809280395508, 0.824042558670044, 0.9297041893005371, 1.0353658199310303, 1.141027569770813, 1.2466892004013062, 1.3523508310317993, 1.458012580871582, 1.5636742115020752, 1.6693358421325684, 1.7749974727630615, 1.8806591033935547, 1.9863208532333374, 2.091982364654541, 2.1976442337036133, 2.3033058643341064, 2.4089674949645996, 2.5146291255950928, 2.620290756225586, 2.725952386856079, 2.8316140174865723, 2.9372758865356445, 3.0429372787475586, 3.148599147796631, 3.254260778427124, 3.359922409057617]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 3.0, 15.0, 12.0, 11.0, 20.0, 56.0, 58.0, 80.0, 164.0, 288.0, 617.0, 1353.0, 3865.0, 15188.0, 117427.0, 792467.0, 97288.0, 13539.0, 3518.0, 1237.0, 575.0, 292.0, 167.0, 101.0, 56.0, 52.0, 37.0, 18.0, 9.0, 12.0, 9.0, 5.0, 9.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.75390625, -3.638275146484375, -3.52264404296875, -3.407012939453125, -3.2913818359375, -3.175750732421875, -3.06011962890625, -2.944488525390625, -2.828857421875, -2.713226318359375, -2.59759521484375, -2.481964111328125, -2.3663330078125, -2.250701904296875, -2.13507080078125, -2.019439697265625, -1.90380859375, -1.788177490234375, -1.67254638671875, -1.556915283203125, -1.4412841796875, -1.325653076171875, -1.21002197265625, -1.094390869140625, -0.978759765625, -0.863128662109375, -0.74749755859375, -0.631866455078125, -0.5162353515625, -0.400604248046875, -0.28497314453125, -0.169342041015625, -0.0537109375, 0.061920166015625, 0.17755126953125, 0.293182373046875, 0.4088134765625, 0.524444580078125, 0.64007568359375, 0.755706787109375, 0.871337890625, 0.986968994140625, 1.10260009765625, 1.218231201171875, 1.3338623046875, 1.449493408203125, 1.56512451171875, 1.680755615234375, 1.79638671875, 1.912017822265625, 2.02764892578125, 2.143280029296875, 2.2589111328125, 2.374542236328125, 2.49017333984375, 2.605804443359375, 2.721435546875, 2.837066650390625, 2.95269775390625, 3.068328857421875, 3.1839599609375, 3.299591064453125, 3.41522216796875, 3.530853271484375, 3.646484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 7.0, 8.0, 19.0, 17.0, 28.0, 40.0, 58.0, 70.0, 74.0, 100.0, 86.0, 92.0, 81.0, 75.0, 74.0, 50.0, 29.0, 27.0, 19.0, 16.0, 12.0, 2.0, 2.0, 3.0, 1.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44677734375, -0.43021392822265625, -0.4136505126953125, -0.39708709716796875, -0.380523681640625, -0.36396026611328125, -0.3473968505859375, -0.33083343505859375, -0.31427001953125, -0.29770660400390625, -0.2811431884765625, -0.26457977294921875, -0.248016357421875, -0.23145294189453125, -0.2148895263671875, -0.19832611083984375, -0.1817626953125, -0.16519927978515625, -0.1486358642578125, -0.13207244873046875, -0.115509033203125, -0.09894561767578125, -0.0823822021484375, -0.06581878662109375, -0.04925537109375, -0.03269195556640625, -0.0161285400390625, 0.00043487548828125, 0.016998291015625, 0.03356170654296875, 0.0501251220703125, 0.06668853759765625, 0.083251953125, 0.09981536865234375, 0.1163787841796875, 0.13294219970703125, 0.149505615234375, 0.16606903076171875, 0.1826324462890625, 0.19919586181640625, 0.21575927734375, 0.23232269287109375, 0.2488861083984375, 0.26544952392578125, 0.282012939453125, 0.29857635498046875, 0.3151397705078125, 0.33170318603515625, 0.3482666015625, 0.36483001708984375, 0.3813934326171875, 0.39795684814453125, 0.414520263671875, 0.43108367919921875, 0.4476470947265625, 0.46421051025390625, 0.48077392578125, 0.49733734130859375, 0.5139007568359375, 0.5304641723632812, 0.547027587890625, 0.5635910034179688, 0.5801544189453125, 0.5967178344726562, 0.61328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 7.0, 11.0, 9.0, 8.0, 23.0, 24.0, 37.0, 65.0, 107.0, 152.0, 264.0, 549.0, 1125.0, 2496.0, 6729.0, 21732.0, 95293.0, 522385.0, 320087.0, 54820.0, 14188.0, 4674.0, 1865.0, 856.0, 440.0, 222.0, 124.0, 87.0, 51.0, 28.0, 26.0, 21.0, 10.0, 8.0, 4.0, 8.0, 1.0, 7.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.73828125, -1.6800079345703125, -1.621734619140625, -1.5634613037109375, -1.50518798828125, -1.4469146728515625, -1.388641357421875, -1.3303680419921875, -1.2720947265625, -1.2138214111328125, -1.155548095703125, -1.0972747802734375, -1.03900146484375, -0.9807281494140625, -0.922454833984375, -0.8641815185546875, -0.805908203125, -0.7476348876953125, -0.689361572265625, -0.6310882568359375, -0.57281494140625, -0.5145416259765625, -0.456268310546875, -0.3979949951171875, -0.3397216796875, -0.2814483642578125, -0.223175048828125, -0.1649017333984375, -0.10662841796875, -0.0483551025390625, 0.009918212890625, 0.0681915283203125, 0.12646484375, 0.1847381591796875, 0.243011474609375, 0.3012847900390625, 0.35955810546875, 0.4178314208984375, 0.476104736328125, 0.5343780517578125, 0.5926513671875, 0.6509246826171875, 0.709197998046875, 0.7674713134765625, 0.82574462890625, 0.8840179443359375, 0.942291259765625, 1.0005645751953125, 1.058837890625, 1.1171112060546875, 1.175384521484375, 1.2336578369140625, 1.29193115234375, 1.3502044677734375, 1.408477783203125, 1.4667510986328125, 1.5250244140625, 1.5832977294921875, 1.641571044921875, 1.6998443603515625, 1.75811767578125, 1.8163909912109375, 1.874664306640625, 1.9329376220703125, 1.9912109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 4.0, 5.0, 12.0, 7.0, 9.0, 17.0, 17.0, 16.0, 17.0, 16.0, 23.0, 32.0, 36.0, 38.0, 41.0, 48.0, 49.0, 42.0, 53.0, 41.0, 40.0, 43.0, 36.0, 38.0, 44.0, 44.0, 43.0, 29.0, 31.0, 19.0, 18.0, 13.0, 15.0, 13.0, 8.0, 14.0, 5.0, 7.0, 6.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2822265625, -1.2428131103515625, -1.203399658203125, -1.1639862060546875, -1.12457275390625, -1.0851593017578125, -1.045745849609375, -1.0063323974609375, -0.9669189453125, -0.9275054931640625, -0.888092041015625, -0.8486785888671875, -0.80926513671875, -0.7698516845703125, -0.730438232421875, -0.6910247802734375, -0.651611328125, -0.6121978759765625, -0.572784423828125, -0.5333709716796875, -0.49395751953125, -0.4545440673828125, -0.415130615234375, -0.3757171630859375, -0.3363037109375, -0.2968902587890625, -0.257476806640625, -0.2180633544921875, -0.17864990234375, -0.1392364501953125, -0.099822998046875, -0.0604095458984375, -0.02099609375, 0.0184173583984375, 0.057830810546875, 0.0972442626953125, 0.13665771484375, 0.1760711669921875, 0.215484619140625, 0.2548980712890625, 0.2943115234375, 0.3337249755859375, 0.373138427734375, 0.4125518798828125, 0.45196533203125, 0.4913787841796875, 0.530792236328125, 0.5702056884765625, 0.609619140625, 0.6490325927734375, 0.688446044921875, 0.7278594970703125, 0.76727294921875, 0.8066864013671875, 0.846099853515625, 0.8855133056640625, 0.9249267578125, 0.9643402099609375, 1.003753662109375, 1.0431671142578125, 1.08258056640625, 1.1219940185546875, 1.161407470703125, 1.2008209228515625, 1.240234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 12.0, 19.0, 15.0, 33.0, 55.0, 105.0, 228.0, 479.0, 1321.0, 4566.0, 24387.0, 355895.0, 616515.0, 35929.0, 6216.0, 1642.0, 530.0, 241.0, 125.0, 69.0, 34.0, 31.0, 20.0, 17.0, 13.0, 8.0, 4.0, 8.0, 2.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.0322265625, -0.9967498779296875, -0.961273193359375, -0.9257965087890625, -0.89031982421875, -0.8548431396484375, -0.819366455078125, -0.7838897705078125, -0.7484130859375, -0.7129364013671875, -0.677459716796875, -0.6419830322265625, -0.60650634765625, -0.5710296630859375, -0.535552978515625, -0.5000762939453125, -0.464599609375, -0.4291229248046875, -0.393646240234375, -0.3581695556640625, -0.32269287109375, -0.2872161865234375, -0.251739501953125, -0.2162628173828125, -0.1807861328125, -0.1453094482421875, -0.109832763671875, -0.0743560791015625, -0.03887939453125, -0.0034027099609375, 0.032073974609375, 0.0675506591796875, 0.10302734375, 0.1385040283203125, 0.173980712890625, 0.2094573974609375, 0.24493408203125, 0.2804107666015625, 0.315887451171875, 0.3513641357421875, 0.3868408203125, 0.4223175048828125, 0.457794189453125, 0.4932708740234375, 0.52874755859375, 0.5642242431640625, 0.599700927734375, 0.6351776123046875, 0.670654296875, 0.7061309814453125, 0.741607666015625, 0.7770843505859375, 0.81256103515625, 0.8480377197265625, 0.883514404296875, 0.9189910888671875, 0.9544677734375, 0.9899444580078125, 1.025421142578125, 1.0608978271484375, 1.09637451171875, 1.1318511962890625, 1.167327880859375, 1.2028045654296875, 1.23828125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 12.0, 13.0, 20.0, 21.0, 32.0, 72.0, 111.0, 209.0, 182.0, 114.0, 70.0, 46.0, 22.0, 21.0, 14.0, 11.0, 12.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015091896057128906, -0.00014552287757396698, -0.0001401267945766449, -0.00013473071157932281, -0.00012933462858200073, -0.00012393854558467865, -0.00011854246258735657, -0.00011314637959003448, -0.0001077502965927124, -0.00010235421359539032, -9.695813059806824e-05, -9.156204760074615e-05, -8.616596460342407e-05, -8.076988160610199e-05, -7.537379860877991e-05, -6.997771561145782e-05, -6.458163261413574e-05, -5.918554961681366e-05, -5.378946661949158e-05, -4.8393383622169495e-05, -4.299730062484741e-05, -3.760121762752533e-05, -3.220513463020325e-05, -2.6809051632881165e-05, -2.1412968635559082e-05, -1.6016885638237e-05, -1.0620802640914917e-05, -5.2247196435928345e-06, 1.7136335372924805e-07, 5.5674463510513306e-06, 1.0963529348373413e-05, 1.6359612345695496e-05, 2.1755695343017578e-05, 2.715177834033966e-05, 3.254786133766174e-05, 3.7943944334983826e-05, 4.334002733230591e-05, 4.873611032962799e-05, 5.413219332695007e-05, 5.9528276324272156e-05, 6.492435932159424e-05, 7.032044231891632e-05, 7.57165253162384e-05, 8.111260831356049e-05, 8.650869131088257e-05, 9.190477430820465e-05, 9.730085730552673e-05, 0.00010269694030284882, 0.0001080930233001709, 0.00011348910629749298, 0.00011888518929481506, 0.00012428127229213715, 0.00012967735528945923, 0.0001350734382867813, 0.0001404695212841034, 0.00014586560428142548, 0.00015126168727874756, 0.00015665777027606964, 0.00016205385327339172, 0.0001674499362707138, 0.0001728460192680359, 0.00017824210226535797, 0.00018363818526268005, 0.00018903426826000214, 0.00019443035125732422]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 7.0, 6.0, 10.0, 28.0, 24.0, 60.0, 73.0, 99.0, 193.0, 423.0, 929.0, 2782.0, 13661.0, 185350.0, 800559.0, 36331.0, 5241.0, 1496.0, 607.0, 259.0, 143.0, 96.0, 54.0, 53.0, 21.0, 15.0, 10.0, 5.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2705078125, -1.225494384765625, -1.18048095703125, -1.135467529296875, -1.0904541015625, -1.045440673828125, -1.00042724609375, -0.955413818359375, -0.910400390625, -0.865386962890625, -0.82037353515625, -0.775360107421875, -0.7303466796875, -0.685333251953125, -0.64031982421875, -0.595306396484375, -0.55029296875, -0.505279541015625, -0.46026611328125, -0.415252685546875, -0.3702392578125, -0.325225830078125, -0.28021240234375, -0.235198974609375, -0.190185546875, -0.145172119140625, -0.10015869140625, -0.055145263671875, -0.0101318359375, 0.034881591796875, 0.07989501953125, 0.124908447265625, 0.169921875, 0.214935302734375, 0.25994873046875, 0.304962158203125, 0.3499755859375, 0.394989013671875, 0.44000244140625, 0.485015869140625, 0.530029296875, 0.575042724609375, 0.62005615234375, 0.665069580078125, 0.7100830078125, 0.755096435546875, 0.80010986328125, 0.845123291015625, 0.89013671875, 0.935150146484375, 0.98016357421875, 1.025177001953125, 1.0701904296875, 1.115203857421875, 1.16021728515625, 1.205230712890625, 1.250244140625, 1.295257568359375, 1.34027099609375, 1.385284423828125, 1.4302978515625, 1.475311279296875, 1.52032470703125, 1.565338134765625, 1.6103515625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 13.0, 18.0, 22.0, 42.0, 42.0, 93.0, 151.0, 190.0, 159.0, 97.0, 40.0, 31.0, 22.0, 21.0, 19.0, 11.0, 3.0, 6.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.916015625, -0.8878860473632812, -0.8597564697265625, -0.8316268920898438, -0.803497314453125, -0.7753677368164062, -0.7472381591796875, -0.7191085815429688, -0.69097900390625, -0.6628494262695312, -0.6347198486328125, -0.6065902709960938, -0.578460693359375, -0.5503311157226562, -0.5222015380859375, -0.49407196044921875, -0.4659423828125, -0.43781280517578125, -0.4096832275390625, -0.38155364990234375, -0.353424072265625, -0.32529449462890625, -0.2971649169921875, -0.26903533935546875, -0.24090576171875, -0.21277618408203125, -0.1846466064453125, -0.15651702880859375, -0.128387451171875, -0.10025787353515625, -0.0721282958984375, -0.04399871826171875, -0.015869140625, 0.01226043701171875, 0.0403900146484375, 0.06851959228515625, 0.096649169921875, 0.12477874755859375, 0.1529083251953125, 0.18103790283203125, 0.20916748046875, 0.23729705810546875, 0.2654266357421875, 0.29355621337890625, 0.321685791015625, 0.34981536865234375, 0.3779449462890625, 0.40607452392578125, 0.4342041015625, 0.46233367919921875, 0.4904632568359375, 0.5185928344726562, 0.546722412109375, 0.5748519897460938, 0.6029815673828125, 0.6311111450195312, 0.65924072265625, 0.6873703002929688, 0.7154998779296875, 0.7436294555664062, 0.771759033203125, 0.7998886108398438, 0.8280181884765625, 0.8561477661132812, 0.88427734375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 11.0, 9.0, 34.0, 51.0, 89.0, 128.0, 167.0, 192.0, 143.0, 93.0, 49.0, 18.0, 13.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.13174057006836, -21.66269874572754, -21.19365692138672, -20.7246150970459, -20.255573272705078, -19.786529541015625, -19.317487716674805, -18.848445892333984, -18.379404067993164, -17.910362243652344, -17.441320419311523, -16.972278594970703, -16.503236770629883, -16.034194946289062, -15.565152168273926, -15.096109390258789, -14.627067565917969, -14.158025741577148, -13.688983917236328, -13.219941139221191, -12.750899314880371, -12.28185749053955, -11.81281566619873, -11.343772888183594, -10.87473201751709, -10.40569019317627, -9.93664836883545, -9.467605590820312, -8.998563766479492, -8.529521942138672, -8.060480117797852, -7.591437816619873, -7.1223955154418945, -6.653353691101074, -6.184311389923096, -5.715269565582275, -5.246227264404297, -4.777185440063477, -4.308143615722656, -3.8391013145446777, -3.3700592517852783, -2.901017189025879, -2.4319751262664795, -1.9629331827163696, -1.4938911199569702, -1.0248491764068604, -0.5558071136474609, -0.08676505088806152, 0.3822770118713379, 0.8513190746307373, 1.3203611373901367, 1.7894030809402466, 2.2584452629089355, 2.727487087249756, 3.1965291500091553, 3.6655712127685547, 4.134613037109375, 4.603654861450195, 5.072697162628174, 5.541738986968994, 6.010781288146973, 6.479823112487793, 6.948864936828613, 7.417907238006592, 7.88694953918457]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 12.0, 10.0, 15.0, 14.0, 13.0, 15.0, 21.0, 23.0, 27.0, 29.0, 19.0, 35.0, 30.0, 35.0, 33.0, 35.0, 45.0, 40.0, 43.0, 31.0, 35.0, 31.0, 29.0, 38.0, 46.0, 41.0, 30.0, 33.0, 32.0, 24.0, 15.0, 18.0, 11.0, 21.0, 5.0, 10.0, 11.0, 6.0, 10.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.049078941345215, -4.876288890838623, -4.703498363494873, -4.530708312988281, -4.357917785644531, -4.1851277351379395, -4.012337684631348, -3.8395471572875977, -3.666757106781006, -3.493966817855835, -3.321176528930664, -3.1483864784240723, -2.9755961894989014, -2.8028059005737305, -2.6300156116485596, -2.4572253227233887, -2.2844350337982178, -2.111644744873047, -1.9388545751571655, -1.7660642862319946, -1.5932741165161133, -1.4204838275909424, -1.2476935386657715, -1.0749033689498901, -0.9021130800247192, -0.7293228507041931, -0.556532621383667, -0.3837423324584961, -0.21095210313796997, -0.03816187381744385, 0.13462841510772705, 0.3074185848236084, 0.4802088737487793, 0.6529991030693054, 0.8257893323898315, 0.9985796213150024, 1.1713697910308838, 1.3441600799560547, 1.5169503688812256, 1.689740538597107, 1.8625308275222778, 2.035320997238159, 2.20811128616333, 2.380901575088501, 2.553691864013672, 2.7264819145202637, 2.8992724418640137, 3.0720624923706055, 3.2448527812957764, 3.4176430702209473, 3.590433359146118, 3.763223648071289, 3.936013698577881, 4.108803749084473, 4.281594276428223, 4.4543843269348145, 4.6271748542785645, 4.799964904785156, 4.972755432128906, 5.145545482635498, 5.318336009979248, 5.49112606048584, 5.66391658782959, 5.836706638336182, 6.009496688842773]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 12.0, 3.0, 9.0, 11.0, 13.0, 27.0, 30.0, 41.0, 75.0, 139.0, 256.0, 586.0, 1617.0, 5729.0, 37030.0, 4058061.0, 78360.0, 8462.0, 2237.0, 757.0, 307.0, 178.0, 96.0, 55.0, 50.0, 24.0, 27.0, 10.0, 26.0, 10.0, 9.0, 9.0, 8.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.609375, -4.463623046875, -4.31787109375, -4.172119140625, -4.0263671875, -3.880615234375, -3.73486328125, -3.589111328125, -3.443359375, -3.297607421875, -3.15185546875, -3.006103515625, -2.8603515625, -2.714599609375, -2.56884765625, -2.423095703125, -2.27734375, -2.131591796875, -1.98583984375, -1.840087890625, -1.6943359375, -1.548583984375, -1.40283203125, -1.257080078125, -1.111328125, -0.965576171875, -0.81982421875, -0.674072265625, -0.5283203125, -0.382568359375, -0.23681640625, -0.091064453125, 0.0546875, 0.200439453125, 0.34619140625, 0.491943359375, 0.6376953125, 0.783447265625, 0.92919921875, 1.074951171875, 1.220703125, 1.366455078125, 1.51220703125, 1.657958984375, 1.8037109375, 1.949462890625, 2.09521484375, 2.240966796875, 2.38671875, 2.532470703125, 2.67822265625, 2.823974609375, 2.9697265625, 3.115478515625, 3.26123046875, 3.406982421875, 3.552734375, 3.698486328125, 3.84423828125, 3.989990234375, 4.1357421875, 4.281494140625, 4.42724609375, 4.572998046875, 4.71875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 1.0, 4.0, 9.0, 19.0, 15.0, 20.0, 33.0, 51.0, 67.0, 68.0, 77.0, 100.0, 82.0, 89.0, 102.0, 65.0, 56.0, 47.0, 24.0, 20.0, 15.0, 18.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447021484375, -0.4301261901855469, -0.41323089599609375, -0.3963356018066406, -0.3794403076171875, -0.3625450134277344, -0.34564971923828125, -0.3287544250488281, -0.311859130859375, -0.2949638366699219, -0.27806854248046875, -0.2611732482910156, -0.2442779541015625, -0.22738265991210938, -0.21048736572265625, -0.19359207153320312, -0.17669677734375, -0.15980148315429688, -0.14290618896484375, -0.12601089477539062, -0.1091156005859375, -0.09222030639648438, -0.07532501220703125, -0.058429718017578125, -0.041534423828125, -0.024639129638671875, -0.00774383544921875, 0.009151458740234375, 0.0260467529296875, 0.042942047119140625, 0.05983734130859375, 0.07673263549804688, 0.0936279296875, 0.11052322387695312, 0.12741851806640625, 0.14431381225585938, 0.1612091064453125, 0.17810440063476562, 0.19499969482421875, 0.21189498901367188, 0.228790283203125, 0.24568557739257812, 0.26258087158203125, 0.2794761657714844, 0.2963714599609375, 0.3132667541503906, 0.33016204833984375, 0.3470573425292969, 0.36395263671875, 0.3808479309082031, 0.39774322509765625, 0.4146385192871094, 0.4315338134765625, 0.4484291076660156, 0.46532440185546875, 0.4822196960449219, 0.499114990234375, 0.5160102844238281, 0.5329055786132812, 0.5498008728027344, 0.5666961669921875, 0.5835914611816406, 0.6004867553710938, 0.6173820495605469, 0.63427734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 13.0, 17.0, 18.0, 25.0, 55.0, 92.0, 134.0, 233.0, 383.0, 758.0, 1512.0, 3327.0, 9038.0, 39792.0, 3343764.0, 749819.0, 31198.0, 7914.0, 3072.0, 1394.0, 703.0, 382.0, 229.0, 140.0, 97.0, 60.0, 37.0, 25.0, 9.0, 12.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.671875, -3.5750732421875, -3.478271484375, -3.3814697265625, -3.28466796875, -3.1878662109375, -3.091064453125, -2.9942626953125, -2.8974609375, -2.8006591796875, -2.703857421875, -2.6070556640625, -2.51025390625, -2.4134521484375, -2.316650390625, -2.2198486328125, -2.123046875, -2.0262451171875, -1.929443359375, -1.8326416015625, -1.73583984375, -1.6390380859375, -1.542236328125, -1.4454345703125, -1.3486328125, -1.2518310546875, -1.155029296875, -1.0582275390625, -0.96142578125, -0.8646240234375, -0.767822265625, -0.6710205078125, -0.57421875, -0.4774169921875, -0.380615234375, -0.2838134765625, -0.18701171875, -0.0902099609375, 0.006591796875, 0.1033935546875, 0.2001953125, 0.2969970703125, 0.393798828125, 0.4906005859375, 0.58740234375, 0.6842041015625, 0.781005859375, 0.8778076171875, 0.974609375, 1.0714111328125, 1.168212890625, 1.2650146484375, 1.36181640625, 1.4586181640625, 1.555419921875, 1.6522216796875, 1.7490234375, 1.8458251953125, 1.942626953125, 2.0394287109375, 2.13623046875, 2.2330322265625, 2.329833984375, 2.4266357421875, 2.5234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 8.0, 20.0, 18.0, 27.0, 56.0, 118.0, 524.0, 2745.0, 307.0, 96.0, 48.0, 30.0, 17.0, 13.0, 8.0, 8.0, 6.0, 4.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1796875, -1.1408233642578125, -1.101959228515625, -1.0630950927734375, -1.02423095703125, -0.9853668212890625, -0.946502685546875, -0.9076385498046875, -0.8687744140625, -0.8299102783203125, -0.791046142578125, -0.7521820068359375, -0.71331787109375, -0.6744537353515625, -0.635589599609375, -0.5967254638671875, -0.557861328125, -0.5189971923828125, -0.480133056640625, -0.4412689208984375, -0.40240478515625, -0.3635406494140625, -0.324676513671875, -0.2858123779296875, -0.2469482421875, -0.2080841064453125, -0.169219970703125, -0.1303558349609375, -0.09149169921875, -0.0526275634765625, -0.013763427734375, 0.0251007080078125, 0.06396484375, 0.1028289794921875, 0.141693115234375, 0.1805572509765625, 0.21942138671875, 0.2582855224609375, 0.297149658203125, 0.3360137939453125, 0.3748779296875, 0.4137420654296875, 0.452606201171875, 0.4914703369140625, 0.53033447265625, 0.5691986083984375, 0.608062744140625, 0.6469268798828125, 0.685791015625, 0.7246551513671875, 0.763519287109375, 0.8023834228515625, 0.84124755859375, 0.8801116943359375, 0.918975830078125, 0.9578399658203125, 0.9967041015625, 1.0355682373046875, 1.074432373046875, 1.1132965087890625, 1.15216064453125, 1.1910247802734375, 1.229888916015625, 1.2687530517578125, 1.3076171875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 9.0, 21.0, 35.0, 74.0, 131.0, 218.0, 223.0, 121.0, 71.0, 33.0, 21.0, 14.0, 12.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.330661773681641, -5.115939140319824, -4.901216506958008, -4.686493396759033, -4.471770763397217, -4.2570481300354, -4.042325019836426, -3.8276023864746094, -3.612879753112793, -3.3981571197509766, -3.183434247970581, -2.9687113761901855, -2.753988742828369, -2.5392661094665527, -2.3245432376861572, -2.1098203659057617, -1.8950977325439453, -1.6803749799728394, -1.4656522274017334, -1.2509294748306274, -1.0362067222595215, -0.8214839696884155, -0.6067612171173096, -0.3920384645462036, -0.17731571197509766, 0.0374070405960083, 0.25212979316711426, 0.4668525457382202, 0.6815752983093262, 0.8962980508804321, 1.111020803451538, 1.325743556022644, 1.54046630859375, 1.755189061164856, 1.969911813735962, 2.1846346855163574, 2.399357318878174, 2.6140799522399902, 2.8288028240203857, 3.0435256958007812, 3.2582483291625977, 3.472970962524414, 3.6876938343048096, 3.902416706085205, 4.1171393394470215, 4.331861972808838, 4.5465850830078125, 4.761307716369629, 4.976030349731445, 5.190752983093262, 5.405475616455078, 5.620198726654053, 5.834921360015869, 6.0496439933776855, 6.26436710357666, 6.479089736938477, 6.693812370300293, 6.908535003662109, 7.123257637023926, 7.3379807472229, 7.552703380584717, 7.767426013946533, 7.982149124145508, 8.196871757507324, 8.41159439086914]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 9.0, 5.0, 10.0, 7.0, 10.0, 9.0, 7.0, 15.0, 12.0, 19.0, 22.0, 44.0, 35.0, 36.0, 43.0, 31.0, 47.0, 50.0, 52.0, 53.0, 51.0, 53.0, 52.0, 42.0, 39.0, 48.0, 23.0, 32.0, 21.0, 22.0, 25.0, 11.0, 12.0, 19.0, 5.0, 8.0, 6.0, 7.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.448403835296631, -2.3606741428375244, -2.272944450378418, -2.1852149963378906, -2.097485303878784, -2.0097556114196777, -1.9220259189605713, -1.8342962265014648, -1.746566653251648, -1.6588369607925415, -1.5711073875427246, -1.4833776950836182, -1.3956480026245117, -1.3079184293746948, -1.2201887369155884, -1.1324591636657715, -1.044729471206665, -0.9569998383522034, -0.8692702054977417, -0.7815405130386353, -0.6938108801841736, -0.6060812473297119, -0.5183515548706055, -0.4306219220161438, -0.34289228916168213, -0.25516265630722046, -0.1674329936504364, -0.07970333099365234, 0.008026301860809326, 0.095755934715271, 0.18348562717437744, 0.2712152600288391, 0.3589451313018799, 0.44667476415634155, 0.5344043970108032, 0.6221340894699097, 0.7098637223243713, 0.797593355178833, 0.8853230476379395, 0.9730526804924011, 1.0607823133468628, 1.1485120058059692, 1.2362415790557861, 1.3239712715148926, 1.411700963973999, 1.499430537223816, 1.5871602296829224, 1.6748898029327393, 1.7626194953918457, 1.8503491878509521, 1.938078761100769, 2.025808334350586, 2.1135380268096924, 2.201267719268799, 2.2889974117279053, 2.3767271041870117, 2.464456558227539, 2.5521862506866455, 2.639915943145752, 2.7276453971862793, 2.8153750896453857, 2.903104782104492, 2.9908344745635986, 3.078564167022705, 3.1662938594818115]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 11.0, 12.0, 19.0, 19.0, 22.0, 43.0, 61.0, 85.0, 170.0, 296.0, 540.0, 1234.0, 3015.0, 9783.0, 50418.0, 548556.0, 384013.0, 37128.0, 8178.0, 2621.0, 1059.0, 527.0, 262.0, 158.0, 96.0, 54.0, 37.0, 42.0, 18.0, 20.0, 13.0, 6.0, 8.0, 4.0, 2.0, 0.0, 5.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.080078125, -2.977142333984375, -2.87420654296875, -2.771270751953125, -2.6683349609375, -2.565399169921875, -2.46246337890625, -2.359527587890625, -2.256591796875, -2.153656005859375, -2.05072021484375, -1.947784423828125, -1.8448486328125, -1.741912841796875, -1.63897705078125, -1.536041259765625, -1.43310546875, -1.330169677734375, -1.22723388671875, -1.124298095703125, -1.0213623046875, -0.918426513671875, -0.81549072265625, -0.712554931640625, -0.609619140625, -0.506683349609375, -0.40374755859375, -0.300811767578125, -0.1978759765625, -0.094940185546875, 0.00799560546875, 0.110931396484375, 0.2138671875, 0.316802978515625, 0.41973876953125, 0.522674560546875, 0.6256103515625, 0.728546142578125, 0.83148193359375, 0.934417724609375, 1.037353515625, 1.140289306640625, 1.24322509765625, 1.346160888671875, 1.4490966796875, 1.552032470703125, 1.65496826171875, 1.757904052734375, 1.86083984375, 1.963775634765625, 2.06671142578125, 2.169647216796875, 2.2725830078125, 2.375518798828125, 2.47845458984375, 2.581390380859375, 2.684326171875, 2.787261962890625, 2.89019775390625, 2.993133544921875, 3.0960693359375, 3.199005126953125, 3.30194091796875, 3.404876708984375, 3.5078125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 9.0, 17.0, 28.0, 39.0, 39.0, 41.0, 60.0, 79.0, 82.0, 80.0, 89.0, 88.0, 77.0, 70.0, 58.0, 42.0, 29.0, 22.0, 8.0, 14.0, 8.0, 3.0, 4.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.498046875, -0.48040008544921875, -0.4627532958984375, -0.44510650634765625, -0.427459716796875, -0.40981292724609375, -0.3921661376953125, -0.37451934814453125, -0.35687255859375, -0.33922576904296875, -0.3215789794921875, -0.30393218994140625, -0.286285400390625, -0.26863861083984375, -0.2509918212890625, -0.23334503173828125, -0.2156982421875, -0.19805145263671875, -0.1804046630859375, -0.16275787353515625, -0.145111083984375, -0.12746429443359375, -0.1098175048828125, -0.09217071533203125, -0.07452392578125, -0.05687713623046875, -0.0392303466796875, -0.02158355712890625, -0.003936767578125, 0.01371002197265625, 0.0313568115234375, 0.04900360107421875, 0.066650390625, 0.08429718017578125, 0.1019439697265625, 0.11959075927734375, 0.137237548828125, 0.15488433837890625, 0.1725311279296875, 0.19017791748046875, 0.20782470703125, 0.22547149658203125, 0.2431182861328125, 0.26076507568359375, 0.278411865234375, 0.29605865478515625, 0.3137054443359375, 0.33135223388671875, 0.3489990234375, 0.36664581298828125, 0.3842926025390625, 0.40193939208984375, 0.419586181640625, 0.43723297119140625, 0.4548797607421875, 0.47252655029296875, 0.49017333984375, 0.5078201293945312, 0.5254669189453125, 0.5431137084960938, 0.560760498046875, 0.5784072875976562, 0.5960540771484375, 0.6137008666992188, 0.63134765625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 1.0, 5.0, 2.0, 6.0, 9.0, 12.0, 17.0, 19.0, 26.0, 47.0, 69.0, 130.0, 251.0, 400.0, 880.0, 1791.0, 4183.0, 11441.0, 38003.0, 164196.0, 537513.0, 217914.0, 48738.0, 13768.0, 4958.0, 2127.0, 944.0, 481.0, 213.0, 150.0, 77.0, 42.0, 42.0, 21.0, 15.0, 6.0, 16.0, 8.0, 3.0, 8.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.69140625, -1.6378631591796875, -1.584320068359375, -1.5307769775390625, -1.47723388671875, -1.4236907958984375, -1.370147705078125, -1.3166046142578125, -1.2630615234375, -1.2095184326171875, -1.155975341796875, -1.1024322509765625, -1.04888916015625, -0.9953460693359375, -0.941802978515625, -0.8882598876953125, -0.834716796875, -0.7811737060546875, -0.727630615234375, -0.6740875244140625, -0.62054443359375, -0.5670013427734375, -0.513458251953125, -0.4599151611328125, -0.4063720703125, -0.3528289794921875, -0.299285888671875, -0.2457427978515625, -0.19219970703125, -0.1386566162109375, -0.085113525390625, -0.0315704345703125, 0.02197265625, 0.0755157470703125, 0.129058837890625, 0.1826019287109375, 0.23614501953125, 0.2896881103515625, 0.343231201171875, 0.3967742919921875, 0.4503173828125, 0.5038604736328125, 0.557403564453125, 0.6109466552734375, 0.66448974609375, 0.7180328369140625, 0.771575927734375, 0.8251190185546875, 0.878662109375, 0.9322052001953125, 0.985748291015625, 1.0392913818359375, 1.09283447265625, 1.1463775634765625, 1.199920654296875, 1.2534637451171875, 1.3070068359375, 1.3605499267578125, 1.414093017578125, 1.4676361083984375, 1.52117919921875, 1.5747222900390625, 1.628265380859375, 1.6818084716796875, 1.7353515625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 16.0, 7.0, 15.0, 20.0, 17.0, 13.0, 22.0, 22.0, 31.0, 27.0, 30.0, 40.0, 43.0, 39.0, 44.0, 51.0, 45.0, 42.0, 33.0, 43.0, 32.0, 45.0, 36.0, 30.0, 31.0, 22.0, 27.0, 24.0, 15.0, 22.0, 19.0, 17.0, 9.0, 9.0, 10.0, 12.0, 4.0, 5.0, 4.0, 2.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.24609375, -1.2064361572265625, -1.166778564453125, -1.1271209716796875, -1.08746337890625, -1.0478057861328125, -1.008148193359375, -0.9684906005859375, -0.9288330078125, -0.8891754150390625, -0.849517822265625, -0.8098602294921875, -0.77020263671875, -0.7305450439453125, -0.690887451171875, -0.6512298583984375, -0.611572265625, -0.5719146728515625, -0.532257080078125, -0.4925994873046875, -0.45294189453125, -0.4132843017578125, -0.373626708984375, -0.3339691162109375, -0.2943115234375, -0.2546539306640625, -0.214996337890625, -0.1753387451171875, -0.13568115234375, -0.0960235595703125, -0.056365966796875, -0.0167083740234375, 0.02294921875, 0.0626068115234375, 0.102264404296875, 0.1419219970703125, 0.18157958984375, 0.2212371826171875, 0.260894775390625, 0.3005523681640625, 0.3402099609375, 0.3798675537109375, 0.419525146484375, 0.4591827392578125, 0.49884033203125, 0.5384979248046875, 0.578155517578125, 0.6178131103515625, 0.657470703125, 0.6971282958984375, 0.736785888671875, 0.7764434814453125, 0.81610107421875, 0.8557586669921875, 0.895416259765625, 0.9350738525390625, 0.9747314453125, 1.0143890380859375, 1.054046630859375, 1.0937042236328125, 1.13336181640625, 1.1730194091796875, 1.212677001953125, 1.2523345947265625, 1.2919921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 10.0, 7.0, 6.0, 10.0, 21.0, 25.0, 41.0, 65.0, 116.0, 237.0, 494.0, 1063.0, 2875.0, 9265.0, 42361.0, 347531.0, 556359.0, 68435.0, 13137.0, 3902.0, 1361.0, 558.0, 292.0, 139.0, 95.0, 44.0, 36.0, 17.0, 17.0, 8.0, 7.0, 6.0, 0.0, 3.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.7158203125, -0.6942138671875, -0.672607421875, -0.6510009765625, -0.62939453125, -0.6077880859375, -0.586181640625, -0.5645751953125, -0.54296875, -0.5213623046875, -0.499755859375, -0.4781494140625, -0.45654296875, -0.4349365234375, -0.413330078125, -0.3917236328125, -0.3701171875, -0.3485107421875, -0.326904296875, -0.3052978515625, -0.28369140625, -0.2620849609375, -0.240478515625, -0.2188720703125, -0.197265625, -0.1756591796875, -0.154052734375, -0.1324462890625, -0.11083984375, -0.0892333984375, -0.067626953125, -0.0460205078125, -0.0244140625, -0.0028076171875, 0.018798828125, 0.0404052734375, 0.06201171875, 0.0836181640625, 0.105224609375, 0.1268310546875, 0.1484375, 0.1700439453125, 0.191650390625, 0.2132568359375, 0.23486328125, 0.2564697265625, 0.278076171875, 0.2996826171875, 0.3212890625, 0.3428955078125, 0.364501953125, 0.3861083984375, 0.40771484375, 0.4293212890625, 0.450927734375, 0.4725341796875, 0.494140625, 0.5157470703125, 0.537353515625, 0.5589599609375, 0.58056640625, 0.6021728515625, 0.623779296875, 0.6453857421875, 0.6669921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 6.0, 2.0, 7.0, 10.0, 5.0, 14.0, 27.0, 30.0, 42.0, 86.0, 128.0, 171.0, 146.0, 114.0, 73.0, 33.0, 24.0, 25.0, 9.0, 12.0, 9.0, 8.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001500844955444336, -0.00014537759125232697, -0.00014067068696022034, -0.0001359637826681137, -0.00013125687837600708, -0.00012654997408390045, -0.00012184306979179382, -0.0001171361654996872, -0.00011242926120758057, -0.00010772235691547394, -0.00010301545262336731, -9.830854833126068e-05, -9.360164403915405e-05, -8.889473974704742e-05, -8.41878354549408e-05, -7.948093116283417e-05, -7.477402687072754e-05, -7.006712257862091e-05, -6.536021828651428e-05, -6.0653313994407654e-05, -5.5946409702301025e-05, -5.12395054101944e-05, -4.653260111808777e-05, -4.182569682598114e-05, -3.711879253387451e-05, -3.241188824176788e-05, -2.7704983949661255e-05, -2.2998079657554626e-05, -1.8291175365447998e-05, -1.358427107334137e-05, -8.877366781234741e-06, -4.170462489128113e-06, 5.364418029785156e-07, 5.243346095085144e-06, 9.950250387191772e-06, 1.4657154679298401e-05, 1.936405897140503e-05, 2.4070963263511658e-05, 2.8777867555618286e-05, 3.3484771847724915e-05, 3.819167613983154e-05, 4.289858043193817e-05, 4.76054847240448e-05, 5.231238901615143e-05, 5.701929330825806e-05, 6.172619760036469e-05, 6.643310189247131e-05, 7.114000618457794e-05, 7.584691047668457e-05, 8.05538147687912e-05, 8.526071906089783e-05, 8.996762335300446e-05, 9.467452764511108e-05, 9.938143193721771e-05, 0.00010408833622932434, 0.00010879524052143097, 0.0001135021448135376, 0.00011820904910564423, 0.00012291595339775085, 0.00012762285768985748, 0.0001323297619819641, 0.00013703666627407074, 0.00014174357056617737, 0.000146450474858284, 0.00015115737915039062]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 4.0, 10.0, 10.0, 14.0, 16.0, 30.0, 44.0, 59.0, 116.0, 205.0, 405.0, 941.0, 2590.0, 9051.0, 46025.0, 494516.0, 440027.0, 41778.0, 8391.0, 2452.0, 947.0, 404.0, 213.0, 111.0, 68.0, 37.0, 31.0, 13.0, 12.0, 9.0, 8.0, 3.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67822265625, -0.654815673828125, -0.63140869140625, -0.608001708984375, -0.5845947265625, -0.561187744140625, -0.53778076171875, -0.514373779296875, -0.490966796875, -0.467559814453125, -0.44415283203125, -0.420745849609375, -0.3973388671875, -0.373931884765625, -0.35052490234375, -0.327117919921875, -0.3037109375, -0.280303955078125, -0.25689697265625, -0.233489990234375, -0.2100830078125, -0.186676025390625, -0.16326904296875, -0.139862060546875, -0.116455078125, -0.093048095703125, -0.06964111328125, -0.046234130859375, -0.0228271484375, 0.000579833984375, 0.02398681640625, 0.047393798828125, 0.07080078125, 0.094207763671875, 0.11761474609375, 0.141021728515625, 0.1644287109375, 0.187835693359375, 0.21124267578125, 0.234649658203125, 0.258056640625, 0.281463623046875, 0.30487060546875, 0.328277587890625, 0.3516845703125, 0.375091552734375, 0.39849853515625, 0.421905517578125, 0.4453125, 0.468719482421875, 0.49212646484375, 0.515533447265625, 0.5389404296875, 0.562347412109375, 0.58575439453125, 0.609161376953125, 0.632568359375, 0.655975341796875, 0.67938232421875, 0.702789306640625, 0.7261962890625, 0.749603271484375, 0.77301025390625, 0.796417236328125, 0.81982421875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 1.0, 5.0, 1.0, 8.0, 6.0, 6.0, 10.0, 11.0, 13.0, 8.0, 30.0, 22.0, 37.0, 68.0, 93.0, 98.0, 117.0, 82.0, 96.0, 85.0, 55.0, 36.0, 28.0, 25.0, 15.0, 8.0, 15.0, 4.0, 3.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.487548828125, -0.47306060791015625, -0.4585723876953125, -0.44408416748046875, -0.429595947265625, -0.41510772705078125, -0.4006195068359375, -0.38613128662109375, -0.37164306640625, -0.35715484619140625, -0.3426666259765625, -0.32817840576171875, -0.313690185546875, -0.29920196533203125, -0.2847137451171875, -0.27022552490234375, -0.2557373046875, -0.24124908447265625, -0.2267608642578125, -0.21227264404296875, -0.197784423828125, -0.18329620361328125, -0.1688079833984375, -0.15431976318359375, -0.13983154296875, -0.12534332275390625, -0.1108551025390625, -0.09636688232421875, -0.081878662109375, -0.06739044189453125, -0.0529022216796875, -0.03841400146484375, -0.02392578125, -0.00943756103515625, 0.0050506591796875, 0.01953887939453125, 0.034027099609375, 0.04851531982421875, 0.0630035400390625, 0.07749176025390625, 0.09197998046875, 0.10646820068359375, 0.1209564208984375, 0.13544464111328125, 0.149932861328125, 0.16442108154296875, 0.1789093017578125, 0.19339752197265625, 0.2078857421875, 0.22237396240234375, 0.2368621826171875, 0.25135040283203125, 0.265838623046875, 0.28032684326171875, 0.2948150634765625, 0.30930328369140625, 0.32379150390625, 0.33827972412109375, 0.3527679443359375, 0.36725616455078125, 0.381744384765625, 0.39623260498046875, 0.4107208251953125, 0.42520904541015625, 0.439697265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 15.0, 16.0, 33.0, 54.0, 99.0, 140.0, 179.0, 183.0, 117.0, 70.0, 52.0, 23.0, 14.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.855772018432617, -15.42529582977295, -14.994818687438965, -14.564342498779297, -14.133865356445312, -13.703389167785645, -13.27291202545166, -12.842435836791992, -12.411958694458008, -11.98148250579834, -11.551005363464355, -11.120529174804688, -10.690052032470703, -10.259575843811035, -9.82909870147705, -9.398622512817383, -8.968145370483398, -8.53766918182373, -8.107192039489746, -7.67671537399292, -7.246238708496094, -6.815762519836426, -6.385285377502441, -5.954809188842773, -5.5243330001831055, -5.093856334686279, -4.663379669189453, -4.232903003692627, -3.802426338195801, -3.3719499111175537, -2.9414732456207275, -2.5109965801239014, -2.080519676208496, -1.65004301071167, -1.2195663452148438, -0.7890897989273071, -0.35861313343048096, 0.07186341285705566, 0.5023400783538818, 0.932816743850708, 1.3632934093475342, 1.7937700748443604, 2.2242467403411865, 2.6547231674194336, 3.0851998329162598, 3.515676498413086, 3.946153163909912, 4.376629829406738, 4.8071064949035645, 5.237583160400391, 5.668059825897217, 6.098536491394043, 6.529013156890869, 6.959489822387695, 7.389966011047363, 7.820443153381348, 8.250919342041016, 8.681395530700684, 9.111872673034668, 9.542348861694336, 9.97282600402832, 10.403302192687988, 10.833779335021973, 11.26425552368164, 11.694732666015625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 1.0, 2.0, 6.0, 4.0, 12.0, 9.0, 9.0, 15.0, 13.0, 14.0, 20.0, 23.0, 19.0, 30.0, 26.0, 34.0, 36.0, 37.0, 45.0, 44.0, 56.0, 38.0, 51.0, 40.0, 39.0, 42.0, 43.0, 41.0, 40.0, 33.0, 27.0, 20.0, 34.0, 19.0, 14.0, 14.0, 14.0, 7.0, 6.0, 6.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.959950923919678, -5.761819362640381, -5.563688278198242, -5.365556716918945, -5.167425155639648, -4.969293594360352, -4.771162509918213, -4.573030948638916, -4.374899864196777, -4.1767683029174805, -3.9786369800567627, -3.780505657196045, -3.582374095916748, -3.3842427730560303, -3.1861114501953125, -2.9879798889160156, -2.7898483276367188, -2.591717004776001, -2.393585443496704, -2.1954541206359863, -1.997322678565979, -1.7991912364959717, -1.601059913635254, -1.4029284715652466, -1.2047970294952393, -1.006665587425232, -0.8085342049598694, -0.6104028224945068, -0.4122713804244995, -0.2141399383544922, -0.016008615493774414, 0.1821228265762329, 0.38025474548339844, 0.5783861875534058, 0.7765175700187683, 0.9746489524841309, 1.1727803945541382, 1.3709118366241455, 1.5690431594848633, 1.7671746015548706, 1.965306043624878, 2.1634373664855957, 2.3615689277648926, 2.5597002506256104, 2.757831573486328, 2.955963134765625, 3.1540944576263428, 3.3522257804870605, 3.5503573417663574, 3.748488664627075, 3.946620225906372, 4.14475154876709, 4.342883110046387, 4.541014671325684, 4.739145755767822, 4.937277317047119, 5.135408401489258, 5.333539962768555, 5.531671047210693, 5.72980260848999, 5.927934169769287, 6.126065254211426, 6.324196815490723, 6.5223283767700195, 6.720459938049316]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 11.0, 10.0, 17.0, 19.0, 13.0, 29.0, 60.0, 77.0, 160.0, 292.0, 633.0, 1548.0, 4461.0, 16604.0, 187481.0, 3927645.0, 42074.0, 8124.0, 2648.0, 1094.0, 527.0, 287.0, 148.0, 90.0, 51.0, 40.0, 28.0, 35.0, 19.0, 11.0, 10.0, 4.0, 7.0, 4.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.375, -4.2393798828125, -4.103759765625, -3.9681396484375, -3.83251953125, -3.6968994140625, -3.561279296875, -3.4256591796875, -3.2900390625, -3.1544189453125, -3.018798828125, -2.8831787109375, -2.74755859375, -2.6119384765625, -2.476318359375, -2.3406982421875, -2.205078125, -2.0694580078125, -1.933837890625, -1.7982177734375, -1.66259765625, -1.5269775390625, -1.391357421875, -1.2557373046875, -1.1201171875, -0.9844970703125, -0.848876953125, -0.7132568359375, -0.57763671875, -0.4420166015625, -0.306396484375, -0.1707763671875, -0.03515625, 0.1004638671875, 0.236083984375, 0.3717041015625, 0.50732421875, 0.6429443359375, 0.778564453125, 0.9141845703125, 1.0498046875, 1.1854248046875, 1.321044921875, 1.4566650390625, 1.59228515625, 1.7279052734375, 1.863525390625, 1.9991455078125, 2.134765625, 2.2703857421875, 2.406005859375, 2.5416259765625, 2.67724609375, 2.8128662109375, 2.948486328125, 3.0841064453125, 3.2197265625, 3.3553466796875, 3.490966796875, 3.6265869140625, 3.76220703125, 3.8978271484375, 4.033447265625, 4.1690673828125, 4.3046875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 6.0, 15.0, 32.0, 23.0, 45.0, 63.0, 65.0, 68.0, 82.0, 83.0, 74.0, 87.0, 84.0, 60.0, 58.0, 37.0, 28.0, 23.0, 16.0, 13.0, 7.0, 4.0, 6.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5078125, -0.49040985107421875, -0.4730072021484375, -0.45560455322265625, -0.438201904296875, -0.42079925537109375, -0.4033966064453125, -0.38599395751953125, -0.36859130859375, -0.35118865966796875, -0.3337860107421875, -0.31638336181640625, -0.298980712890625, -0.28157806396484375, -0.2641754150390625, -0.24677276611328125, -0.2293701171875, -0.21196746826171875, -0.1945648193359375, -0.17716217041015625, -0.159759521484375, -0.14235687255859375, -0.1249542236328125, -0.10755157470703125, -0.09014892578125, -0.07274627685546875, -0.0553436279296875, -0.03794097900390625, -0.020538330078125, -0.00313568115234375, 0.0142669677734375, 0.03166961669921875, 0.049072265625, 0.06647491455078125, 0.0838775634765625, 0.10128021240234375, 0.118682861328125, 0.13608551025390625, 0.1534881591796875, 0.17089080810546875, 0.18829345703125, 0.20569610595703125, 0.2230987548828125, 0.24050140380859375, 0.257904052734375, 0.27530670166015625, 0.2927093505859375, 0.31011199951171875, 0.3275146484375, 0.34491729736328125, 0.3623199462890625, 0.37972259521484375, 0.397125244140625, 0.41452789306640625, 0.4319305419921875, 0.44933319091796875, 0.46673583984375, 0.48413848876953125, 0.5015411376953125, 0.5189437866210938, 0.536346435546875, 0.5537490844726562, 0.5711517333984375, 0.5885543823242188, 0.60595703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 7.0, 9.0, 17.0, 21.0, 41.0, 64.0, 84.0, 147.0, 245.0, 403.0, 645.0, 1226.0, 2224.0, 4301.0, 9600.0, 24731.0, 98217.0, 3522723.0, 448675.0, 51024.0, 16115.0, 6707.0, 3149.0, 1653.0, 901.0, 534.0, 292.0, 191.0, 124.0, 72.0, 48.0, 31.0, 35.0, 12.0, 6.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.72265625, -2.6506195068359375, -2.578582763671875, -2.5065460205078125, -2.43450927734375, -2.3624725341796875, -2.290435791015625, -2.2183990478515625, -2.1463623046875, -2.0743255615234375, -2.002288818359375, -1.9302520751953125, -1.85821533203125, -1.7861785888671875, -1.714141845703125, -1.6421051025390625, -1.570068359375, -1.4980316162109375, -1.425994873046875, -1.3539581298828125, -1.28192138671875, -1.2098846435546875, -1.137847900390625, -1.0658111572265625, -0.9937744140625, -0.9217376708984375, -0.849700927734375, -0.7776641845703125, -0.70562744140625, -0.6335906982421875, -0.561553955078125, -0.4895172119140625, -0.41748046875, -0.3454437255859375, -0.273406982421875, -0.2013702392578125, -0.12933349609375, -0.0572967529296875, 0.014739990234375, 0.0867767333984375, 0.1588134765625, 0.2308502197265625, 0.302886962890625, 0.3749237060546875, 0.44696044921875, 0.5189971923828125, 0.591033935546875, 0.6630706787109375, 0.735107421875, 0.8071441650390625, 0.879180908203125, 0.9512176513671875, 1.02325439453125, 1.0952911376953125, 1.167327880859375, 1.2393646240234375, 1.3114013671875, 1.3834381103515625, 1.455474853515625, 1.5275115966796875, 1.59954833984375, 1.6715850830078125, 1.743621826171875, 1.8156585693359375, 1.8876953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 7.0, 2.0, 6.0, 6.0, 12.0, 7.0, 19.0, 22.0, 30.0, 59.0, 62.0, 123.0, 341.0, 2366.0, 577.0, 174.0, 92.0, 44.0, 35.0, 21.0, 14.0, 10.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0146484375, -0.9853744506835938, -0.9561004638671875, -0.9268264770507812, -0.897552490234375, -0.8682785034179688, -0.8390045166015625, -0.8097305297851562, -0.78045654296875, -0.7511825561523438, -0.7219085693359375, -0.6926345825195312, -0.663360595703125, -0.6340866088867188, -0.6048126220703125, -0.5755386352539062, -0.5462646484375, -0.5169906616210938, -0.4877166748046875, -0.45844268798828125, -0.429168701171875, -0.39989471435546875, -0.3706207275390625, -0.34134674072265625, -0.31207275390625, -0.28279876708984375, -0.2535247802734375, -0.22425079345703125, -0.194976806640625, -0.16570281982421875, -0.1364288330078125, -0.10715484619140625, -0.077880859375, -0.04860687255859375, -0.0193328857421875, 0.00994110107421875, 0.039215087890625, 0.06848907470703125, 0.0977630615234375, 0.12703704833984375, 0.15631103515625, 0.18558502197265625, 0.2148590087890625, 0.24413299560546875, 0.273406982421875, 0.30268096923828125, 0.3319549560546875, 0.36122894287109375, 0.3905029296875, 0.41977691650390625, 0.4490509033203125, 0.47832489013671875, 0.507598876953125, 0.5368728637695312, 0.5661468505859375, 0.5954208374023438, 0.62469482421875, 0.6539688110351562, 0.6832427978515625, 0.7125167846679688, 0.741790771484375, 0.7710647583007812, 0.8003387451171875, 0.8296127319335938, 0.85888671875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 2.0, 13.0, 20.0, 82.0, 165.0, 305.0, 260.0, 85.0, 44.0, 16.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4218854904174805, -6.096843242645264, -5.771800994873047, -5.44675874710083, -5.121716499328613, -4.7966742515563965, -4.47163200378418, -4.146589756011963, -3.821547508239746, -3.4965052604675293, -3.1714630126953125, -2.8464207649230957, -2.521378517150879, -2.196336269378662, -1.8712940216064453, -1.5462517738342285, -1.2212095260620117, -0.8961672782897949, -0.5711250305175781, -0.24608278274536133, 0.07895946502685547, 0.40400171279907227, 0.7290439605712891, 1.0540862083435059, 1.3791284561157227, 1.7041707038879395, 2.0292129516601562, 2.354255199432373, 2.67929744720459, 3.0043396949768066, 3.3293819427490234, 3.6544241905212402, 3.9794654846191406, 4.304507732391357, 4.629549980163574, 4.954592227935791, 5.279634475708008, 5.604676723480225, 5.929718971252441, 6.254761219024658, 6.579803466796875, 6.904845714569092, 7.229887962341309, 7.554930210113525, 7.879972457885742, 8.205015182495117, 8.530056953430176, 8.855098724365234, 9.18014144897461, 9.505184173583984, 9.830225944519043, 10.155267715454102, 10.480310440063477, 10.805353164672852, 11.13039493560791, 11.455436706542969, 11.780479431152344, 12.105522155761719, 12.430563926696777, 12.755605697631836, 13.080648422241211, 13.405691146850586, 13.730732917785645, 14.055774688720703, 14.380817413330078]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 2.0, 8.0, 9.0, 6.0, 8.0, 19.0, 18.0, 21.0, 18.0, 25.0, 32.0, 20.0, 41.0, 25.0, 44.0, 35.0, 34.0, 39.0, 39.0, 50.0, 45.0, 46.0, 35.0, 53.0, 45.0, 31.0, 27.0, 30.0, 36.0, 17.0, 28.0, 16.0, 14.0, 11.0, 17.0, 16.0, 6.0, 10.0, 8.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.838697671890259, -2.761110782623291, -2.6835241317749023, -2.6059372425079346, -2.528350591659546, -2.450763702392578, -2.3731770515441895, -2.2955901622772217, -2.218003273010254, -2.140416383743286, -2.0628297328948975, -1.9852429628372192, -1.907656192779541, -1.8300693035125732, -1.752482533454895, -1.6748957633972168, -1.5973091125488281, -1.51972234249115, -1.4421355724334717, -1.3645488023757935, -1.2869620323181152, -1.2093751430511475, -1.1317883729934692, -1.054201602935791, -0.9766148328781128, -0.8990280628204346, -0.8214412927627563, -0.7438544631004333, -0.6662676930427551, -0.5886809229850769, -0.5110940933227539, -0.4335073232650757, -0.35592055320739746, -0.27833378314971924, -0.20074698328971863, -0.12316019833087921, -0.045573413372039795, 0.03201335668563843, 0.10960015654563904, 0.18718695640563965, 0.26477372646331787, 0.3423604965209961, 0.4199472963809967, 0.4975340962409973, 0.5751208662986755, 0.6527076363563538, 0.7302944660186768, 0.807881236076355, 0.8854680061340332, 0.9630547761917114, 1.0406415462493896, 1.1182283163070679, 1.195815086364746, 1.2734019756317139, 1.350988745689392, 1.4285755157470703, 1.5061622858047485, 1.5837490558624268, 1.661335825920105, 1.7389225959777832, 1.816509485244751, 1.8940961360931396, 1.9716830253601074, 2.049269676208496, 2.126856565475464]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 7.0, 12.0, 11.0, 33.0, 49.0, 44.0, 88.0, 104.0, 167.0, 263.0, 445.0, 805.0, 1630.0, 3900.0, 11052.0, 43049.0, 229758.0, 566465.0, 146725.0, 29580.0, 8113.0, 3093.0, 1405.0, 685.0, 382.0, 244.0, 148.0, 92.0, 58.0, 50.0, 32.0, 21.0, 13.0, 12.0, 4.0, 4.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9296875, -2.844451904296875, -2.75921630859375, -2.673980712890625, -2.5887451171875, -2.503509521484375, -2.41827392578125, -2.333038330078125, -2.247802734375, -2.162567138671875, -2.07733154296875, -1.992095947265625, -1.9068603515625, -1.821624755859375, -1.73638916015625, -1.651153564453125, -1.56591796875, -1.480682373046875, -1.39544677734375, -1.310211181640625, -1.2249755859375, -1.139739990234375, -1.05450439453125, -0.969268798828125, -0.884033203125, -0.798797607421875, -0.71356201171875, -0.628326416015625, -0.5430908203125, -0.457855224609375, -0.37261962890625, -0.287384033203125, -0.2021484375, -0.116912841796875, -0.03167724609375, 0.053558349609375, 0.1387939453125, 0.224029541015625, 0.30926513671875, 0.394500732421875, 0.479736328125, 0.564971923828125, 0.65020751953125, 0.735443115234375, 0.8206787109375, 0.905914306640625, 0.99114990234375, 1.076385498046875, 1.16162109375, 1.246856689453125, 1.33209228515625, 1.417327880859375, 1.5025634765625, 1.587799072265625, 1.67303466796875, 1.758270263671875, 1.843505859375, 1.928741455078125, 2.01397705078125, 2.099212646484375, 2.1844482421875, 2.269683837890625, 2.35491943359375, 2.440155029296875, 2.525390625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 4.0, 12.0, 9.0, 9.0, 20.0, 28.0, 36.0, 51.0, 51.0, 64.0, 58.0, 67.0, 89.0, 79.0, 64.0, 65.0, 55.0, 57.0, 48.0, 32.0, 24.0, 19.0, 22.0, 12.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.5283203125, -0.51129150390625, -0.4942626953125, -0.47723388671875, -0.460205078125, -0.44317626953125, -0.4261474609375, -0.40911865234375, -0.39208984375, -0.37506103515625, -0.3580322265625, -0.34100341796875, -0.323974609375, -0.30694580078125, -0.2899169921875, -0.27288818359375, -0.255859375, -0.23883056640625, -0.2218017578125, -0.20477294921875, -0.187744140625, -0.17071533203125, -0.1536865234375, -0.13665771484375, -0.11962890625, -0.10260009765625, -0.0855712890625, -0.06854248046875, -0.051513671875, -0.03448486328125, -0.0174560546875, -0.00042724609375, 0.0166015625, 0.03363037109375, 0.0506591796875, 0.06768798828125, 0.084716796875, 0.10174560546875, 0.1187744140625, 0.13580322265625, 0.15283203125, 0.16986083984375, 0.1868896484375, 0.20391845703125, 0.220947265625, 0.23797607421875, 0.2550048828125, 0.27203369140625, 0.2890625, 0.30609130859375, 0.3231201171875, 0.34014892578125, 0.357177734375, 0.37420654296875, 0.3912353515625, 0.40826416015625, 0.42529296875, 0.44232177734375, 0.4593505859375, 0.47637939453125, 0.493408203125, 0.51043701171875, 0.5274658203125, 0.54449462890625, 0.5615234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 8.0, 9.0, 20.0, 21.0, 27.0, 31.0, 48.0, 92.0, 122.0, 197.0, 238.0, 428.0, 667.0, 1175.0, 2054.0, 3973.0, 8227.0, 18135.0, 42032.0, 107004.0, 266111.0, 335961.0, 154835.0, 60106.0, 24725.0, 10814.0, 5128.0, 2685.0, 1375.0, 847.0, 490.0, 312.0, 199.0, 137.0, 78.0, 61.0, 51.0, 30.0, 22.0, 15.0, 14.0, 9.0, 11.0, 9.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1826171875, -1.1434478759765625, -1.104278564453125, -1.0651092529296875, -1.02593994140625, -0.9867706298828125, -0.947601318359375, -0.9084320068359375, -0.8692626953125, -0.8300933837890625, -0.790924072265625, -0.7517547607421875, -0.71258544921875, -0.6734161376953125, -0.634246826171875, -0.5950775146484375, -0.555908203125, -0.5167388916015625, -0.477569580078125, -0.4384002685546875, -0.39923095703125, -0.3600616455078125, -0.320892333984375, -0.2817230224609375, -0.2425537109375, -0.2033843994140625, -0.164215087890625, -0.1250457763671875, -0.08587646484375, -0.0467071533203125, -0.007537841796875, 0.0316314697265625, 0.07080078125, 0.1099700927734375, 0.149139404296875, 0.1883087158203125, 0.22747802734375, 0.2666473388671875, 0.305816650390625, 0.3449859619140625, 0.3841552734375, 0.4233245849609375, 0.462493896484375, 0.5016632080078125, 0.54083251953125, 0.5800018310546875, 0.619171142578125, 0.6583404541015625, 0.697509765625, 0.7366790771484375, 0.775848388671875, 0.8150177001953125, 0.85418701171875, 0.8933563232421875, 0.932525634765625, 0.9716949462890625, 1.0108642578125, 1.0500335693359375, 1.089202880859375, 1.1283721923828125, 1.16754150390625, 1.2067108154296875, 1.245880126953125, 1.2850494384765625, 1.32421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 11.0, 12.0, 12.0, 13.0, 18.0, 25.0, 16.0, 27.0, 30.0, 30.0, 37.0, 42.0, 37.0, 47.0, 50.0, 57.0, 38.0, 56.0, 52.0, 46.0, 44.0, 47.0, 31.0, 30.0, 26.0, 17.0, 24.0, 19.0, 20.0, 24.0, 16.0, 12.0, 6.0, 2.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6904296875, -1.6351470947265625, -1.579864501953125, -1.5245819091796875, -1.46929931640625, -1.4140167236328125, -1.358734130859375, -1.3034515380859375, -1.2481689453125, -1.1928863525390625, -1.137603759765625, -1.0823211669921875, -1.02703857421875, -0.9717559814453125, -0.916473388671875, -0.8611907958984375, -0.805908203125, -0.7506256103515625, -0.695343017578125, -0.6400604248046875, -0.58477783203125, -0.5294952392578125, -0.474212646484375, -0.4189300537109375, -0.3636474609375, -0.3083648681640625, -0.253082275390625, -0.1977996826171875, -0.14251708984375, -0.0872344970703125, -0.031951904296875, 0.0233306884765625, 0.07861328125, 0.1338958740234375, 0.189178466796875, 0.2444610595703125, 0.29974365234375, 0.3550262451171875, 0.410308837890625, 0.4655914306640625, 0.5208740234375, 0.5761566162109375, 0.631439208984375, 0.6867218017578125, 0.74200439453125, 0.7972869873046875, 0.852569580078125, 0.9078521728515625, 0.963134765625, 1.0184173583984375, 1.073699951171875, 1.1289825439453125, 1.18426513671875, 1.2395477294921875, 1.294830322265625, 1.3501129150390625, 1.4053955078125, 1.4606781005859375, 1.515960693359375, 1.5712432861328125, 1.62652587890625, 1.6818084716796875, 1.737091064453125, 1.7923736572265625, 1.84765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 10.0, 7.0, 11.0, 10.0, 20.0, 35.0, 68.0, 101.0, 174.0, 265.0, 495.0, 956.0, 1999.0, 5078.0, 17794.0, 106133.0, 694279.0, 183555.0, 26045.0, 6649.0, 2360.0, 1136.0, 555.0, 337.0, 185.0, 102.0, 67.0, 45.0, 35.0, 21.0, 10.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.23828125, -1.2044677734375, -1.170654296875, -1.1368408203125, -1.10302734375, -1.0692138671875, -1.035400390625, -1.0015869140625, -0.9677734375, -0.9339599609375, -0.900146484375, -0.8663330078125, -0.83251953125, -0.7987060546875, -0.764892578125, -0.7310791015625, -0.697265625, -0.6634521484375, -0.629638671875, -0.5958251953125, -0.56201171875, -0.5281982421875, -0.494384765625, -0.4605712890625, -0.4267578125, -0.3929443359375, -0.359130859375, -0.3253173828125, -0.29150390625, -0.2576904296875, -0.223876953125, -0.1900634765625, -0.15625, -0.1224365234375, -0.088623046875, -0.0548095703125, -0.02099609375, 0.0128173828125, 0.046630859375, 0.0804443359375, 0.1142578125, 0.1480712890625, 0.181884765625, 0.2156982421875, 0.24951171875, 0.2833251953125, 0.317138671875, 0.3509521484375, 0.384765625, 0.4185791015625, 0.452392578125, 0.4862060546875, 0.52001953125, 0.5538330078125, 0.587646484375, 0.6214599609375, 0.6552734375, 0.6890869140625, 0.722900390625, 0.7567138671875, 0.79052734375, 0.8243408203125, 0.858154296875, 0.8919677734375, 0.92578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 12.0, 15.0, 16.0, 31.0, 32.0, 37.0, 50.0, 79.0, 93.0, 115.0, 122.0, 83.0, 81.0, 50.0, 41.0, 32.0, 23.0, 22.0, 11.0, 7.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011920928955078125, -0.000115223228931427, -0.00011123716831207275, -0.0001072511076927185, -0.00010326504707336426, -9.927898645401001e-05, -9.529292583465576e-05, -9.130686521530151e-05, -8.732080459594727e-05, -8.333474397659302e-05, -7.934868335723877e-05, -7.536262273788452e-05, -7.137656211853027e-05, -6.739050149917603e-05, -6.340444087982178e-05, -5.941838026046753e-05, -5.543231964111328e-05, -5.144625902175903e-05, -4.7460198402404785e-05, -4.347413778305054e-05, -3.948807716369629e-05, -3.550201654434204e-05, -3.151595592498779e-05, -2.7529895305633545e-05, -2.3543834686279297e-05, -1.955777406692505e-05, -1.55717134475708e-05, -1.1585652828216553e-05, -7.599592208862305e-06, -3.6135315895080566e-06, 3.725290298461914e-07, 4.3585896492004395e-06, 8.344650268554688e-06, 1.2330710887908936e-05, 1.6316771507263184e-05, 2.030283212661743e-05, 2.428889274597168e-05, 2.8274953365325928e-05, 3.2261013984680176e-05, 3.6247074604034424e-05, 4.023313522338867e-05, 4.421919584274292e-05, 4.820525646209717e-05, 5.2191317081451416e-05, 5.6177377700805664e-05, 6.016343832015991e-05, 6.414949893951416e-05, 6.813555955886841e-05, 7.212162017822266e-05, 7.61076807975769e-05, 8.009374141693115e-05, 8.40798020362854e-05, 8.806586265563965e-05, 9.20519232749939e-05, 9.603798389434814e-05, 0.00010002404451370239, 0.00010401010513305664, 0.00010799616575241089, 0.00011198222637176514, 0.00011596828699111938, 0.00011995434761047363, 0.00012394040822982788, 0.00012792646884918213, 0.00013191252946853638, 0.00013589859008789062]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 8.0, 11.0, 20.0, 22.0, 34.0, 50.0, 82.0, 155.0, 208.0, 462.0, 1000.0, 2785.0, 10472.0, 65227.0, 735368.0, 204023.0, 20978.0, 4669.0, 1549.0, 655.0, 297.0, 166.0, 89.0, 64.0, 47.0, 32.0, 17.0, 14.0, 7.0, 5.0, 6.0, 6.0, 2.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.72265625, -1.6744232177734375, -1.626190185546875, -1.5779571533203125, -1.52972412109375, -1.4814910888671875, -1.433258056640625, -1.3850250244140625, -1.3367919921875, -1.2885589599609375, -1.240325927734375, -1.1920928955078125, -1.14385986328125, -1.0956268310546875, -1.047393798828125, -0.9991607666015625, -0.950927734375, -0.9026947021484375, -0.854461669921875, -0.8062286376953125, -0.75799560546875, -0.7097625732421875, -0.661529541015625, -0.6132965087890625, -0.5650634765625, -0.5168304443359375, -0.468597412109375, -0.4203643798828125, -0.37213134765625, -0.3238983154296875, -0.275665283203125, -0.2274322509765625, -0.17919921875, -0.1309661865234375, -0.082733154296875, -0.0345001220703125, 0.01373291015625, 0.0619659423828125, 0.110198974609375, 0.1584320068359375, 0.2066650390625, 0.2548980712890625, 0.303131103515625, 0.3513641357421875, 0.39959716796875, 0.4478302001953125, 0.496063232421875, 0.5442962646484375, 0.592529296875, 0.6407623291015625, 0.688995361328125, 0.7372283935546875, 0.78546142578125, 0.8336944580078125, 0.881927490234375, 0.9301605224609375, 0.9783935546875, 1.0266265869140625, 1.074859619140625, 1.1230926513671875, 1.17132568359375, 1.2195587158203125, 1.267791748046875, 1.3160247802734375, 1.3642578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 3.0, 10.0, 14.0, 12.0, 11.0, 29.0, 32.0, 64.0, 69.0, 134.0, 116.0, 138.0, 106.0, 66.0, 53.0, 40.0, 19.0, 22.0, 18.0, 10.0, 5.0, 8.0, 5.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7939453125, -0.7579193115234375, -0.721893310546875, -0.6858673095703125, -0.64984130859375, -0.6138153076171875, -0.577789306640625, -0.5417633056640625, -0.5057373046875, -0.4697113037109375, -0.433685302734375, -0.3976593017578125, -0.36163330078125, -0.3256072998046875, -0.289581298828125, -0.2535552978515625, -0.217529296875, -0.1815032958984375, -0.145477294921875, -0.1094512939453125, -0.07342529296875, -0.0373992919921875, -0.001373291015625, 0.0346527099609375, 0.0706787109375, 0.1067047119140625, 0.142730712890625, 0.1787567138671875, 0.21478271484375, 0.2508087158203125, 0.286834716796875, 0.3228607177734375, 0.35888671875, 0.3949127197265625, 0.430938720703125, 0.4669647216796875, 0.50299072265625, 0.5390167236328125, 0.575042724609375, 0.6110687255859375, 0.6470947265625, 0.6831207275390625, 0.719146728515625, 0.7551727294921875, 0.79119873046875, 0.8272247314453125, 0.863250732421875, 0.8992767333984375, 0.935302734375, 0.9713287353515625, 1.007354736328125, 1.0433807373046875, 1.07940673828125, 1.1154327392578125, 1.151458740234375, 1.1874847412109375, 1.2235107421875, 1.2595367431640625, 1.295562744140625, 1.3315887451171875, 1.36761474609375, 1.4036407470703125, 1.439666748046875, 1.4756927490234375, 1.51171875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 13.0, 41.0, 73.0, 171.0, 248.0, 202.0, 123.0, 67.0, 28.0, 12.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.453231811523438, -12.651277542114258, -11.849323272705078, -11.047369956970215, -10.245415687561035, -9.443461418151855, -8.641508102416992, -7.8395538330078125, -7.037599563598633, -6.235645294189453, -5.433691501617432, -4.63173770904541, -3.8297834396362305, -3.027829170227051, -2.2258753776550293, -1.4239215850830078, -0.6219673156738281, 0.17998671531677246, 0.981940746307373, 1.7838947772979736, 2.585848808288574, 3.387803077697754, 4.189756870269775, 4.991710662841797, 5.793664932250977, 6.595619201660156, 7.397572994232178, 8.1995267868042, 9.001481056213379, 9.803435325622559, 10.605388641357422, 11.407342910766602, 12.209297180175781, 13.011251449584961, 13.81320571899414, 14.615159034729004, 15.417113304138184, 16.219066619873047, 17.021020889282227, 17.822975158691406, 18.624929428100586, 19.426883697509766, 20.228837966918945, 21.030792236328125, 21.832744598388672, 22.634700775146484, 23.43665313720703, 24.23860740661621, 25.04056167602539, 25.84251594543457, 26.64447021484375, 27.44642448425293, 28.24837875366211, 29.050331115722656, 29.852285385131836, 30.654239654541016, 31.456193923950195, 32.258148193359375, 33.06010055541992, 33.862056732177734, 34.66400909423828, 35.465965270996094, 36.26791763305664, 37.06986999511719, 37.871826171875]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 11.0, 4.0, 4.0, 2.0, 13.0, 4.0, 12.0, 12.0, 11.0, 20.0, 22.0, 22.0, 23.0, 25.0, 24.0, 28.0, 41.0, 34.0, 38.0, 34.0, 38.0, 33.0, 33.0, 39.0, 41.0, 34.0, 39.0, 46.0, 35.0, 29.0, 29.0, 34.0, 26.0, 19.0, 20.0, 20.0, 18.0, 11.0, 12.0, 13.0, 10.0, 6.0, 6.0, 6.0, 9.0, 5.0, 1.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-8.649946212768555, -8.391485214233398, -8.133024215698242, -7.874563694000244, -7.616103172302246, -7.35764217376709, -7.099181175231934, -6.840720176696777, -6.582259654998779, -6.323798656463623, -6.065338134765625, -5.806877136230469, -5.5484161376953125, -5.2899556159973145, -5.031494617462158, -4.77303409576416, -4.514573097229004, -4.256112098693848, -3.9976515769958496, -3.7391905784606934, -3.480729818344116, -3.222269058227539, -2.963808059692383, -2.7053472995758057, -2.4468865394592285, -2.1884257793426514, -1.9299649000167847, -1.671504020690918, -1.4130432605743408, -1.1545825004577637, -0.896121621131897, -0.6376607418060303, -0.3791999816894531, -0.1207391619682312, 0.13772165775299072, 0.39618247747421265, 0.6546432971954346, 0.9131040573120117, 1.1715649366378784, 1.4300258159637451, 1.6884865760803223, 1.9469473361968994, 2.2054080963134766, 2.463869094848633, 2.72232985496521, 2.980790615081787, 3.2392516136169434, 3.4977123737335205, 3.7561731338500977, 4.014634132385254, 4.273094654083252, 4.531555652618408, 4.790016174316406, 5.0484771728515625, 5.306938171386719, 5.565399169921875, 5.823859691619873, 6.082320690155029, 6.340781211853027, 6.599242210388184, 6.85770320892334, 7.116163730621338, 7.374624729156494, 7.633085250854492, 7.891546249389648]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 3.0, 6.0, 7.0, 9.0, 18.0, 23.0, 26.0, 40.0, 69.0, 135.0, 221.0, 466.0, 996.0, 2392.0, 6302.0, 20065.0, 126046.0, 3900478.0, 108570.0, 18398.0, 5692.0, 2255.0, 942.0, 466.0, 248.0, 110.0, 83.0, 55.0, 44.0, 32.0, 15.0, 17.0, 15.0, 10.0, 7.0, 4.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.140625, -4.0205078125, -3.900390625, -3.7802734375, -3.66015625, -3.5400390625, -3.419921875, -3.2998046875, -3.1796875, -3.0595703125, -2.939453125, -2.8193359375, -2.69921875, -2.5791015625, -2.458984375, -2.3388671875, -2.21875, -2.0986328125, -1.978515625, -1.8583984375, -1.73828125, -1.6181640625, -1.498046875, -1.3779296875, -1.2578125, -1.1376953125, -1.017578125, -0.8974609375, -0.77734375, -0.6572265625, -0.537109375, -0.4169921875, -0.296875, -0.1767578125, -0.056640625, 0.0634765625, 0.18359375, 0.3037109375, 0.423828125, 0.5439453125, 0.6640625, 0.7841796875, 0.904296875, 1.0244140625, 1.14453125, 1.2646484375, 1.384765625, 1.5048828125, 1.625, 1.7451171875, 1.865234375, 1.9853515625, 2.10546875, 2.2255859375, 2.345703125, 2.4658203125, 2.5859375, 2.7060546875, 2.826171875, 2.9462890625, 3.06640625, 3.1865234375, 3.306640625, 3.4267578125, 3.546875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 9.0, 17.0, 17.0, 15.0, 17.0, 26.0, 37.0, 26.0, 51.0, 54.0, 64.0, 52.0, 69.0, 79.0, 71.0, 53.0, 50.0, 43.0, 44.0, 45.0, 41.0, 29.0, 22.0, 22.0, 11.0, 10.0, 7.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.53662109375, -0.5196609497070312, -0.5027008056640625, -0.48574066162109375, -0.468780517578125, -0.45182037353515625, -0.4348602294921875, -0.41790008544921875, -0.40093994140625, -0.38397979736328125, -0.3670196533203125, -0.35005950927734375, -0.333099365234375, -0.31613922119140625, -0.2991790771484375, -0.28221893310546875, -0.2652587890625, -0.24829864501953125, -0.2313385009765625, -0.21437835693359375, -0.197418212890625, -0.18045806884765625, -0.1634979248046875, -0.14653778076171875, -0.12957763671875, -0.11261749267578125, -0.0956573486328125, -0.07869720458984375, -0.061737060546875, -0.04477691650390625, -0.0278167724609375, -0.01085662841796875, 0.006103515625, 0.02306365966796875, 0.0400238037109375, 0.05698394775390625, 0.073944091796875, 0.09090423583984375, 0.1078643798828125, 0.12482452392578125, 0.14178466796875, 0.15874481201171875, 0.1757049560546875, 0.19266510009765625, 0.209625244140625, 0.22658538818359375, 0.2435455322265625, 0.26050567626953125, 0.2774658203125, 0.29442596435546875, 0.3113861083984375, 0.32834625244140625, 0.345306396484375, 0.36226654052734375, 0.3792266845703125, 0.39618682861328125, 0.41314697265625, 0.43010711669921875, 0.4470672607421875, 0.46402740478515625, 0.480987548828125, 0.49794769287109375, 0.5149078369140625, 0.5318679809570312, 0.548828125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 18.0, 20.0, 31.0, 46.0, 72.0, 134.0, 207.0, 381.0, 685.0, 1373.0, 2818.0, 6995.0, 21173.0, 96751.0, 3620301.0, 379282.0, 43344.0, 12034.0, 4462.0, 1920.0, 991.0, 540.0, 260.0, 156.0, 100.0, 60.0, 41.0, 23.0, 25.0, 9.0, 10.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.57421875, -3.474273681640625, -3.37432861328125, -3.274383544921875, -3.1744384765625, -3.074493408203125, -2.97454833984375, -2.874603271484375, -2.774658203125, -2.674713134765625, -2.57476806640625, -2.474822998046875, -2.3748779296875, -2.274932861328125, -2.17498779296875, -2.075042724609375, -1.97509765625, -1.875152587890625, -1.77520751953125, -1.675262451171875, -1.5753173828125, -1.475372314453125, -1.37542724609375, -1.275482177734375, -1.175537109375, -1.075592041015625, -0.97564697265625, -0.875701904296875, -0.7757568359375, -0.675811767578125, -0.57586669921875, -0.475921630859375, -0.3759765625, -0.276031494140625, -0.17608642578125, -0.076141357421875, 0.0238037109375, 0.123748779296875, 0.22369384765625, 0.323638916015625, 0.423583984375, 0.523529052734375, 0.62347412109375, 0.723419189453125, 0.8233642578125, 0.923309326171875, 1.02325439453125, 1.123199462890625, 1.22314453125, 1.323089599609375, 1.42303466796875, 1.522979736328125, 1.6229248046875, 1.722869873046875, 1.82281494140625, 1.922760009765625, 2.022705078125, 2.122650146484375, 2.22259521484375, 2.322540283203125, 2.4224853515625, 2.522430419921875, 2.62237548828125, 2.722320556640625, 2.822265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 5.0, 3.0, 11.0, 5.0, 7.0, 12.0, 14.0, 17.0, 24.0, 43.0, 48.0, 97.0, 193.0, 598.0, 2221.0, 374.0, 134.0, 79.0, 49.0, 30.0, 27.0, 20.0, 16.0, 7.0, 9.0, 6.0, 7.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.142578125, -1.1022491455078125, -1.061920166015625, -1.0215911865234375, -0.98126220703125, -0.9409332275390625, -0.900604248046875, -0.8602752685546875, -0.8199462890625, -0.7796173095703125, -0.739288330078125, -0.6989593505859375, -0.65863037109375, -0.6183013916015625, -0.577972412109375, -0.5376434326171875, -0.497314453125, -0.4569854736328125, -0.416656494140625, -0.3763275146484375, -0.33599853515625, -0.2956695556640625, -0.255340576171875, -0.2150115966796875, -0.1746826171875, -0.1343536376953125, -0.094024658203125, -0.0536956787109375, -0.01336669921875, 0.0269622802734375, 0.067291259765625, 0.1076202392578125, 0.14794921875, 0.1882781982421875, 0.228607177734375, 0.2689361572265625, 0.30926513671875, 0.3495941162109375, 0.389923095703125, 0.4302520751953125, 0.4705810546875, 0.5109100341796875, 0.551239013671875, 0.5915679931640625, 0.63189697265625, 0.6722259521484375, 0.712554931640625, 0.7528839111328125, 0.793212890625, 0.8335418701171875, 0.873870849609375, 0.9141998291015625, 0.95452880859375, 0.9948577880859375, 1.035186767578125, 1.0755157470703125, 1.1158447265625, 1.1561737060546875, 1.196502685546875, 1.2368316650390625, 1.27716064453125, 1.3174896240234375, 1.357818603515625, 1.3981475830078125, 1.4384765625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 15.0, 6.0, 33.0, 78.0, 180.0, 257.0, 222.0, 123.0, 50.0, 15.0, 8.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.920326232910156, -14.491230010986328, -14.062132835388184, -13.633036613464355, -13.203940391540527, -12.774843215942383, -12.345746994018555, -11.916650772094727, -11.487554550170898, -11.05845832824707, -10.629361152648926, -10.200264930725098, -9.77116870880127, -9.342071533203125, -8.912975311279297, -8.483879089355469, -8.054781913757324, -7.625685214996338, -7.19658899307251, -6.767492294311523, -6.338396072387695, -5.909299373626709, -5.480202674865723, -5.0511064529418945, -4.622009754180908, -4.192913055419922, -3.7638168334960938, -3.3347201347351074, -2.9056236743927, -2.476527214050293, -2.0474305152893066, -1.6183340549468994, -1.1892375946044922, -0.7601410746574402, -0.3310445547103882, 0.0980520248413086, 0.5271484851837158, 0.956244945526123, 1.3853416442871094, 1.8144381046295166, 2.243534564971924, 2.672631025314331, 3.1017274856567383, 3.5308241844177246, 3.959920644760132, 4.389017105102539, 4.818113803863525, 5.247210502624512, 5.67630672454834, 6.105403423309326, 6.534499645233154, 6.963596343994141, 7.392692565917969, 7.821789264678955, 8.250885963439941, 8.67998218536377, 9.109079360961914, 9.538175582885742, 9.967272758483887, 10.396368980407715, 10.825465202331543, 11.254562377929688, 11.683658599853516, 12.112754821777344, 12.541851043701172]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 8.0, 17.0, 6.0, 12.0, 21.0, 14.0, 15.0, 18.0, 21.0, 32.0, 25.0, 43.0, 38.0, 38.0, 26.0, 41.0, 47.0, 26.0, 38.0, 44.0, 37.0, 29.0, 47.0, 29.0, 47.0, 32.0, 28.0, 27.0, 28.0, 21.0, 13.0, 14.0, 19.0, 10.0, 10.0, 15.0, 9.0, 4.0, 7.0, 5.0, 5.0, 1.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-3.4667015075683594, -3.363508939743042, -3.2603163719177246, -3.157123565673828, -3.0539309978485107, -2.9507384300231934, -2.847545862197876, -2.7443532943725586, -2.641160726547241, -2.537968158721924, -2.4347755908966064, -2.331583023071289, -2.2283902168273926, -2.125197649002075, -2.022005081176758, -1.9188125133514404, -1.8156198263168335, -1.7124272584915161, -1.6092345714569092, -1.5060420036315918, -1.4028494358062744, -1.299656867980957, -1.19646418094635, -1.0932716131210327, -0.9900789856910706, -0.8868863582611084, -0.783693790435791, -0.6805011630058289, -0.5773085355758667, -0.4741159677505493, -0.37092334032058716, -0.2677307724952698, -0.16453814506530762, -0.06134553998708725, 0.04184706509113312, 0.14503967761993408, 0.24823227524757385, 0.3514248728752136, 0.4546175003051758, 0.5578100681304932, 0.6610026955604553, 0.7641953229904175, 0.8673878908157349, 0.970580518245697, 1.0737731456756592, 1.1769657135009766, 1.280158281326294, 1.3833508491516113, 1.4865435361862183, 1.5897361040115356, 1.6929287910461426, 1.79612135887146, 1.8993139266967773, 2.0025064945220947, 2.105699062347412, 2.2088918685913086, 2.312084436416626, 2.4152770042419434, 2.5184695720672607, 2.621662139892578, 2.7248549461364746, 2.828047513961792, 2.9312400817871094, 3.0344326496124268, 3.137625217437744]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 5.0, 5.0, 10.0, 6.0, 18.0, 24.0, 20.0, 33.0, 71.0, 101.0, 135.0, 207.0, 343.0, 539.0, 897.0, 1849.0, 4229.0, 11004.0, 33464.0, 116797.0, 377571.0, 349159.0, 104442.0, 29820.0, 9929.0, 3844.0, 1810.0, 878.0, 449.0, 299.0, 197.0, 118.0, 88.0, 58.0, 49.0, 25.0, 22.0, 13.0, 13.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.68359375, -2.599609375, -2.515625, -2.431640625, -2.34765625, -2.263671875, -2.1796875, -2.095703125, -2.01171875, -1.927734375, -1.84375, -1.759765625, -1.67578125, -1.591796875, -1.5078125, -1.423828125, -1.33984375, -1.255859375, -1.171875, -1.087890625, -1.00390625, -0.919921875, -0.8359375, -0.751953125, -0.66796875, -0.583984375, -0.5, -0.416015625, -0.33203125, -0.248046875, -0.1640625, -0.080078125, 0.00390625, 0.087890625, 0.171875, 0.255859375, 0.33984375, 0.423828125, 0.5078125, 0.591796875, 0.67578125, 0.759765625, 0.84375, 0.927734375, 1.01171875, 1.095703125, 1.1796875, 1.263671875, 1.34765625, 1.431640625, 1.515625, 1.599609375, 1.68359375, 1.767578125, 1.8515625, 1.935546875, 2.01953125, 2.103515625, 2.1875, 2.271484375, 2.35546875, 2.439453125, 2.5234375, 2.607421875, 2.69140625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 4.0, 4.0, 6.0, 11.0, 12.0, 26.0, 29.0, 30.0, 49.0, 36.0, 49.0, 53.0, 56.0, 60.0, 59.0, 65.0, 58.0, 48.0, 63.0, 58.0, 40.0, 34.0, 33.0, 19.0, 23.0, 23.0, 15.0, 10.0, 10.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.54345703125, -0.5260696411132812, -0.5086822509765625, -0.49129486083984375, -0.473907470703125, -0.45652008056640625, -0.4391326904296875, -0.42174530029296875, -0.40435791015625, -0.38697052001953125, -0.3695831298828125, -0.35219573974609375, -0.334808349609375, -0.31742095947265625, -0.3000335693359375, -0.28264617919921875, -0.2652587890625, -0.24787139892578125, -0.2304840087890625, -0.21309661865234375, -0.195709228515625, -0.17832183837890625, -0.1609344482421875, -0.14354705810546875, -0.12615966796875, -0.10877227783203125, -0.0913848876953125, -0.07399749755859375, -0.056610107421875, -0.03922271728515625, -0.0218353271484375, -0.00444793701171875, 0.012939453125, 0.03032684326171875, 0.0477142333984375, 0.06510162353515625, 0.082489013671875, 0.09987640380859375, 0.1172637939453125, 0.13465118408203125, 0.15203857421875, 0.16942596435546875, 0.1868133544921875, 0.20420074462890625, 0.221588134765625, 0.23897552490234375, 0.2563629150390625, 0.27375030517578125, 0.2911376953125, 0.30852508544921875, 0.3259124755859375, 0.34329986572265625, 0.360687255859375, 0.37807464599609375, 0.3954620361328125, 0.41284942626953125, 0.43023681640625, 0.44762420654296875, 0.4650115966796875, 0.48239898681640625, 0.499786376953125, 0.5171737670898438, 0.5345611572265625, 0.5519485473632812, 0.5693359375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 7.0, 4.0, 6.0, 23.0, 24.0, 41.0, 49.0, 88.0, 155.0, 247.0, 498.0, 956.0, 2147.0, 5759.0, 16654.0, 55956.0, 218752.0, 492267.0, 183621.0, 47905.0, 14372.0, 5103.0, 1951.0, 923.0, 445.0, 253.0, 117.0, 97.0, 48.0, 35.0, 19.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25390625, -2.177337646484375, -2.10076904296875, -2.024200439453125, -1.9476318359375, -1.871063232421875, -1.79449462890625, -1.717926025390625, -1.641357421875, -1.564788818359375, -1.48822021484375, -1.411651611328125, -1.3350830078125, -1.258514404296875, -1.18194580078125, -1.105377197265625, -1.02880859375, -0.952239990234375, -0.87567138671875, -0.799102783203125, -0.7225341796875, -0.645965576171875, -0.56939697265625, -0.492828369140625, -0.416259765625, -0.339691162109375, -0.26312255859375, -0.186553955078125, -0.1099853515625, -0.033416748046875, 0.04315185546875, 0.119720458984375, 0.1962890625, 0.272857666015625, 0.34942626953125, 0.425994873046875, 0.5025634765625, 0.579132080078125, 0.65570068359375, 0.732269287109375, 0.808837890625, 0.885406494140625, 0.96197509765625, 1.038543701171875, 1.1151123046875, 1.191680908203125, 1.26824951171875, 1.344818115234375, 1.42138671875, 1.497955322265625, 1.57452392578125, 1.651092529296875, 1.7276611328125, 1.804229736328125, 1.88079833984375, 1.957366943359375, 2.033935546875, 2.110504150390625, 2.18707275390625, 2.263641357421875, 2.3402099609375, 2.416778564453125, 2.49334716796875, 2.569915771484375, 2.646484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 6.0, 6.0, 8.0, 12.0, 13.0, 15.0, 15.0, 13.0, 27.0, 27.0, 33.0, 31.0, 37.0, 23.0, 49.0, 47.0, 46.0, 52.0, 47.0, 53.0, 49.0, 46.0, 40.0, 45.0, 37.0, 31.0, 25.0, 19.0, 21.0, 26.0, 16.0, 22.0, 9.0, 11.0, 8.0, 5.0, 5.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.7626953125, -1.6974334716796875, -1.632171630859375, -1.5669097900390625, -1.50164794921875, -1.4363861083984375, -1.371124267578125, -1.3058624267578125, -1.2406005859375, -1.1753387451171875, -1.110076904296875, -1.0448150634765625, -0.97955322265625, -0.9142913818359375, -0.849029541015625, -0.7837677001953125, -0.718505859375, -0.6532440185546875, -0.587982177734375, -0.5227203369140625, -0.45745849609375, -0.3921966552734375, -0.326934814453125, -0.2616729736328125, -0.1964111328125, -0.1311492919921875, -0.065887451171875, -0.0006256103515625, 0.06463623046875, 0.1298980712890625, 0.195159912109375, 0.2604217529296875, 0.32568359375, 0.3909454345703125, 0.456207275390625, 0.5214691162109375, 0.58673095703125, 0.6519927978515625, 0.717254638671875, 0.7825164794921875, 0.8477783203125, 0.9130401611328125, 0.978302001953125, 1.0435638427734375, 1.10882568359375, 1.1740875244140625, 1.239349365234375, 1.3046112060546875, 1.369873046875, 1.4351348876953125, 1.500396728515625, 1.5656585693359375, 1.63092041015625, 1.6961822509765625, 1.761444091796875, 1.8267059326171875, 1.8919677734375, 1.9572296142578125, 2.022491455078125, 2.0877532958984375, 2.15301513671875, 2.2182769775390625, 2.283538818359375, 2.3488006591796875, 2.4140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 6.0, 3.0, 10.0, 21.0, 36.0, 55.0, 125.0, 232.0, 497.0, 998.0, 2678.0, 8101.0, 35122.0, 248874.0, 622199.0, 103412.0, 18013.0, 4964.0, 1719.0, 748.0, 367.0, 178.0, 80.0, 41.0, 30.0, 17.0, 7.0, 2.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.56640625, -1.5178985595703125, -1.469390869140625, -1.4208831787109375, -1.37237548828125, -1.3238677978515625, -1.275360107421875, -1.2268524169921875, -1.1783447265625, -1.1298370361328125, -1.081329345703125, -1.0328216552734375, -0.98431396484375, -0.9358062744140625, -0.887298583984375, -0.8387908935546875, -0.790283203125, -0.7417755126953125, -0.693267822265625, -0.6447601318359375, -0.59625244140625, -0.5477447509765625, -0.499237060546875, -0.4507293701171875, -0.4022216796875, -0.3537139892578125, -0.305206298828125, -0.2566986083984375, -0.20819091796875, -0.1596832275390625, -0.111175537109375, -0.0626678466796875, -0.01416015625, 0.0343475341796875, 0.082855224609375, 0.1313629150390625, 0.17987060546875, 0.2283782958984375, 0.276885986328125, 0.3253936767578125, 0.3739013671875, 0.4224090576171875, 0.470916748046875, 0.5194244384765625, 0.56793212890625, 0.6164398193359375, 0.664947509765625, 0.7134552001953125, 0.761962890625, 0.8104705810546875, 0.858978271484375, 0.9074859619140625, 0.95599365234375, 1.0045013427734375, 1.053009033203125, 1.1015167236328125, 1.1500244140625, 1.1985321044921875, 1.247039794921875, 1.2955474853515625, 1.34405517578125, 1.3925628662109375, 1.441070556640625, 1.4895782470703125, 1.5380859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 12.0, 13.0, 16.0, 30.0, 29.0, 51.0, 57.0, 88.0, 129.0, 155.0, 122.0, 88.0, 61.0, 38.0, 27.0, 24.0, 17.0, 16.0, 7.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002906322479248047, -0.00028218701481819153, -0.00027374178171157837, -0.0002652965486049652, -0.00025685131549835205, -0.0002484060823917389, -0.00023996084928512573, -0.00023151561617851257, -0.00022307038307189941, -0.00021462514996528625, -0.0002061799168586731, -0.00019773468375205994, -0.00018928945064544678, -0.00018084421753883362, -0.00017239898443222046, -0.0001639537513256073, -0.00015550851821899414, -0.00014706328511238098, -0.00013861805200576782, -0.00013017281889915466, -0.0001217275857925415, -0.00011328235268592834, -0.00010483711957931519, -9.639188647270203e-05, -8.794665336608887e-05, -7.950142025947571e-05, -7.105618715286255e-05, -6.261095404624939e-05, -5.416572093963623e-05, -4.572048783302307e-05, -3.727525472640991e-05, -2.8830021619796753e-05, -2.0384788513183594e-05, -1.1939555406570435e-05, -3.4943222999572754e-06, 4.950910806655884e-06, 1.3396143913269043e-05, 2.1841377019882202e-05, 3.028661012649536e-05, 3.873184323310852e-05, 4.717707633972168e-05, 5.562230944633484e-05, 6.4067542552948e-05, 7.251277565956116e-05, 8.095800876617432e-05, 8.940324187278748e-05, 9.784847497940063e-05, 0.0001062937080860138, 0.00011473894119262695, 0.0001231841742992401, 0.00013162940740585327, 0.00014007464051246643, 0.0001485198736190796, 0.00015696510672569275, 0.0001654103398323059, 0.00017385557293891907, 0.00018230080604553223, 0.00019074603915214539, 0.00019919127225875854, 0.0002076365053653717, 0.00021608173847198486, 0.00022452697157859802, 0.00023297220468521118, 0.00024141743779182434, 0.0002498626708984375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 8.0, 15.0, 11.0, 26.0, 36.0, 64.0, 132.0, 192.0, 312.0, 628.0, 1597.0, 4679.0, 20202.0, 159130.0, 708228.0, 128674.0, 17655.0, 4138.0, 1448.0, 658.0, 297.0, 146.0, 95.0, 52.0, 38.0, 23.0, 21.0, 12.0, 9.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-2.181640625, -2.124908447265625, -2.06817626953125, -2.011444091796875, -1.9547119140625, -1.897979736328125, -1.84124755859375, -1.784515380859375, -1.727783203125, -1.671051025390625, -1.61431884765625, -1.557586669921875, -1.5008544921875, -1.444122314453125, -1.38739013671875, -1.330657958984375, -1.27392578125, -1.217193603515625, -1.16046142578125, -1.103729248046875, -1.0469970703125, -0.990264892578125, -0.93353271484375, -0.876800537109375, -0.820068359375, -0.763336181640625, -0.70660400390625, -0.649871826171875, -0.5931396484375, -0.536407470703125, -0.47967529296875, -0.422943115234375, -0.3662109375, -0.309478759765625, -0.25274658203125, -0.196014404296875, -0.1392822265625, -0.082550048828125, -0.02581787109375, 0.030914306640625, 0.087646484375, 0.144378662109375, 0.20111083984375, 0.257843017578125, 0.3145751953125, 0.371307373046875, 0.42803955078125, 0.484771728515625, 0.54150390625, 0.598236083984375, 0.65496826171875, 0.711700439453125, 0.7684326171875, 0.825164794921875, 0.88189697265625, 0.938629150390625, 0.995361328125, 1.052093505859375, 1.10882568359375, 1.165557861328125, 1.2222900390625, 1.279022216796875, 1.33575439453125, 1.392486572265625, 1.44921875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 6.0, 11.0, 15.0, 15.0, 25.0, 35.0, 56.0, 62.0, 86.0, 107.0, 121.0, 87.0, 87.0, 69.0, 38.0, 50.0, 30.0, 11.0, 19.0, 17.0, 11.0, 6.0, 5.0, 5.0, 4.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1088104248046875, -1.063323974609375, -1.0178375244140625, -0.97235107421875, -0.9268646240234375, -0.881378173828125, -0.8358917236328125, -0.7904052734375, -0.7449188232421875, -0.699432373046875, -0.6539459228515625, -0.60845947265625, -0.5629730224609375, -0.517486572265625, -0.4720001220703125, -0.426513671875, -0.3810272216796875, -0.335540771484375, -0.2900543212890625, -0.24456787109375, -0.1990814208984375, -0.153594970703125, -0.1081085205078125, -0.0626220703125, -0.0171356201171875, 0.028350830078125, 0.0738372802734375, 0.11932373046875, 0.1648101806640625, 0.210296630859375, 0.2557830810546875, 0.30126953125, 0.3467559814453125, 0.392242431640625, 0.4377288818359375, 0.48321533203125, 0.5287017822265625, 0.574188232421875, 0.6196746826171875, 0.6651611328125, 0.7106475830078125, 0.756134033203125, 0.8016204833984375, 0.84710693359375, 0.8925933837890625, 0.938079833984375, 0.9835662841796875, 1.029052734375, 1.0745391845703125, 1.120025634765625, 1.1655120849609375, 1.21099853515625, 1.2564849853515625, 1.301971435546875, 1.3474578857421875, 1.3929443359375, 1.4384307861328125, 1.483917236328125, 1.5294036865234375, 1.57489013671875, 1.6203765869140625, 1.665863037109375, 1.7113494873046875, 1.7568359375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 3.0, 11.0, 21.0, 13.0, 16.0, 39.0, 62.0, 71.0, 101.0, 108.0, 111.0, 103.0, 96.0, 80.0, 54.0, 33.0, 23.0, 12.0, 13.0, 11.0, 8.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.366525650024414, -12.869441032409668, -12.372356414794922, -11.87527084350586, -11.378186225891113, -10.881101608276367, -10.384016036987305, -9.886931419372559, -9.389846801757812, -8.892762184143066, -8.39567756652832, -7.898591995239258, -7.401507377624512, -6.904422760009766, -6.407337665557861, -5.910252571105957, -5.413167953491211, -4.916083335876465, -4.4189982414245605, -3.9219133853912354, -3.42482852935791, -2.927743673324585, -2.4306588172912598, -1.9335739612579346, -1.4364891052246094, -0.9394042491912842, -0.442319393157959, 0.05476546287536621, 0.5518503189086914, 1.0489351749420166, 1.5460200309753418, 2.043104887008667, 2.540189743041992, 3.0372745990753174, 3.5343594551086426, 4.031444549560547, 4.528529167175293, 5.025613784790039, 5.522698879241943, 6.019783973693848, 6.516868591308594, 7.01395320892334, 7.511038303375244, 8.008123397827148, 8.505208015441895, 9.00229263305664, 9.499378204345703, 9.99646282196045, 10.493547439575195, 10.990632057189941, 11.487716674804688, 11.98480224609375, 12.481886863708496, 12.978971481323242, 13.476057052612305, 13.97314167022705, 14.470226287841797, 14.967310905456543, 15.464395523071289, 15.961481094360352, 16.45856475830078, 16.955650329589844, 17.452735900878906, 17.949819564819336, 18.4469051361084]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 13.0, 14.0, 10.0, 17.0, 8.0, 15.0, 26.0, 27.0, 31.0, 23.0, 40.0, 42.0, 42.0, 59.0, 43.0, 50.0, 61.0, 40.0, 48.0, 51.0, 32.0, 34.0, 37.0, 42.0, 20.0, 20.0, 23.0, 20.0, 17.0, 15.0, 11.0, 16.0, 6.0, 4.0, 7.0, 9.0, 4.0, 7.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.76424789428711, -9.410740852355957, -9.057234764099121, -8.703727722167969, -8.350220680236816, -7.996714115142822, -7.643207550048828, -7.289700508117676, -6.936193943023682, -6.5826873779296875, -6.229180335998535, -5.875673770904541, -5.522167205810547, -5.1686601638793945, -4.8151535987854, -4.461647033691406, -4.108139991760254, -3.7546331882476807, -3.4011263847351074, -3.0476198196411133, -2.69411301612854, -2.340606212615967, -1.9870996475219727, -1.6335928440093994, -1.2800860404968262, -0.9265792965888977, -0.5730725526809692, -0.21956586837768555, 0.1339409351348877, 0.48744773864746094, 0.8409543037414551, 1.1944611072540283, 1.5479679107666016, 1.9014747142791748, 2.254981517791748, 2.608488082885742, 2.9619948863983154, 3.3155016899108887, 3.669008255004883, 4.022515296936035, 4.376021862030029, 4.729528427124023, 5.083035469055176, 5.43654203414917, 5.790048599243164, 6.143555641174316, 6.4970622062683105, 6.850568771362305, 7.204075813293457, 7.557582378387451, 7.9110894203186035, 8.264595985412598, 8.61810302734375, 8.971609115600586, 9.325116157531738, 9.67862319946289, 10.032129287719727, 10.385636329650879, 10.739142417907715, 11.092649459838867, 11.44615650177002, 11.799663543701172, 12.153169631958008, 12.50667667388916, 12.860183715820312]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 22.0, 58.0, 93.0, 135.0, 299.0, 578.0, 1294.0, 3091.0, 10447.0, 141955.0, 4011523.0, 17491.0, 4191.0, 1595.0, 711.0, 335.0, 184.0, 95.0, 66.0, 30.0, 27.0, 18.0, 12.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4375, -5.24432373046875, -5.0511474609375, -4.85797119140625, -4.664794921875, -4.47161865234375, -4.2784423828125, -4.08526611328125, -3.89208984375, -3.69891357421875, -3.5057373046875, -3.31256103515625, -3.119384765625, -2.92620849609375, -2.7330322265625, -2.53985595703125, -2.3466796875, -2.15350341796875, -1.9603271484375, -1.76715087890625, -1.573974609375, -1.38079833984375, -1.1876220703125, -0.99444580078125, -0.80126953125, -0.60809326171875, -0.4149169921875, -0.22174072265625, -0.028564453125, 0.16461181640625, 0.3577880859375, 0.55096435546875, 0.744140625, 0.93731689453125, 1.1304931640625, 1.32366943359375, 1.516845703125, 1.71002197265625, 1.9031982421875, 2.09637451171875, 2.28955078125, 2.48272705078125, 2.6759033203125, 2.86907958984375, 3.062255859375, 3.25543212890625, 3.4486083984375, 3.64178466796875, 3.8349609375, 4.02813720703125, 4.2213134765625, 4.41448974609375, 4.607666015625, 4.80084228515625, 4.9940185546875, 5.18719482421875, 5.38037109375, 5.57354736328125, 5.7667236328125, 5.95989990234375, 6.153076171875, 6.34625244140625, 6.5394287109375, 6.73260498046875, 6.92578125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 10.0, 11.0, 11.0, 20.0, 18.0, 32.0, 32.0, 33.0, 38.0, 53.0, 34.0, 53.0, 58.0, 47.0, 58.0, 51.0, 63.0, 53.0, 45.0, 47.0, 27.0, 32.0, 29.0, 26.0, 30.0, 18.0, 18.0, 10.0, 11.0, 6.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5556640625, -0.537628173828125, -0.51959228515625, -0.501556396484375, -0.4835205078125, -0.465484619140625, -0.44744873046875, -0.429412841796875, -0.411376953125, -0.393341064453125, -0.37530517578125, -0.357269287109375, -0.3392333984375, -0.321197509765625, -0.30316162109375, -0.285125732421875, -0.26708984375, -0.249053955078125, -0.23101806640625, -0.212982177734375, -0.1949462890625, -0.176910400390625, -0.15887451171875, -0.140838623046875, -0.122802734375, -0.104766845703125, -0.08673095703125, -0.068695068359375, -0.0506591796875, -0.032623291015625, -0.01458740234375, 0.003448486328125, 0.021484375, 0.039520263671875, 0.05755615234375, 0.075592041015625, 0.0936279296875, 0.111663818359375, 0.12969970703125, 0.147735595703125, 0.165771484375, 0.183807373046875, 0.20184326171875, 0.219879150390625, 0.2379150390625, 0.255950927734375, 0.27398681640625, 0.292022705078125, 0.31005859375, 0.328094482421875, 0.34613037109375, 0.364166259765625, 0.3822021484375, 0.400238037109375, 0.41827392578125, 0.436309814453125, 0.454345703125, 0.472381591796875, 0.49041748046875, 0.508453369140625, 0.5264892578125, 0.544525146484375, 0.56256103515625, 0.580596923828125, 0.5986328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 11.0, 8.0, 16.0, 23.0, 32.0, 51.0, 74.0, 102.0, 152.0, 212.0, 322.0, 474.0, 772.0, 1144.0, 1957.0, 3675.0, 7920.0, 22343.0, 132063.0, 3928085.0, 65237.0, 15395.0, 6282.0, 3067.0, 1752.0, 1030.0, 671.0, 444.0, 307.0, 199.0, 147.0, 104.0, 75.0, 44.0, 29.0, 22.0, 20.0, 10.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.91375732421875, -2.8177490234375, -2.72174072265625, -2.625732421875, -2.52972412109375, -2.4337158203125, -2.33770751953125, -2.24169921875, -2.14569091796875, -2.0496826171875, -1.95367431640625, -1.857666015625, -1.76165771484375, -1.6656494140625, -1.56964111328125, -1.4736328125, -1.37762451171875, -1.2816162109375, -1.18560791015625, -1.089599609375, -0.99359130859375, -0.8975830078125, -0.80157470703125, -0.70556640625, -0.60955810546875, -0.5135498046875, -0.41754150390625, -0.321533203125, -0.22552490234375, -0.1295166015625, -0.03350830078125, 0.0625, 0.15850830078125, 0.2545166015625, 0.35052490234375, 0.446533203125, 0.54254150390625, 0.6385498046875, 0.73455810546875, 0.83056640625, 0.92657470703125, 1.0225830078125, 1.11859130859375, 1.214599609375, 1.31060791015625, 1.4066162109375, 1.50262451171875, 1.5986328125, 1.69464111328125, 1.7906494140625, 1.88665771484375, 1.982666015625, 2.07867431640625, 2.1746826171875, 2.27069091796875, 2.36669921875, 2.46270751953125, 2.5587158203125, 2.65472412109375, 2.750732421875, 2.84674072265625, 2.9427490234375, 3.03875732421875, 3.134765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 4.0, 11.0, 15.0, 19.0, 41.0, 60.0, 146.0, 3015.0, 497.0, 99.0, 43.0, 34.0, 17.0, 12.0, 8.0, 4.0, 5.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.56201171875, -0.5432052612304688, -0.5243988037109375, -0.5055923461914062, -0.486785888671875, -0.46797943115234375, -0.4491729736328125, -0.43036651611328125, -0.41156005859375, -0.39275360107421875, -0.3739471435546875, -0.35514068603515625, -0.336334228515625, -0.31752777099609375, -0.2987213134765625, -0.27991485595703125, -0.2611083984375, -0.24230194091796875, -0.2234954833984375, -0.20468902587890625, -0.185882568359375, -0.16707611083984375, -0.1482696533203125, -0.12946319580078125, -0.11065673828125, -0.09185028076171875, -0.0730438232421875, -0.05423736572265625, -0.035430908203125, -0.01662445068359375, 0.0021820068359375, 0.02098846435546875, 0.039794921875, 0.05860137939453125, 0.0774078369140625, 0.09621429443359375, 0.115020751953125, 0.13382720947265625, 0.1526336669921875, 0.17144012451171875, 0.19024658203125, 0.20905303955078125, 0.2278594970703125, 0.24666595458984375, 0.265472412109375, 0.28427886962890625, 0.3030853271484375, 0.32189178466796875, 0.3406982421875, 0.35950469970703125, 0.3783111572265625, 0.39711761474609375, 0.415924072265625, 0.43473052978515625, 0.4535369873046875, 0.47234344482421875, 0.49114990234375, 0.5099563598632812, 0.5287628173828125, 0.5475692749023438, 0.566375732421875, 0.5851821899414062, 0.6039886474609375, 0.6227951049804688, 0.6416015625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 10.0, 14.0, 24.0, 39.0, 72.0, 101.0, 138.0, 140.0, 122.0, 104.0, 82.0, 56.0, 34.0, 25.0, 16.0, 6.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5385429859161377, -3.4232499599456787, -3.3079566955566406, -3.1926636695861816, -3.0773706436157227, -2.9620776176452637, -2.8467845916748047, -2.7314913272857666, -2.6161983013153076, -2.5009052753448486, -2.3856120109558105, -2.2703189849853516, -2.1550259590148926, -2.0397329330444336, -1.924439787864685, -1.8091466426849365, -1.6938536167144775, -1.5785605907440186, -1.46326744556427, -1.3479743003845215, -1.2326812744140625, -1.1173882484436035, -1.002095103263855, -0.8868020176887512, -0.7715089321136475, -0.6562158465385437, -0.5409227609634399, -0.4256296753883362, -0.3103365898132324, -0.19504350423812866, -0.0797504186630249, 0.03554266691207886, 0.15083599090576172, 0.2661290764808655, 0.38142216205596924, 0.496715247631073, 0.6120083332061768, 0.7273014187812805, 0.8425945043563843, 0.957887589931488, 1.0731806755065918, 1.1884737014770508, 1.3037668466567993, 1.4190599918365479, 1.5343530178070068, 1.6496460437774658, 1.7649391889572144, 1.880232334136963, 1.9955253601074219, 2.110818386077881, 2.22611141204834, 2.341404676437378, 2.456697702407837, 2.571990728378296, 2.687283992767334, 2.802577018737793, 2.917870044708252, 3.033163070678711, 3.14845609664917, 3.263749361038208, 3.379042387008667, 3.494335412979126, 3.609628677368164, 3.724921703338623, 3.840214729309082]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 10.0, 14.0, 7.0, 10.0, 20.0, 21.0, 23.0, 22.0, 16.0, 28.0, 31.0, 36.0, 41.0, 33.0, 31.0, 50.0, 33.0, 38.0, 53.0, 46.0, 39.0, 22.0, 43.0, 34.0, 42.0, 34.0, 27.0, 25.0, 26.0, 26.0, 16.0, 19.0, 15.0, 13.0, 10.0, 7.0, 9.0, 4.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.326143503189087, -1.2843542098999023, -1.2425650358200073, -1.2007757425308228, -1.1589865684509277, -1.1171972751617432, -1.0754081010818481, -1.0336188077926636, -0.9918296337127686, -0.9500404000282288, -0.908251166343689, -0.8664619326591492, -0.8246726989746094, -0.7828834652900696, -0.7410942316055298, -0.6993049383163452, -0.6575157046318054, -0.6157264709472656, -0.5739372372627258, -0.532148003578186, -0.49035876989364624, -0.44856953620910645, -0.40678027272224426, -0.36499103903770447, -0.3232018053531647, -0.2814125716686249, -0.23962333798408508, -0.1978340893983841, -0.1560448557138443, -0.1142556220293045, -0.07246637344360352, -0.03067713975906372, 0.011112093925476074, 0.05290133133530617, 0.09469056874513626, 0.13647980988025665, 0.17826904356479645, 0.22005827724933624, 0.26184752583503723, 0.303636759519577, 0.3454259932041168, 0.3872152268886566, 0.4290044605731964, 0.4707937240600586, 0.5125829577445984, 0.5543721914291382, 0.596161425113678, 0.6379506587982178, 0.6797398924827576, 0.7215291261672974, 0.7633183598518372, 0.805107593536377, 0.8468968272209167, 0.8886860609054565, 0.9304753541946411, 0.9722645282745361, 1.0140538215637207, 1.0558431148529053, 1.0976322889328003, 1.1394215822219849, 1.1812107563018799, 1.2230000495910645, 1.2647892236709595, 1.306578516960144, 1.348367691040039]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 7.0, 4.0, 6.0, 3.0, 7.0, 7.0, 17.0, 24.0, 28.0, 46.0, 64.0, 97.0, 123.0, 183.0, 287.0, 494.0, 747.0, 1404.0, 2528.0, 4816.0, 9699.0, 21099.0, 47029.0, 107881.0, 215145.0, 279670.0, 191212.0, 90952.0, 39527.0, 17562.0, 8350.0, 4192.0, 2195.0, 1218.0, 705.0, 421.0, 276.0, 162.0, 107.0, 76.0, 54.0, 32.0, 33.0, 17.0, 17.0, 11.0, 12.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 3.0, 3.0], "bins": [-2.09765625, -2.0366668701171875, -1.975677490234375, -1.9146881103515625, -1.85369873046875, -1.7927093505859375, -1.731719970703125, -1.6707305908203125, -1.6097412109375, -1.5487518310546875, -1.487762451171875, -1.4267730712890625, -1.36578369140625, -1.3047943115234375, -1.243804931640625, -1.1828155517578125, -1.121826171875, -1.0608367919921875, -0.999847412109375, -0.9388580322265625, -0.87786865234375, -0.8168792724609375, -0.755889892578125, -0.6949005126953125, -0.6339111328125, -0.5729217529296875, -0.511932373046875, -0.4509429931640625, -0.38995361328125, -0.3289642333984375, -0.267974853515625, -0.2069854736328125, -0.14599609375, -0.0850067138671875, -0.024017333984375, 0.0369720458984375, 0.09796142578125, 0.1589508056640625, 0.219940185546875, 0.2809295654296875, 0.3419189453125, 0.4029083251953125, 0.463897705078125, 0.5248870849609375, 0.58587646484375, 0.6468658447265625, 0.707855224609375, 0.7688446044921875, 0.829833984375, 0.8908233642578125, 0.951812744140625, 1.0128021240234375, 1.07379150390625, 1.1347808837890625, 1.195770263671875, 1.2567596435546875, 1.3177490234375, 1.3787384033203125, 1.439727783203125, 1.5007171630859375, 1.56170654296875, 1.6226959228515625, 1.683685302734375, 1.7446746826171875, 1.8056640625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 9.0, 11.0, 8.0, 18.0, 13.0, 26.0, 21.0, 35.0, 36.0, 31.0, 32.0, 41.0, 44.0, 56.0, 35.0, 45.0, 58.0, 48.0, 44.0, 56.0, 47.0, 49.0, 32.0, 33.0, 33.0, 21.0, 19.0, 23.0, 17.0, 15.0, 8.0, 12.0, 5.0, 4.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5556640625, -0.5374526977539062, -0.5192413330078125, -0.5010299682617188, -0.482818603515625, -0.46460723876953125, -0.4463958740234375, -0.42818450927734375, -0.40997314453125, -0.39176177978515625, -0.3735504150390625, -0.35533905029296875, -0.337127685546875, -0.31891632080078125, -0.3007049560546875, -0.28249359130859375, -0.2642822265625, -0.24607086181640625, -0.2278594970703125, -0.20964813232421875, -0.191436767578125, -0.17322540283203125, -0.1550140380859375, -0.13680267333984375, -0.11859130859375, -0.10037994384765625, -0.0821685791015625, -0.06395721435546875, -0.045745849609375, -0.02753448486328125, -0.0093231201171875, 0.00888824462890625, 0.027099609375, 0.04531097412109375, 0.0635223388671875, 0.08173370361328125, 0.099945068359375, 0.11815643310546875, 0.1363677978515625, 0.15457916259765625, 0.17279052734375, 0.19100189208984375, 0.2092132568359375, 0.22742462158203125, 0.245635986328125, 0.26384735107421875, 0.2820587158203125, 0.30027008056640625, 0.3184814453125, 0.33669281005859375, 0.3549041748046875, 0.37311553955078125, 0.391326904296875, 0.40953826904296875, 0.4277496337890625, 0.44596099853515625, 0.46417236328125, 0.48238372802734375, 0.5005950927734375, 0.5188064575195312, 0.537017822265625, 0.5552291870117188, 0.5734405517578125, 0.5916519165039062, 0.60986328125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 5.0, 1.0, 4.0, 4.0, 8.0, 9.0, 17.0, 19.0, 27.0, 48.0, 74.0, 129.0, 228.0, 486.0, 1101.0, 2948.0, 8414.0, 29370.0, 124487.0, 479158.0, 305398.0, 69884.0, 17785.0, 5361.0, 1898.0, 822.0, 353.0, 189.0, 116.0, 78.0, 45.0, 27.0, 19.0, 14.0, 7.0, 6.0, 7.0, 8.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.865234375, -2.76910400390625, -2.6729736328125, -2.57684326171875, -2.480712890625, -2.38458251953125, -2.2884521484375, -2.19232177734375, -2.09619140625, -2.00006103515625, -1.9039306640625, -1.80780029296875, -1.711669921875, -1.61553955078125, -1.5194091796875, -1.42327880859375, -1.3271484375, -1.23101806640625, -1.1348876953125, -1.03875732421875, -0.942626953125, -0.84649658203125, -0.7503662109375, -0.65423583984375, -0.55810546875, -0.46197509765625, -0.3658447265625, -0.26971435546875, -0.173583984375, -0.07745361328125, 0.0186767578125, 0.11480712890625, 0.2109375, 0.30706787109375, 0.4031982421875, 0.49932861328125, 0.595458984375, 0.69158935546875, 0.7877197265625, 0.88385009765625, 0.97998046875, 1.07611083984375, 1.1722412109375, 1.26837158203125, 1.364501953125, 1.46063232421875, 1.5567626953125, 1.65289306640625, 1.7490234375, 1.84515380859375, 1.9412841796875, 2.03741455078125, 2.133544921875, 2.22967529296875, 2.3258056640625, 2.42193603515625, 2.51806640625, 2.61419677734375, 2.7103271484375, 2.80645751953125, 2.902587890625, 2.99871826171875, 3.0948486328125, 3.19097900390625, 3.287109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 8.0, 5.0, 13.0, 10.0, 17.0, 21.0, 19.0, 30.0, 34.0, 40.0, 52.0, 50.0, 55.0, 70.0, 63.0, 57.0, 60.0, 64.0, 54.0, 54.0, 46.0, 36.0, 31.0, 26.0, 21.0, 15.0, 14.0, 13.0, 14.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.69140625, -4.574737548828125, -4.45806884765625, -4.341400146484375, -4.2247314453125, -4.108062744140625, -3.99139404296875, -3.874725341796875, -3.758056640625, -3.641387939453125, -3.52471923828125, -3.408050537109375, -3.2913818359375, -3.174713134765625, -3.05804443359375, -2.941375732421875, -2.82470703125, -2.708038330078125, -2.59136962890625, -2.474700927734375, -2.3580322265625, -2.241363525390625, -2.12469482421875, -2.008026123046875, -1.891357421875, -1.774688720703125, -1.65802001953125, -1.541351318359375, -1.4246826171875, -1.308013916015625, -1.19134521484375, -1.074676513671875, -0.9580078125, -0.841339111328125, -0.72467041015625, -0.608001708984375, -0.4913330078125, -0.374664306640625, -0.25799560546875, -0.141326904296875, -0.024658203125, 0.092010498046875, 0.20867919921875, 0.325347900390625, 0.4420166015625, 0.558685302734375, 0.67535400390625, 0.792022705078125, 0.90869140625, 1.025360107421875, 1.14202880859375, 1.258697509765625, 1.3753662109375, 1.492034912109375, 1.60870361328125, 1.725372314453125, 1.842041015625, 1.958709716796875, 2.07537841796875, 2.192047119140625, 2.3087158203125, 2.425384521484375, 2.54205322265625, 2.658721923828125, 2.775390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 8.0, 5.0, 9.0, 23.0, 21.0, 35.0, 53.0, 83.0, 168.0, 273.0, 695.0, 1768.0, 6403.0, 37264.0, 591485.0, 374327.0, 27920.0, 5268.0, 1462.0, 628.0, 260.0, 153.0, 69.0, 46.0, 26.0, 27.0, 20.0, 10.0, 9.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.146484375, -3.053741455078125, -2.96099853515625, -2.868255615234375, -2.7755126953125, -2.682769775390625, -2.59002685546875, -2.497283935546875, -2.404541015625, -2.311798095703125, -2.21905517578125, -2.126312255859375, -2.0335693359375, -1.940826416015625, -1.84808349609375, -1.755340576171875, -1.66259765625, -1.569854736328125, -1.47711181640625, -1.384368896484375, -1.2916259765625, -1.198883056640625, -1.10614013671875, -1.013397216796875, -0.920654296875, -0.827911376953125, -0.73516845703125, -0.642425537109375, -0.5496826171875, -0.456939697265625, -0.36419677734375, -0.271453857421875, -0.1787109375, -0.085968017578125, 0.00677490234375, 0.099517822265625, 0.1922607421875, 0.285003662109375, 0.37774658203125, 0.470489501953125, 0.563232421875, 0.655975341796875, 0.74871826171875, 0.841461181640625, 0.9342041015625, 1.026947021484375, 1.11968994140625, 1.212432861328125, 1.30517578125, 1.397918701171875, 1.49066162109375, 1.583404541015625, 1.6761474609375, 1.768890380859375, 1.86163330078125, 1.954376220703125, 2.047119140625, 2.139862060546875, 2.23260498046875, 2.325347900390625, 2.4180908203125, 2.510833740234375, 2.60357666015625, 2.696319580078125, 2.7890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 15.0, 13.0, 9.0, 21.0, 22.0, 29.0, 30.0, 47.0, 58.0, 68.0, 87.0, 81.0, 93.0, 85.0, 66.0, 57.0, 44.0, 30.0, 29.0, 26.0, 18.0, 9.0, 8.0, 10.0, 7.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.00023317337036132812, -0.00022704154253005981, -0.0002209097146987915, -0.0002147778868675232, -0.00020864605903625488, -0.00020251423120498657, -0.00019638240337371826, -0.00019025057554244995, -0.00018411874771118164, -0.00017798691987991333, -0.00017185509204864502, -0.0001657232642173767, -0.0001595914363861084, -0.0001534596085548401, -0.00014732778072357178, -0.00014119595289230347, -0.00013506412506103516, -0.00012893229722976685, -0.00012280046939849854, -0.00011666864156723022, -0.00011053681373596191, -0.0001044049859046936, -9.827315807342529e-05, -9.214133024215698e-05, -8.600950241088867e-05, -7.987767457962036e-05, -7.374584674835205e-05, -6.761401891708374e-05, -6.148219108581543e-05, -5.535036325454712e-05, -4.921853542327881e-05, -4.30867075920105e-05, -3.695487976074219e-05, -3.082305192947388e-05, -2.4691224098205566e-05, -1.8559396266937256e-05, -1.2427568435668945e-05, -6.295740604400635e-06, -1.6391277313232422e-07, 5.967915058135986e-06, 1.2099742889404297e-05, 1.8231570720672607e-05, 2.4363398551940918e-05, 3.049522638320923e-05, 3.662705421447754e-05, 4.275888204574585e-05, 4.889070987701416e-05, 5.502253770828247e-05, 6.115436553955078e-05, 6.728619337081909e-05, 7.34180212020874e-05, 7.954984903335571e-05, 8.568167686462402e-05, 9.181350469589233e-05, 9.794533252716064e-05, 0.00010407716035842896, 0.00011020898818969727, 0.00011634081602096558, 0.0001224726438522339, 0.0001286044716835022, 0.0001347362995147705, 0.00014086812734603882, 0.00014699995517730713, 0.00015313178300857544, 0.00015926361083984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 7.0, 17.0, 21.0, 30.0, 61.0, 78.0, 161.0, 296.0, 561.0, 1535.0, 4394.0, 18272.0, 124366.0, 732299.0, 138926.0, 19771.0, 4890.0, 1493.0, 628.0, 316.0, 181.0, 96.0, 57.0, 28.0, 15.0, 16.0, 17.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.328125, -2.2542724609375, -2.180419921875, -2.1065673828125, -2.03271484375, -1.9588623046875, -1.885009765625, -1.8111572265625, -1.7373046875, -1.6634521484375, -1.589599609375, -1.5157470703125, -1.44189453125, -1.3680419921875, -1.294189453125, -1.2203369140625, -1.146484375, -1.0726318359375, -0.998779296875, -0.9249267578125, -0.85107421875, -0.7772216796875, -0.703369140625, -0.6295166015625, -0.5556640625, -0.4818115234375, -0.407958984375, -0.3341064453125, -0.26025390625, -0.1864013671875, -0.112548828125, -0.0386962890625, 0.03515625, 0.1090087890625, 0.182861328125, 0.2567138671875, 0.33056640625, 0.4044189453125, 0.478271484375, 0.5521240234375, 0.6259765625, 0.6998291015625, 0.773681640625, 0.8475341796875, 0.92138671875, 0.9952392578125, 1.069091796875, 1.1429443359375, 1.216796875, 1.2906494140625, 1.364501953125, 1.4383544921875, 1.51220703125, 1.5860595703125, 1.659912109375, 1.7337646484375, 1.8076171875, 1.8814697265625, 1.955322265625, 2.0291748046875, 2.10302734375, 2.1768798828125, 2.250732421875, 2.3245849609375, 2.3984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 7.0, 9.0, 5.0, 11.0, 13.0, 9.0, 21.0, 24.0, 31.0, 47.0, 61.0, 104.0, 139.0, 138.0, 108.0, 66.0, 67.0, 36.0, 30.0, 23.0, 16.0, 10.0, 9.0, 7.0, 6.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.384765625, -3.29827880859375, -3.2117919921875, -3.12530517578125, -3.038818359375, -2.95233154296875, -2.8658447265625, -2.77935791015625, -2.69287109375, -2.60638427734375, -2.5198974609375, -2.43341064453125, -2.346923828125, -2.26043701171875, -2.1739501953125, -2.08746337890625, -2.0009765625, -1.91448974609375, -1.8280029296875, -1.74151611328125, -1.655029296875, -1.56854248046875, -1.4820556640625, -1.39556884765625, -1.30908203125, -1.22259521484375, -1.1361083984375, -1.04962158203125, -0.963134765625, -0.87664794921875, -0.7901611328125, -0.70367431640625, -0.6171875, -0.53070068359375, -0.4442138671875, -0.35772705078125, -0.271240234375, -0.18475341796875, -0.0982666015625, -0.01177978515625, 0.07470703125, 0.16119384765625, 0.2476806640625, 0.33416748046875, 0.420654296875, 0.50714111328125, 0.5936279296875, 0.68011474609375, 0.7666015625, 0.85308837890625, 0.9395751953125, 1.02606201171875, 1.112548828125, 1.19903564453125, 1.2855224609375, 1.37200927734375, 1.45849609375, 1.54498291015625, 1.6314697265625, 1.71795654296875, 1.804443359375, 1.89093017578125, 1.9774169921875, 2.06390380859375, 2.150390625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 7.0, 11.0, 18.0, 46.0, 50.0, 126.0, 160.0, 172.0, 153.0, 119.0, 66.0, 40.0, 23.0, 10.0, 4.0, 2.0, 3.0], "bins": [-68.13705444335938, -66.88511657714844, -65.63318634033203, -64.3812484741211, -63.12931442260742, -61.87738037109375, -60.62544250488281, -59.37350845336914, -58.12157440185547, -56.8696403503418, -55.617706298828125, -54.36576843261719, -53.113834381103516, -51.861900329589844, -50.609962463378906, -49.358028411865234, -48.10609436035156, -46.85416030883789, -45.60222625732422, -44.35028839111328, -43.09835433959961, -41.84642028808594, -40.594482421875, -39.34254837036133, -38.090614318847656, -36.838680267333984, -35.58674621582031, -34.334808349609375, -33.0828742980957, -31.83094024658203, -30.579004287719727, -29.327068328857422, -28.075136184692383, -26.823200225830078, -25.571266174316406, -24.319332122802734, -23.06739616394043, -21.815460205078125, -20.563526153564453, -19.31159210205078, -18.059656143188477, -16.807720184326172, -15.5557861328125, -14.303851127624512, -13.051916122436523, -11.799981117248535, -10.548046112060547, -9.296111106872559, -8.04417610168457, -6.792241096496582, -5.540306091308594, -4.2883710861206055, -3.036436080932617, -1.784501075744629, -0.5325660705566406, 0.7193689346313477, 1.971303939819336, 3.223238945007324, 4.4751739501953125, 5.727108955383301, 6.979043960571289, 8.230978965759277, 9.482913970947266, 10.734848976135254, 11.986783981323242]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 6.0, 1.0, 5.0, 3.0, 3.0, 3.0, 9.0, 13.0, 12.0, 23.0, 20.0, 35.0, 34.0, 23.0, 40.0, 46.0, 38.0, 58.0, 64.0, 58.0, 64.0, 68.0, 58.0, 47.0, 45.0, 32.0, 38.0, 25.0, 22.0, 26.0, 14.0, 14.0, 14.0, 9.0, 9.0, 5.0, 13.0, 4.0, 1.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.822039604187012, -15.275516510009766, -14.728992462158203, -14.182469367980957, -13.635946273803711, -13.089422225952148, -12.542899131774902, -11.996376037597656, -11.449851989746094, -10.903328895568848, -10.356804847717285, -9.810281753540039, -9.263758659362793, -8.717235565185547, -8.170711517333984, -7.624188423156738, -7.077665328979492, -6.531141757965088, -5.984618663787842, -5.4380950927734375, -4.891571998596191, -4.345048427581787, -3.798524856567383, -3.2520015239715576, -2.7054781913757324, -2.1589548587799072, -1.6124314069747925, -1.0659079551696777, -0.5193846225738525, 0.027138710021972656, 0.573662281036377, 1.1201856136322021, 1.666707992553711, 2.213231325149536, 2.7597546577453613, 3.3062782287597656, 3.852801561355591, 4.399324893951416, 4.94584846496582, 5.492371559143066, 6.038895130157471, 6.585418701171875, 7.131941795349121, 7.678465366363525, 8.22498893737793, 8.771512031555176, 9.318035125732422, 9.864559173583984, 10.41108226776123, 10.957605361938477, 11.504129409790039, 12.050652503967285, 12.597175598144531, 13.143699645996094, 13.69022274017334, 14.236745834350586, 14.783269882202148, 15.329792976379395, 15.876317024230957, 16.422840118408203, 16.969364166259766, 17.515886306762695, 18.062410354614258, 18.60893440246582, 19.15545654296875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 11.0, 13.0, 23.0, 39.0, 74.0, 149.0, 397.0, 956.0, 2531.0, 10113.0, 152855.0, 4003942.0, 17367.0, 3673.0, 1172.0, 504.0, 183.0, 116.0, 62.0, 40.0, 16.0, 13.0, 10.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-9.671875, -9.43682861328125, -9.2017822265625, -8.96673583984375, -8.731689453125, -8.49664306640625, -8.2615966796875, -8.02655029296875, -7.79150390625, -7.55645751953125, -7.3214111328125, -7.08636474609375, -6.851318359375, -6.61627197265625, -6.3812255859375, -6.14617919921875, -5.9111328125, -5.67608642578125, -5.4410400390625, -5.20599365234375, -4.970947265625, -4.73590087890625, -4.5008544921875, -4.26580810546875, -4.03076171875, -3.79571533203125, -3.5606689453125, -3.32562255859375, -3.090576171875, -2.85552978515625, -2.6204833984375, -2.38543701171875, -2.150390625, -1.91534423828125, -1.6802978515625, -1.44525146484375, -1.210205078125, -0.97515869140625, -0.7401123046875, -0.50506591796875, -0.27001953125, -0.03497314453125, 0.2000732421875, 0.43511962890625, 0.670166015625, 0.90521240234375, 1.1402587890625, 1.37530517578125, 1.6103515625, 1.84539794921875, 2.0804443359375, 2.31549072265625, 2.550537109375, 2.78558349609375, 3.0206298828125, 3.25567626953125, 3.49072265625, 3.72576904296875, 3.9608154296875, 4.19586181640625, 4.430908203125, 4.66595458984375, 4.9010009765625, 5.13604736328125, 5.37109375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 0.0, 1.0, 5.0, 9.0, 8.0, 7.0, 7.0, 9.0, 20.0, 23.0, 21.0, 44.0, 39.0, 53.0, 64.0, 68.0, 59.0, 72.0, 73.0, 69.0, 67.0, 45.0, 47.0, 45.0, 29.0, 34.0, 21.0, 14.0, 18.0, 10.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5556640625, -0.5292205810546875, -0.502777099609375, -0.4763336181640625, -0.44989013671875, -0.4234466552734375, -0.397003173828125, -0.3705596923828125, -0.3441162109375, -0.3176727294921875, -0.291229248046875, -0.2647857666015625, -0.23834228515625, -0.2118988037109375, -0.185455322265625, -0.1590118408203125, -0.132568359375, -0.1061248779296875, -0.079681396484375, -0.0532379150390625, -0.02679443359375, -0.0003509521484375, 0.026092529296875, 0.0525360107421875, 0.0789794921875, 0.1054229736328125, 0.131866455078125, 0.1583099365234375, 0.18475341796875, 0.2111968994140625, 0.237640380859375, 0.2640838623046875, 0.29052734375, 0.3169708251953125, 0.343414306640625, 0.3698577880859375, 0.39630126953125, 0.4227447509765625, 0.449188232421875, 0.4756317138671875, 0.5020751953125, 0.5285186767578125, 0.554962158203125, 0.5814056396484375, 0.60784912109375, 0.6342926025390625, 0.660736083984375, 0.6871795654296875, 0.713623046875, 0.7400665283203125, 0.766510009765625, 0.7929534912109375, 0.81939697265625, 0.8458404541015625, 0.872283935546875, 0.8987274169921875, 0.9251708984375, 0.9516143798828125, 0.978057861328125, 1.0045013427734375, 1.03094482421875, 1.0573883056640625, 1.083831787109375, 1.1102752685546875, 1.13671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 16.0, 16.0, 28.0, 30.0, 51.0, 67.0, 110.0, 163.0, 225.0, 364.0, 506.0, 859.0, 1360.0, 2054.0, 3743.0, 7524.0, 17184.0, 54924.0, 3519421.0, 509083.0, 45460.0, 15385.0, 6782.0, 3474.0, 1962.0, 1215.0, 746.0, 487.0, 326.0, 242.0, 152.0, 98.0, 74.0, 43.0, 44.0, 28.0, 11.0, 10.0, 8.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08203125, -2.95843505859375, -2.8348388671875, -2.71124267578125, -2.587646484375, -2.46405029296875, -2.3404541015625, -2.21685791015625, -2.09326171875, -1.96966552734375, -1.8460693359375, -1.72247314453125, -1.598876953125, -1.47528076171875, -1.3516845703125, -1.22808837890625, -1.1044921875, -0.98089599609375, -0.8572998046875, -0.73370361328125, -0.610107421875, -0.48651123046875, -0.3629150390625, -0.23931884765625, -0.11572265625, 0.00787353515625, 0.1314697265625, 0.25506591796875, 0.378662109375, 0.50225830078125, 0.6258544921875, 0.74945068359375, 0.873046875, 0.99664306640625, 1.1202392578125, 1.24383544921875, 1.367431640625, 1.49102783203125, 1.6146240234375, 1.73822021484375, 1.86181640625, 1.98541259765625, 2.1090087890625, 2.23260498046875, 2.356201171875, 2.47979736328125, 2.6033935546875, 2.72698974609375, 2.8505859375, 2.97418212890625, 3.0977783203125, 3.22137451171875, 3.344970703125, 3.46856689453125, 3.5921630859375, 3.71575927734375, 3.83935546875, 3.96295166015625, 4.0865478515625, 4.21014404296875, 4.333740234375, 4.45733642578125, 4.5809326171875, 4.70452880859375, 4.828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 7.0, 8.0, 7.0, 18.0, 15.0, 26.0, 37.0, 85.0, 230.0, 3097.0, 273.0, 102.0, 49.0, 21.0, 31.0, 13.0, 14.0, 5.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -0.9961090087890625, -0.959991455078125, -0.9238739013671875, -0.88775634765625, -0.8516387939453125, -0.815521240234375, -0.7794036865234375, -0.7432861328125, -0.7071685791015625, -0.671051025390625, -0.6349334716796875, -0.59881591796875, -0.5626983642578125, -0.526580810546875, -0.4904632568359375, -0.454345703125, -0.4182281494140625, -0.382110595703125, -0.3459930419921875, -0.30987548828125, -0.2737579345703125, -0.237640380859375, -0.2015228271484375, -0.1654052734375, -0.1292877197265625, -0.093170166015625, -0.0570526123046875, -0.02093505859375, 0.0151824951171875, 0.051300048828125, 0.0874176025390625, 0.12353515625, 0.1596527099609375, 0.195770263671875, 0.2318878173828125, 0.26800537109375, 0.3041229248046875, 0.340240478515625, 0.3763580322265625, 0.4124755859375, 0.4485931396484375, 0.484710693359375, 0.5208282470703125, 0.55694580078125, 0.5930633544921875, 0.629180908203125, 0.6652984619140625, 0.701416015625, 0.7375335693359375, 0.773651123046875, 0.8097686767578125, 0.84588623046875, 0.8820037841796875, 0.918121337890625, 0.9542388916015625, 0.9903564453125, 1.0264739990234375, 1.062591552734375, 1.0987091064453125, 1.13482666015625, 1.1709442138671875, 1.207061767578125, 1.2431793212890625, 1.279296875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 4.0, 7.0, 18.0, 29.0, 29.0, 56.0, 90.0, 137.0, 149.0, 137.0, 110.0, 80.0, 66.0, 24.0, 19.0, 22.0, 12.0, 3.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.178412437438965, -3.970205783843994, -3.7619991302490234, -3.5537924766540527, -3.345585823059082, -3.1373791694641113, -2.9291725158691406, -2.72096586227417, -2.512759208679199, -2.3045525550842285, -2.096345901489258, -1.888139247894287, -1.6799325942993164, -1.4717258214950562, -1.2635191679000854, -1.0553125143051147, -0.8471057415008545, -0.6388990879058838, -0.4306924045085907, -0.2224857211112976, -0.014279067516326904, 0.19392764568328857, 0.4021342992782593, 0.61034095287323, 0.8185476064682007, 1.0267542600631714, 1.234960913658142, 1.4431676864624023, 1.651374340057373, 1.8595809936523438, 2.0677876472473145, 2.275994300842285, 2.484200954437256, 2.6924076080322266, 2.9006142616271973, 3.108820915222168, 3.3170275688171387, 3.5252342224121094, 3.73344087600708, 3.941647529602051, 4.1498541831970215, 4.358060836791992, 4.566267490386963, 4.774474143981934, 4.982680797576904, 5.190887451171875, 5.399094104766846, 5.607300758361816, 5.815507888793945, 6.023714542388916, 6.231921195983887, 6.440127849578857, 6.648334503173828, 6.856541156768799, 7.0647478103637695, 7.27295446395874, 7.481161117553711, 7.689367771148682, 7.897574424743652, 8.105781555175781, 8.313987731933594, 8.522194862365723, 8.730401039123535, 8.938608169555664, 9.146814346313477]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 10.0, 13.0, 18.0, 16.0, 19.0, 24.0, 33.0, 31.0, 26.0, 26.0, 48.0, 36.0, 30.0, 36.0, 52.0, 43.0, 41.0, 39.0, 34.0, 39.0, 35.0, 34.0, 43.0, 31.0, 29.0, 34.0, 27.0, 31.0, 22.0, 20.0, 9.0, 10.0, 10.0, 10.0, 5.0, 1.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-3.6049296855926514, -3.502578020095825, -3.400226354598999, -3.297874689102173, -3.1955230236053467, -3.0931713581085205, -2.9908194541931152, -2.888467788696289, -2.786116123199463, -2.6837644577026367, -2.5814127922058105, -2.4790611267089844, -2.376709461212158, -2.274357795715332, -2.172006130218506, -2.0696544647216797, -1.9673027992248535, -1.8649511337280273, -1.7625994682312012, -1.660247802734375, -1.5578961372375488, -1.4555444717407227, -1.353192687034607, -1.2508410215377808, -1.1484893560409546, -1.0461376905441284, -0.9437860250473022, -0.8414342999458313, -0.7390826344490051, -0.636730968952179, -0.534379243850708, -0.43202757835388184, -0.32967591285705566, -0.2273242324590683, -0.12497255206108093, -0.022620856761932373, 0.0797308087348938, 0.18208247423171997, 0.2844341993331909, 0.3867858648300171, 0.48913753032684326, 0.5914891958236694, 0.6938408613204956, 0.7961925864219666, 0.8985442519187927, 1.0008959770202637, 1.1032476425170898, 1.205599308013916, 1.3079509735107422, 1.4103026390075684, 1.5126543045043945, 1.6150059700012207, 1.7173576354980469, 1.819709300994873, 1.9220610857009888, 2.0244126319885254, 2.1267642974853516, 2.2291159629821777, 2.331467628479004, 2.43381929397583, 2.5361709594726562, 2.6385226249694824, 2.7408742904663086, 2.8432259559631348, 2.94557785987854]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 8.0, 14.0, 13.0, 18.0, 41.0, 57.0, 67.0, 91.0, 127.0, 233.0, 332.0, 558.0, 952.0, 1720.0, 3135.0, 6007.0, 12197.0, 26250.0, 57703.0, 126920.0, 241633.0, 270604.0, 160139.0, 74361.0, 33581.0, 15563.0, 7271.0, 3905.0, 2064.0, 1159.0, 633.0, 399.0, 262.0, 173.0, 113.0, 79.0, 50.0, 32.0, 30.0, 15.0, 9.0, 4.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 3.0], "bins": [-1.9404296875, -1.8836212158203125, -1.826812744140625, -1.7700042724609375, -1.71319580078125, -1.6563873291015625, -1.599578857421875, -1.5427703857421875, -1.4859619140625, -1.4291534423828125, -1.372344970703125, -1.3155364990234375, -1.25872802734375, -1.2019195556640625, -1.145111083984375, -1.0883026123046875, -1.031494140625, -0.9746856689453125, -0.917877197265625, -0.8610687255859375, -0.80426025390625, -0.7474517822265625, -0.690643310546875, -0.6338348388671875, -0.5770263671875, -0.5202178955078125, -0.463409423828125, -0.4066009521484375, -0.34979248046875, -0.2929840087890625, -0.236175537109375, -0.1793670654296875, -0.12255859375, -0.0657501220703125, -0.008941650390625, 0.0478668212890625, 0.10467529296875, 0.1614837646484375, 0.218292236328125, 0.2751007080078125, 0.3319091796875, 0.3887176513671875, 0.445526123046875, 0.5023345947265625, 0.55914306640625, 0.6159515380859375, 0.672760009765625, 0.7295684814453125, 0.786376953125, 0.8431854248046875, 0.899993896484375, 0.9568023681640625, 1.01361083984375, 1.0704193115234375, 1.127227783203125, 1.1840362548828125, 1.2408447265625, 1.2976531982421875, 1.354461669921875, 1.4112701416015625, 1.46807861328125, 1.5248870849609375, 1.581695556640625, 1.6385040283203125, 1.6953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 4.0, 8.0, 9.0, 13.0, 16.0, 21.0, 12.0, 25.0, 31.0, 43.0, 47.0, 49.0, 42.0, 62.0, 66.0, 68.0, 64.0, 67.0, 56.0, 57.0, 42.0, 38.0, 34.0, 23.0, 21.0, 22.0, 22.0, 13.0, 6.0, 6.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7900390625, -0.758056640625, -0.72607421875, -0.694091796875, -0.662109375, -0.630126953125, -0.59814453125, -0.566162109375, -0.5341796875, -0.502197265625, -0.47021484375, -0.438232421875, -0.40625, -0.374267578125, -0.34228515625, -0.310302734375, -0.2783203125, -0.246337890625, -0.21435546875, -0.182373046875, -0.150390625, -0.118408203125, -0.08642578125, -0.054443359375, -0.0224609375, 0.009521484375, 0.04150390625, 0.073486328125, 0.10546875, 0.137451171875, 0.16943359375, 0.201416015625, 0.2333984375, 0.265380859375, 0.29736328125, 0.329345703125, 0.361328125, 0.393310546875, 0.42529296875, 0.457275390625, 0.4892578125, 0.521240234375, 0.55322265625, 0.585205078125, 0.6171875, 0.649169921875, 0.68115234375, 0.713134765625, 0.7451171875, 0.777099609375, 0.80908203125, 0.841064453125, 0.873046875, 0.905029296875, 0.93701171875, 0.968994140625, 1.0009765625, 1.032958984375, 1.06494140625, 1.096923828125, 1.12890625, 1.160888671875, 1.19287109375, 1.224853515625, 1.2568359375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 16.0, 15.0, 21.0, 35.0, 71.0, 123.0, 288.0, 687.0, 2061.0, 8697.0, 58974.0, 639457.0, 303170.0, 27640.0, 5041.0, 1366.0, 448.0, 187.0, 120.0, 53.0, 40.0, 16.0, 15.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.70703125, -7.51348876953125, -7.3199462890625, -7.12640380859375, -6.932861328125, -6.73931884765625, -6.5457763671875, -6.35223388671875, -6.15869140625, -5.96514892578125, -5.7716064453125, -5.57806396484375, -5.384521484375, -5.19097900390625, -4.9974365234375, -4.80389404296875, -4.6103515625, -4.41680908203125, -4.2232666015625, -4.02972412109375, -3.836181640625, -3.64263916015625, -3.4490966796875, -3.25555419921875, -3.06201171875, -2.86846923828125, -2.6749267578125, -2.48138427734375, -2.287841796875, -2.09429931640625, -1.9007568359375, -1.70721435546875, -1.513671875, -1.32012939453125, -1.1265869140625, -0.93304443359375, -0.739501953125, -0.54595947265625, -0.3524169921875, -0.15887451171875, 0.03466796875, 0.22821044921875, 0.4217529296875, 0.61529541015625, 0.808837890625, 1.00238037109375, 1.1959228515625, 1.38946533203125, 1.5830078125, 1.77655029296875, 1.9700927734375, 2.16363525390625, 2.357177734375, 2.55072021484375, 2.7442626953125, 2.93780517578125, 3.13134765625, 3.32489013671875, 3.5184326171875, 3.71197509765625, 3.905517578125, 4.09906005859375, 4.2926025390625, 4.48614501953125, 4.6796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 8.0, 7.0, 15.0, 12.0, 12.0, 24.0, 24.0, 24.0, 31.0, 44.0, 58.0, 59.0, 60.0, 61.0, 75.0, 61.0, 48.0, 61.0, 47.0, 43.0, 48.0, 38.0, 25.0, 22.0, 18.0, 15.0, 12.0, 4.0, 12.0, 5.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.30078125, -6.1280517578125, -5.955322265625, -5.7825927734375, -5.60986328125, -5.4371337890625, -5.264404296875, -5.0916748046875, -4.9189453125, -4.7462158203125, -4.573486328125, -4.4007568359375, -4.22802734375, -4.0552978515625, -3.882568359375, -3.7098388671875, -3.537109375, -3.3643798828125, -3.191650390625, -3.0189208984375, -2.84619140625, -2.6734619140625, -2.500732421875, -2.3280029296875, -2.1552734375, -1.9825439453125, -1.809814453125, -1.6370849609375, -1.46435546875, -1.2916259765625, -1.118896484375, -0.9461669921875, -0.7734375, -0.6007080078125, -0.427978515625, -0.2552490234375, -0.08251953125, 0.0902099609375, 0.262939453125, 0.4356689453125, 0.6083984375, 0.7811279296875, 0.953857421875, 1.1265869140625, 1.29931640625, 1.4720458984375, 1.644775390625, 1.8175048828125, 1.990234375, 2.1629638671875, 2.335693359375, 2.5084228515625, 2.68115234375, 2.8538818359375, 3.026611328125, 3.1993408203125, 3.3720703125, 3.5447998046875, 3.717529296875, 3.8902587890625, 4.06298828125, 4.2357177734375, 4.408447265625, 4.5811767578125, 4.75390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 9.0, 6.0, 8.0, 19.0, 34.0, 54.0, 121.0, 181.0, 488.0, 1262.0, 5231.0, 51124.0, 856430.0, 122118.0, 8663.0, 1749.0, 538.0, 239.0, 113.0, 75.0, 32.0, 22.0, 17.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.07403564453125, -3.9410400390625, -3.80804443359375, -3.675048828125, -3.54205322265625, -3.4090576171875, -3.27606201171875, -3.14306640625, -3.01007080078125, -2.8770751953125, -2.74407958984375, -2.611083984375, -2.47808837890625, -2.3450927734375, -2.21209716796875, -2.0791015625, -1.94610595703125, -1.8131103515625, -1.68011474609375, -1.547119140625, -1.41412353515625, -1.2811279296875, -1.14813232421875, -1.01513671875, -0.88214111328125, -0.7491455078125, -0.61614990234375, -0.483154296875, -0.35015869140625, -0.2171630859375, -0.08416748046875, 0.048828125, 0.18182373046875, 0.3148193359375, 0.44781494140625, 0.580810546875, 0.71380615234375, 0.8468017578125, 0.97979736328125, 1.11279296875, 1.24578857421875, 1.3787841796875, 1.51177978515625, 1.644775390625, 1.77777099609375, 1.9107666015625, 2.04376220703125, 2.1767578125, 2.30975341796875, 2.4427490234375, 2.57574462890625, 2.708740234375, 2.84173583984375, 2.9747314453125, 3.10772705078125, 3.24072265625, 3.37371826171875, 3.5067138671875, 3.63970947265625, 3.772705078125, 3.90570068359375, 4.0386962890625, 4.17169189453125, 4.3046875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 2.0, 1.0, 6.0, 14.0, 9.0, 26.0, 28.0, 40.0, 51.0, 86.0, 119.0, 126.0, 125.0, 111.0, 110.0, 44.0, 38.0, 24.0, 18.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.0005655288696289062, -0.0005529113113880157, -0.0005402937531471252, -0.0005276761949062347, -0.0005150586366653442, -0.0005024410784244537, -0.0004898235201835632, -0.00047720596194267273, -0.0004645884037017822, -0.0004519708454608917, -0.0004393532872200012, -0.0004267357289791107, -0.0004141181707382202, -0.0004015006124973297, -0.0003888830542564392, -0.0003762654960155487, -0.0003636479377746582, -0.0003510303795337677, -0.0003384128212928772, -0.0003257952630519867, -0.0003131777048110962, -0.0003005601465702057, -0.0002879425883293152, -0.0002753250300884247, -0.0002627074718475342, -0.0002500899136066437, -0.00023747235536575317, -0.00022485479712486267, -0.00021223723888397217, -0.00019961968064308167, -0.00018700212240219116, -0.00017438456416130066, -0.00016176700592041016, -0.00014914944767951965, -0.00013653188943862915, -0.00012391433119773865, -0.00011129677295684814, -9.867921471595764e-05, -8.606165647506714e-05, -7.344409823417664e-05, -6.082653999328613e-05, -4.820898175239563e-05, -3.559142351150513e-05, -2.2973865270614624e-05, -1.0356307029724121e-05, 2.261251211166382e-06, 1.4878809452056885e-05, 2.7496367692947388e-05, 4.011392593383789e-05, 5.2731484174728394e-05, 6.53490424156189e-05, 7.79666006565094e-05, 9.05841588973999e-05, 0.0001032017171382904, 0.00011581927537918091, 0.0001284368336200714, 0.00014105439186096191, 0.00015367195010185242, 0.00016628950834274292, 0.00017890706658363342, 0.00019152462482452393, 0.00020414218306541443, 0.00021675974130630493, 0.00022937729954719543, 0.00024199485778808594]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 8.0, 14.0, 18.0, 26.0, 45.0, 92.0, 210.0, 480.0, 1962.0, 29210.0, 974053.0, 39279.0, 2181.0, 530.0, 206.0, 107.0, 49.0, 31.0, 20.0, 11.0, 8.0, 5.0, 2.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6640625, -8.4503173828125, -8.236572265625, -8.0228271484375, -7.80908203125, -7.5953369140625, -7.381591796875, -7.1678466796875, -6.9541015625, -6.7403564453125, -6.526611328125, -6.3128662109375, -6.09912109375, -5.8853759765625, -5.671630859375, -5.4578857421875, -5.244140625, -5.0303955078125, -4.816650390625, -4.6029052734375, -4.38916015625, -4.1754150390625, -3.961669921875, -3.7479248046875, -3.5341796875, -3.3204345703125, -3.106689453125, -2.8929443359375, -2.67919921875, -2.4654541015625, -2.251708984375, -2.0379638671875, -1.82421875, -1.6104736328125, -1.396728515625, -1.1829833984375, -0.96923828125, -0.7554931640625, -0.541748046875, -0.3280029296875, -0.1142578125, 0.0994873046875, 0.313232421875, 0.5269775390625, 0.74072265625, 0.9544677734375, 1.168212890625, 1.3819580078125, 1.595703125, 1.8094482421875, 2.023193359375, 2.2369384765625, 2.45068359375, 2.6644287109375, 2.878173828125, 3.0919189453125, 3.3056640625, 3.5194091796875, 3.733154296875, 3.9468994140625, 4.16064453125, 4.3743896484375, 4.588134765625, 4.8018798828125, 5.015625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 9.0, 17.0, 27.0, 69.0, 173.0, 306.0, 235.0, 109.0, 32.0, 21.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.890625, -10.662567138671875, -10.43450927734375, -10.206451416015625, -9.9783935546875, -9.750335693359375, -9.52227783203125, -9.294219970703125, -9.066162109375, -8.838104248046875, -8.61004638671875, -8.381988525390625, -8.1539306640625, -7.925872802734375, -7.69781494140625, -7.469757080078125, -7.24169921875, -7.013641357421875, -6.78558349609375, -6.557525634765625, -6.3294677734375, -6.101409912109375, -5.87335205078125, -5.645294189453125, -5.417236328125, -5.189178466796875, -4.96112060546875, -4.733062744140625, -4.5050048828125, -4.276947021484375, -4.04888916015625, -3.820831298828125, -3.5927734375, -3.364715576171875, -3.13665771484375, -2.908599853515625, -2.6805419921875, -2.452484130859375, -2.22442626953125, -1.996368408203125, -1.768310546875, -1.540252685546875, -1.31219482421875, -1.084136962890625, -0.8560791015625, -0.628021240234375, -0.39996337890625, -0.171905517578125, 0.05615234375, 0.284210205078125, 0.51226806640625, 0.740325927734375, 0.9683837890625, 1.196441650390625, 1.42449951171875, 1.652557373046875, 1.880615234375, 2.108673095703125, 2.33673095703125, 2.564788818359375, 2.7928466796875, 3.020904541015625, 3.24896240234375, 3.477020263671875, 3.705078125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 11.0, 27.0, 116.0, 362.0, 359.0, 121.0, 13.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.034568786621094, -43.15842819213867, -39.282283782958984, -35.40614318847656, -31.530000686645508, -27.653858184814453, -23.77771759033203, -19.901575088500977, -16.025432586669922, -12.149290084838867, -8.273148536682129, -4.397006988525391, -0.5208644866943359, 3.3552780151367188, 7.231418609619141, 11.107561111450195, 14.98370361328125, 18.859846115112305, 22.73598861694336, 26.61212921142578, 30.488271713256836, 34.36441421508789, 38.24055480957031, 42.11669921875, 45.99283981323242, 49.868980407714844, 53.74512481689453, 57.62126541137695, 61.497406005859375, 65.37355041503906, 69.24969482421875, 73.1258316040039, 77.00196838378906, 80.87811279296875, 84.7542495727539, 88.6303939819336, 92.50653839111328, 96.38267517089844, 100.25881958007812, 104.13496398925781, 108.0111083984375, 111.88725280761719, 115.76338958740234, 119.63953399658203, 123.51567840576172, 127.39181518554688, 131.26795959472656, 135.14410400390625, 139.02023315429688, 142.89637756347656, 146.77252197265625, 150.64865112304688, 154.52479553222656, 158.40093994140625, 162.27708435058594, 166.15322875976562, 170.0293731689453, 173.905517578125, 177.7816619873047, 181.65780639648438, 185.533935546875, 189.4100799560547, 193.28622436523438, 197.16236877441406, 201.03851318359375]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 4.0, 2.0, 9.0, 9.0, 17.0, 10.0, 16.0, 22.0, 19.0, 26.0, 29.0, 39.0, 36.0, 52.0, 44.0, 38.0, 60.0, 44.0, 77.0, 55.0, 52.0, 47.0, 37.0, 37.0, 34.0, 30.0, 25.0, 24.0, 21.0, 15.0, 10.0, 8.0, 17.0, 5.0, 5.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.857677459716797, -22.127111434936523, -21.39654541015625, -20.665979385375977, -19.935413360595703, -19.20484733581543, -18.474281311035156, -17.743715286254883, -17.01314926147461, -16.282583236694336, -15.552017211914062, -14.821451187133789, -14.090885162353516, -13.360319137573242, -12.629753112792969, -11.899187088012695, -11.168621063232422, -10.438055038452148, -9.707489013671875, -8.976922988891602, -8.246356964111328, -7.515790939331055, -6.785224914550781, -6.054658889770508, -5.324092864990234, -4.593526840209961, -3.8629608154296875, -3.132394790649414, -2.4018287658691406, -1.6712627410888672, -0.9406967163085938, -0.2101306915283203, 0.5204334259033203, 1.2509994506835938, 1.9815654754638672, 2.7121315002441406, 3.442697525024414, 4.1732635498046875, 4.903829574584961, 5.634395599365234, 6.364961624145508, 7.095527648925781, 7.826093673706055, 8.556659698486328, 9.287225723266602, 10.017791748046875, 10.748357772827148, 11.478923797607422, 12.209489822387695, 12.940055847167969, 13.670621871948242, 14.401187896728516, 15.131753921508789, 15.862319946289062, 16.592885971069336, 17.32345199584961, 18.054018020629883, 18.784584045410156, 19.51515007019043, 20.245716094970703, 20.976282119750977, 21.70684814453125, 22.437414169311523, 23.167980194091797, 23.89854621887207]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 1.0, 2.0, 5.0, 9.0, 16.0, 23.0, 30.0, 58.0, 103.0, 202.0, 397.0, 794.0, 1750.0, 5336.0, 42106.0, 4122099.0, 15591.0, 3337.0, 1195.0, 566.0, 254.0, 163.0, 85.0, 51.0, 31.0, 15.0, 12.0, 13.0, 7.0, 11.0, 2.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.8046875, -8.5322265625, -8.259765625, -7.9873046875, -7.71484375, -7.4423828125, -7.169921875, -6.8974609375, -6.625, -6.3525390625, -6.080078125, -5.8076171875, -5.53515625, -5.2626953125, -4.990234375, -4.7177734375, -4.4453125, -4.1728515625, -3.900390625, -3.6279296875, -3.35546875, -3.0830078125, -2.810546875, -2.5380859375, -2.265625, -1.9931640625, -1.720703125, -1.4482421875, -1.17578125, -0.9033203125, -0.630859375, -0.3583984375, -0.0859375, 0.1865234375, 0.458984375, 0.7314453125, 1.00390625, 1.2763671875, 1.548828125, 1.8212890625, 2.09375, 2.3662109375, 2.638671875, 2.9111328125, 3.18359375, 3.4560546875, 3.728515625, 4.0009765625, 4.2734375, 4.5458984375, 4.818359375, 5.0908203125, 5.36328125, 5.6357421875, 5.908203125, 6.1806640625, 6.453125, 6.7255859375, 6.998046875, 7.2705078125, 7.54296875, 7.8154296875, 8.087890625, 8.3603515625, 8.6328125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 11.0, 18.0, 30.0, 31.0, 39.0, 43.0, 58.0, 72.0, 84.0, 87.0, 87.0, 93.0, 79.0, 54.0, 56.0, 33.0, 25.0, 28.0, 16.0, 12.0, 12.0, 5.0, 6.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1611328125, -1.1131591796875, -1.065185546875, -1.0172119140625, -0.96923828125, -0.9212646484375, -0.873291015625, -0.8253173828125, -0.77734375, -0.7293701171875, -0.681396484375, -0.6334228515625, -0.58544921875, -0.5374755859375, -0.489501953125, -0.4415283203125, -0.3935546875, -0.3455810546875, -0.297607421875, -0.2496337890625, -0.20166015625, -0.1536865234375, -0.105712890625, -0.0577392578125, -0.009765625, 0.0382080078125, 0.086181640625, 0.1341552734375, 0.18212890625, 0.2301025390625, 0.278076171875, 0.3260498046875, 0.3740234375, 0.4219970703125, 0.469970703125, 0.5179443359375, 0.56591796875, 0.6138916015625, 0.661865234375, 0.7098388671875, 0.7578125, 0.8057861328125, 0.853759765625, 0.9017333984375, 0.94970703125, 0.9976806640625, 1.045654296875, 1.0936279296875, 1.1416015625, 1.1895751953125, 1.237548828125, 1.2855224609375, 1.33349609375, 1.3814697265625, 1.429443359375, 1.4774169921875, 1.525390625, 1.5733642578125, 1.621337890625, 1.6693115234375, 1.71728515625, 1.7652587890625, 1.813232421875, 1.8612060546875, 1.9091796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 4.0, 16.0, 12.0, 25.0, 27.0, 27.0, 76.0, 92.0, 158.0, 273.0, 360.0, 573.0, 1011.0, 1859.0, 3846.0, 9980.0, 48790.0, 4070440.0, 39832.0, 9016.0, 3551.0, 1744.0, 994.0, 514.0, 346.0, 244.0, 141.0, 81.0, 66.0, 55.0, 40.0, 31.0, 13.0, 13.0, 9.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41015625, -6.17669677734375, -5.9432373046875, -5.70977783203125, -5.476318359375, -5.24285888671875, -5.0093994140625, -4.77593994140625, -4.54248046875, -4.30902099609375, -4.0755615234375, -3.84210205078125, -3.608642578125, -3.37518310546875, -3.1417236328125, -2.90826416015625, -2.6748046875, -2.44134521484375, -2.2078857421875, -1.97442626953125, -1.740966796875, -1.50750732421875, -1.2740478515625, -1.04058837890625, -0.80712890625, -0.57366943359375, -0.3402099609375, -0.10675048828125, 0.126708984375, 0.36016845703125, 0.5936279296875, 0.82708740234375, 1.060546875, 1.29400634765625, 1.5274658203125, 1.76092529296875, 1.994384765625, 2.22784423828125, 2.4613037109375, 2.69476318359375, 2.92822265625, 3.16168212890625, 3.3951416015625, 3.62860107421875, 3.862060546875, 4.09552001953125, 4.3289794921875, 4.56243896484375, 4.7958984375, 5.02935791015625, 5.2628173828125, 5.49627685546875, 5.729736328125, 5.96319580078125, 6.1966552734375, 6.43011474609375, 6.66357421875, 6.89703369140625, 7.1304931640625, 7.36395263671875, 7.597412109375, 7.83087158203125, 8.0643310546875, 8.29779052734375, 8.53125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 12.0, 11.0, 22.0, 37.0, 76.0, 3630.0, 167.0, 52.0, 19.0, 10.0, 6.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.41796875, -1.3607177734375, -1.303466796875, -1.2462158203125, -1.18896484375, -1.1317138671875, -1.074462890625, -1.0172119140625, -0.9599609375, -0.9027099609375, -0.845458984375, -0.7882080078125, -0.73095703125, -0.6737060546875, -0.616455078125, -0.5592041015625, -0.501953125, -0.4447021484375, -0.387451171875, -0.3302001953125, -0.27294921875, -0.2156982421875, -0.158447265625, -0.1011962890625, -0.0439453125, 0.0133056640625, 0.070556640625, 0.1278076171875, 0.18505859375, 0.2423095703125, 0.299560546875, 0.3568115234375, 0.4140625, 0.4713134765625, 0.528564453125, 0.5858154296875, 0.64306640625, 0.7003173828125, 0.757568359375, 0.8148193359375, 0.8720703125, 0.9293212890625, 0.986572265625, 1.0438232421875, 1.10107421875, 1.1583251953125, 1.215576171875, 1.2728271484375, 1.330078125, 1.3873291015625, 1.444580078125, 1.5018310546875, 1.55908203125, 1.6163330078125, 1.673583984375, 1.7308349609375, 1.7880859375, 1.8453369140625, 1.902587890625, 1.9598388671875, 2.01708984375, 2.0743408203125, 2.131591796875, 2.1888427734375, 2.24609375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 10.0, 15.0, 28.0, 45.0, 84.0, 119.0, 137.0, 148.0, 116.0, 105.0, 55.0, 42.0, 33.0, 20.0, 10.0, 4.0, 8.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.686426162719727, -6.486286640167236, -6.286147117614746, -6.086007118225098, -5.885867595672607, -5.685728073120117, -5.485588550567627, -5.285449028015137, -5.085309028625488, -4.885169506072998, -4.685029983520508, -4.484889984130859, -4.284750461578369, -4.084610939025879, -3.8844714164733887, -3.6843318939208984, -3.484192371368408, -3.284052848815918, -3.0839130878448486, -2.8837735652923584, -2.683633804321289, -2.483494281768799, -2.2833547592163086, -2.0832152366638184, -1.883075475692749, -1.6829358339309692, -1.4827961921691895, -1.2826566696166992, -1.0825170278549194, -0.8823773860931396, -0.6822378635406494, -0.48209822177886963, -0.28195905685424805, -0.08181944489479065, 0.11832016706466675, 0.31845974922180176, 0.5185993909835815, 0.7187390327453613, 0.9188785552978516, 1.1190181970596313, 1.3191578388214111, 1.519297480583191, 1.7194371223449707, 1.919576644897461, 2.119716167449951, 2.3198559284210205, 2.5199954509735107, 2.72013521194458, 2.9202747344970703, 3.1204142570495605, 3.32055401802063, 3.52069354057312, 3.7208333015441895, 3.9209728240966797, 4.12111234664917, 4.32125186920166, 4.521391868591309, 4.721531391143799, 4.921670913696289, 5.1218109130859375, 5.321950435638428, 5.522089958190918, 5.722229480743408, 5.922369003295898, 6.122508525848389]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 7.0, 6.0, 10.0, 17.0, 9.0, 7.0, 18.0, 17.0, 23.0, 20.0, 17.0, 28.0, 33.0, 40.0, 45.0, 39.0, 49.0, 46.0, 40.0, 43.0, 38.0, 40.0, 35.0, 47.0, 51.0, 24.0, 37.0, 30.0, 23.0, 27.0, 19.0, 25.0, 19.0, 19.0, 15.0, 9.0, 7.0, 6.0, 3.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.822389602661133, -2.73347806930542, -2.644566297531128, -2.555654764175415, -2.466742992401123, -2.37783145904541, -2.2889199256896973, -2.2000083923339844, -2.1110966205596924, -2.0221850872039795, -1.9332733154296875, -1.8443617820739746, -1.7554501295089722, -1.6665384769439697, -1.5776269435882568, -1.4887152910232544, -1.399803638458252, -1.3108919858932495, -1.221980333328247, -1.1330687999725342, -1.0441571474075317, -0.9552454948425293, -0.8663339018821716, -0.777422308921814, -0.6885106563568115, -0.5995990037918091, -0.5106874108314514, -0.42177578806877136, -0.3328641653060913, -0.24395254254341125, -0.1550409197807312, -0.06612932682037354, 0.022782325744628906, 0.11169394850730896, 0.200605571269989, 0.28951719403266907, 0.3784288167953491, 0.4673404395580292, 0.5562520623207092, 0.6451636552810669, 0.7340753078460693, 0.8229869604110718, 0.9118985533714294, 1.000810146331787, 1.0897217988967896, 1.178633451461792, 1.2675449848175049, 1.3564566373825073, 1.4453682899475098, 1.5342799425125122, 1.6231915950775146, 1.7121031284332275, 1.80101478099823, 1.8899264335632324, 1.9788379669189453, 2.067749500274658, 2.15666127204895, 2.245572805404663, 2.334484577178955, 2.423396110534668, 2.512307643890381, 2.601219415664673, 2.6901309490203857, 2.7790427207946777, 2.8679542541503906]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 11.0, 9.0, 8.0, 16.0, 18.0, 40.0, 43.0, 61.0, 108.0, 121.0, 262.0, 409.0, 746.0, 1490.0, 3424.0, 8094.0, 21670.0, 65901.0, 210980.0, 427685.0, 207354.0, 63953.0, 21452.0, 7999.0, 3320.0, 1518.0, 756.0, 433.0, 200.0, 148.0, 93.0, 62.0, 48.0, 35.0, 26.0, 19.0, 11.0, 3.0, 5.0, 6.0, 3.0, 7.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.83984375, -2.749664306640625, -2.65948486328125, -2.569305419921875, -2.4791259765625, -2.388946533203125, -2.29876708984375, -2.208587646484375, -2.118408203125, -2.028228759765625, -1.93804931640625, -1.847869873046875, -1.7576904296875, -1.667510986328125, -1.57733154296875, -1.487152099609375, -1.39697265625, -1.306793212890625, -1.21661376953125, -1.126434326171875, -1.0362548828125, -0.946075439453125, -0.85589599609375, -0.765716552734375, -0.675537109375, -0.585357666015625, -0.49517822265625, -0.404998779296875, -0.3148193359375, -0.224639892578125, -0.13446044921875, -0.044281005859375, 0.0458984375, 0.136077880859375, 0.22625732421875, 0.316436767578125, 0.4066162109375, 0.496795654296875, 0.58697509765625, 0.677154541015625, 0.767333984375, 0.857513427734375, 0.94769287109375, 1.037872314453125, 1.1280517578125, 1.218231201171875, 1.30841064453125, 1.398590087890625, 1.48876953125, 1.578948974609375, 1.66912841796875, 1.759307861328125, 1.8494873046875, 1.939666748046875, 2.02984619140625, 2.120025634765625, 2.210205078125, 2.300384521484375, 2.39056396484375, 2.480743408203125, 2.5709228515625, 2.661102294921875, 2.75128173828125, 2.841461181640625, 2.931640625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 10.0, 11.0, 11.0, 18.0, 24.0, 38.0, 42.0, 49.0, 56.0, 65.0, 71.0, 51.0, 71.0, 77.0, 64.0, 52.0, 67.0, 40.0, 40.0, 38.0, 31.0, 15.0, 15.0, 14.0, 6.0, 5.0, 2.0, 3.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3461456298828125, -1.300689697265625, -1.2552337646484375, -1.20977783203125, -1.1643218994140625, -1.118865966796875, -1.0734100341796875, -1.0279541015625, -0.9824981689453125, -0.937042236328125, -0.8915863037109375, -0.84613037109375, -0.8006744384765625, -0.755218505859375, -0.7097625732421875, -0.664306640625, -0.6188507080078125, -0.573394775390625, -0.5279388427734375, -0.48248291015625, -0.4370269775390625, -0.391571044921875, -0.3461151123046875, -0.3006591796875, -0.2552032470703125, -0.209747314453125, -0.1642913818359375, -0.11883544921875, -0.0733795166015625, -0.027923583984375, 0.0175323486328125, 0.06298828125, 0.1084442138671875, 0.153900146484375, 0.1993560791015625, 0.24481201171875, 0.2902679443359375, 0.335723876953125, 0.3811798095703125, 0.4266357421875, 0.4720916748046875, 0.517547607421875, 0.5630035400390625, 0.60845947265625, 0.6539154052734375, 0.699371337890625, 0.7448272705078125, 0.790283203125, 0.8357391357421875, 0.881195068359375, 0.9266510009765625, 0.97210693359375, 1.0175628662109375, 1.063018798828125, 1.1084747314453125, 1.1539306640625, 1.1993865966796875, 1.244842529296875, 1.2902984619140625, 1.33575439453125, 1.3812103271484375, 1.426666259765625, 1.4721221923828125, 1.517578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 10.0, 15.0, 22.0, 42.0, 59.0, 92.0, 178.0, 355.0, 670.0, 1750.0, 6183.0, 34155.0, 306668.0, 612162.0, 70813.0, 10818.0, 2679.0, 924.0, 396.0, 215.0, 115.0, 66.0, 47.0, 27.0, 24.0, 21.0, 10.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.375, -4.2078857421875, -4.040771484375, -3.8736572265625, -3.70654296875, -3.5394287109375, -3.372314453125, -3.2052001953125, -3.0380859375, -2.8709716796875, -2.703857421875, -2.5367431640625, -2.36962890625, -2.2025146484375, -2.035400390625, -1.8682861328125, -1.701171875, -1.5340576171875, -1.366943359375, -1.1998291015625, -1.03271484375, -0.8656005859375, -0.698486328125, -0.5313720703125, -0.3642578125, -0.1971435546875, -0.030029296875, 0.1370849609375, 0.30419921875, 0.4713134765625, 0.638427734375, 0.8055419921875, 0.97265625, 1.1397705078125, 1.306884765625, 1.4739990234375, 1.64111328125, 1.8082275390625, 1.975341796875, 2.1424560546875, 2.3095703125, 2.4766845703125, 2.643798828125, 2.8109130859375, 2.97802734375, 3.1451416015625, 3.312255859375, 3.4793701171875, 3.646484375, 3.8135986328125, 3.980712890625, 4.1478271484375, 4.31494140625, 4.4820556640625, 4.649169921875, 4.8162841796875, 4.9833984375, 5.1505126953125, 5.317626953125, 5.4847412109375, 5.65185546875, 5.8189697265625, 5.986083984375, 6.1531982421875, 6.3203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 9.0, 12.0, 11.0, 19.0, 14.0, 20.0, 26.0, 25.0, 23.0, 38.0, 33.0, 40.0, 59.0, 50.0, 61.0, 54.0, 58.0, 51.0, 51.0, 52.0, 42.0, 45.0, 50.0, 29.0, 22.0, 20.0, 19.0, 11.0, 9.0, 14.0, 8.0, 5.0, 7.0, 3.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46875, -5.27874755859375, -5.0887451171875, -4.89874267578125, -4.708740234375, -4.51873779296875, -4.3287353515625, -4.13873291015625, -3.94873046875, -3.75872802734375, -3.5687255859375, -3.37872314453125, -3.188720703125, -2.99871826171875, -2.8087158203125, -2.61871337890625, -2.4287109375, -2.23870849609375, -2.0487060546875, -1.85870361328125, -1.668701171875, -1.47869873046875, -1.2886962890625, -1.09869384765625, -0.90869140625, -0.71868896484375, -0.5286865234375, -0.33868408203125, -0.148681640625, 0.04132080078125, 0.2313232421875, 0.42132568359375, 0.611328125, 0.80133056640625, 0.9913330078125, 1.18133544921875, 1.371337890625, 1.56134033203125, 1.7513427734375, 1.94134521484375, 2.13134765625, 2.32135009765625, 2.5113525390625, 2.70135498046875, 2.891357421875, 3.08135986328125, 3.2713623046875, 3.46136474609375, 3.6513671875, 3.84136962890625, 4.0313720703125, 4.22137451171875, 4.411376953125, 4.60137939453125, 4.7913818359375, 4.98138427734375, 5.17138671875, 5.36138916015625, 5.5513916015625, 5.74139404296875, 5.931396484375, 6.12139892578125, 6.3114013671875, 6.50140380859375, 6.69140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 11.0, 7.0, 18.0, 22.0, 38.0, 29.0, 68.0, 95.0, 190.0, 307.0, 622.0, 1484.0, 4594.0, 23470.0, 407671.0, 571666.0, 29920.0, 5190.0, 1644.0, 633.0, 315.0, 214.0, 124.0, 70.0, 36.0, 32.0, 23.0, 15.0, 10.0, 9.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.923828125, -2.8265380859375, -2.729248046875, -2.6319580078125, -2.53466796875, -2.4373779296875, -2.340087890625, -2.2427978515625, -2.1455078125, -2.0482177734375, -1.950927734375, -1.8536376953125, -1.75634765625, -1.6590576171875, -1.561767578125, -1.4644775390625, -1.3671875, -1.2698974609375, -1.172607421875, -1.0753173828125, -0.97802734375, -0.8807373046875, -0.783447265625, -0.6861572265625, -0.5888671875, -0.4915771484375, -0.394287109375, -0.2969970703125, -0.19970703125, -0.1024169921875, -0.005126953125, 0.0921630859375, 0.189453125, 0.2867431640625, 0.384033203125, 0.4813232421875, 0.57861328125, 0.6759033203125, 0.773193359375, 0.8704833984375, 0.9677734375, 1.0650634765625, 1.162353515625, 1.2596435546875, 1.35693359375, 1.4542236328125, 1.551513671875, 1.6488037109375, 1.74609375, 1.8433837890625, 1.940673828125, 2.0379638671875, 2.13525390625, 2.2325439453125, 2.329833984375, 2.4271240234375, 2.5244140625, 2.6217041015625, 2.718994140625, 2.8162841796875, 2.91357421875, 3.0108642578125, 3.108154296875, 3.2054443359375, 3.302734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 4.0, 8.0, 13.0, 25.0, 36.0, 52.0, 72.0, 76.0, 127.0, 128.0, 146.0, 115.0, 59.0, 57.0, 38.0, 20.0, 16.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025963783264160156, -0.00024629756808280945, -0.00023295730352401733, -0.00021961703896522522, -0.0002062767744064331, -0.000192936509847641, -0.00017959624528884888, -0.00016625598073005676, -0.00015291571617126465, -0.00013957545161247253, -0.00012623518705368042, -0.0001128949224948883, -9.955465793609619e-05, -8.621439337730408e-05, -7.287412881851196e-05, -5.953386425971985e-05, -4.6193599700927734e-05, -3.285333514213562e-05, -1.9513070583343506e-05, -6.172806024551392e-06, 7.167458534240723e-06, 2.0507723093032837e-05, 3.384798765182495e-05, 4.7188252210617065e-05, 6.052851676940918e-05, 7.38687813282013e-05, 8.720904588699341e-05, 0.00010054931044578552, 0.00011388957500457764, 0.00012722983956336975, 0.00014057010412216187, 0.00015391036868095398, 0.0001672506332397461, 0.0001805908977985382, 0.00019393116235733032, 0.00020727142691612244, 0.00022061169147491455, 0.00023395195603370667, 0.0002472922205924988, 0.0002606324851512909, 0.000273972749710083, 0.0002873130142688751, 0.00030065327882766724, 0.00031399354338645935, 0.00032733380794525146, 0.0003406740725040436, 0.0003540143370628357, 0.0003673546016216278, 0.0003806948661804199, 0.00039403513073921204, 0.00040737539529800415, 0.00042071565985679626, 0.0004340559244155884, 0.0004473961889743805, 0.0004607364535331726, 0.0004740767180919647, 0.00048741698265075684, 0.000500757247209549, 0.0005140975117683411, 0.0005274377763271332, 0.0005407780408859253, 0.0005541183054447174, 0.0005674585700035095, 0.0005807988345623016, 0.0005941390991210938]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 11.0, 5.0, 10.0, 18.0, 17.0, 34.0, 56.0, 99.0, 258.0, 593.0, 1712.0, 6597.0, 59015.0, 884947.0, 84156.0, 7934.0, 1934.0, 659.0, 243.0, 109.0, 54.0, 28.0, 24.0, 12.0, 12.0, 3.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140625, -4.0093994140625, -3.878173828125, -3.7469482421875, -3.61572265625, -3.4844970703125, -3.353271484375, -3.2220458984375, -3.0908203125, -2.9595947265625, -2.828369140625, -2.6971435546875, -2.56591796875, -2.4346923828125, -2.303466796875, -2.1722412109375, -2.041015625, -1.9097900390625, -1.778564453125, -1.6473388671875, -1.51611328125, -1.3848876953125, -1.253662109375, -1.1224365234375, -0.9912109375, -0.8599853515625, -0.728759765625, -0.5975341796875, -0.46630859375, -0.3350830078125, -0.203857421875, -0.0726318359375, 0.05859375, 0.1898193359375, 0.321044921875, 0.4522705078125, 0.58349609375, 0.7147216796875, 0.845947265625, 0.9771728515625, 1.1083984375, 1.2396240234375, 1.370849609375, 1.5020751953125, 1.63330078125, 1.7645263671875, 1.895751953125, 2.0269775390625, 2.158203125, 2.2894287109375, 2.420654296875, 2.5518798828125, 2.68310546875, 2.8143310546875, 2.945556640625, 3.0767822265625, 3.2080078125, 3.3392333984375, 3.470458984375, 3.6016845703125, 3.73291015625, 3.8641357421875, 3.995361328125, 4.1265869140625, 4.2578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 11.0, 18.0, 26.0, 34.0, 53.0, 73.0, 94.0, 116.0, 116.0, 109.0, 72.0, 80.0, 54.0, 38.0, 23.0, 13.0, 14.0, 4.0, 6.0, 5.0, 5.0, 7.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.365234375, -2.275848388671875, -2.18646240234375, -2.097076416015625, -2.0076904296875, -1.918304443359375, -1.82891845703125, -1.739532470703125, -1.650146484375, -1.560760498046875, -1.47137451171875, -1.381988525390625, -1.2926025390625, -1.203216552734375, -1.11383056640625, -1.024444580078125, -0.93505859375, -0.845672607421875, -0.75628662109375, -0.666900634765625, -0.5775146484375, -0.488128662109375, -0.39874267578125, -0.309356689453125, -0.219970703125, -0.130584716796875, -0.04119873046875, 0.048187255859375, 0.1375732421875, 0.226959228515625, 0.31634521484375, 0.405731201171875, 0.4951171875, 0.584503173828125, 0.67388916015625, 0.763275146484375, 0.8526611328125, 0.942047119140625, 1.03143310546875, 1.120819091796875, 1.210205078125, 1.299591064453125, 1.38897705078125, 1.478363037109375, 1.5677490234375, 1.657135009765625, 1.74652099609375, 1.835906982421875, 1.92529296875, 2.014678955078125, 2.10406494140625, 2.193450927734375, 2.2828369140625, 2.372222900390625, 2.46160888671875, 2.550994873046875, 2.640380859375, 2.729766845703125, 2.81915283203125, 2.908538818359375, 2.9979248046875, 3.087310791015625, 3.17669677734375, 3.266082763671875, 3.35546875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 11.0, 100.0, 370.0, 407.0, 93.0, 25.0, 3.0, 1.0, 1.0, 1.0], "bins": [-240.26705932617188, -236.05662536621094, -231.84619140625, -227.63575744628906, -223.42532348632812, -219.21487426757812, -215.00445556640625, -210.79400634765625, -206.5835723876953, -202.37313842773438, -198.16270446777344, -193.9522705078125, -189.74183654785156, -185.53140258789062, -181.32095336914062, -177.1105194091797, -172.90008544921875, -168.6896514892578, -164.47921752929688, -160.26878356933594, -156.058349609375, -151.847900390625, -147.63748168945312, -143.42703247070312, -139.21661376953125, -135.0061798095703, -130.79574584960938, -126.58531188964844, -122.37487030029297, -118.16443634033203, -113.9540023803711, -109.74356842041016, -105.53313446044922, -101.32270050048828, -97.11226654052734, -92.90182495117188, -88.69139099121094, -84.48095703125, -80.27052307128906, -76.06008911132812, -71.84964752197266, -67.63921356201172, -63.428775787353516, -59.21834182739258, -55.007904052734375, -50.79747009277344, -46.5870361328125, -42.37660217285156, -38.166168212890625, -33.95573425292969, -29.745296478271484, -25.534862518310547, -21.324426651000977, -17.113990783691406, -12.903556823730469, -8.693120956420898, -4.482683181762695, -0.2722477912902832, 3.938187599182129, 8.148622512817383, 12.359058380126953, 16.569494247436523, 20.77992820739746, 24.99036407470703, 29.2007999420166]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 2.0, 6.0, 7.0, 12.0, 17.0, 14.0, 24.0, 28.0, 34.0, 47.0, 54.0, 43.0, 59.0, 46.0, 89.0, 60.0, 71.0, 51.0, 51.0, 57.0, 50.0, 44.0, 26.0, 20.0, 24.0, 19.0, 13.0, 10.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.46742248535156, -37.43059539794922, -36.393768310546875, -35.35694122314453, -34.32011413574219, -33.28328323364258, -32.246456146240234, -31.20962905883789, -30.172801971435547, -29.135974884033203, -28.09914779663086, -27.062318801879883, -26.02549171447754, -24.988664627075195, -23.95183563232422, -22.915008544921875, -21.87818145751953, -20.841354370117188, -19.804527282714844, -18.767698287963867, -17.730871200561523, -16.69404411315918, -15.65721607208252, -14.62038803100586, -13.583560943603516, -12.546733856201172, -11.509905815124512, -10.473077774047852, -9.436250686645508, -8.399423599243164, -7.362595558166504, -6.325767993927002, -5.288944244384766, -4.252116680145264, -3.2152891159057617, -2.1784615516662598, -1.1416339874267578, -0.10480642318725586, 0.9320211410522461, 1.968848705291748, 3.00567626953125, 4.042503833770752, 5.079331398010254, 6.116158962249756, 7.152986526489258, 8.189813613891602, 9.226641654968262, 10.263469696044922, 11.300296783447266, 12.33712387084961, 13.37395191192627, 14.41077995300293, 15.447607040405273, 16.484434127807617, 17.521263122558594, 18.558090209960938, 19.59491729736328, 20.631744384765625, 21.66857147216797, 22.705400466918945, 23.74222755432129, 24.779054641723633, 25.81588363647461, 26.852710723876953, 27.889537811279297]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 13.0, 6.0, 18.0, 26.0, 37.0, 57.0, 86.0, 155.0, 243.0, 516.0, 1195.0, 2982.0, 9567.0, 95161.0, 4050680.0, 25130.0, 5237.0, 1707.0, 698.0, 349.0, 163.0, 89.0, 59.0, 44.0, 21.0, 10.0, 10.0, 6.0, 4.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.80206298828125, -4.6041259765625, -4.40618896484375, -4.208251953125, -4.01031494140625, -3.8123779296875, -3.61444091796875, -3.41650390625, -3.21856689453125, -3.0206298828125, -2.82269287109375, -2.624755859375, -2.42681884765625, -2.2288818359375, -2.03094482421875, -1.8330078125, -1.63507080078125, -1.4371337890625, -1.23919677734375, -1.041259765625, -0.84332275390625, -0.6453857421875, -0.44744873046875, -0.24951171875, -0.05157470703125, 0.1463623046875, 0.34429931640625, 0.542236328125, 0.74017333984375, 0.9381103515625, 1.13604736328125, 1.333984375, 1.53192138671875, 1.7298583984375, 1.92779541015625, 2.125732421875, 2.32366943359375, 2.5216064453125, 2.71954345703125, 2.91748046875, 3.11541748046875, 3.3133544921875, 3.51129150390625, 3.709228515625, 3.90716552734375, 4.1051025390625, 4.30303955078125, 4.5009765625, 4.69891357421875, 4.8968505859375, 5.09478759765625, 5.292724609375, 5.49066162109375, 5.6885986328125, 5.88653564453125, 6.08447265625, 6.28240966796875, 6.4803466796875, 6.67828369140625, 6.876220703125, 7.07415771484375, 7.2720947265625, 7.47003173828125, 7.66796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 5.0, 8.0, 9.0, 24.0, 38.0, 49.0, 61.0, 71.0, 101.0, 99.0, 121.0, 110.0, 84.0, 69.0, 48.0, 37.0, 20.0, 11.0, 11.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.416015625, -2.3471832275390625, -2.278350830078125, -2.2095184326171875, -2.14068603515625, -2.0718536376953125, -2.003021240234375, -1.9341888427734375, -1.8653564453125, -1.7965240478515625, -1.727691650390625, -1.6588592529296875, -1.59002685546875, -1.5211944580078125, -1.452362060546875, -1.3835296630859375, -1.314697265625, -1.2458648681640625, -1.177032470703125, -1.1082000732421875, -1.03936767578125, -0.9705352783203125, -0.901702880859375, -0.8328704833984375, -0.7640380859375, -0.6952056884765625, -0.626373291015625, -0.5575408935546875, -0.48870849609375, -0.4198760986328125, -0.351043701171875, -0.2822113037109375, -0.21337890625, -0.1445465087890625, -0.075714111328125, -0.0068817138671875, 0.06195068359375, 0.1307830810546875, 0.199615478515625, 0.2684478759765625, 0.3372802734375, 0.4061126708984375, 0.474945068359375, 0.5437774658203125, 0.61260986328125, 0.6814422607421875, 0.750274658203125, 0.8191070556640625, 0.887939453125, 0.9567718505859375, 1.025604248046875, 1.0944366455078125, 1.16326904296875, 1.2321014404296875, 1.300933837890625, 1.3697662353515625, 1.4385986328125, 1.5074310302734375, 1.576263427734375, 1.6450958251953125, 1.71392822265625, 1.7827606201171875, 1.851593017578125, 1.9204254150390625, 1.9892578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 16.0, 20.0, 31.0, 30.0, 50.0, 53.0, 90.0, 120.0, 197.0, 284.0, 478.0, 789.0, 1373.0, 2659.0, 6049.0, 16002.0, 63934.0, 3877381.0, 179110.0, 28108.0, 9113.0, 3822.0, 1893.0, 1012.0, 563.0, 346.0, 241.0, 167.0, 115.0, 67.0, 41.0, 40.0, 23.0, 17.0, 13.0, 12.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.5, -3.36395263671875, -3.2279052734375, -3.09185791015625, -2.955810546875, -2.81976318359375, -2.6837158203125, -2.54766845703125, -2.41162109375, -2.27557373046875, -2.1395263671875, -2.00347900390625, -1.867431640625, -1.73138427734375, -1.5953369140625, -1.45928955078125, -1.3232421875, -1.18719482421875, -1.0511474609375, -0.91510009765625, -0.779052734375, -0.64300537109375, -0.5069580078125, -0.37091064453125, -0.23486328125, -0.09881591796875, 0.0372314453125, 0.17327880859375, 0.309326171875, 0.44537353515625, 0.5814208984375, 0.71746826171875, 0.853515625, 0.98956298828125, 1.1256103515625, 1.26165771484375, 1.397705078125, 1.53375244140625, 1.6697998046875, 1.80584716796875, 1.94189453125, 2.07794189453125, 2.2139892578125, 2.35003662109375, 2.486083984375, 2.62213134765625, 2.7581787109375, 2.89422607421875, 3.0302734375, 3.16632080078125, 3.3023681640625, 3.43841552734375, 3.574462890625, 3.71051025390625, 3.8465576171875, 3.98260498046875, 4.11865234375, 4.25469970703125, 4.3907470703125, 4.52679443359375, 4.662841796875, 4.79888916015625, 4.9349365234375, 5.07098388671875, 5.20703125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 9.0, 10.0, 5.0, 18.0, 23.0, 35.0, 53.0, 96.0, 252.0, 3183.0, 170.0, 63.0, 41.0, 32.0, 21.0, 14.0, 8.0, 8.0, 5.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.841796875, -1.779144287109375, -1.71649169921875, -1.653839111328125, -1.5911865234375, -1.528533935546875, -1.46588134765625, -1.403228759765625, -1.340576171875, -1.277923583984375, -1.21527099609375, -1.152618408203125, -1.0899658203125, -1.027313232421875, -0.96466064453125, -0.902008056640625, -0.83935546875, -0.776702880859375, -0.71405029296875, -0.651397705078125, -0.5887451171875, -0.526092529296875, -0.46343994140625, -0.400787353515625, -0.338134765625, -0.275482177734375, -0.21282958984375, -0.150177001953125, -0.0875244140625, -0.024871826171875, 0.03778076171875, 0.100433349609375, 0.1630859375, 0.225738525390625, 0.28839111328125, 0.351043701171875, 0.4136962890625, 0.476348876953125, 0.53900146484375, 0.601654052734375, 0.664306640625, 0.726959228515625, 0.78961181640625, 0.852264404296875, 0.9149169921875, 0.977569580078125, 1.04022216796875, 1.102874755859375, 1.16552734375, 1.228179931640625, 1.29083251953125, 1.353485107421875, 1.4161376953125, 1.478790283203125, 1.54144287109375, 1.604095458984375, 1.666748046875, 1.729400634765625, 1.79205322265625, 1.854705810546875, 1.9173583984375, 1.980010986328125, 2.04266357421875, 2.105316162109375, 2.16796875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 8.0, 4.0, 17.0, 25.0, 67.0, 126.0, 199.0, 229.0, 166.0, 94.0, 39.0, 15.0, 8.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.184077262878418, -13.732525825500488, -13.280973434448242, -12.829421997070312, -12.377870559692383, -11.926318168640137, -11.474766731262207, -11.023214340209961, -10.571662902832031, -10.120111465454102, -9.668559074401855, -9.217007637023926, -8.76545524597168, -8.31390380859375, -7.86235237121582, -7.410800457000732, -6.9592485427856445, -6.507696628570557, -6.056144714355469, -5.604593276977539, -5.153041362762451, -4.701489448547363, -4.249938011169434, -3.7983860969543457, -3.346834182739258, -2.89528226852417, -2.443730592727661, -1.9921787977218628, -1.5406270027160645, -1.0890750885009766, -0.6375234127044678, -0.18597173690795898, 0.2655811309814453, 0.7171329259872437, 1.168684720993042, 1.6202365159988403, 2.0717883110046387, 2.5233402252197266, 2.9748919010162354, 3.426443576812744, 3.877995491027832, 4.32954740524292, 4.781099319458008, 5.2326507568359375, 5.684202671051025, 6.135754585266113, 6.587306022644043, 7.038857936859131, 7.490409851074219, 7.941961765289307, 8.393513679504395, 8.845065116882324, 9.29661750793457, 9.7481689453125, 10.19972038269043, 10.65127182006836, 11.102824211120605, 11.554375648498535, 12.005928039550781, 12.457479476928711, 12.90903091430664, 13.360583305358887, 13.812134742736816, 14.263687133789062, 14.715238571166992]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 5.0, 8.0, 10.0, 6.0, 15.0, 21.0, 25.0, 25.0, 26.0, 27.0, 39.0, 36.0, 37.0, 33.0, 35.0, 46.0, 55.0, 46.0, 48.0, 38.0, 34.0, 48.0, 41.0, 32.0, 46.0, 39.0, 24.0, 28.0, 22.0, 18.0, 19.0, 11.0, 14.0, 13.0, 5.0, 5.0, 8.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.659075736999512, -4.512619972229004, -4.366164207458496, -4.219708442687988, -4.0732526779174805, -3.9267966747283936, -3.7803406715393066, -3.633884906768799, -3.487429141998291, -3.340973377227783, -3.1945176124572754, -3.0480616092681885, -2.9016058444976807, -2.755150079727173, -2.608694076538086, -2.462238311767578, -2.3157825469970703, -2.1693267822265625, -2.0228710174560547, -1.8764150142669678, -1.72995924949646, -1.5835034847259521, -1.4370476007461548, -1.2905917167663574, -1.1441359519958496, -0.997680127620697, -0.8512243032455444, -0.7047684788703918, -0.5583126544952393, -0.41185683012008667, -0.2654010057449341, -0.11894512176513672, 0.027510643005371094, 0.17396646738052368, 0.32042229175567627, 0.46687811613082886, 0.6133339405059814, 0.759789764881134, 0.9062455892562866, 1.052701473236084, 1.1991572380065918, 1.3456130027770996, 1.492068886756897, 1.6385247707366943, 1.7849805355072021, 1.93143630027771, 2.077892303466797, 2.2243480682373047, 2.3708038330078125, 2.5172595977783203, 2.663715362548828, 2.810171365737915, 2.956627130508423, 3.1030828952789307, 3.2495388984680176, 3.3959946632385254, 3.542450428009033, 3.688906192779541, 3.835361957550049, 3.9818179607391357, 4.128273963928223, 4.2747297286987305, 4.421185493469238, 4.567641258239746, 4.714097023010254]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 9.0, 12.0, 31.0, 72.0, 120.0, 332.0, 984.0, 3573.0, 21613.0, 241951.0, 680691.0, 86226.0, 9810.0, 2085.0, 603.0, 213.0, 114.0, 47.0, 30.0, 17.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.86328125, -7.657958984375, -7.45263671875, -7.247314453125, -7.0419921875, -6.836669921875, -6.63134765625, -6.426025390625, -6.220703125, -6.015380859375, -5.81005859375, -5.604736328125, -5.3994140625, -5.194091796875, -4.98876953125, -4.783447265625, -4.578125, -4.372802734375, -4.16748046875, -3.962158203125, -3.7568359375, -3.551513671875, -3.34619140625, -3.140869140625, -2.935546875, -2.730224609375, -2.52490234375, -2.319580078125, -2.1142578125, -1.908935546875, -1.70361328125, -1.498291015625, -1.29296875, -1.087646484375, -0.88232421875, -0.677001953125, -0.4716796875, -0.266357421875, -0.06103515625, 0.144287109375, 0.349609375, 0.554931640625, 0.76025390625, 0.965576171875, 1.1708984375, 1.376220703125, 1.58154296875, 1.786865234375, 1.9921875, 2.197509765625, 2.40283203125, 2.608154296875, 2.8134765625, 3.018798828125, 3.22412109375, 3.429443359375, 3.634765625, 3.840087890625, 4.04541015625, 4.250732421875, 4.4560546875, 4.661376953125, 4.86669921875, 5.072021484375, 5.27734375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 3.0, 9.0, 15.0, 13.0, 36.0, 41.0, 56.0, 76.0, 93.0, 97.0, 110.0, 102.0, 98.0, 75.0, 56.0, 37.0, 22.0, 19.0, 19.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.62109375, -2.5492401123046875, -2.477386474609375, -2.4055328369140625, -2.33367919921875, -2.2618255615234375, -2.189971923828125, -2.1181182861328125, -2.0462646484375, -1.9744110107421875, -1.902557373046875, -1.8307037353515625, -1.75885009765625, -1.6869964599609375, -1.615142822265625, -1.5432891845703125, -1.471435546875, -1.3995819091796875, -1.327728271484375, -1.2558746337890625, -1.18402099609375, -1.1121673583984375, -1.040313720703125, -0.9684600830078125, -0.8966064453125, -0.8247528076171875, -0.752899169921875, -0.6810455322265625, -0.60919189453125, -0.5373382568359375, -0.465484619140625, -0.3936309814453125, -0.32177734375, -0.2499237060546875, -0.178070068359375, -0.1062164306640625, -0.03436279296875, 0.0374908447265625, 0.109344482421875, 0.1811981201171875, 0.2530517578125, 0.3249053955078125, 0.396759033203125, 0.4686126708984375, 0.54046630859375, 0.6123199462890625, 0.684173583984375, 0.7560272216796875, 0.827880859375, 0.8997344970703125, 0.971588134765625, 1.0434417724609375, 1.11529541015625, 1.1871490478515625, 1.259002685546875, 1.3308563232421875, 1.4027099609375, 1.4745635986328125, 1.546417236328125, 1.6182708740234375, 1.69012451171875, 1.7619781494140625, 1.833831787109375, 1.9056854248046875, 1.9775390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 5.0, 8.0, 19.0, 23.0, 27.0, 48.0, 82.0, 118.0, 174.0, 335.0, 621.0, 1312.0, 3346.0, 10667.0, 49647.0, 328849.0, 538967.0, 89430.0, 16803.0, 4545.0, 1697.0, 762.0, 404.0, 240.0, 129.0, 89.0, 54.0, 48.0, 35.0, 19.0, 15.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.90625, -4.77056884765625, -4.6348876953125, -4.49920654296875, -4.363525390625, -4.22784423828125, -4.0921630859375, -3.95648193359375, -3.82080078125, -3.68511962890625, -3.5494384765625, -3.41375732421875, -3.278076171875, -3.14239501953125, -3.0067138671875, -2.87103271484375, -2.7353515625, -2.59967041015625, -2.4639892578125, -2.32830810546875, -2.192626953125, -2.05694580078125, -1.9212646484375, -1.78558349609375, -1.64990234375, -1.51422119140625, -1.3785400390625, -1.24285888671875, -1.107177734375, -0.97149658203125, -0.8358154296875, -0.70013427734375, -0.564453125, -0.42877197265625, -0.2930908203125, -0.15740966796875, -0.021728515625, 0.11395263671875, 0.2496337890625, 0.38531494140625, 0.52099609375, 0.65667724609375, 0.7923583984375, 0.92803955078125, 1.063720703125, 1.19940185546875, 1.3350830078125, 1.47076416015625, 1.6064453125, 1.74212646484375, 1.8778076171875, 2.01348876953125, 2.149169921875, 2.28485107421875, 2.4205322265625, 2.55621337890625, 2.69189453125, 2.82757568359375, 2.9632568359375, 3.09893798828125, 3.234619140625, 3.37030029296875, 3.5059814453125, 3.64166259765625, 3.77734375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 7.0, 9.0, 6.0, 9.0, 11.0, 10.0, 17.0, 13.0, 27.0, 24.0, 34.0, 29.0, 39.0, 45.0, 54.0, 42.0, 56.0, 55.0, 48.0, 59.0, 46.0, 57.0, 42.0, 45.0, 34.0, 30.0, 24.0, 22.0, 16.0, 10.0, 17.0, 22.0, 11.0, 6.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65625, -5.4912109375, -5.326171875, -5.1611328125, -4.99609375, -4.8310546875, -4.666015625, -4.5009765625, -4.3359375, -4.1708984375, -4.005859375, -3.8408203125, -3.67578125, -3.5107421875, -3.345703125, -3.1806640625, -3.015625, -2.8505859375, -2.685546875, -2.5205078125, -2.35546875, -2.1904296875, -2.025390625, -1.8603515625, -1.6953125, -1.5302734375, -1.365234375, -1.2001953125, -1.03515625, -0.8701171875, -0.705078125, -0.5400390625, -0.375, -0.2099609375, -0.044921875, 0.1201171875, 0.28515625, 0.4501953125, 0.615234375, 0.7802734375, 0.9453125, 1.1103515625, 1.275390625, 1.4404296875, 1.60546875, 1.7705078125, 1.935546875, 2.1005859375, 2.265625, 2.4306640625, 2.595703125, 2.7607421875, 2.92578125, 3.0908203125, 3.255859375, 3.4208984375, 3.5859375, 3.7509765625, 3.916015625, 4.0810546875, 4.24609375, 4.4111328125, 4.576171875, 4.7412109375, 4.90625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 9.0, 9.0, 10.0, 22.0, 19.0, 28.0, 92.0, 175.0, 413.0, 989.0, 4112.0, 30756.0, 665431.0, 325858.0, 16437.0, 2750.0, 779.0, 325.0, 142.0, 60.0, 56.0, 28.0, 16.0, 12.0, 5.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.71484375, -2.6450042724609375, -2.575164794921875, -2.5053253173828125, -2.43548583984375, -2.3656463623046875, -2.295806884765625, -2.2259674072265625, -2.1561279296875, -2.0862884521484375, -2.016448974609375, -1.9466094970703125, -1.87677001953125, -1.8069305419921875, -1.737091064453125, -1.6672515869140625, -1.597412109375, -1.5275726318359375, -1.457733154296875, -1.3878936767578125, -1.31805419921875, -1.2482147216796875, -1.178375244140625, -1.1085357666015625, -1.0386962890625, -0.9688568115234375, -0.899017333984375, -0.8291778564453125, -0.75933837890625, -0.6894989013671875, -0.619659423828125, -0.5498199462890625, -0.47998046875, -0.4101409912109375, -0.340301513671875, -0.2704620361328125, -0.20062255859375, -0.1307830810546875, -0.060943603515625, 0.0088958740234375, 0.0787353515625, 0.1485748291015625, 0.218414306640625, 0.2882537841796875, 0.35809326171875, 0.4279327392578125, 0.497772216796875, 0.5676116943359375, 0.637451171875, 0.7072906494140625, 0.777130126953125, 0.8469696044921875, 0.91680908203125, 0.9866485595703125, 1.056488037109375, 1.1263275146484375, 1.1961669921875, 1.2660064697265625, 1.335845947265625, 1.4056854248046875, 1.47552490234375, 1.5453643798828125, 1.615203857421875, 1.6850433349609375, 1.7548828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 10.0, 5.0, 8.0, 12.0, 8.0, 17.0, 24.0, 25.0, 30.0, 31.0, 37.0, 58.0, 72.0, 56.0, 74.0, 78.0, 96.0, 71.0, 77.0, 48.0, 37.0, 37.0, 24.0, 9.0, 8.0, 15.0, 6.0, 7.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002162456512451172, -0.00020909495651721954, -0.0002019442617893219, -0.00019479356706142426, -0.0001876428723335266, -0.00018049217760562897, -0.00017334148287773132, -0.00016619078814983368, -0.00015904009342193604, -0.0001518893986940384, -0.00014473870396614075, -0.0001375880092382431, -0.00013043731451034546, -0.00012328661978244781, -0.00011613592505455017, -0.00010898523032665253, -0.00010183453559875488, -9.468384087085724e-05, -8.75331461429596e-05, -8.038245141506195e-05, -7.32317566871643e-05, -6.608106195926666e-05, -5.893036723136902e-05, -5.1779672503471375e-05, -4.462897777557373e-05, -3.7478283047676086e-05, -3.0327588319778442e-05, -2.31768935918808e-05, -1.6026198863983154e-05, -8.87550413608551e-06, -1.7248094081878662e-06, 5.425885319709778e-06, 1.2576580047607422e-05, 1.9727274775505066e-05, 2.687796950340271e-05, 3.4028664231300354e-05, 4.1179358959198e-05, 4.833005368709564e-05, 5.5480748414993286e-05, 6.263144314289093e-05, 6.978213787078857e-05, 7.693283259868622e-05, 8.408352732658386e-05, 9.12342220544815e-05, 9.838491678237915e-05, 0.0001055356115102768, 0.00011268630623817444, 0.00011983700096607208, 0.00012698769569396973, 0.00013413839042186737, 0.00014128908514976501, 0.00014843977987766266, 0.0001555904746055603, 0.00016274116933345795, 0.0001698918640613556, 0.00017704255878925323, 0.00018419325351715088, 0.00019134394824504852, 0.00019849464297294617, 0.0002056453377008438, 0.00021279603242874146, 0.0002199467271566391, 0.00022709742188453674, 0.0002342481166124344, 0.00024139881134033203]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 12.0, 10.0, 22.0, 46.0, 55.0, 145.0, 282.0, 623.0, 1870.0, 9430.0, 177368.0, 811795.0, 40487.0, 4369.0, 1161.0, 422.0, 210.0, 95.0, 49.0, 33.0, 19.0, 24.0, 6.0, 0.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.328125, -2.245819091796875, -2.16351318359375, -2.081207275390625, -1.9989013671875, -1.916595458984375, -1.83428955078125, -1.751983642578125, -1.669677734375, -1.587371826171875, -1.50506591796875, -1.422760009765625, -1.3404541015625, -1.258148193359375, -1.17584228515625, -1.093536376953125, -1.01123046875, -0.928924560546875, -0.84661865234375, -0.764312744140625, -0.6820068359375, -0.599700927734375, -0.51739501953125, -0.435089111328125, -0.352783203125, -0.270477294921875, -0.18817138671875, -0.105865478515625, -0.0235595703125, 0.058746337890625, 0.14105224609375, 0.223358154296875, 0.3056640625, 0.387969970703125, 0.47027587890625, 0.552581787109375, 0.6348876953125, 0.717193603515625, 0.79949951171875, 0.881805419921875, 0.964111328125, 1.046417236328125, 1.12872314453125, 1.211029052734375, 1.2933349609375, 1.375640869140625, 1.45794677734375, 1.540252685546875, 1.62255859375, 1.704864501953125, 1.78717041015625, 1.869476318359375, 1.9517822265625, 2.034088134765625, 2.11639404296875, 2.198699951171875, 2.281005859375, 2.363311767578125, 2.44561767578125, 2.527923583984375, 2.6102294921875, 2.692535400390625, 2.77484130859375, 2.857147216796875, 2.939453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 11.0, 15.0, 19.0, 34.0, 36.0, 51.0, 67.0, 71.0, 90.0, 88.0, 101.0, 85.0, 71.0, 68.0, 49.0, 44.0, 25.0, 21.0, 16.0, 9.0, 13.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0380859375, -0.9887847900390625, -0.939483642578125, -0.8901824951171875, -0.84088134765625, -0.7915802001953125, -0.742279052734375, -0.6929779052734375, -0.6436767578125, -0.5943756103515625, -0.545074462890625, -0.4957733154296875, -0.44647216796875, -0.3971710205078125, -0.347869873046875, -0.2985687255859375, -0.249267578125, -0.1999664306640625, -0.150665283203125, -0.1013641357421875, -0.05206298828125, -0.0027618408203125, 0.046539306640625, 0.0958404541015625, 0.1451416015625, 0.1944427490234375, 0.243743896484375, 0.2930450439453125, 0.34234619140625, 0.3916473388671875, 0.440948486328125, 0.4902496337890625, 0.53955078125, 0.5888519287109375, 0.638153076171875, 0.6874542236328125, 0.73675537109375, 0.7860565185546875, 0.835357666015625, 0.8846588134765625, 0.9339599609375, 0.9832611083984375, 1.032562255859375, 1.0818634033203125, 1.13116455078125, 1.1804656982421875, 1.229766845703125, 1.2790679931640625, 1.328369140625, 1.3776702880859375, 1.426971435546875, 1.4762725830078125, 1.52557373046875, 1.5748748779296875, 1.624176025390625, 1.6734771728515625, 1.7227783203125, 1.7720794677734375, 1.821380615234375, 1.8706817626953125, 1.91998291015625, 1.9692840576171875, 2.018585205078125, 2.0678863525390625, 2.1171875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 8.0, 13.0, 27.0, 71.0, 132.0, 197.0, 243.0, 166.0, 77.0, 45.0, 16.0, 10.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.57719802856445, -38.83559799194336, -37.09400177001953, -35.35240173339844, -33.610801696777344, -31.869205474853516, -30.127605438232422, -28.38600730895996, -26.6444091796875, -24.90281105041504, -23.161212921142578, -21.419612884521484, -19.678014755249023, -17.936416625976562, -16.19481658935547, -14.453218460083008, -12.711620330810547, -10.970022201538086, -9.228423118591309, -7.4868245124816895, -5.74522590637207, -4.003627777099609, -2.262028694152832, -0.5204296112060547, 1.2211685180664062, 2.9627671241760254, 4.7043657302856445, 6.445964336395264, 8.187562942504883, 9.929161071777344, 11.670760154724121, 13.412359237670898, 15.153953552246094, 16.895551681518555, 18.637149810791016, 20.37874984741211, 22.12034797668457, 23.86194610595703, 25.603546142578125, 27.345144271850586, 29.086742401123047, 30.828340530395508, 32.56993865966797, 34.31153869628906, 36.053138732910156, 37.794734954833984, 39.53633499145508, 41.277931213378906, 43.01953125, 44.761131286621094, 46.50272750854492, 48.244327545166016, 49.985923767089844, 51.72752380371094, 53.46912384033203, 55.210723876953125, 56.95232009887695, 58.69392013549805, 60.435516357421875, 62.17711639404297, 63.91871643066406, 65.66030883789062, 67.40190887451172, 69.14350891113281, 70.8851089477539]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 10.0, 7.0, 17.0, 16.0, 20.0, 29.0, 31.0, 44.0, 41.0, 50.0, 59.0, 79.0, 69.0, 74.0, 62.0, 86.0, 46.0, 49.0, 36.0, 36.0, 27.0, 21.0, 17.0, 22.0, 13.0, 13.0, 7.0, 6.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.024574279785156, -30.084320068359375, -29.144065856933594, -28.203811645507812, -27.26355743408203, -26.32330322265625, -25.3830509185791, -24.44279670715332, -23.50254249572754, -22.562288284301758, -21.622034072875977, -20.681779861450195, -19.741527557373047, -18.801273345947266, -17.861019134521484, -16.920764923095703, -15.980510711669922, -15.04025650024414, -14.10000228881836, -13.159749031066895, -12.219494819641113, -11.279240608215332, -10.338987350463867, -9.398733139038086, -8.458478927612305, -7.518224716186523, -6.5779709815979, -5.637717247009277, -4.697463035583496, -3.757208824157715, -2.816955089569092, -1.8767013549804688, -0.9364471435546875, 0.0038068294525146484, 0.9440608024597168, 1.884314775466919, 2.824568748474121, 3.7648229598999023, 4.705076694488525, 5.645330429077148, 6.58558464050293, 7.525838851928711, 8.466093063354492, 9.406346321105957, 10.346600532531738, 11.28685474395752, 12.227108001708984, 13.167362213134766, 14.107616424560547, 15.047870635986328, 15.98812484741211, 16.92837905883789, 17.868633270263672, 18.808887481689453, 19.7491397857666, 20.689393997192383, 21.629648208618164, 22.569902420043945, 23.510156631469727, 24.450410842895508, 25.390663146972656, 26.330917358398438, 27.27117156982422, 28.21142578125, 29.15167999267578]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 11.0, 13.0, 29.0, 58.0, 136.0, 223.0, 470.0, 1214.0, 3637.0, 16445.0, 136630.0, 3826631.0, 183923.0, 18504.0, 4048.0, 1276.0, 530.0, 214.0, 115.0, 62.0, 43.0, 17.0, 16.0, 14.0, 7.0, 8.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.75390625, -5.61199951171875, -5.4700927734375, -5.32818603515625, -5.186279296875, -5.04437255859375, -4.9024658203125, -4.76055908203125, -4.61865234375, -4.47674560546875, -4.3348388671875, -4.19293212890625, -4.051025390625, -3.90911865234375, -3.7672119140625, -3.62530517578125, -3.4833984375, -3.34149169921875, -3.1995849609375, -3.05767822265625, -2.915771484375, -2.77386474609375, -2.6319580078125, -2.49005126953125, -2.34814453125, -2.20623779296875, -2.0643310546875, -1.92242431640625, -1.780517578125, -1.63861083984375, -1.4967041015625, -1.35479736328125, -1.212890625, -1.07098388671875, -0.9290771484375, -0.78717041015625, -0.645263671875, -0.50335693359375, -0.3614501953125, -0.21954345703125, -0.07763671875, 0.06427001953125, 0.2061767578125, 0.34808349609375, 0.489990234375, 0.63189697265625, 0.7738037109375, 0.91571044921875, 1.0576171875, 1.19952392578125, 1.3414306640625, 1.48333740234375, 1.625244140625, 1.76715087890625, 1.9090576171875, 2.05096435546875, 2.19287109375, 2.33477783203125, 2.4766845703125, 2.61859130859375, 2.760498046875, 2.90240478515625, 3.0443115234375, 3.18621826171875, 3.328125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 6.0, 12.0, 10.0, 12.0, 15.0, 18.0, 24.0, 26.0, 32.0, 29.0, 36.0, 36.0, 41.0, 58.0, 52.0, 49.0, 64.0, 58.0, 51.0, 51.0, 55.0, 53.0, 43.0, 33.0, 24.0, 23.0, 17.0, 11.0, 14.0, 18.0, 9.0, 7.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81884765625, -0.7853927612304688, -0.7519378662109375, -0.7184829711914062, -0.685028076171875, -0.6515731811523438, -0.6181182861328125, -0.5846633911132812, -0.55120849609375, -0.5177536010742188, -0.4842987060546875, -0.45084381103515625, -0.417388916015625, -0.38393402099609375, -0.3504791259765625, -0.31702423095703125, -0.2835693359375, -0.25011444091796875, -0.2166595458984375, -0.18320465087890625, -0.149749755859375, -0.11629486083984375, -0.0828399658203125, -0.04938507080078125, -0.01593017578125, 0.01752471923828125, 0.0509796142578125, 0.08443450927734375, 0.117889404296875, 0.15134429931640625, 0.1847991943359375, 0.21825408935546875, 0.251708984375, 0.28516387939453125, 0.3186187744140625, 0.35207366943359375, 0.385528564453125, 0.41898345947265625, 0.4524383544921875, 0.48589324951171875, 0.51934814453125, 0.5528030395507812, 0.5862579345703125, 0.6197128295898438, 0.653167724609375, 0.6866226196289062, 0.7200775146484375, 0.7535324096679688, 0.7869873046875, 0.8204421997070312, 0.8538970947265625, 0.8873519897460938, 0.920806884765625, 0.9542617797851562, 0.9877166748046875, 1.0211715698242188, 1.05462646484375, 1.0880813598632812, 1.1215362548828125, 1.1549911499023438, 1.188446044921875, 1.2219009399414062, 1.2553558349609375, 1.2888107299804688, 1.322265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 9.0, 4.0, 4.0, 11.0, 13.0, 32.0, 53.0, 85.0, 213.0, 603.0, 1720.0, 6592.0, 37055.0, 1020777.0, 3061310.0, 53612.0, 8680.0, 2248.0, 687.0, 288.0, 142.0, 57.0, 31.0, 15.0, 17.0, 9.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.94464111328125, -5.7799072265625, -5.61517333984375, -5.450439453125, -5.28570556640625, -5.1209716796875, -4.95623779296875, -4.79150390625, -4.62677001953125, -4.4620361328125, -4.29730224609375, -4.132568359375, -3.96783447265625, -3.8031005859375, -3.63836669921875, -3.4736328125, -3.30889892578125, -3.1441650390625, -2.97943115234375, -2.814697265625, -2.64996337890625, -2.4852294921875, -2.32049560546875, -2.15576171875, -1.99102783203125, -1.8262939453125, -1.66156005859375, -1.496826171875, -1.33209228515625, -1.1673583984375, -1.00262451171875, -0.837890625, -0.67315673828125, -0.5084228515625, -0.34368896484375, -0.178955078125, -0.01422119140625, 0.1505126953125, 0.31524658203125, 0.47998046875, 0.64471435546875, 0.8094482421875, 0.97418212890625, 1.138916015625, 1.30364990234375, 1.4683837890625, 1.63311767578125, 1.7978515625, 1.96258544921875, 2.1273193359375, 2.29205322265625, 2.456787109375, 2.62152099609375, 2.7862548828125, 2.95098876953125, 3.11572265625, 3.28045654296875, 3.4451904296875, 3.60992431640625, 3.774658203125, 3.93939208984375, 4.1041259765625, 4.26885986328125, 4.43359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 13.0, 7.0, 6.0, 11.0, 16.0, 28.0, 32.0, 41.0, 79.0, 124.0, 225.0, 416.0, 861.0, 1002.0, 494.0, 256.0, 119.0, 103.0, 54.0, 47.0, 30.0, 17.0, 12.0, 15.0, 12.0, 9.0, 11.0, 8.0, 3.0, 2.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-3.62890625, -3.528472900390625, -3.42803955078125, -3.327606201171875, -3.2271728515625, -3.126739501953125, -3.02630615234375, -2.925872802734375, -2.825439453125, -2.725006103515625, -2.62457275390625, -2.524139404296875, -2.4237060546875, -2.323272705078125, -2.22283935546875, -2.122406005859375, -2.02197265625, -1.921539306640625, -1.82110595703125, -1.720672607421875, -1.6202392578125, -1.519805908203125, -1.41937255859375, -1.318939208984375, -1.218505859375, -1.118072509765625, -1.01763916015625, -0.917205810546875, -0.8167724609375, -0.716339111328125, -0.61590576171875, -0.515472412109375, -0.4150390625, -0.314605712890625, -0.21417236328125, -0.113739013671875, -0.0133056640625, 0.087127685546875, 0.18756103515625, 0.287994384765625, 0.388427734375, 0.488861083984375, 0.58929443359375, 0.689727783203125, 0.7901611328125, 0.890594482421875, 0.99102783203125, 1.091461181640625, 1.19189453125, 1.292327880859375, 1.39276123046875, 1.493194580078125, 1.5936279296875, 1.694061279296875, 1.79449462890625, 1.894927978515625, 1.995361328125, 2.095794677734375, 2.19622802734375, 2.296661376953125, 2.3970947265625, 2.497528076171875, 2.59796142578125, 2.698394775390625, 2.798828125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 9.0, 12.0, 23.0, 42.0, 87.0, 137.0, 183.0, 166.0, 120.0, 76.0, 44.0, 29.0, 22.0, 11.0, 4.0, 6.0, 2.0, 6.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.98832893371582, -21.048076629638672, -20.107824325561523, -19.167572021484375, -18.227319717407227, -17.287067413330078, -16.346813201904297, -15.406561851501465, -14.466309547424316, -13.526057243347168, -12.58580493927002, -11.645551681518555, -10.705299377441406, -9.765047073364258, -8.82479476928711, -7.884542465209961, -6.9442901611328125, -6.004037857055664, -5.063785552978516, -4.123532772064209, -3.1832804679870605, -2.243028163909912, -1.3027753829956055, -0.36252307891845703, 0.5777292251586914, 1.5179816484451294, 2.4582340717315674, 3.398486614227295, 4.338738918304443, 5.278991222381592, 6.219244003295898, 7.159496307373047, 8.099750518798828, 9.040002822875977, 9.980255126953125, 10.920507431030273, 11.860759735107422, 12.80101203918457, 13.741265296936035, 14.681517601013184, 15.621769905090332, 16.562023162841797, 17.502275466918945, 18.442527770996094, 19.382780075073242, 20.32303237915039, 21.26328468322754, 22.203536987304688, 23.143789291381836, 24.084041595458984, 25.024293899536133, 25.96454620361328, 26.90479850769043, 27.845050811767578, 28.78530502319336, 29.725555419921875, 30.665809631347656, 31.606061935424805, 32.54631423950195, 33.486568450927734, 34.42681884765625, 35.36707305908203, 36.30732345581055, 37.24757766723633, 38.187828063964844]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 0.0, 5.0, 1.0, 6.0, 13.0, 8.0, 14.0, 19.0, 20.0, 24.0, 19.0, 41.0, 32.0, 46.0, 39.0, 47.0, 48.0, 41.0, 49.0, 51.0, 43.0, 50.0, 49.0, 40.0, 44.0, 45.0, 34.0, 28.0, 31.0, 21.0, 24.0, 19.0, 17.0, 12.0, 8.0, 6.0, 8.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75447654724121, -17.229167938232422, -16.703859329223633, -16.178550720214844, -15.653243064880371, -15.127934455871582, -14.60262680053711, -14.07731819152832, -13.552009582519531, -13.026700973510742, -12.501392364501953, -11.97608470916748, -11.450776100158691, -10.925467491149902, -10.40015983581543, -9.87485122680664, -9.349542617797852, -8.824234008789062, -8.298925399780273, -7.773617744445801, -7.248309135437012, -6.723000526428223, -6.197692394256592, -5.672384262084961, -5.147075653076172, -4.621767044067383, -4.096458911895752, -3.571150541305542, -3.045842170715332, -2.520533800125122, -1.995225429534912, -1.4699170589447021, -0.9446067810058594, -0.4192984104156494, 0.10600996017456055, 0.6313183307647705, 1.1566267013549805, 1.6819350719451904, 2.2072434425354004, 2.7325518131256104, 3.2578601837158203, 3.7831685543060303, 4.30847692489624, 4.833785057067871, 5.35909366607666, 5.884402275085449, 6.40971040725708, 6.935018539428711, 7.4603271484375, 7.985635757446289, 8.510944366455078, 9.03625202178955, 9.56156063079834, 10.086869239807129, 10.612176895141602, 11.13748550415039, 11.66279411315918, 12.188102722167969, 12.713411331176758, 13.23871898651123, 13.76402759552002, 14.289336204528809, 14.814643859863281, 15.33995246887207, 15.86526107788086]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 12.0, 11.0, 17.0, 27.0, 43.0, 63.0, 95.0, 182.0, 277.0, 488.0, 924.0, 1767.0, 3445.0, 7497.0, 17993.0, 46448.0, 131397.0, 332543.0, 312439.0, 119821.0, 42857.0, 16419.0, 6857.0, 3243.0, 1642.0, 891.0, 470.0, 263.0, 169.0, 91.0, 65.0, 40.0, 16.0, 24.0, 11.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.265625, -2.1873779296875, -2.109130859375, -2.0308837890625, -1.95263671875, -1.8743896484375, -1.796142578125, -1.7178955078125, -1.6396484375, -1.5614013671875, -1.483154296875, -1.4049072265625, -1.32666015625, -1.2484130859375, -1.170166015625, -1.0919189453125, -1.013671875, -0.9354248046875, -0.857177734375, -0.7789306640625, -0.70068359375, -0.6224365234375, -0.544189453125, -0.4659423828125, -0.3876953125, -0.3094482421875, -0.231201171875, -0.1529541015625, -0.07470703125, 0.0035400390625, 0.081787109375, 0.1600341796875, 0.23828125, 0.3165283203125, 0.394775390625, 0.4730224609375, 0.55126953125, 0.6295166015625, 0.707763671875, 0.7860107421875, 0.8642578125, 0.9425048828125, 1.020751953125, 1.0989990234375, 1.17724609375, 1.2554931640625, 1.333740234375, 1.4119873046875, 1.490234375, 1.5684814453125, 1.646728515625, 1.7249755859375, 1.80322265625, 1.8814697265625, 1.959716796875, 2.0379638671875, 2.1162109375, 2.1944580078125, 2.272705078125, 2.3509521484375, 2.42919921875, 2.5074462890625, 2.585693359375, 2.6639404296875, 2.7421875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 4.0, 12.0, 7.0, 11.0, 10.0, 13.0, 21.0, 22.0, 22.0, 15.0, 39.0, 35.0, 29.0, 32.0, 44.0, 46.0, 53.0, 46.0, 56.0, 60.0, 47.0, 45.0, 43.0, 41.0, 30.0, 31.0, 27.0, 21.0, 23.0, 24.0, 18.0, 15.0, 16.0, 8.0, 9.0, 2.0, 0.0, 7.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78125, -0.75054931640625, -0.7198486328125, -0.68914794921875, -0.658447265625, -0.62774658203125, -0.5970458984375, -0.56634521484375, -0.53564453125, -0.50494384765625, -0.4742431640625, -0.44354248046875, -0.412841796875, -0.38214111328125, -0.3514404296875, -0.32073974609375, -0.2900390625, -0.25933837890625, -0.2286376953125, -0.19793701171875, -0.167236328125, -0.13653564453125, -0.1058349609375, -0.07513427734375, -0.04443359375, -0.01373291015625, 0.0169677734375, 0.04766845703125, 0.078369140625, 0.10906982421875, 0.1397705078125, 0.17047119140625, 0.201171875, 0.23187255859375, 0.2625732421875, 0.29327392578125, 0.323974609375, 0.35467529296875, 0.3853759765625, 0.41607666015625, 0.44677734375, 0.47747802734375, 0.5081787109375, 0.53887939453125, 0.569580078125, 0.60028076171875, 0.6309814453125, 0.66168212890625, 0.6923828125, 0.72308349609375, 0.7537841796875, 0.78448486328125, 0.815185546875, 0.84588623046875, 0.8765869140625, 0.90728759765625, 0.93798828125, 0.96868896484375, 0.9993896484375, 1.03009033203125, 1.060791015625, 1.09149169921875, 1.1221923828125, 1.15289306640625, 1.18359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 1.0, 5.0, 9.0, 16.0, 13.0, 21.0, 29.0, 36.0, 52.0, 67.0, 102.0, 159.0, 245.0, 429.0, 639.0, 1159.0, 2183.0, 4659.0, 13489.0, 54155.0, 292327.0, 542365.0, 100901.0, 22124.0, 6851.0, 2867.0, 1453.0, 830.0, 487.0, 284.0, 193.0, 120.0, 77.0, 60.0, 37.0, 34.0, 15.0, 14.0, 13.0, 8.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.23828125, -3.13446044921875, -3.0306396484375, -2.92681884765625, -2.822998046875, -2.71917724609375, -2.6153564453125, -2.51153564453125, -2.40771484375, -2.30389404296875, -2.2000732421875, -2.09625244140625, -1.992431640625, -1.88861083984375, -1.7847900390625, -1.68096923828125, -1.5771484375, -1.47332763671875, -1.3695068359375, -1.26568603515625, -1.161865234375, -1.05804443359375, -0.9542236328125, -0.85040283203125, -0.74658203125, -0.64276123046875, -0.5389404296875, -0.43511962890625, -0.331298828125, -0.22747802734375, -0.1236572265625, -0.01983642578125, 0.083984375, 0.18780517578125, 0.2916259765625, 0.39544677734375, 0.499267578125, 0.60308837890625, 0.7069091796875, 0.81072998046875, 0.91455078125, 1.01837158203125, 1.1221923828125, 1.22601318359375, 1.329833984375, 1.43365478515625, 1.5374755859375, 1.64129638671875, 1.7451171875, 1.84893798828125, 1.9527587890625, 2.05657958984375, 2.160400390625, 2.26422119140625, 2.3680419921875, 2.47186279296875, 2.57568359375, 2.67950439453125, 2.7833251953125, 2.88714599609375, 2.990966796875, 3.09478759765625, 3.1986083984375, 3.30242919921875, 3.40625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 1.0, 2.0, 7.0, 9.0, 9.0, 14.0, 19.0, 17.0, 30.0, 29.0, 29.0, 44.0, 44.0, 40.0, 49.0, 54.0, 41.0, 50.0, 49.0, 51.0, 62.0, 63.0, 54.0, 44.0, 33.0, 32.0, 21.0, 29.0, 13.0, 13.0, 12.0, 4.0, 12.0, 5.0, 7.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.63079833984375, -5.4725341796875, -5.31427001953125, -5.156005859375, -4.99774169921875, -4.8394775390625, -4.68121337890625, -4.52294921875, -4.36468505859375, -4.2064208984375, -4.04815673828125, -3.889892578125, -3.73162841796875, -3.5733642578125, -3.41510009765625, -3.2568359375, -3.09857177734375, -2.9403076171875, -2.78204345703125, -2.623779296875, -2.46551513671875, -2.3072509765625, -2.14898681640625, -1.99072265625, -1.83245849609375, -1.6741943359375, -1.51593017578125, -1.357666015625, -1.19940185546875, -1.0411376953125, -0.88287353515625, -0.724609375, -0.56634521484375, -0.4080810546875, -0.24981689453125, -0.091552734375, 0.06671142578125, 0.2249755859375, 0.38323974609375, 0.54150390625, 0.69976806640625, 0.8580322265625, 1.01629638671875, 1.174560546875, 1.33282470703125, 1.4910888671875, 1.64935302734375, 1.8076171875, 1.96588134765625, 2.1241455078125, 2.28240966796875, 2.440673828125, 2.59893798828125, 2.7572021484375, 2.91546630859375, 3.07373046875, 3.23199462890625, 3.3902587890625, 3.54852294921875, 3.706787109375, 3.86505126953125, 4.0233154296875, 4.18157958984375, 4.33984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 10.0, 12.0, 11.0, 21.0, 26.0, 38.0, 77.0, 110.0, 185.0, 386.0, 854.0, 2508.0, 11663.0, 136747.0, 823484.0, 61907.0, 7191.0, 1853.0, 683.0, 305.0, 159.0, 96.0, 75.0, 41.0, 26.0, 24.0, 14.0, 15.0, 4.0, 3.0, 9.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.658203125, -1.59283447265625, -1.5274658203125, -1.46209716796875, -1.396728515625, -1.33135986328125, -1.2659912109375, -1.20062255859375, -1.13525390625, -1.06988525390625, -1.0045166015625, -0.93914794921875, -0.873779296875, -0.80841064453125, -0.7430419921875, -0.67767333984375, -0.6123046875, -0.54693603515625, -0.4815673828125, -0.41619873046875, -0.350830078125, -0.28546142578125, -0.2200927734375, -0.15472412109375, -0.08935546875, -0.02398681640625, 0.0413818359375, 0.10675048828125, 0.172119140625, 0.23748779296875, 0.3028564453125, 0.36822509765625, 0.43359375, 0.49896240234375, 0.5643310546875, 0.62969970703125, 0.695068359375, 0.76043701171875, 0.8258056640625, 0.89117431640625, 0.95654296875, 1.02191162109375, 1.0872802734375, 1.15264892578125, 1.218017578125, 1.28338623046875, 1.3487548828125, 1.41412353515625, 1.4794921875, 1.54486083984375, 1.6102294921875, 1.67559814453125, 1.740966796875, 1.80633544921875, 1.8717041015625, 1.93707275390625, 2.00244140625, 2.06781005859375, 2.1331787109375, 2.19854736328125, 2.263916015625, 2.32928466796875, 2.3946533203125, 2.46002197265625, 2.525390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 4.0, 15.0, 14.0, 27.0, 22.0, 40.0, 39.0, 58.0, 78.0, 72.0, 118.0, 109.0, 91.0, 57.0, 55.0, 41.0, 39.0, 25.0, 19.0, 22.0, 9.0, 11.0, 5.0, 3.0, 2.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00032973289489746094, -0.00032123737037181854, -0.00031274184584617615, -0.00030424632132053375, -0.00029575079679489136, -0.00028725527226924896, -0.00027875974774360657, -0.00027026422321796417, -0.0002617686986923218, -0.0002532731741666794, -0.000244777649641037, -0.0002362821251153946, -0.0002277866005897522, -0.0002192910760641098, -0.0002107955515384674, -0.000202300027012825, -0.00019380450248718262, -0.00018530897796154022, -0.00017681345343589783, -0.00016831792891025543, -0.00015982240438461304, -0.00015132687985897064, -0.00014283135533332825, -0.00013433583080768585, -0.00012584030628204346, -0.00011734478175640106, -0.00010884925723075867, -0.00010035373270511627, -9.185820817947388e-05, -8.336268365383148e-05, -7.486715912818909e-05, -6.637163460254669e-05, -5.78761100769043e-05, -4.93805855512619e-05, -4.088506102561951e-05, -3.238953649997711e-05, -2.3894011974334717e-05, -1.5398487448692322e-05, -6.902962923049927e-06, 1.5925616025924683e-06, 1.0088086128234863e-05, 1.8583610653877258e-05, 2.7079135179519653e-05, 3.557465970516205e-05, 4.407018423080444e-05, 5.256570875644684e-05, 6.106123328208923e-05, 6.955675780773163e-05, 7.805228233337402e-05, 8.654780685901642e-05, 9.504333138465881e-05, 0.00010353885591030121, 0.0001120343804359436, 0.000120529904961586, 0.0001290254294872284, 0.0001375209540128708, 0.00014601647853851318, 0.00015451200306415558, 0.00016300752758979797, 0.00017150305211544037, 0.00017999857664108276, 0.00018849410116672516, 0.00019698962569236755, 0.00020548515021800995, 0.00021398067474365234]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 11.0, 4.0, 9.0, 9.0, 16.0, 26.0, 29.0, 42.0, 49.0, 72.0, 115.0, 219.0, 346.0, 693.0, 1547.0, 4079.0, 15089.0, 104815.0, 733908.0, 159110.0, 19838.0, 4876.0, 1885.0, 718.0, 389.0, 221.0, 149.0, 81.0, 56.0, 44.0, 25.0, 24.0, 22.0, 12.0, 6.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8115234375, -1.7620086669921875, -1.712493896484375, -1.6629791259765625, -1.61346435546875, -1.5639495849609375, -1.514434814453125, -1.4649200439453125, -1.4154052734375, -1.3658905029296875, -1.316375732421875, -1.2668609619140625, -1.21734619140625, -1.1678314208984375, -1.118316650390625, -1.0688018798828125, -1.019287109375, -0.9697723388671875, -0.920257568359375, -0.8707427978515625, -0.82122802734375, -0.7717132568359375, -0.722198486328125, -0.6726837158203125, -0.6231689453125, -0.5736541748046875, -0.524139404296875, -0.4746246337890625, -0.42510986328125, -0.3755950927734375, -0.326080322265625, -0.2765655517578125, -0.22705078125, -0.1775360107421875, -0.128021240234375, -0.0785064697265625, -0.02899169921875, 0.0205230712890625, 0.070037841796875, 0.1195526123046875, 0.1690673828125, 0.2185821533203125, 0.268096923828125, 0.3176116943359375, 0.36712646484375, 0.4166412353515625, 0.466156005859375, 0.5156707763671875, 0.565185546875, 0.6147003173828125, 0.664215087890625, 0.7137298583984375, 0.76324462890625, 0.8127593994140625, 0.862274169921875, 0.9117889404296875, 0.9613037109375, 1.0108184814453125, 1.060333251953125, 1.1098480224609375, 1.15936279296875, 1.2088775634765625, 1.258392333984375, 1.3079071044921875, 1.357421875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 7.0, 12.0, 24.0, 23.0, 21.0, 34.0, 39.0, 56.0, 63.0, 81.0, 84.0, 83.0, 76.0, 75.0, 70.0, 59.0, 41.0, 33.0, 32.0, 21.0, 13.0, 7.0, 9.0, 8.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5927734375, -1.545074462890625, -1.49737548828125, -1.449676513671875, -1.4019775390625, -1.354278564453125, -1.30657958984375, -1.258880615234375, -1.211181640625, -1.163482666015625, -1.11578369140625, -1.068084716796875, -1.0203857421875, -0.972686767578125, -0.92498779296875, -0.877288818359375, -0.82958984375, -0.781890869140625, -0.73419189453125, -0.686492919921875, -0.6387939453125, -0.591094970703125, -0.54339599609375, -0.495697021484375, -0.447998046875, -0.400299072265625, -0.35260009765625, -0.304901123046875, -0.2572021484375, -0.209503173828125, -0.16180419921875, -0.114105224609375, -0.06640625, -0.018707275390625, 0.02899169921875, 0.076690673828125, 0.1243896484375, 0.172088623046875, 0.21978759765625, 0.267486572265625, 0.315185546875, 0.362884521484375, 0.41058349609375, 0.458282470703125, 0.5059814453125, 0.553680419921875, 0.60137939453125, 0.649078369140625, 0.69677734375, 0.744476318359375, 0.79217529296875, 0.839874267578125, 0.8875732421875, 0.935272216796875, 0.98297119140625, 1.030670166015625, 1.078369140625, 1.126068115234375, 1.17376708984375, 1.221466064453125, 1.2691650390625, 1.316864013671875, 1.36456298828125, 1.412261962890625, 1.4599609375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 6.0, 16.0, 29.0, 56.0, 87.0, 139.0, 177.0, 198.0, 119.0, 70.0, 36.0, 20.0, 18.0, 12.0, 4.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.88990020751953, -36.91172790527344, -35.93355941772461, -34.955387115478516, -33.97721481323242, -32.999046325683594, -32.0208740234375, -31.04270362854004, -30.064533233642578, -29.086362838745117, -28.108190536499023, -27.130020141601562, -26.1518497467041, -25.17367935180664, -24.195507049560547, -23.217336654663086, -22.239164352416992, -21.26099395751953, -20.282821655273438, -19.304651260375977, -18.326480865478516, -17.348308563232422, -16.37013816833496, -15.3919677734375, -14.413796424865723, -13.435625076293945, -12.457454681396484, -11.479283332824707, -10.50111198425293, -9.522941589355469, -8.544770240783691, -7.566599369049072, -6.588428497314453, -5.610257625579834, -4.632086753845215, -3.6539154052734375, -2.6757445335388184, -1.6975736618041992, -0.7194023132324219, 0.25876855850219727, 1.2369394302368164, 2.2151103019714355, 3.193281412124634, 4.171452522277832, 5.149623394012451, 6.12779426574707, 7.105965614318848, 8.084136962890625, 9.062307357788086, 10.040478706359863, 11.018649101257324, 11.996820449829102, 12.974990844726562, 13.95316219329834, 14.931333541870117, 15.909503936767578, 16.887676239013672, 17.865846633911133, 18.844018936157227, 19.822189331054688, 20.80035972595215, 21.77853012084961, 22.756702423095703, 23.734872817993164, 24.713043212890625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 6.0, 9.0, 4.0, 7.0, 11.0, 13.0, 13.0, 17.0, 16.0, 21.0, 24.0, 35.0, 29.0, 27.0, 30.0, 35.0, 42.0, 43.0, 58.0, 45.0, 55.0, 44.0, 54.0, 39.0, 42.0, 31.0, 26.0, 27.0, 34.0, 18.0, 23.0, 18.0, 17.0, 17.0, 14.0, 9.0, 6.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-17.36117935180664, -16.849042892456055, -16.33690643310547, -15.824769973754883, -15.312633514404297, -14.800497055053711, -14.288360595703125, -13.776224136352539, -13.264087677001953, -12.751951217651367, -12.239814758300781, -11.727678298950195, -11.21554183959961, -10.703405380249023, -10.191268920898438, -9.679132461547852, -9.166996002197266, -8.65485954284668, -8.142723083496094, -7.630586624145508, -7.118450164794922, -6.606313705444336, -6.09417724609375, -5.582040786743164, -5.069904327392578, -4.557767868041992, -4.045631408691406, -3.5334949493408203, -3.0213584899902344, -2.5092220306396484, -1.9970855712890625, -1.4849491119384766, -0.9728145599365234, -0.4606781005859375, 0.05145835876464844, 0.5635948181152344, 1.0757312774658203, 1.5878677368164062, 2.100004196166992, 2.612140655517578, 3.124277114868164, 3.63641357421875, 4.148550033569336, 4.660686492919922, 5.172822952270508, 5.684959411621094, 6.19709587097168, 6.709232330322266, 7.221368789672852, 7.7335052490234375, 8.245641708374023, 8.75777816772461, 9.269914627075195, 9.782051086425781, 10.294187545776367, 10.806324005126953, 11.318460464477539, 11.830596923828125, 12.342733383178711, 12.854869842529297, 13.367006301879883, 13.879142761230469, 14.391279220581055, 14.90341567993164, 15.415552139282227]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 8.0, 10.0, 24.0, 31.0, 35.0, 96.0, 182.0, 444.0, 1672.0, 13722.0, 3916003.0, 254689.0, 5755.0, 1017.0, 284.0, 135.0, 68.0, 35.0, 20.0, 15.0, 8.0, 8.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.70367431640625, -8.4464111328125, -8.18914794921875, -7.931884765625, -7.67462158203125, -7.4173583984375, -7.16009521484375, -6.90283203125, -6.64556884765625, -6.3883056640625, -6.13104248046875, -5.873779296875, -5.61651611328125, -5.3592529296875, -5.10198974609375, -4.8447265625, -4.58746337890625, -4.3302001953125, -4.07293701171875, -3.815673828125, -3.55841064453125, -3.3011474609375, -3.04388427734375, -2.78662109375, -2.52935791015625, -2.2720947265625, -2.01483154296875, -1.757568359375, -1.50030517578125, -1.2430419921875, -0.98577880859375, -0.728515625, -0.47125244140625, -0.2139892578125, 0.04327392578125, 0.300537109375, 0.55780029296875, 0.8150634765625, 1.07232666015625, 1.32958984375, 1.58685302734375, 1.8441162109375, 2.10137939453125, 2.358642578125, 2.61590576171875, 2.8731689453125, 3.13043212890625, 3.3876953125, 3.64495849609375, 3.9022216796875, 4.15948486328125, 4.416748046875, 4.67401123046875, 4.9312744140625, 5.18853759765625, 5.44580078125, 5.70306396484375, 5.9603271484375, 6.21759033203125, 6.474853515625, 6.73211669921875, 6.9893798828125, 7.24664306640625, 7.50390625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 8.0, 15.0, 20.0, 21.0, 31.0, 35.0, 45.0, 59.0, 64.0, 76.0, 68.0, 88.0, 75.0, 82.0, 68.0, 50.0, 44.0, 36.0, 28.0, 35.0, 14.0, 9.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5537109375, -1.5057525634765625, -1.457794189453125, -1.4098358154296875, -1.36187744140625, -1.3139190673828125, -1.265960693359375, -1.2180023193359375, -1.1700439453125, -1.1220855712890625, -1.074127197265625, -1.0261688232421875, -0.97821044921875, -0.9302520751953125, -0.882293701171875, -0.8343353271484375, -0.786376953125, -0.7384185791015625, -0.690460205078125, -0.6425018310546875, -0.59454345703125, -0.5465850830078125, -0.498626708984375, -0.4506683349609375, -0.4027099609375, -0.3547515869140625, -0.306793212890625, -0.2588348388671875, -0.21087646484375, -0.1629180908203125, -0.114959716796875, -0.0670013427734375, -0.01904296875, 0.0289154052734375, 0.076873779296875, 0.1248321533203125, 0.17279052734375, 0.2207489013671875, 0.268707275390625, 0.3166656494140625, 0.3646240234375, 0.4125823974609375, 0.460540771484375, 0.5084991455078125, 0.55645751953125, 0.6044158935546875, 0.652374267578125, 0.7003326416015625, 0.748291015625, 0.7962493896484375, 0.844207763671875, 0.8921661376953125, 0.94012451171875, 0.9880828857421875, 1.036041259765625, 1.0839996337890625, 1.1319580078125, 1.1799163818359375, 1.227874755859375, 1.2758331298828125, 1.32379150390625, 1.3717498779296875, 1.419708251953125, 1.4676666259765625, 1.515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 9.0, 7.0, 22.0, 42.0, 48.0, 77.0, 116.0, 191.0, 320.0, 510.0, 869.0, 1517.0, 2981.0, 6069.0, 15004.0, 47028.0, 309536.0, 3457861.0, 280138.0, 44739.0, 14621.0, 6167.0, 2765.0, 1587.0, 842.0, 461.0, 290.0, 171.0, 94.0, 62.0, 41.0, 26.0, 19.0, 9.0, 13.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.94140625, -2.86077880859375, -2.7801513671875, -2.69952392578125, -2.618896484375, -2.53826904296875, -2.4576416015625, -2.37701416015625, -2.29638671875, -2.21575927734375, -2.1351318359375, -2.05450439453125, -1.973876953125, -1.89324951171875, -1.8126220703125, -1.73199462890625, -1.6513671875, -1.57073974609375, -1.4901123046875, -1.40948486328125, -1.328857421875, -1.24822998046875, -1.1676025390625, -1.08697509765625, -1.00634765625, -0.92572021484375, -0.8450927734375, -0.76446533203125, -0.683837890625, -0.60321044921875, -0.5225830078125, -0.44195556640625, -0.361328125, -0.28070068359375, -0.2000732421875, -0.11944580078125, -0.038818359375, 0.04180908203125, 0.1224365234375, 0.20306396484375, 0.28369140625, 0.36431884765625, 0.4449462890625, 0.52557373046875, 0.606201171875, 0.68682861328125, 0.7674560546875, 0.84808349609375, 0.9287109375, 1.00933837890625, 1.0899658203125, 1.17059326171875, 1.251220703125, 1.33184814453125, 1.4124755859375, 1.49310302734375, 1.57373046875, 1.65435791015625, 1.7349853515625, 1.81561279296875, 1.896240234375, 1.97686767578125, 2.0574951171875, 2.13812255859375, 2.21875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 5.0, 5.0, 8.0, 13.0, 13.0, 27.0, 24.0, 54.0, 91.0, 174.0, 374.0, 1095.0, 1256.0, 484.0, 204.0, 90.0, 43.0, 33.0, 16.0, 15.0, 10.0, 7.0, 5.0, 5.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.14453125, -4.03265380859375, -3.9207763671875, -3.80889892578125, -3.697021484375, -3.58514404296875, -3.4732666015625, -3.36138916015625, -3.24951171875, -3.13763427734375, -3.0257568359375, -2.91387939453125, -2.802001953125, -2.69012451171875, -2.5782470703125, -2.46636962890625, -2.3544921875, -2.24261474609375, -2.1307373046875, -2.01885986328125, -1.906982421875, -1.79510498046875, -1.6832275390625, -1.57135009765625, -1.45947265625, -1.34759521484375, -1.2357177734375, -1.12384033203125, -1.011962890625, -0.90008544921875, -0.7882080078125, -0.67633056640625, -0.564453125, -0.45257568359375, -0.3406982421875, -0.22882080078125, -0.116943359375, -0.00506591796875, 0.1068115234375, 0.21868896484375, 0.33056640625, 0.44244384765625, 0.5543212890625, 0.66619873046875, 0.778076171875, 0.88995361328125, 1.0018310546875, 1.11370849609375, 1.2255859375, 1.33746337890625, 1.4493408203125, 1.56121826171875, 1.673095703125, 1.78497314453125, 1.8968505859375, 2.00872802734375, 2.12060546875, 2.23248291015625, 2.3443603515625, 2.45623779296875, 2.568115234375, 2.67999267578125, 2.7918701171875, 2.90374755859375, 3.015625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 10.0, 20.0, 46.0, 133.0, 301.0, 301.0, 116.0, 34.0, 17.0, 6.0, 2.0, 6.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.278968811035156, -52.9849739074707, -51.690975189208984, -50.39698028564453, -49.10298156738281, -47.80898666381836, -46.514991760253906, -45.22099304199219, -43.926998138427734, -42.63300323486328, -41.33900451660156, -40.04500961303711, -38.751014709472656, -37.45701599121094, -36.163021087646484, -34.86902618408203, -33.57502746582031, -32.28103256225586, -30.98703384399414, -29.693038940429688, -28.3990421295166, -27.105045318603516, -25.811050415039062, -24.517053604125977, -23.22305679321289, -21.929059982299805, -20.63506317138672, -19.341068267822266, -18.04707145690918, -16.753074645996094, -15.459078788757324, -14.165082931518555, -12.871086120605469, -11.577089309692383, -10.283093452453613, -8.989097595214844, -7.695100784301758, -6.40110445022583, -5.107108116149902, -3.813112258911133, -2.519115447998047, -1.2251191139221191, 0.0688772201538086, 1.3628735542297363, 2.656869888305664, 3.950866222381592, 5.2448625564575195, 6.538858413696289, 7.832855224609375, 9.126852035522461, 10.42084789276123, 11.71484375, 13.008840560913086, 14.302837371826172, 15.596833229064941, 16.89082908630371, 18.184825897216797, 19.478822708129883, 20.77281951904297, 22.066814422607422, 23.360811233520508, 24.654808044433594, 25.948802947998047, 27.242799758911133, 28.53679656982422]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 9.0, 6.0, 10.0, 12.0, 11.0, 15.0, 22.0, 30.0, 27.0, 29.0, 34.0, 43.0, 50.0, 47.0, 51.0, 57.0, 50.0, 53.0, 58.0, 36.0, 43.0, 51.0, 45.0, 36.0, 35.0, 25.0, 31.0, 14.0, 15.0, 17.0, 7.0, 6.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.61648941040039, -13.207945823669434, -12.799402236938477, -12.390857696533203, -11.982314109802246, -11.573770523071289, -11.165226936340332, -10.756683349609375, -10.348138809204102, -9.939595222473145, -9.531051635742188, -9.122507095336914, -8.713963508605957, -8.305419921875, -7.896876335144043, -7.488332271575928, -7.079788684844971, -6.671245098114014, -6.262701034545898, -5.854157447814941, -5.445613384246826, -5.037069797515869, -4.628525733947754, -4.219982147216797, -3.8114383220672607, -3.4028944969177246, -2.9943506717681885, -2.5858068466186523, -2.1772632598876953, -1.7687194347381592, -1.360175609588623, -0.9516317844390869, -0.5430879592895508, -0.13454416394233704, 0.2739996314048767, 0.6825433969497681, 1.0910872220993042, 1.4996309280395508, 1.908174753189087, 2.316718578338623, 2.725262403488159, 3.1338062286376953, 3.5423500537872314, 3.9508938789367676, 4.359437465667725, 4.76798152923584, 5.176525115966797, 5.585068702697754, 5.993612766265869, 6.402156352996826, 6.810700416564941, 7.219244003295898, 7.627788066864014, 8.036331176757812, 8.444875717163086, 8.853419303894043, 9.261962890625, 9.670506477355957, 10.079050064086914, 10.487594604492188, 10.896138191223145, 11.304681777954102, 11.713225364685059, 12.121768951416016, 12.530313491821289]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 13.0, 12.0, 20.0, 28.0, 40.0, 64.0, 109.0, 149.0, 257.0, 480.0, 833.0, 1505.0, 3100.0, 6720.0, 15431.0, 39453.0, 108448.0, 309147.0, 354240.0, 129062.0, 46449.0, 18021.0, 7418.0, 3594.0, 1789.0, 899.0, 518.0, 287.0, 184.0, 92.0, 58.0, 44.0, 23.0, 18.0, 16.0, 14.0, 4.0, 5.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.113372802734375, -2.03533935546875, -1.957305908203125, -1.8792724609375, -1.801239013671875, -1.72320556640625, -1.645172119140625, -1.567138671875, -1.489105224609375, -1.41107177734375, -1.333038330078125, -1.2550048828125, -1.176971435546875, -1.09893798828125, -1.020904541015625, -0.94287109375, -0.864837646484375, -0.78680419921875, -0.708770751953125, -0.6307373046875, -0.552703857421875, -0.47467041015625, -0.396636962890625, -0.318603515625, -0.240570068359375, -0.16253662109375, -0.084503173828125, -0.0064697265625, 0.071563720703125, 0.14959716796875, 0.227630615234375, 0.3056640625, 0.383697509765625, 0.46173095703125, 0.539764404296875, 0.6177978515625, 0.695831298828125, 0.77386474609375, 0.851898193359375, 0.929931640625, 1.007965087890625, 1.08599853515625, 1.164031982421875, 1.2420654296875, 1.320098876953125, 1.39813232421875, 1.476165771484375, 1.55419921875, 1.632232666015625, 1.71026611328125, 1.788299560546875, 1.8663330078125, 1.944366455078125, 2.02239990234375, 2.100433349609375, 2.178466796875, 2.256500244140625, 2.33453369140625, 2.412567138671875, 2.4906005859375, 2.568634033203125, 2.64666748046875, 2.724700927734375, 2.802734375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 9.0, 14.0, 13.0, 15.0, 27.0, 27.0, 20.0, 32.0, 42.0, 41.0, 44.0, 56.0, 49.0, 45.0, 66.0, 50.0, 61.0, 59.0, 48.0, 48.0, 44.0, 32.0, 26.0, 21.0, 22.0, 21.0, 17.0, 11.0, 13.0, 6.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.4892578125, -1.4535446166992188, -1.4178314208984375, -1.3821182250976562, -1.346405029296875, -1.3106918334960938, -1.2749786376953125, -1.2392654418945312, -1.20355224609375, -1.1678390502929688, -1.1321258544921875, -1.0964126586914062, -1.060699462890625, -1.0249862670898438, -0.9892730712890625, -0.9535598754882812, -0.9178466796875, -0.8821334838867188, -0.8464202880859375, -0.8107070922851562, -0.774993896484375, -0.7392807006835938, -0.7035675048828125, -0.6678543090820312, -0.63214111328125, -0.5964279174804688, -0.5607147216796875, -0.5250015258789062, -0.489288330078125, -0.45357513427734375, -0.4178619384765625, -0.38214874267578125, -0.346435546875, -0.31072235107421875, -0.2750091552734375, -0.23929595947265625, -0.203582763671875, -0.16786956787109375, -0.1321563720703125, -0.09644317626953125, -0.06072998046875, -0.02501678466796875, 0.0106964111328125, 0.04640960693359375, 0.082122802734375, 0.11783599853515625, 0.1535491943359375, 0.18926239013671875, 0.2249755859375, 0.26068878173828125, 0.2964019775390625, 0.33211517333984375, 0.367828369140625, 0.40354156494140625, 0.4392547607421875, 0.47496795654296875, 0.51068115234375, 0.5463943481445312, 0.5821075439453125, 0.6178207397460938, 0.653533935546875, 0.6892471313476562, 0.7249603271484375, 0.7606735229492188, 0.79638671875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 6.0, 5.0, 8.0, 8.0, 10.0, 12.0, 32.0, 34.0, 37.0, 71.0, 116.0, 145.0, 242.0, 440.0, 849.0, 1995.0, 6117.0, 25868.0, 151380.0, 669992.0, 154587.0, 26290.0, 6241.0, 2074.0, 874.0, 409.0, 236.0, 148.0, 108.0, 67.0, 43.0, 26.0, 24.0, 16.0, 12.0, 10.0, 4.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.31640625, -3.1912841796875, -3.066162109375, -2.9410400390625, -2.81591796875, -2.6907958984375, -2.565673828125, -2.4405517578125, -2.3154296875, -2.1903076171875, -2.065185546875, -1.9400634765625, -1.81494140625, -1.6898193359375, -1.564697265625, -1.4395751953125, -1.314453125, -1.1893310546875, -1.064208984375, -0.9390869140625, -0.81396484375, -0.6888427734375, -0.563720703125, -0.4385986328125, -0.3134765625, -0.1883544921875, -0.063232421875, 0.0618896484375, 0.18701171875, 0.3121337890625, 0.437255859375, 0.5623779296875, 0.6875, 0.8126220703125, 0.937744140625, 1.0628662109375, 1.18798828125, 1.3131103515625, 1.438232421875, 1.5633544921875, 1.6884765625, 1.8135986328125, 1.938720703125, 2.0638427734375, 2.18896484375, 2.3140869140625, 2.439208984375, 2.5643310546875, 2.689453125, 2.8145751953125, 2.939697265625, 3.0648193359375, 3.18994140625, 3.3150634765625, 3.440185546875, 3.5653076171875, 3.6904296875, 3.8155517578125, 3.940673828125, 4.0657958984375, 4.19091796875, 4.3160400390625, 4.441162109375, 4.5662841796875, 4.69140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 8.0, 14.0, 6.0, 12.0, 19.0, 18.0, 22.0, 26.0, 25.0, 32.0, 38.0, 34.0, 36.0, 34.0, 42.0, 38.0, 60.0, 42.0, 43.0, 46.0, 36.0, 39.0, 38.0, 41.0, 41.0, 25.0, 26.0, 26.0, 16.0, 22.0, 15.0, 17.0, 4.0, 15.0, 10.0, 11.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.435546875, -3.3251953125, -3.21484375, -3.1044921875, -2.994140625, -2.8837890625, -2.7734375, -2.6630859375, -2.552734375, -2.4423828125, -2.33203125, -2.2216796875, -2.111328125, -2.0009765625, -1.890625, -1.7802734375, -1.669921875, -1.5595703125, -1.44921875, -1.3388671875, -1.228515625, -1.1181640625, -1.0078125, -0.8974609375, -0.787109375, -0.6767578125, -0.56640625, -0.4560546875, -0.345703125, -0.2353515625, -0.125, -0.0146484375, 0.095703125, 0.2060546875, 0.31640625, 0.4267578125, 0.537109375, 0.6474609375, 0.7578125, 0.8681640625, 0.978515625, 1.0888671875, 1.19921875, 1.3095703125, 1.419921875, 1.5302734375, 1.640625, 1.7509765625, 1.861328125, 1.9716796875, 2.08203125, 2.1923828125, 2.302734375, 2.4130859375, 2.5234375, 2.6337890625, 2.744140625, 2.8544921875, 2.96484375, 3.0751953125, 3.185546875, 3.2958984375, 3.40625, 3.5166015625, 3.626953125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 2.0, 5.0, 6.0, 9.0, 16.0, 21.0, 32.0, 36.0, 55.0, 83.0, 102.0, 228.0, 416.0, 778.0, 2047.0, 6587.0, 33757.0, 419538.0, 536545.0, 37231.0, 7044.0, 2123.0, 856.0, 384.0, 230.0, 113.0, 79.0, 52.0, 43.0, 31.0, 21.0, 21.0, 15.0, 5.0, 9.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0], "bins": [-2.09375, -2.0322113037109375, -1.970672607421875, -1.9091339111328125, -1.84759521484375, -1.7860565185546875, -1.724517822265625, -1.6629791259765625, -1.6014404296875, -1.5399017333984375, -1.478363037109375, -1.4168243408203125, -1.35528564453125, -1.2937469482421875, -1.232208251953125, -1.1706695556640625, -1.109130859375, -1.0475921630859375, -0.986053466796875, -0.9245147705078125, -0.86297607421875, -0.8014373779296875, -0.739898681640625, -0.6783599853515625, -0.6168212890625, -0.5552825927734375, -0.493743896484375, -0.4322052001953125, -0.37066650390625, -0.3091278076171875, -0.247589111328125, -0.1860504150390625, -0.12451171875, -0.0629730224609375, -0.001434326171875, 0.0601043701171875, 0.12164306640625, 0.1831817626953125, 0.244720458984375, 0.3062591552734375, 0.3677978515625, 0.4293365478515625, 0.490875244140625, 0.5524139404296875, 0.61395263671875, 0.6754913330078125, 0.737030029296875, 0.7985687255859375, 0.860107421875, 0.9216461181640625, 0.983184814453125, 1.0447235107421875, 1.10626220703125, 1.1678009033203125, 1.229339599609375, 1.2908782958984375, 1.3524169921875, 1.4139556884765625, 1.475494384765625, 1.5370330810546875, 1.59857177734375, 1.6601104736328125, 1.721649169921875, 1.7831878662109375, 1.8447265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 16.0, 22.0, 53.0, 84.0, 185.0, 241.0, 164.0, 108.0, 51.0, 22.0, 26.0, 7.0, 9.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0010929107666015625, -0.001069914549589157, -0.0010469183325767517, -0.0010239221155643463, -0.001000925898551941, -0.0009779296815395355, -0.0009549334645271301, -0.0009319372475147247, -0.0009089410305023193, -0.0008859448134899139, -0.0008629485964775085, -0.0008399523794651031, -0.0008169561624526978, -0.0007939599454402924, -0.000770963728427887, -0.0007479675114154816, -0.0007249712944030762, -0.0007019750773906708, -0.0006789788603782654, -0.00065598264336586, -0.0006329864263534546, -0.0006099902093410492, -0.0005869939923286438, -0.0005639977753162384, -0.000541001558303833, -0.0005180053412914276, -0.0004950091242790222, -0.0004720129072666168, -0.0004490166902542114, -0.00042602047324180603, -0.00040302425622940063, -0.00038002803921699524, -0.00035703182220458984, -0.00033403560519218445, -0.00031103938817977905, -0.00028804317116737366, -0.00026504695415496826, -0.00024205073714256287, -0.00021905452013015747, -0.00019605830311775208, -0.00017306208610534668, -0.00015006586909294128, -0.0001270696520805359, -0.00010407343506813049, -8.10772180557251e-05, -5.80810010433197e-05, -3.508478403091431e-05, -1.2088567018508911e-05, 1.0907649993896484e-05, 3.390386700630188e-05, 5.6900084018707275e-05, 7.989630103111267e-05, 0.00010289251804351807, 0.00012588873505592346, 0.00014888495206832886, 0.00017188116908073425, 0.00019487738609313965, 0.00021787360310554504, 0.00024086982011795044, 0.00026386603713035583, 0.00028686225414276123, 0.0003098584711551666, 0.000332854688167572, 0.0003558509051799774, 0.0003788471221923828]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 17.0, 19.0, 27.0, 36.0, 53.0, 100.0, 169.0, 351.0, 790.0, 2121.0, 8610.0, 66158.0, 792662.0, 157376.0, 14823.0, 3199.0, 1045.0, 447.0, 225.0, 119.0, 64.0, 42.0, 28.0, 15.0, 8.0, 6.0, 11.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.0919189453125, -2.023681640625, -1.9554443359375, -1.88720703125, -1.8189697265625, -1.750732421875, -1.6824951171875, -1.6142578125, -1.5460205078125, -1.477783203125, -1.4095458984375, -1.34130859375, -1.2730712890625, -1.204833984375, -1.1365966796875, -1.068359375, -1.0001220703125, -0.931884765625, -0.8636474609375, -0.79541015625, -0.7271728515625, -0.658935546875, -0.5906982421875, -0.5224609375, -0.4542236328125, -0.385986328125, -0.3177490234375, -0.24951171875, -0.1812744140625, -0.113037109375, -0.0447998046875, 0.0234375, 0.0916748046875, 0.159912109375, 0.2281494140625, 0.29638671875, 0.3646240234375, 0.432861328125, 0.5010986328125, 0.5693359375, 0.6375732421875, 0.705810546875, 0.7740478515625, 0.84228515625, 0.9105224609375, 0.978759765625, 1.0469970703125, 1.115234375, 1.1834716796875, 1.251708984375, 1.3199462890625, 1.38818359375, 1.4564208984375, 1.524658203125, 1.5928955078125, 1.6611328125, 1.7293701171875, 1.797607421875, 1.8658447265625, 1.93408203125, 2.0023193359375, 2.070556640625, 2.1387939453125, 2.20703125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 7.0, 10.0, 13.0, 13.0, 16.0, 19.0, 21.0, 28.0, 27.0, 45.0, 45.0, 57.0, 73.0, 74.0, 67.0, 67.0, 74.0, 67.0, 53.0, 26.0, 41.0, 29.0, 24.0, 14.0, 23.0, 10.0, 7.0, 14.0, 8.0, 5.0, 3.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7265625, -1.6815948486328125, -1.636627197265625, -1.5916595458984375, -1.54669189453125, -1.5017242431640625, -1.456756591796875, -1.4117889404296875, -1.3668212890625, -1.3218536376953125, -1.276885986328125, -1.2319183349609375, -1.18695068359375, -1.1419830322265625, -1.097015380859375, -1.0520477294921875, -1.007080078125, -0.9621124267578125, -0.917144775390625, -0.8721771240234375, -0.82720947265625, -0.7822418212890625, -0.737274169921875, -0.6923065185546875, -0.6473388671875, -0.6023712158203125, -0.557403564453125, -0.5124359130859375, -0.46746826171875, -0.4225006103515625, -0.377532958984375, -0.3325653076171875, -0.28759765625, -0.2426300048828125, -0.197662353515625, -0.1526947021484375, -0.10772705078125, -0.0627593994140625, -0.017791748046875, 0.0271759033203125, 0.0721435546875, 0.1171112060546875, 0.162078857421875, 0.2070465087890625, 0.25201416015625, 0.2969818115234375, 0.341949462890625, 0.3869171142578125, 0.431884765625, 0.4768524169921875, 0.521820068359375, 0.5667877197265625, 0.61175537109375, 0.6567230224609375, 0.701690673828125, 0.7466583251953125, 0.7916259765625, 0.8365936279296875, 0.881561279296875, 0.9265289306640625, 0.97149658203125, 1.0164642333984375, 1.061431884765625, 1.1063995361328125, 1.1513671875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 11.0, 27.0, 62.0, 138.0, 188.0, 260.0, 159.0, 78.0, 48.0, 14.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-63.306217193603516, -62.02650833129883, -60.746795654296875, -59.46708679199219, -58.1873779296875, -56.90766525268555, -55.62795639038086, -54.348243713378906, -53.06853485107422, -51.78882598876953, -50.50911331176758, -49.22940444946289, -47.9496955871582, -46.66998291015625, -45.39027404785156, -44.110565185546875, -42.83085632324219, -41.5511474609375, -40.27143478393555, -38.99172592163086, -37.71201705932617, -36.43230438232422, -35.15259552001953, -33.872886657714844, -32.59317398071289, -31.31346321105957, -30.033754348754883, -28.754043579101562, -27.474332809448242, -26.194622039794922, -24.914913177490234, -23.635202407836914, -22.355491638183594, -21.075780868530273, -19.796072006225586, -18.516361236572266, -17.236650466918945, -15.956940650939941, -14.677230834960938, -13.397520065307617, -12.117810249328613, -10.83810043334961, -9.558389663696289, -8.278679847717285, -6.998969554901123, -5.719259262084961, -4.439549446105957, -3.1598386764526367, -1.8801288604736328, -0.6004186868667603, 0.6792914867401123, 1.9590015411376953, 3.2387118339538574, 4.5184221267700195, 5.798131942749023, 7.077842712402344, 8.357552528381348, 9.637262344360352, 10.916973114013672, 12.196682929992676, 13.47639274597168, 14.756103515625, 16.035812377929688, 17.31552505493164, 18.595233917236328]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 4.0, 7.0, 5.0, 11.0, 10.0, 17.0, 24.0, 21.0, 19.0, 39.0, 33.0, 24.0, 43.0, 44.0, 51.0, 62.0, 82.0, 67.0, 60.0, 51.0, 47.0, 40.0, 51.0, 28.0, 25.0, 34.0, 24.0, 16.0, 20.0, 13.0, 13.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.01881217956543, -21.38681411743164, -20.754817962646484, -20.122821807861328, -19.49082374572754, -18.85882568359375, -18.226829528808594, -17.594833374023438, -16.96283531188965, -16.33083724975586, -15.698841094970703, -15.06684398651123, -14.434846878051758, -13.802849769592285, -13.170852661132812, -12.53885555267334, -11.906858444213867, -11.274861335754395, -10.642864227294922, -10.01086711883545, -9.378870010375977, -8.746872901916504, -8.114875793457031, -7.482878684997559, -6.850881576538086, -6.218884468078613, -5.586887359619141, -4.954890251159668, -4.322893142700195, -3.6908960342407227, -3.05889892578125, -2.4269018173217773, -1.7949066162109375, -1.1629095077514648, -0.5309123992919922, 0.10108470916748047, 0.7330818176269531, 1.3650789260864258, 1.9970760345458984, 2.629073143005371, 3.2610702514648438, 3.8930673599243164, 4.525064468383789, 5.157061576843262, 5.789058685302734, 6.421055793762207, 7.05305290222168, 7.685050010681152, 8.317047119140625, 8.949044227600098, 9.58104133605957, 10.213038444519043, 10.845035552978516, 11.477032661437988, 12.109029769897461, 12.741026878356934, 13.373023986816406, 14.005021095275879, 14.637018203735352, 15.269015312194824, 15.901012420654297, 16.533008575439453, 17.165006637573242, 17.79700469970703, 18.429000854492188]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 4.0, 7.0, 14.0, 19.0, 29.0, 48.0, 72.0, 148.0, 273.0, 556.0, 1035.0, 2658.0, 7449.0, 27200.0, 205931.0, 3347835.0, 540802.0, 43622.0, 10152.0, 3437.0, 1451.0, 709.0, 329.0, 174.0, 83.0, 68.0, 51.0, 26.0, 21.0, 24.0, 9.0, 12.0, 6.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.50390625, -2.427215576171875, -2.35052490234375, -2.273834228515625, -2.1971435546875, -2.120452880859375, -2.04376220703125, -1.967071533203125, -1.890380859375, -1.813690185546875, -1.73699951171875, -1.660308837890625, -1.5836181640625, -1.506927490234375, -1.43023681640625, -1.353546142578125, -1.27685546875, -1.200164794921875, -1.12347412109375, -1.046783447265625, -0.9700927734375, -0.893402099609375, -0.81671142578125, -0.740020751953125, -0.663330078125, -0.586639404296875, -0.50994873046875, -0.433258056640625, -0.3565673828125, -0.279876708984375, -0.20318603515625, -0.126495361328125, -0.0498046875, 0.026885986328125, 0.10357666015625, 0.180267333984375, 0.2569580078125, 0.333648681640625, 0.41033935546875, 0.487030029296875, 0.563720703125, 0.640411376953125, 0.71710205078125, 0.793792724609375, 0.8704833984375, 0.947174072265625, 1.02386474609375, 1.100555419921875, 1.17724609375, 1.253936767578125, 1.33062744140625, 1.407318115234375, 1.4840087890625, 1.560699462890625, 1.63739013671875, 1.714080810546875, 1.790771484375, 1.867462158203125, 1.94415283203125, 2.020843505859375, 2.0975341796875, 2.174224853515625, 2.25091552734375, 2.327606201171875, 2.404296875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 1.0, 8.0, 7.0, 6.0, 5.0, 8.0, 12.0, 14.0, 16.0, 26.0, 34.0, 33.0, 27.0, 33.0, 41.0, 32.0, 49.0, 36.0, 49.0, 44.0, 43.0, 59.0, 47.0, 52.0, 43.0, 41.0, 44.0, 28.0, 25.0, 23.0, 17.0, 21.0, 12.0, 9.0, 11.0, 10.0, 6.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.751953125, -0.7252273559570312, -0.6985015869140625, -0.6717758178710938, -0.645050048828125, -0.6183242797851562, -0.5915985107421875, -0.5648727416992188, -0.53814697265625, -0.5114212036132812, -0.4846954345703125, -0.45796966552734375, -0.431243896484375, -0.40451812744140625, -0.3777923583984375, -0.35106658935546875, -0.3243408203125, -0.29761505126953125, -0.2708892822265625, -0.24416351318359375, -0.217437744140625, -0.19071197509765625, -0.1639862060546875, -0.13726043701171875, -0.11053466796875, -0.08380889892578125, -0.0570831298828125, -0.03035736083984375, -0.003631591796875, 0.02309417724609375, 0.0498199462890625, 0.07654571533203125, 0.103271484375, 0.12999725341796875, 0.1567230224609375, 0.18344879150390625, 0.210174560546875, 0.23690032958984375, 0.2636260986328125, 0.29035186767578125, 0.31707763671875, 0.34380340576171875, 0.3705291748046875, 0.39725494384765625, 0.423980712890625, 0.45070648193359375, 0.4774322509765625, 0.5041580200195312, 0.5308837890625, 0.5576095581054688, 0.5843353271484375, 0.6110610961914062, 0.637786865234375, 0.6645126342773438, 0.6912384033203125, 0.7179641723632812, 0.74468994140625, 0.7714157104492188, 0.7981414794921875, 0.8248672485351562, 0.851593017578125, 0.8783187866210938, 0.9050445556640625, 0.9317703247070312, 0.95849609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 4.0, 9.0, 9.0, 16.0, 36.0, 56.0, 96.0, 153.0, 336.0, 907.0, 2474.0, 9311.0, 52051.0, 1291483.0, 2743678.0, 75479.0, 12515.0, 3386.0, 1187.0, 508.0, 260.0, 130.0, 59.0, 47.0, 42.0, 12.0, 11.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.931640625, -2.814727783203125, -2.69781494140625, -2.580902099609375, -2.4639892578125, -2.347076416015625, -2.23016357421875, -2.113250732421875, -1.996337890625, -1.879425048828125, -1.76251220703125, -1.645599365234375, -1.5286865234375, -1.411773681640625, -1.29486083984375, -1.177947998046875, -1.06103515625, -0.944122314453125, -0.82720947265625, -0.710296630859375, -0.5933837890625, -0.476470947265625, -0.35955810546875, -0.242645263671875, -0.125732421875, -0.008819580078125, 0.10809326171875, 0.225006103515625, 0.3419189453125, 0.458831787109375, 0.57574462890625, 0.692657470703125, 0.8095703125, 0.926483154296875, 1.04339599609375, 1.160308837890625, 1.2772216796875, 1.394134521484375, 1.51104736328125, 1.627960205078125, 1.744873046875, 1.861785888671875, 1.97869873046875, 2.095611572265625, 2.2125244140625, 2.329437255859375, 2.44635009765625, 2.563262939453125, 2.68017578125, 2.797088623046875, 2.91400146484375, 3.030914306640625, 3.1478271484375, 3.264739990234375, 3.38165283203125, 3.498565673828125, 3.615478515625, 3.732391357421875, 3.84930419921875, 3.966217041015625, 4.0831298828125, 4.200042724609375, 4.31695556640625, 4.433868408203125, 4.55078125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 6.0, 8.0, 9.0, 14.0, 19.0, 25.0, 39.0, 58.0, 89.0, 154.0, 315.0, 581.0, 1119.0, 748.0, 392.0, 169.0, 94.0, 56.0, 47.0, 33.0, 26.0, 25.0, 18.0, 6.0, 4.0, 4.0, 8.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.57464599609375, -2.4656982421875, -2.35675048828125, -2.247802734375, -2.13885498046875, -2.0299072265625, -1.92095947265625, -1.81201171875, -1.70306396484375, -1.5941162109375, -1.48516845703125, -1.376220703125, -1.26727294921875, -1.1583251953125, -1.04937744140625, -0.9404296875, -0.83148193359375, -0.7225341796875, -0.61358642578125, -0.504638671875, -0.39569091796875, -0.2867431640625, -0.17779541015625, -0.06884765625, 0.04010009765625, 0.1490478515625, 0.25799560546875, 0.366943359375, 0.47589111328125, 0.5848388671875, 0.69378662109375, 0.802734375, 0.91168212890625, 1.0206298828125, 1.12957763671875, 1.238525390625, 1.34747314453125, 1.4564208984375, 1.56536865234375, 1.67431640625, 1.78326416015625, 1.8922119140625, 2.00115966796875, 2.110107421875, 2.21905517578125, 2.3280029296875, 2.43695068359375, 2.5458984375, 2.65484619140625, 2.7637939453125, 2.87274169921875, 2.981689453125, 3.09063720703125, 3.1995849609375, 3.30853271484375, 3.41748046875, 3.52642822265625, 3.6353759765625, 3.74432373046875, 3.853271484375, 3.96221923828125, 4.0711669921875, 4.18011474609375, 4.2890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 7.0, 10.0, 14.0, 35.0, 72.0, 101.0, 144.0, 190.0, 159.0, 111.0, 65.0, 25.0, 18.0, 14.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-16.693740844726562, -15.918699264526367, -15.143657684326172, -14.368616104125977, -13.593574523925781, -12.818532943725586, -12.04349136352539, -11.268449783325195, -10.493408203125, -9.718366622924805, -8.94332504272461, -8.168283462524414, -7.393241882324219, -6.618200302124023, -5.84315824508667, -5.068116664886475, -4.293074607849121, -3.518033027648926, -2.7429914474487305, -1.967949628829956, -1.1929080486297607, -0.41786646842956543, 0.357175350189209, 1.1322169303894043, 1.9072585105895996, 2.682300090789795, 3.4573416709899902, 4.232383728027344, 5.007425308227539, 5.782466888427734, 6.55750846862793, 7.332550048828125, 8.10759162902832, 8.882633209228516, 9.657674789428711, 10.432716369628906, 11.207757949829102, 11.982799530029297, 12.757841110229492, 13.532882690429688, 14.307924270629883, 15.082965850830078, 15.858007431030273, 16.63304901123047, 17.408090591430664, 18.18313217163086, 18.958173751831055, 19.73321533203125, 20.508258819580078, 21.283300399780273, 22.05834197998047, 22.833383560180664, 23.60842514038086, 24.383466720581055, 25.15850830078125, 25.933549880981445, 26.70859146118164, 27.483633041381836, 28.25867462158203, 29.033716201782227, 29.808757781982422, 30.583799362182617, 31.358840942382812, 32.13388442993164, 32.9089241027832]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 3.0, 4.0, 3.0, 8.0, 6.0, 5.0, 12.0, 13.0, 16.0, 4.0, 20.0, 25.0, 22.0, 21.0, 31.0, 33.0, 23.0, 41.0, 44.0, 46.0, 29.0, 42.0, 32.0, 58.0, 47.0, 40.0, 33.0, 38.0, 38.0, 34.0, 23.0, 27.0, 25.0, 27.0, 22.0, 17.0, 17.0, 15.0, 12.0, 14.0, 6.0, 4.0, 2.0, 3.0, 3.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.627767562866211, -12.270913124084473, -11.914058685302734, -11.557204246520996, -11.200349807739258, -10.84349536895752, -10.486640930175781, -10.12978744506836, -9.772932052612305, -9.416077613830566, -9.059223175048828, -8.70236873626709, -8.345514297485352, -7.988659858703613, -7.631805896759033, -7.274951457977295, -6.918097496032715, -6.561243057250977, -6.204388618469238, -5.8475341796875, -5.490679740905762, -5.133825302124023, -4.776971340179443, -4.420116901397705, -4.063262462615967, -3.7064080238342285, -3.3495535850524902, -2.992699384689331, -2.6358449459075928, -2.2789905071258545, -1.9221363067626953, -1.565281867980957, -1.2084274291992188, -0.8515730500221252, -0.49471867084503174, -0.137864351272583, 0.21899008750915527, 0.5758445262908936, 0.9326987266540527, 1.289553165435791, 1.6464076042175293, 2.0032620429992676, 2.360116481781006, 2.716970682144165, 3.0738251209259033, 3.4306795597076416, 3.787533760070801, 4.144388198852539, 4.501242637634277, 4.858097076416016, 5.214951515197754, 5.571805953979492, 5.9286603927612305, 6.285514831542969, 6.642368793487549, 6.999223232269287, 7.356077671051025, 7.712932109832764, 8.069786071777344, 8.426640510559082, 8.78349494934082, 9.140349388122559, 9.497203826904297, 9.854058265686035, 10.210912704467773]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 12.0, 12.0, 20.0, 21.0, 21.0, 49.0, 82.0, 110.0, 207.0, 311.0, 517.0, 908.0, 1468.0, 2894.0, 5469.0, 11133.0, 24019.0, 52738.0, 116123.0, 236343.0, 286601.0, 166245.0, 76529.0, 34615.0, 15637.0, 7682.0, 3813.0, 2000.0, 1167.0, 673.0, 409.0, 238.0, 139.0, 88.0, 65.0, 58.0, 25.0, 27.0, 20.0, 16.0, 2.0, 9.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6767578125, -1.6247406005859375, -1.572723388671875, -1.5207061767578125, -1.46868896484375, -1.4166717529296875, -1.364654541015625, -1.3126373291015625, -1.2606201171875, -1.2086029052734375, -1.156585693359375, -1.1045684814453125, -1.05255126953125, -1.0005340576171875, -0.948516845703125, -0.8964996337890625, -0.844482421875, -0.7924652099609375, -0.740447998046875, -0.6884307861328125, -0.63641357421875, -0.5843963623046875, -0.532379150390625, -0.4803619384765625, -0.4283447265625, -0.3763275146484375, -0.324310302734375, -0.2722930908203125, -0.22027587890625, -0.1682586669921875, -0.116241455078125, -0.0642242431640625, -0.01220703125, 0.0398101806640625, 0.091827392578125, 0.1438446044921875, 0.19586181640625, 0.2478790283203125, 0.299896240234375, 0.3519134521484375, 0.4039306640625, 0.4559478759765625, 0.507965087890625, 0.5599822998046875, 0.61199951171875, 0.6640167236328125, 0.716033935546875, 0.7680511474609375, 0.820068359375, 0.8720855712890625, 0.924102783203125, 0.9761199951171875, 1.02813720703125, 1.0801544189453125, 1.132171630859375, 1.1841888427734375, 1.2362060546875, 1.2882232666015625, 1.340240478515625, 1.3922576904296875, 1.44427490234375, 1.4962921142578125, 1.548309326171875, 1.6003265380859375, 1.65234375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 1.0, 8.0, 2.0, 14.0, 11.0, 13.0, 11.0, 19.0, 18.0, 17.0, 20.0, 27.0, 29.0, 30.0, 28.0, 39.0, 37.0, 39.0, 34.0, 47.0, 39.0, 38.0, 57.0, 33.0, 51.0, 30.0, 34.0, 35.0, 36.0, 26.0, 26.0, 20.0, 21.0, 23.0, 15.0, 19.0, 7.0, 8.0, 14.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.71240234375, -0.6879043579101562, -0.6634063720703125, -0.6389083862304688, -0.614410400390625, -0.5899124145507812, -0.5654144287109375, -0.5409164428710938, -0.51641845703125, -0.49192047119140625, -0.4674224853515625, -0.44292449951171875, -0.418426513671875, -0.39392852783203125, -0.3694305419921875, -0.34493255615234375, -0.3204345703125, -0.29593658447265625, -0.2714385986328125, -0.24694061279296875, -0.222442626953125, -0.19794464111328125, -0.1734466552734375, -0.14894866943359375, -0.12445068359375, -0.09995269775390625, -0.0754547119140625, -0.05095672607421875, -0.026458740234375, -0.00196075439453125, 0.0225372314453125, 0.04703521728515625, 0.071533203125, 0.09603118896484375, 0.1205291748046875, 0.14502716064453125, 0.169525146484375, 0.19402313232421875, 0.2185211181640625, 0.24301910400390625, 0.26751708984375, 0.29201507568359375, 0.3165130615234375, 0.34101104736328125, 0.365509033203125, 0.39000701904296875, 0.4145050048828125, 0.43900299072265625, 0.4635009765625, 0.48799896240234375, 0.5124969482421875, 0.5369949340820312, 0.561492919921875, 0.5859909057617188, 0.6104888916015625, 0.6349868774414062, 0.65948486328125, 0.6839828491210938, 0.7084808349609375, 0.7329788208007812, 0.757476806640625, 0.7819747924804688, 0.8064727783203125, 0.8309707641601562, 0.85546875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 3.0, 9.0, 7.0, 16.0, 27.0, 26.0, 38.0, 53.0, 77.0, 120.0, 189.0, 290.0, 406.0, 662.0, 1152.0, 1982.0, 5218.0, 19397.0, 128252.0, 694499.0, 161507.0, 23405.0, 5797.0, 2322.0, 1125.0, 674.0, 434.0, 257.0, 204.0, 116.0, 79.0, 52.0, 57.0, 29.0, 12.0, 20.0, 7.0, 7.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.353515625, -3.24005126953125, -3.1265869140625, -3.01312255859375, -2.899658203125, -2.78619384765625, -2.6727294921875, -2.55926513671875, -2.44580078125, -2.33233642578125, -2.2188720703125, -2.10540771484375, -1.991943359375, -1.87847900390625, -1.7650146484375, -1.65155029296875, -1.5380859375, -1.42462158203125, -1.3111572265625, -1.19769287109375, -1.084228515625, -0.97076416015625, -0.8572998046875, -0.74383544921875, -0.63037109375, -0.51690673828125, -0.4034423828125, -0.28997802734375, -0.176513671875, -0.06304931640625, 0.0504150390625, 0.16387939453125, 0.27734375, 0.39080810546875, 0.5042724609375, 0.61773681640625, 0.731201171875, 0.84466552734375, 0.9581298828125, 1.07159423828125, 1.18505859375, 1.29852294921875, 1.4119873046875, 1.52545166015625, 1.638916015625, 1.75238037109375, 1.8658447265625, 1.97930908203125, 2.0927734375, 2.20623779296875, 2.3197021484375, 2.43316650390625, 2.546630859375, 2.66009521484375, 2.7735595703125, 2.88702392578125, 3.00048828125, 3.11395263671875, 3.2274169921875, 3.34088134765625, 3.454345703125, 3.56781005859375, 3.6812744140625, 3.79473876953125, 3.908203125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 7.0, 5.0, 9.0, 14.0, 14.0, 19.0, 19.0, 29.0, 34.0, 22.0, 33.0, 56.0, 39.0, 39.0, 49.0, 43.0, 50.0, 44.0, 50.0, 42.0, 56.0, 48.0, 40.0, 29.0, 32.0, 39.0, 29.0, 22.0, 17.0, 15.0, 11.0, 10.0, 7.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96484375, -3.84490966796875, -3.7249755859375, -3.60504150390625, -3.485107421875, -3.36517333984375, -3.2452392578125, -3.12530517578125, -3.00537109375, -2.88543701171875, -2.7655029296875, -2.64556884765625, -2.525634765625, -2.40570068359375, -2.2857666015625, -2.16583251953125, -2.0458984375, -1.92596435546875, -1.8060302734375, -1.68609619140625, -1.566162109375, -1.44622802734375, -1.3262939453125, -1.20635986328125, -1.08642578125, -0.96649169921875, -0.8465576171875, -0.72662353515625, -0.606689453125, -0.48675537109375, -0.3668212890625, -0.24688720703125, -0.126953125, -0.00701904296875, 0.1129150390625, 0.23284912109375, 0.352783203125, 0.47271728515625, 0.5926513671875, 0.71258544921875, 0.83251953125, 0.95245361328125, 1.0723876953125, 1.19232177734375, 1.312255859375, 1.43218994140625, 1.5521240234375, 1.67205810546875, 1.7919921875, 1.91192626953125, 2.0318603515625, 2.15179443359375, 2.271728515625, 2.39166259765625, 2.5115966796875, 2.63153076171875, 2.75146484375, 2.87139892578125, 2.9913330078125, 3.11126708984375, 3.231201171875, 3.35113525390625, 3.4710693359375, 3.59100341796875, 3.7109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 13.0, 10.0, 14.0, 17.0, 27.0, 35.0, 67.0, 105.0, 159.0, 231.0, 439.0, 927.0, 2297.0, 7670.0, 46329.0, 696454.0, 261447.0, 23988.0, 5026.0, 1614.0, 721.0, 345.0, 205.0, 132.0, 75.0, 41.0, 43.0, 28.0, 21.0, 15.0, 11.0, 9.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.38671875, -1.3417510986328125, -1.296783447265625, -1.2518157958984375, -1.20684814453125, -1.1618804931640625, -1.116912841796875, -1.0719451904296875, -1.0269775390625, -0.9820098876953125, -0.937042236328125, -0.8920745849609375, -0.84710693359375, -0.8021392822265625, -0.757171630859375, -0.7122039794921875, -0.667236328125, -0.6222686767578125, -0.577301025390625, -0.5323333740234375, -0.48736572265625, -0.4423980712890625, -0.397430419921875, -0.3524627685546875, -0.3074951171875, -0.2625274658203125, -0.217559814453125, -0.1725921630859375, -0.12762451171875, -0.0826568603515625, -0.037689208984375, 0.0072784423828125, 0.05224609375, 0.0972137451171875, 0.142181396484375, 0.1871490478515625, 0.23211669921875, 0.2770843505859375, 0.322052001953125, 0.3670196533203125, 0.4119873046875, 0.4569549560546875, 0.501922607421875, 0.5468902587890625, 0.59185791015625, 0.6368255615234375, 0.681793212890625, 0.7267608642578125, 0.771728515625, 0.8166961669921875, 0.861663818359375, 0.9066314697265625, 0.95159912109375, 0.9965667724609375, 1.041534423828125, 1.0865020751953125, 1.1314697265625, 1.1764373779296875, 1.221405029296875, 1.2663726806640625, 1.31134033203125, 1.3563079833984375, 1.401275634765625, 1.4462432861328125, 1.4912109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 2.0, 7.0, 6.0, 7.0, 17.0, 20.0, 32.0, 40.0, 41.0, 60.0, 83.0, 106.0, 117.0, 105.0, 61.0, 52.0, 49.0, 33.0, 36.0, 21.0, 17.0, 16.0, 11.0, 7.0, 9.0, 4.0, 5.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002772808074951172, -0.0002675391733646393, -0.0002577975392341614, -0.00024805590510368347, -0.00023831427097320557, -0.00022857263684272766, -0.00021883100271224976, -0.00020908936858177185, -0.00019934773445129395, -0.00018960610032081604, -0.00017986446619033813, -0.00017012283205986023, -0.00016038119792938232, -0.00015063956379890442, -0.00014089792966842651, -0.0001311562955379486, -0.0001214146614074707, -0.0001116730272769928, -0.00010193139314651489, -9.218975901603699e-05, -8.244812488555908e-05, -7.270649075508118e-05, -6.296485662460327e-05, -5.3223222494125366e-05, -4.348158836364746e-05, -3.3739954233169556e-05, -2.399832010269165e-05, -1.4256685972213745e-05, -4.51505184173584e-06, 5.2265822887420654e-06, 1.496821641921997e-05, 2.4709850549697876e-05, 3.445148468017578e-05, 4.4193118810653687e-05, 5.393475294113159e-05, 6.36763870716095e-05, 7.34180212020874e-05, 8.315965533256531e-05, 9.290128946304321e-05, 0.00010264292359352112, 0.00011238455772399902, 0.00012212619185447693, 0.00013186782598495483, 0.00014160946011543274, 0.00015135109424591064, 0.00016109272837638855, 0.00017083436250686646, 0.00018057599663734436, 0.00019031763076782227, 0.00020005926489830017, 0.00020980089902877808, 0.00021954253315925598, 0.0002292841672897339, 0.0002390258014202118, 0.0002487674355506897, 0.0002585090696811676, 0.0002682507038116455, 0.0002779923379421234, 0.0002877339720726013, 0.0002974756062030792, 0.00030721724033355713, 0.00031695887446403503, 0.00032670050859451294, 0.00033644214272499084, 0.00034618377685546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 1.0, 11.0, 15.0, 11.0, 22.0, 35.0, 59.0, 101.0, 143.0, 279.0, 567.0, 1213.0, 3177.0, 11756.0, 75860.0, 794797.0, 136183.0, 17095.0, 4326.0, 1437.0, 663.0, 312.0, 161.0, 103.0, 57.0, 41.0, 45.0, 22.0, 11.0, 14.0, 9.0, 4.0, 2.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5009765625, -1.4549560546875, -1.408935546875, -1.3629150390625, -1.31689453125, -1.2708740234375, -1.224853515625, -1.1788330078125, -1.1328125, -1.0867919921875, -1.040771484375, -0.9947509765625, -0.94873046875, -0.9027099609375, -0.856689453125, -0.8106689453125, -0.7646484375, -0.7186279296875, -0.672607421875, -0.6265869140625, -0.58056640625, -0.5345458984375, -0.488525390625, -0.4425048828125, -0.396484375, -0.3504638671875, -0.304443359375, -0.2584228515625, -0.21240234375, -0.1663818359375, -0.120361328125, -0.0743408203125, -0.0283203125, 0.0177001953125, 0.063720703125, 0.1097412109375, 0.15576171875, 0.2017822265625, 0.247802734375, 0.2938232421875, 0.33984375, 0.3858642578125, 0.431884765625, 0.4779052734375, 0.52392578125, 0.5699462890625, 0.615966796875, 0.6619873046875, 0.7080078125, 0.7540283203125, 0.800048828125, 0.8460693359375, 0.89208984375, 0.9381103515625, 0.984130859375, 1.0301513671875, 1.076171875, 1.1221923828125, 1.168212890625, 1.2142333984375, 1.26025390625, 1.3062744140625, 1.352294921875, 1.3983154296875, 1.4443359375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 6.0, 11.0, 9.0, 6.0, 13.0, 19.0, 27.0, 19.0, 37.0, 48.0, 64.0, 74.0, 83.0, 85.0, 82.0, 70.0, 64.0, 69.0, 43.0, 36.0, 30.0, 22.0, 18.0, 13.0, 11.0, 5.0, 8.0, 9.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0908203125, -1.0528717041015625, -1.014923095703125, -0.9769744873046875, -0.93902587890625, -0.9010772705078125, -0.863128662109375, -0.8251800537109375, -0.7872314453125, -0.7492828369140625, -0.711334228515625, -0.6733856201171875, -0.63543701171875, -0.5974884033203125, -0.559539794921875, -0.5215911865234375, -0.483642578125, -0.4456939697265625, -0.407745361328125, -0.3697967529296875, -0.33184814453125, -0.2938995361328125, -0.255950927734375, -0.2180023193359375, -0.1800537109375, -0.1421051025390625, -0.104156494140625, -0.0662078857421875, -0.02825927734375, 0.0096893310546875, 0.047637939453125, 0.0855865478515625, 0.12353515625, 0.1614837646484375, 0.199432373046875, 0.2373809814453125, 0.27532958984375, 0.3132781982421875, 0.351226806640625, 0.3891754150390625, 0.4271240234375, 0.4650726318359375, 0.503021240234375, 0.5409698486328125, 0.57891845703125, 0.6168670654296875, 0.654815673828125, 0.6927642822265625, 0.730712890625, 0.7686614990234375, 0.806610107421875, 0.8445587158203125, 0.88250732421875, 0.9204559326171875, 0.958404541015625, 0.9963531494140625, 1.0343017578125, 1.0722503662109375, 1.110198974609375, 1.1481475830078125, 1.18609619140625, 1.2240447998046875, 1.261993408203125, 1.2999420166015625, 1.337890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 13.0, 14.0, 20.0, 48.0, 104.0, 144.0, 289.0, 174.0, 103.0, 41.0, 22.0, 7.0, 8.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.962188720703125, -45.99844741821289, -45.034706115722656, -44.07096481323242, -43.10722351074219, -42.14348220825195, -41.17974090576172, -40.215999603271484, -39.25225830078125, -38.288516998291016, -37.32477569580078, -36.36103439331055, -35.39729309082031, -34.43355178833008, -33.469810485839844, -32.50606918334961, -31.542325973510742, -30.578584671020508, -29.614843368530273, -28.65110206604004, -27.687360763549805, -26.72361946105957, -25.759876251220703, -24.79613494873047, -23.832393646240234, -22.86865234375, -21.904911041259766, -20.94116973876953, -19.977428436279297, -19.013687133789062, -18.049945831298828, -17.086204528808594, -16.12246322631836, -15.158721923828125, -14.19498062133789, -13.231239318847656, -12.267498016357422, -11.303756713867188, -10.340014457702637, -9.376273155212402, -8.412530899047852, -7.448789596557617, -6.485048294067383, -5.52130651473999, -4.557565212249756, -3.5938239097595215, -2.630082130432129, -1.6663408279418945, -0.7025995254516602, 0.26114189624786377, 1.2248833179473877, 2.188624858856201, 3.1523661613464355, 4.11610746383667, 5.0798492431640625, 6.043590545654297, 7.007331848144531, 7.971073150634766, 8.934814453125, 9.898555755615234, 10.862297058105469, 11.826038360595703, 12.789780616760254, 13.753521919250488, 14.717263221740723]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 14.0, 7.0, 11.0, 9.0, 16.0, 11.0, 16.0, 19.0, 20.0, 35.0, 33.0, 27.0, 25.0, 30.0, 29.0, 36.0, 59.0, 61.0, 56.0, 61.0, 44.0, 44.0, 36.0, 35.0, 20.0, 26.0, 17.0, 15.0, 27.0, 24.0, 18.0, 19.0, 13.0, 8.0, 15.0, 13.0, 8.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-12.562311172485352, -12.178360939025879, -11.794410705566406, -11.410460472106934, -11.026510238647461, -10.642560005187988, -10.258609771728516, -9.874659538269043, -9.49070930480957, -9.106759071350098, -8.722808837890625, -8.338858604431152, -7.95490837097168, -7.570958137512207, -7.187007904052734, -6.803057670593262, -6.419106960296631, -6.035156726837158, -5.6512064933776855, -5.267256259918213, -4.88330602645874, -4.499355792999268, -4.115405082702637, -3.731455087661743, -3.3475048542022705, -2.963554620742798, -2.579604387283325, -2.1956539154052734, -1.8117038011550903, -1.4277535676956177, -1.0438032150268555, -0.6598529815673828, -0.27590274810791016, 0.10804751515388489, 0.49199777841567993, 0.8759480714797974, 1.25989830493927, 1.6438485383987427, 2.027798891067505, 2.4117491245269775, 2.79569935798645, 3.179649591445923, 3.5635998249053955, 3.9475502967834473, 4.33150053024292, 4.715450763702393, 5.099400997161865, 5.483351230621338, 5.8673014640808105, 6.251251697540283, 6.635201930999756, 7.0191521644592285, 7.403102397918701, 7.787052631378174, 8.171003341674805, 8.554953575134277, 8.93890380859375, 9.322854042053223, 9.706804275512695, 10.090754508972168, 10.47470474243164, 10.858654975891113, 11.242605209350586, 11.626555442810059, 12.010505676269531]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 6.0, 15.0, 14.0, 28.0, 41.0, 81.0, 153.0, 329.0, 851.0, 2652.0, 10321.0, 74766.0, 2342433.0, 1694089.0, 56230.0, 8657.0, 2180.0, 752.0, 295.0, 172.0, 83.0, 39.0, 32.0, 17.0, 11.0, 9.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.37109375, -2.29913330078125, -2.2271728515625, -2.15521240234375, -2.083251953125, -2.01129150390625, -1.9393310546875, -1.86737060546875, -1.79541015625, -1.72344970703125, -1.6514892578125, -1.57952880859375, -1.507568359375, -1.43560791015625, -1.3636474609375, -1.29168701171875, -1.2197265625, -1.14776611328125, -1.0758056640625, -1.00384521484375, -0.931884765625, -0.85992431640625, -0.7879638671875, -0.71600341796875, -0.64404296875, -0.57208251953125, -0.5001220703125, -0.42816162109375, -0.356201171875, -0.28424072265625, -0.2122802734375, -0.14031982421875, -0.068359375, 0.00360107421875, 0.0755615234375, 0.14752197265625, 0.219482421875, 0.29144287109375, 0.3634033203125, 0.43536376953125, 0.50732421875, 0.57928466796875, 0.6512451171875, 0.72320556640625, 0.795166015625, 0.86712646484375, 0.9390869140625, 1.01104736328125, 1.0830078125, 1.15496826171875, 1.2269287109375, 1.29888916015625, 1.370849609375, 1.44281005859375, 1.5147705078125, 1.58673095703125, 1.65869140625, 1.73065185546875, 1.8026123046875, 1.87457275390625, 1.946533203125, 2.01849365234375, 2.0904541015625, 2.16241455078125, 2.234375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 7.0, 4.0, 6.0, 11.0, 7.0, 17.0, 22.0, 12.0, 22.0, 24.0, 23.0, 34.0, 24.0, 22.0, 44.0, 37.0, 43.0, 42.0, 50.0, 47.0, 45.0, 54.0, 46.0, 47.0, 44.0, 43.0, 34.0, 30.0, 26.0, 24.0, 23.0, 14.0, 18.0, 13.0, 3.0, 12.0, 8.0, 4.0, 5.0, 3.0, 0.0, 4.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6340484619140625, -0.608428955078125, -0.5828094482421875, -0.55718994140625, -0.5315704345703125, -0.505950927734375, -0.4803314208984375, -0.4547119140625, -0.4290924072265625, -0.403472900390625, -0.3778533935546875, -0.35223388671875, -0.3266143798828125, -0.300994873046875, -0.2753753662109375, -0.249755859375, -0.2241363525390625, -0.198516845703125, -0.1728973388671875, -0.14727783203125, -0.1216583251953125, -0.096038818359375, -0.0704193115234375, -0.0447998046875, -0.0191802978515625, 0.006439208984375, 0.0320587158203125, 0.05767822265625, 0.0832977294921875, 0.108917236328125, 0.1345367431640625, 0.16015625, 0.1857757568359375, 0.211395263671875, 0.2370147705078125, 0.26263427734375, 0.2882537841796875, 0.313873291015625, 0.3394927978515625, 0.3651123046875, 0.3907318115234375, 0.416351318359375, 0.4419708251953125, 0.46759033203125, 0.4932098388671875, 0.518829345703125, 0.5444488525390625, 0.570068359375, 0.5956878662109375, 0.621307373046875, 0.6469268798828125, 0.67254638671875, 0.6981658935546875, 0.723785400390625, 0.7494049072265625, 0.7750244140625, 0.8006439208984375, 0.826263427734375, 0.8518829345703125, 0.87750244140625, 0.9031219482421875, 0.928741455078125, 0.9543609619140625, 0.97998046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 8.0, 6.0, 7.0, 8.0, 12.0, 15.0, 17.0, 37.0, 41.0, 83.0, 113.0, 159.0, 264.0, 481.0, 866.0, 1867.0, 4564.0, 13227.0, 47800.0, 304618.0, 3287082.0, 446566.0, 60656.0, 15962.0, 5310.0, 2187.0, 978.0, 483.0, 280.0, 163.0, 106.0, 76.0, 58.0, 42.0, 43.0, 22.0, 27.0, 16.0, 13.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8056640625, -1.7465972900390625, -1.687530517578125, -1.6284637451171875, -1.56939697265625, -1.5103302001953125, -1.451263427734375, -1.3921966552734375, -1.3331298828125, -1.2740631103515625, -1.214996337890625, -1.1559295654296875, -1.09686279296875, -1.0377960205078125, -0.978729248046875, -0.9196624755859375, -0.860595703125, -0.8015289306640625, -0.742462158203125, -0.6833953857421875, -0.62432861328125, -0.5652618408203125, -0.506195068359375, -0.4471282958984375, -0.3880615234375, -0.3289947509765625, -0.269927978515625, -0.2108612060546875, -0.15179443359375, -0.0927276611328125, -0.033660888671875, 0.0254058837890625, 0.08447265625, 0.1435394287109375, 0.202606201171875, 0.2616729736328125, 0.32073974609375, 0.3798065185546875, 0.438873291015625, 0.4979400634765625, 0.5570068359375, 0.6160736083984375, 0.675140380859375, 0.7342071533203125, 0.79327392578125, 0.8523406982421875, 0.911407470703125, 0.9704742431640625, 1.029541015625, 1.0886077880859375, 1.147674560546875, 1.2067413330078125, 1.26580810546875, 1.3248748779296875, 1.383941650390625, 1.4430084228515625, 1.5020751953125, 1.5611419677734375, 1.620208740234375, 1.6792755126953125, 1.73834228515625, 1.7974090576171875, 1.856475830078125, 1.9155426025390625, 1.974609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 9.0, 6.0, 7.0, 8.0, 16.0, 13.0, 9.0, 21.0, 33.0, 29.0, 48.0, 77.0, 76.0, 140.0, 225.0, 357.0, 570.0, 686.0, 568.0, 371.0, 249.0, 146.0, 102.0, 78.0, 40.0, 31.0, 37.0, 23.0, 23.0, 14.0, 14.0, 10.0, 6.0, 5.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.9130859375, -1.8578033447265625, -1.802520751953125, -1.7472381591796875, -1.69195556640625, -1.6366729736328125, -1.581390380859375, -1.5261077880859375, -1.4708251953125, -1.4155426025390625, -1.360260009765625, -1.3049774169921875, -1.24969482421875, -1.1944122314453125, -1.139129638671875, -1.0838470458984375, -1.028564453125, -0.9732818603515625, -0.917999267578125, -0.8627166748046875, -0.80743408203125, -0.7521514892578125, -0.696868896484375, -0.6415863037109375, -0.5863037109375, -0.5310211181640625, -0.475738525390625, -0.4204559326171875, -0.36517333984375, -0.3098907470703125, -0.254608154296875, -0.1993255615234375, -0.14404296875, -0.0887603759765625, -0.033477783203125, 0.0218048095703125, 0.07708740234375, 0.1323699951171875, 0.187652587890625, 0.2429351806640625, 0.2982177734375, 0.3535003662109375, 0.408782958984375, 0.4640655517578125, 0.51934814453125, 0.5746307373046875, 0.629913330078125, 0.6851959228515625, 0.740478515625, 0.7957611083984375, 0.851043701171875, 0.9063262939453125, 0.96160888671875, 1.0168914794921875, 1.072174072265625, 1.1274566650390625, 1.1827392578125, 1.2380218505859375, 1.293304443359375, 1.3485870361328125, 1.40386962890625, 1.4591522216796875, 1.514434814453125, 1.5697174072265625, 1.625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 12.0, 40.0, 95.0, 236.0, 318.0, 186.0, 64.0, 25.0, 7.0, 10.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.70520782470703, -16.62074089050293, -15.536274909973145, -14.45180892944336, -13.367341995239258, -12.282876014709473, -11.198410034179688, -10.113943099975586, -9.0294771194458, -7.945010662078857, -6.860544204711914, -5.776078224182129, -4.6916117668151855, -3.607145309448242, -2.522679328918457, -1.4382128715515137, -0.3537464141845703, 0.7307199239730835, 1.8151862621307373, 2.8996524810791016, 3.984118938446045, 5.068585395812988, 6.153051376342773, 7.237517833709717, 8.32198429107666, 9.406450271606445, 10.490917205810547, 11.575383186340332, 12.659849166870117, 13.744316101074219, 14.828782081604004, 15.913248062133789, 16.99771499633789, 18.082181930541992, 19.16664695739746, 20.251113891601562, 21.335580825805664, 22.420047760009766, 23.504512786865234, 24.588979721069336, 25.673446655273438, 26.75791358947754, 27.842378616333008, 28.92684555053711, 30.01131248474121, 31.095779418945312, 32.18024444580078, 33.26470947265625, 34.34917449951172, 35.43363952636719, 36.51810836791992, 37.60257339477539, 38.68703842163086, 39.771507263183594, 40.85597229003906, 41.94043731689453, 43.024906158447266, 44.109371185302734, 45.19384002685547, 46.27830505371094, 47.362770080566406, 48.44723892211914, 49.53170394897461, 50.61616897583008, 51.70063781738281]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 12.0, 12.0, 9.0, 5.0, 11.0, 18.0, 20.0, 20.0, 28.0, 32.0, 33.0, 45.0, 40.0, 44.0, 37.0, 51.0, 65.0, 63.0, 47.0, 50.0, 46.0, 50.0, 36.0, 40.0, 27.0, 37.0, 24.0, 15.0, 12.0, 12.0, 13.0, 15.0, 14.0, 8.0, 4.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.922636032104492, -11.611213684082031, -11.299790382385254, -10.988368034362793, -10.676944732666016, -10.365522384643555, -10.054099082946777, -9.742676734924316, -9.431253433227539, -9.119831085205078, -8.8084077835083, -8.49698543548584, -8.185562133789062, -7.874139785766602, -7.562716960906982, -7.251294136047363, -6.939871788024902, -6.628448963165283, -6.317026138305664, -6.005603313446045, -5.694180488586426, -5.382758140563965, -5.071335315704346, -4.759912490844727, -4.448489665985107, -4.137066841125488, -3.825644016265869, -3.514221429824829, -3.20279860496521, -2.891375780105591, -2.579953193664551, -2.2685303688049316, -1.9571075439453125, -1.6456847190856934, -1.3342620134353638, -1.0228393077850342, -0.711416482925415, -0.3999936580657959, -0.08857095241546631, 0.22285175323486328, 0.5342745780944824, 0.8456973433494568, 1.1571201086044312, 1.4685428142547607, 1.7799656391143799, 2.091388463973999, 2.402811050415039, 2.714233875274658, 3.0256567001342773, 3.3370795249938965, 3.6485023498535156, 3.9599249362945557, 4.271347999572754, 4.582770347595215, 4.894193172454834, 5.205615997314453, 5.517038822174072, 5.828461647033691, 6.1398844718933105, 6.45130729675293, 6.762729644775391, 7.074152946472168, 7.385575294494629, 7.696998119354248, 8.008420944213867]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 6.0, 8.0, 12.0, 30.0, 26.0, 46.0, 81.0, 150.0, 190.0, 330.0, 497.0, 997.0, 1807.0, 3472.0, 7143.0, 15250.0, 34097.0, 80273.0, 192433.0, 333833.0, 216301.0, 90162.0, 38189.0, 17015.0, 7787.0, 3809.0, 1974.0, 1061.0, 599.0, 356.0, 203.0, 148.0, 85.0, 55.0, 28.0, 35.0, 23.0, 14.0, 9.0, 2.0, 2.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.400390625, -1.3495941162109375, -1.298797607421875, -1.2480010986328125, -1.19720458984375, -1.1464080810546875, -1.095611572265625, -1.0448150634765625, -0.9940185546875, -0.9432220458984375, -0.892425537109375, -0.8416290283203125, -0.79083251953125, -0.7400360107421875, -0.689239501953125, -0.6384429931640625, -0.587646484375, -0.5368499755859375, -0.486053466796875, -0.4352569580078125, -0.38446044921875, -0.3336639404296875, -0.282867431640625, -0.2320709228515625, -0.1812744140625, -0.1304779052734375, -0.079681396484375, -0.0288848876953125, 0.02191162109375, 0.0727081298828125, 0.123504638671875, 0.1743011474609375, 0.22509765625, 0.2758941650390625, 0.326690673828125, 0.3774871826171875, 0.42828369140625, 0.4790802001953125, 0.529876708984375, 0.5806732177734375, 0.6314697265625, 0.6822662353515625, 0.733062744140625, 0.7838592529296875, 0.83465576171875, 0.8854522705078125, 0.936248779296875, 0.9870452880859375, 1.037841796875, 1.0886383056640625, 1.139434814453125, 1.1902313232421875, 1.24102783203125, 1.2918243408203125, 1.342620849609375, 1.3934173583984375, 1.4442138671875, 1.4950103759765625, 1.545806884765625, 1.5966033935546875, 1.64739990234375, 1.6981964111328125, 1.748992919921875, 1.7997894287109375, 1.8505859375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 0.0, 7.0, 5.0, 6.0, 13.0, 8.0, 14.0, 12.0, 10.0, 21.0, 18.0, 21.0, 22.0, 27.0, 25.0, 27.0, 36.0, 36.0, 43.0, 36.0, 26.0, 43.0, 35.0, 38.0, 46.0, 41.0, 56.0, 33.0, 36.0, 27.0, 22.0, 22.0, 28.0, 27.0, 31.0, 15.0, 17.0, 11.0, 8.0, 10.0, 11.0, 3.0, 4.0, 5.0, 4.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.6923828125, -0.6698760986328125, -0.647369384765625, -0.6248626708984375, -0.60235595703125, -0.5798492431640625, -0.557342529296875, -0.5348358154296875, -0.5123291015625, -0.4898223876953125, -0.467315673828125, -0.4448089599609375, -0.42230224609375, -0.3997955322265625, -0.377288818359375, -0.3547821044921875, -0.332275390625, -0.3097686767578125, -0.287261962890625, -0.2647552490234375, -0.24224853515625, -0.2197418212890625, -0.197235107421875, -0.1747283935546875, -0.1522216796875, -0.1297149658203125, -0.107208251953125, -0.0847015380859375, -0.06219482421875, -0.0396881103515625, -0.017181396484375, 0.0053253173828125, 0.02783203125, 0.0503387451171875, 0.072845458984375, 0.0953521728515625, 0.11785888671875, 0.1403656005859375, 0.162872314453125, 0.1853790283203125, 0.2078857421875, 0.2303924560546875, 0.252899169921875, 0.2754058837890625, 0.29791259765625, 0.3204193115234375, 0.342926025390625, 0.3654327392578125, 0.387939453125, 0.4104461669921875, 0.432952880859375, 0.4554595947265625, 0.47796630859375, 0.5004730224609375, 0.522979736328125, 0.5454864501953125, 0.5679931640625, 0.5904998779296875, 0.613006591796875, 0.6355133056640625, 0.65802001953125, 0.6805267333984375, 0.703033447265625, 0.7255401611328125, 0.748046875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 6.0, 11.0, 22.0, 24.0, 37.0, 58.0, 79.0, 108.0, 151.0, 251.0, 412.0, 661.0, 1196.0, 2426.0, 6943.0, 32041.0, 217883.0, 668347.0, 93325.0, 15976.0, 4368.0, 1755.0, 928.0, 529.0, 331.0, 223.0, 134.0, 94.0, 86.0, 44.0, 31.0, 20.0, 10.0, 9.0, 12.0, 10.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.265625, -3.157806396484375, -3.04998779296875, -2.942169189453125, -2.8343505859375, -2.726531982421875, -2.61871337890625, -2.510894775390625, -2.403076171875, -2.295257568359375, -2.18743896484375, -2.079620361328125, -1.9718017578125, -1.863983154296875, -1.75616455078125, -1.648345947265625, -1.54052734375, -1.432708740234375, -1.32489013671875, -1.217071533203125, -1.1092529296875, -1.001434326171875, -0.89361572265625, -0.785797119140625, -0.677978515625, -0.570159912109375, -0.46234130859375, -0.354522705078125, -0.2467041015625, -0.138885498046875, -0.03106689453125, 0.076751708984375, 0.1845703125, 0.292388916015625, 0.40020751953125, 0.508026123046875, 0.6158447265625, 0.723663330078125, 0.83148193359375, 0.939300537109375, 1.047119140625, 1.154937744140625, 1.26275634765625, 1.370574951171875, 1.4783935546875, 1.586212158203125, 1.69403076171875, 1.801849365234375, 1.90966796875, 2.017486572265625, 2.12530517578125, 2.233123779296875, 2.3409423828125, 2.448760986328125, 2.55657958984375, 2.664398193359375, 2.772216796875, 2.880035400390625, 2.98785400390625, 3.095672607421875, 3.2034912109375, 3.311309814453125, 3.41912841796875, 3.526947021484375, 3.634765625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 9.0, 6.0, 17.0, 12.0, 14.0, 24.0, 30.0, 36.0, 34.0, 41.0, 42.0, 57.0, 60.0, 55.0, 69.0, 56.0, 57.0, 54.0, 40.0, 47.0, 44.0, 34.0, 33.0, 23.0, 24.0, 25.0, 18.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.3321533203125, -4.207275390625, -4.0823974609375, -3.95751953125, -3.8326416015625, -3.707763671875, -3.5828857421875, -3.4580078125, -3.3331298828125, -3.208251953125, -3.0833740234375, -2.95849609375, -2.8336181640625, -2.708740234375, -2.5838623046875, -2.458984375, -2.3341064453125, -2.209228515625, -2.0843505859375, -1.95947265625, -1.8345947265625, -1.709716796875, -1.5848388671875, -1.4599609375, -1.3350830078125, -1.210205078125, -1.0853271484375, -0.96044921875, -0.8355712890625, -0.710693359375, -0.5858154296875, -0.4609375, -0.3360595703125, -0.211181640625, -0.0863037109375, 0.03857421875, 0.1634521484375, 0.288330078125, 0.4132080078125, 0.5380859375, 0.6629638671875, 0.787841796875, 0.9127197265625, 1.03759765625, 1.1624755859375, 1.287353515625, 1.4122314453125, 1.537109375, 1.6619873046875, 1.786865234375, 1.9117431640625, 2.03662109375, 2.1614990234375, 2.286376953125, 2.4112548828125, 2.5361328125, 2.6610107421875, 2.785888671875, 2.9107666015625, 3.03564453125, 3.1605224609375, 3.285400390625, 3.4102783203125, 3.53515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 7.0, 10.0, 8.0, 18.0, 16.0, 26.0, 52.0, 74.0, 108.0, 197.0, 399.0, 812.0, 2015.0, 6748.0, 36921.0, 304424.0, 619747.0, 62173.0, 10102.0, 2632.0, 1036.0, 413.0, 255.0, 129.0, 70.0, 44.0, 40.0, 26.0, 11.0, 17.0, 3.0, 6.0, 4.0, 5.0, 0.0, 4.0, 2.0, 1.0, 2.0], "bins": [-1.2177734375, -1.1881637573242188, -1.1585540771484375, -1.1289443969726562, -1.099334716796875, -1.0697250366210938, -1.0401153564453125, -1.0105056762695312, -0.98089599609375, -0.9512863159179688, -0.9216766357421875, -0.8920669555664062, -0.862457275390625, -0.8328475952148438, -0.8032379150390625, -0.7736282348632812, -0.7440185546875, -0.7144088745117188, -0.6847991943359375, -0.6551895141601562, -0.625579833984375, -0.5959701538085938, -0.5663604736328125, -0.5367507934570312, -0.50714111328125, -0.47753143310546875, -0.4479217529296875, -0.41831207275390625, -0.388702392578125, -0.35909271240234375, -0.3294830322265625, -0.29987335205078125, -0.270263671875, -0.24065399169921875, -0.2110443115234375, -0.18143463134765625, -0.151824951171875, -0.12221527099609375, -0.0926055908203125, -0.06299591064453125, -0.03338623046875, -0.00377655029296875, 0.0258331298828125, 0.05544281005859375, 0.085052490234375, 0.11466217041015625, 0.1442718505859375, 0.17388153076171875, 0.2034912109375, 0.23310089111328125, 0.2627105712890625, 0.29232025146484375, 0.321929931640625, 0.35153961181640625, 0.3811492919921875, 0.41075897216796875, 0.44036865234375, 0.46997833251953125, 0.4995880126953125, 0.5291976928710938, 0.558807373046875, 0.5884170532226562, 0.6180267333984375, 0.6476364135742188, 0.67724609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 7.0, 4.0, 6.0, 9.0, 11.0, 9.0, 25.0, 40.0, 46.0, 61.0, 79.0, 89.0, 120.0, 111.0, 109.0, 71.0, 51.0, 35.0, 27.0, 19.0, 13.0, 14.0, 14.0, 7.0, 5.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003390312194824219, -0.00033006444573402405, -0.0003210976719856262, -0.0003121308982372284, -0.00030316412448883057, -0.00029419735074043274, -0.0002852305769920349, -0.0002762638032436371, -0.00026729702949523926, -0.00025833025574684143, -0.0002493634819984436, -0.00024039670825004578, -0.00023142993450164795, -0.00022246316075325012, -0.0002134963870048523, -0.00020452961325645447, -0.00019556283950805664, -0.0001865960657596588, -0.00017762929201126099, -0.00016866251826286316, -0.00015969574451446533, -0.0001507289707660675, -0.00014176219701766968, -0.00013279542326927185, -0.00012382864952087402, -0.0001148618757724762, -0.00010589510202407837, -9.692832827568054e-05, -8.796155452728271e-05, -7.899478077888489e-05, -7.002800703048706e-05, -6.106123328208923e-05, -5.2094459533691406e-05, -4.312768578529358e-05, -3.416091203689575e-05, -2.5194138288497925e-05, -1.6227364540100098e-05, -7.2605907917022705e-06, 1.7061829566955566e-06, 1.0672956705093384e-05, 1.963973045349121e-05, 2.8606504201889038e-05, 3.7573277950286865e-05, 4.654005169868469e-05, 5.550682544708252e-05, 6.447359919548035e-05, 7.344037294387817e-05, 8.2407146692276e-05, 9.137392044067383e-05, 0.00010034069418907166, 0.00010930746793746948, 0.00011827424168586731, 0.00012724101543426514, 0.00013620778918266296, 0.0001451745629310608, 0.00015414133667945862, 0.00016310811042785645, 0.00017207488417625427, 0.0001810416579246521, 0.00019000843167304993, 0.00019897520542144775, 0.00020794197916984558, 0.0002169087529182434, 0.00022587552666664124, 0.00023484230041503906]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 10.0, 9.0, 13.0, 31.0, 34.0, 41.0, 60.0, 100.0, 128.0, 198.0, 326.0, 556.0, 1105.0, 2069.0, 5036.0, 15565.0, 75298.0, 547263.0, 322525.0, 57049.0, 12753.0, 4214.0, 1897.0, 930.0, 489.0, 311.0, 170.0, 103.0, 95.0, 55.0, 30.0, 21.0, 9.0, 10.0, 15.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.7587890625, -0.735015869140625, -0.71124267578125, -0.687469482421875, -0.6636962890625, -0.639923095703125, -0.61614990234375, -0.592376708984375, -0.568603515625, -0.544830322265625, -0.52105712890625, -0.497283935546875, -0.4735107421875, -0.449737548828125, -0.42596435546875, -0.402191162109375, -0.37841796875, -0.354644775390625, -0.33087158203125, -0.307098388671875, -0.2833251953125, -0.259552001953125, -0.23577880859375, -0.212005615234375, -0.188232421875, -0.164459228515625, -0.14068603515625, -0.116912841796875, -0.0931396484375, -0.069366455078125, -0.04559326171875, -0.021820068359375, 0.001953125, 0.025726318359375, 0.04949951171875, 0.073272705078125, 0.0970458984375, 0.120819091796875, 0.14459228515625, 0.168365478515625, 0.192138671875, 0.215911865234375, 0.23968505859375, 0.263458251953125, 0.2872314453125, 0.311004638671875, 0.33477783203125, 0.358551025390625, 0.38232421875, 0.406097412109375, 0.42987060546875, 0.453643798828125, 0.4774169921875, 0.501190185546875, 0.52496337890625, 0.548736572265625, 0.572509765625, 0.596282958984375, 0.62005615234375, 0.643829345703125, 0.6676025390625, 0.691375732421875, 0.71514892578125, 0.738922119140625, 0.7626953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 8.0, 6.0, 10.0, 7.0, 14.0, 15.0, 19.0, 20.0, 29.0, 30.0, 27.0, 39.0, 46.0, 44.0, 45.0, 51.0, 60.0, 63.0, 71.0, 59.0, 51.0, 62.0, 37.0, 27.0, 28.0, 17.0, 18.0, 17.0, 20.0, 15.0, 18.0, 6.0, 6.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5965042114257812, -0.5753326416015625, -0.5541610717773438, -0.532989501953125, -0.5118179321289062, -0.4906463623046875, -0.46947479248046875, -0.44830322265625, -0.42713165283203125, -0.4059600830078125, -0.38478851318359375, -0.363616943359375, -0.34244537353515625, -0.3212738037109375, -0.30010223388671875, -0.2789306640625, -0.25775909423828125, -0.2365875244140625, -0.21541595458984375, -0.194244384765625, -0.17307281494140625, -0.1519012451171875, -0.13072967529296875, -0.10955810546875, -0.08838653564453125, -0.0672149658203125, -0.04604339599609375, -0.024871826171875, -0.00370025634765625, 0.0174713134765625, 0.03864288330078125, 0.059814453125, 0.08098602294921875, 0.1021575927734375, 0.12332916259765625, 0.144500732421875, 0.16567230224609375, 0.1868438720703125, 0.20801544189453125, 0.22918701171875, 0.25035858154296875, 0.2715301513671875, 0.29270172119140625, 0.313873291015625, 0.33504486083984375, 0.3562164306640625, 0.37738800048828125, 0.3985595703125, 0.41973114013671875, 0.4409027099609375, 0.46207427978515625, 0.483245849609375, 0.5044174194335938, 0.5255889892578125, 0.5467605590820312, 0.56793212890625, 0.5891036987304688, 0.6102752685546875, 0.6314468383789062, 0.652618408203125, 0.6737899780273438, 0.6949615478515625, 0.7161331176757812, 0.7373046875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 11.0, 18.0, 24.0, 58.0, 106.0, 185.0, 282.0, 162.0, 79.0, 38.0, 13.0, 7.0, 9.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-42.03028869628906, -41.14311218261719, -40.25593948364258, -39.36876678466797, -38.481590270996094, -37.59441375732422, -36.70724105834961, -35.820068359375, -34.932891845703125, -34.04571533203125, -33.15854263305664, -32.27136993408203, -31.384193420410156, -30.497018814086914, -29.609844207763672, -28.72266960144043, -27.835494995117188, -26.948320388793945, -26.061145782470703, -25.17397117614746, -24.28679656982422, -23.399621963500977, -22.512447357177734, -21.625272750854492, -20.73809814453125, -19.850923538208008, -18.963748931884766, -18.076574325561523, -17.18939971923828, -16.30222511291504, -15.415050506591797, -14.527875900268555, -13.64069938659668, -12.753524780273438, -11.866350173950195, -10.979175567626953, -10.092000961303711, -9.204826354980469, -8.317651748657227, -7.430477142333984, -6.543302536010742, -5.6561279296875, -4.768953323364258, -3.8817787170410156, -2.9946041107177734, -2.1074295043945312, -1.220254898071289, -0.3330802917480469, 0.5540943145751953, 1.4412689208984375, 2.3284435272216797, 3.215618133544922, 4.102792739868164, 4.989967346191406, 5.877141952514648, 6.764316558837891, 7.651491165161133, 8.538665771484375, 9.425840377807617, 10.31301498413086, 11.200189590454102, 12.087364196777344, 12.974538803100586, 13.861713409423828, 14.74888801574707]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 5.0, 3.0, 9.0, 7.0, 12.0, 13.0, 12.0, 13.0, 23.0, 19.0, 20.0, 28.0, 27.0, 23.0, 29.0, 32.0, 47.0, 47.0, 62.0, 61.0, 66.0, 46.0, 45.0, 34.0, 39.0, 38.0, 25.0, 35.0, 15.0, 26.0, 21.0, 13.0, 12.0, 15.0, 10.0, 12.0, 7.0, 11.0, 4.0, 4.0, 3.0, 5.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.115571975708008, -11.708925247192383, -11.302278518676758, -10.895631790161133, -10.488985061645508, -10.082338333129883, -9.675691604614258, -9.269044876098633, -8.862398147583008, -8.455751419067383, -8.049104690551758, -7.642457962036133, -7.235811233520508, -6.829164505004883, -6.422517776489258, -6.015871047973633, -5.609224319458008, -5.202577590942383, -4.795930862426758, -4.389284133911133, -3.982637405395508, -3.575990676879883, -3.169343948364258, -2.762697219848633, -2.356050491333008, -1.9494037628173828, -1.5427570343017578, -1.1361103057861328, -0.7294635772705078, -0.3228168487548828, 0.08382987976074219, 0.4904766082763672, 0.8971233367919922, 1.3037700653076172, 1.7104167938232422, 2.117063522338867, 2.523710250854492, 2.930356979370117, 3.337003707885742, 3.743650436401367, 4.150297164916992, 4.556943893432617, 4.963590621948242, 5.370237350463867, 5.776884078979492, 6.183530807495117, 6.590177536010742, 6.996824264526367, 7.403470993041992, 7.810117721557617, 8.216764450073242, 8.623411178588867, 9.030057907104492, 9.436704635620117, 9.843351364135742, 10.249998092651367, 10.656644821166992, 11.063291549682617, 11.469938278198242, 11.876585006713867, 12.283231735229492, 12.689878463745117, 13.096525192260742, 13.503171920776367, 13.909818649291992]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 9.0, 9.0, 24.0, 21.0, 42.0, 66.0, 110.0, 205.0, 351.0, 832.0, 2163.0, 7041.0, 34913.0, 492003.0, 3325531.0, 295979.0, 25935.0, 5634.0, 1807.0, 753.0, 360.0, 173.0, 105.0, 69.0, 49.0, 27.0, 22.0, 13.0, 12.0, 3.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.880859375, -1.822845458984375, -1.76483154296875, -1.706817626953125, -1.6488037109375, -1.590789794921875, -1.53277587890625, -1.474761962890625, -1.416748046875, -1.358734130859375, -1.30072021484375, -1.242706298828125, -1.1846923828125, -1.126678466796875, -1.06866455078125, -1.010650634765625, -0.95263671875, -0.894622802734375, -0.83660888671875, -0.778594970703125, -0.7205810546875, -0.662567138671875, -0.60455322265625, -0.546539306640625, -0.488525390625, -0.430511474609375, -0.37249755859375, -0.314483642578125, -0.2564697265625, -0.198455810546875, -0.14044189453125, -0.082427978515625, -0.0244140625, 0.033599853515625, 0.09161376953125, 0.149627685546875, 0.2076416015625, 0.265655517578125, 0.32366943359375, 0.381683349609375, 0.439697265625, 0.497711181640625, 0.55572509765625, 0.613739013671875, 0.6717529296875, 0.729766845703125, 0.78778076171875, 0.845794677734375, 0.90380859375, 0.961822509765625, 1.01983642578125, 1.077850341796875, 1.1358642578125, 1.193878173828125, 1.25189208984375, 1.309906005859375, 1.367919921875, 1.425933837890625, 1.48394775390625, 1.541961669921875, 1.5999755859375, 1.657989501953125, 1.71600341796875, 1.774017333984375, 1.83203125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 13.0, 11.0, 11.0, 12.0, 18.0, 27.0, 20.0, 26.0, 31.0, 27.0, 27.0, 28.0, 39.0, 49.0, 40.0, 41.0, 50.0, 59.0, 45.0, 47.0, 38.0, 30.0, 42.0, 53.0, 28.0, 34.0, 24.0, 30.0, 18.0, 19.0, 10.0, 11.0, 10.0, 8.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.77099609375, -0.7461166381835938, -0.7212371826171875, -0.6963577270507812, -0.671478271484375, -0.6465988159179688, -0.6217193603515625, -0.5968399047851562, -0.57196044921875, -0.5470809936523438, -0.5222015380859375, -0.49732208251953125, -0.472442626953125, -0.44756317138671875, -0.4226837158203125, -0.39780426025390625, -0.3729248046875, -0.34804534912109375, -0.3231658935546875, -0.29828643798828125, -0.273406982421875, -0.24852752685546875, -0.2236480712890625, -0.19876861572265625, -0.17388916015625, -0.14900970458984375, -0.1241302490234375, -0.09925079345703125, -0.074371337890625, -0.04949188232421875, -0.0246124267578125, 0.00026702880859375, 0.025146484375, 0.05002593994140625, 0.0749053955078125, 0.09978485107421875, 0.124664306640625, 0.14954376220703125, 0.1744232177734375, 0.19930267333984375, 0.22418212890625, 0.24906158447265625, 0.2739410400390625, 0.29882049560546875, 0.323699951171875, 0.34857940673828125, 0.3734588623046875, 0.39833831787109375, 0.4232177734375, 0.44809722900390625, 0.4729766845703125, 0.49785614013671875, 0.522735595703125, 0.5476150512695312, 0.5724945068359375, 0.5973739624023438, 0.62225341796875, 0.6471328735351562, 0.6720123291015625, 0.6968917846679688, 0.721771240234375, 0.7466506958007812, 0.7715301513671875, 0.7964096069335938, 0.8212890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 14.0, 8.0, 12.0, 24.0, 30.0, 58.0, 95.0, 105.0, 237.0, 553.0, 1477.0, 5696.0, 36087.0, 884042.0, 3180725.0, 71869.0, 9300.0, 2213.0, 824.0, 352.0, 206.0, 118.0, 84.0, 46.0, 27.0, 22.0, 22.0, 5.0, 10.0, 7.0, 3.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.13671875, -3.0474853515625, -2.958251953125, -2.8690185546875, -2.77978515625, -2.6905517578125, -2.601318359375, -2.5120849609375, -2.4228515625, -2.3336181640625, -2.244384765625, -2.1551513671875, -2.06591796875, -1.9766845703125, -1.887451171875, -1.7982177734375, -1.708984375, -1.6197509765625, -1.530517578125, -1.4412841796875, -1.35205078125, -1.2628173828125, -1.173583984375, -1.0843505859375, -0.9951171875, -0.9058837890625, -0.816650390625, -0.7274169921875, -0.63818359375, -0.5489501953125, -0.459716796875, -0.3704833984375, -0.28125, -0.1920166015625, -0.102783203125, -0.0135498046875, 0.07568359375, 0.1649169921875, 0.254150390625, 0.3433837890625, 0.4326171875, 0.5218505859375, 0.611083984375, 0.7003173828125, 0.78955078125, 0.8787841796875, 0.968017578125, 1.0572509765625, 1.146484375, 1.2357177734375, 1.324951171875, 1.4141845703125, 1.50341796875, 1.5926513671875, 1.681884765625, 1.7711181640625, 1.8603515625, 1.9495849609375, 2.038818359375, 2.1280517578125, 2.21728515625, 2.3065185546875, 2.395751953125, 2.4849853515625, 2.57421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 11.0, 10.0, 11.0, 21.0, 26.0, 22.0, 34.0, 45.0, 98.0, 128.0, 185.0, 377.0, 627.0, 751.0, 660.0, 422.0, 226.0, 138.0, 79.0, 51.0, 35.0, 33.0, 24.0, 15.0, 11.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6328125, -1.571380615234375, -1.50994873046875, -1.448516845703125, -1.3870849609375, -1.325653076171875, -1.26422119140625, -1.202789306640625, -1.141357421875, -1.079925537109375, -1.01849365234375, -0.957061767578125, -0.8956298828125, -0.834197998046875, -0.77276611328125, -0.711334228515625, -0.64990234375, -0.588470458984375, -0.52703857421875, -0.465606689453125, -0.4041748046875, -0.342742919921875, -0.28131103515625, -0.219879150390625, -0.158447265625, -0.097015380859375, -0.03558349609375, 0.025848388671875, 0.0872802734375, 0.148712158203125, 0.21014404296875, 0.271575927734375, 0.3330078125, 0.394439697265625, 0.45587158203125, 0.517303466796875, 0.5787353515625, 0.640167236328125, 0.70159912109375, 0.763031005859375, 0.824462890625, 0.885894775390625, 0.94732666015625, 1.008758544921875, 1.0701904296875, 1.131622314453125, 1.19305419921875, 1.254486083984375, 1.31591796875, 1.377349853515625, 1.43878173828125, 1.500213623046875, 1.5616455078125, 1.623077392578125, 1.68450927734375, 1.745941162109375, 1.807373046875, 1.868804931640625, 1.93023681640625, 1.991668701171875, 2.0531005859375, 2.114532470703125, 2.17596435546875, 2.237396240234375, 2.298828125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 10.0, 10.0, 24.0, 66.0, 125.0, 213.0, 239.0, 154.0, 75.0, 34.0, 11.0, 12.0, 10.0, 6.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.545472145080566, -12.797033309936523, -12.048593521118164, -11.300153732299805, -10.551714897155762, -9.803276062011719, -9.05483627319336, -8.306396484375, -7.557957649230957, -6.809518337249756, -6.061079025268555, -5.3126397132873535, -4.564200401306152, -3.815761089324951, -3.06732177734375, -2.318882465362549, -1.5704431533813477, -0.8220038414001465, -0.07356452941894531, 0.6748747825622559, 1.423314094543457, 2.171753406524658, 2.9201927185058594, 3.6686320304870605, 4.417071342468262, 5.165510654449463, 5.913949966430664, 6.662389278411865, 7.410828590393066, 8.15926742553711, 8.907707214355469, 9.656147003173828, 10.404586791992188, 11.153026580810547, 11.90146541595459, 12.649904251098633, 13.398344039916992, 14.146783828735352, 14.895222663879395, 15.643661499023438, 16.392101287841797, 17.140541076660156, 17.888980865478516, 18.637418746948242, 19.3858585357666, 20.13429832458496, 20.882736206054688, 21.631175994873047, 22.379615783691406, 23.128055572509766, 23.876495361328125, 24.62493324279785, 25.37337303161621, 26.12181282043457, 26.870250701904297, 27.618690490722656, 28.367130279541016, 29.115570068359375, 29.864009857177734, 30.61244773864746, 31.36088752746582, 32.10932540893555, 32.857765197753906, 33.606204986572266, 34.354644775390625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 6.0, 9.0, 13.0, 23.0, 21.0, 20.0, 28.0, 34.0, 37.0, 40.0, 47.0, 55.0, 52.0, 51.0, 49.0, 50.0, 53.0, 51.0, 43.0, 46.0, 35.0, 29.0, 46.0, 24.0, 27.0, 16.0, 13.0, 19.0, 17.0, 7.0, 10.0, 6.0, 8.0, 5.0, 6.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.258282661437988, -5.999912261962891, -5.741541862487793, -5.483171463012695, -5.224801063537598, -4.9664306640625, -4.7080607414245605, -4.449690341949463, -4.191319942474365, -3.9329495429992676, -3.67457914352417, -3.4162089824676514, -3.1578385829925537, -2.899468183517456, -2.6410980224609375, -2.38272762298584, -2.124357223510742, -1.8659868240356445, -1.6076165437698364, -1.3492462635040283, -1.0908758640289307, -0.832505464553833, -0.5741351842880249, -0.3157649040222168, -0.05739450454711914, 0.20097583532333374, 0.4593461751937866, 0.7177165150642395, 0.9760868549346924, 1.23445725440979, 1.4928275346755981, 1.7511978149414062, 2.0095672607421875, 2.267937660217285, 2.526308059692383, 2.7846782207489014, 3.043048620223999, 3.3014190196990967, 3.5597891807556152, 3.818159580230713, 4.0765299797058105, 4.334900379180908, 4.593270778656006, 4.8516411781311035, 5.110011100769043, 5.368381500244141, 5.626751899719238, 5.885122299194336, 6.143492698669434, 6.401863098144531, 6.660233497619629, 6.918603897094727, 7.176974296569824, 7.435344696044922, 7.693714618682861, 7.952085018157959, 8.210454940795898, 8.468825340270996, 8.727195739746094, 8.985566139221191, 9.243936538696289, 9.502306938171387, 9.760677337646484, 10.019046783447266, 10.27741813659668]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 1.0, 7.0, 6.0, 10.0, 6.0, 8.0, 27.0, 24.0, 33.0, 62.0, 88.0, 128.0, 192.0, 347.0, 569.0, 956.0, 1644.0, 3022.0, 5800.0, 11887.0, 26329.0, 59870.0, 136719.0, 255048.0, 268942.0, 152363.0, 67537.0, 29392.0, 13451.0, 6427.0, 3288.0, 1856.0, 956.0, 583.0, 343.0, 211.0, 131.0, 86.0, 56.0, 34.0, 34.0, 29.0, 18.0, 9.0, 7.0, 3.0, 6.0, 4.0, 1.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3251953125, -1.28387451171875, -1.2425537109375, -1.20123291015625, -1.159912109375, -1.11859130859375, -1.0772705078125, -1.03594970703125, -0.99462890625, -0.95330810546875, -0.9119873046875, -0.87066650390625, -0.829345703125, -0.78802490234375, -0.7467041015625, -0.70538330078125, -0.6640625, -0.62274169921875, -0.5814208984375, -0.54010009765625, -0.498779296875, -0.45745849609375, -0.4161376953125, -0.37481689453125, -0.33349609375, -0.29217529296875, -0.2508544921875, -0.20953369140625, -0.168212890625, -0.12689208984375, -0.0855712890625, -0.04425048828125, -0.0029296875, 0.03839111328125, 0.0797119140625, 0.12103271484375, 0.162353515625, 0.20367431640625, 0.2449951171875, 0.28631591796875, 0.32763671875, 0.36895751953125, 0.4102783203125, 0.45159912109375, 0.492919921875, 0.53424072265625, 0.5755615234375, 0.61688232421875, 0.658203125, 0.69952392578125, 0.7408447265625, 0.78216552734375, 0.823486328125, 0.86480712890625, 0.9061279296875, 0.94744873046875, 0.98876953125, 1.03009033203125, 1.0714111328125, 1.11273193359375, 1.154052734375, 1.19537353515625, 1.2366943359375, 1.27801513671875, 1.3193359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 8.0, 4.0, 12.0, 14.0, 9.0, 15.0, 17.0, 21.0, 19.0, 26.0, 37.0, 23.0, 34.0, 29.0, 30.0, 41.0, 44.0, 45.0, 53.0, 36.0, 45.0, 52.0, 44.0, 35.0, 48.0, 29.0, 30.0, 32.0, 29.0, 21.0, 20.0, 21.0, 19.0, 10.0, 13.0, 7.0, 5.0, 10.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.86328125, -0.8387222290039062, -0.8141632080078125, -0.7896041870117188, -0.765045166015625, -0.7404861450195312, -0.7159271240234375, -0.6913681030273438, -0.66680908203125, -0.6422500610351562, -0.6176910400390625, -0.5931320190429688, -0.568572998046875, -0.5440139770507812, -0.5194549560546875, -0.49489593505859375, -0.4703369140625, -0.44577789306640625, -0.4212188720703125, -0.39665985107421875, -0.372100830078125, -0.34754180908203125, -0.3229827880859375, -0.29842376708984375, -0.27386474609375, -0.24930572509765625, -0.2247467041015625, -0.20018768310546875, -0.175628662109375, -0.15106964111328125, -0.1265106201171875, -0.10195159912109375, -0.077392578125, -0.05283355712890625, -0.0282745361328125, -0.00371551513671875, 0.020843505859375, 0.04540252685546875, 0.0699615478515625, 0.09452056884765625, 0.11907958984375, 0.14363861083984375, 0.1681976318359375, 0.19275665283203125, 0.217315673828125, 0.24187469482421875, 0.2664337158203125, 0.29099273681640625, 0.3155517578125, 0.34011077880859375, 0.3646697998046875, 0.38922882080078125, 0.413787841796875, 0.43834686279296875, 0.4629058837890625, 0.48746490478515625, 0.51202392578125, 0.5365829467773438, 0.5611419677734375, 0.5857009887695312, 0.610260009765625, 0.6348190307617188, 0.6593780517578125, 0.6839370727539062, 0.70849609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 9.0, 9.0, 10.0, 11.0, 11.0, 17.0, 34.0, 36.0, 62.0, 97.0, 142.0, 237.0, 439.0, 665.0, 1510.0, 3723.0, 10195.0, 36750.0, 156043.0, 580076.0, 192791.0, 45424.0, 12426.0, 4206.0, 1704.0, 789.0, 418.0, 240.0, 140.0, 84.0, 75.0, 51.0, 31.0, 25.0, 17.0, 12.0, 6.0, 12.0, 9.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2109375, -2.14306640625, -2.0751953125, -2.00732421875, -1.939453125, -1.87158203125, -1.8037109375, -1.73583984375, -1.66796875, -1.60009765625, -1.5322265625, -1.46435546875, -1.396484375, -1.32861328125, -1.2607421875, -1.19287109375, -1.125, -1.05712890625, -0.9892578125, -0.92138671875, -0.853515625, -0.78564453125, -0.7177734375, -0.64990234375, -0.58203125, -0.51416015625, -0.4462890625, -0.37841796875, -0.310546875, -0.24267578125, -0.1748046875, -0.10693359375, -0.0390625, 0.02880859375, 0.0966796875, 0.16455078125, 0.232421875, 0.30029296875, 0.3681640625, 0.43603515625, 0.50390625, 0.57177734375, 0.6396484375, 0.70751953125, 0.775390625, 0.84326171875, 0.9111328125, 0.97900390625, 1.046875, 1.11474609375, 1.1826171875, 1.25048828125, 1.318359375, 1.38623046875, 1.4541015625, 1.52197265625, 1.58984375, 1.65771484375, 1.7255859375, 1.79345703125, 1.861328125, 1.92919921875, 1.9970703125, 2.06494140625, 2.1328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 5.0, 8.0, 11.0, 17.0, 18.0, 13.0, 25.0, 43.0, 32.0, 47.0, 45.0, 53.0, 68.0, 55.0, 66.0, 58.0, 42.0, 59.0, 56.0, 55.0, 36.0, 26.0, 34.0, 22.0, 18.0, 16.0, 23.0, 14.0, 9.0, 2.0, 8.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.662109375, -3.557403564453125, -3.45269775390625, -3.347991943359375, -3.2432861328125, -3.138580322265625, -3.03387451171875, -2.929168701171875, -2.824462890625, -2.719757080078125, -2.61505126953125, -2.510345458984375, -2.4056396484375, -2.300933837890625, -2.19622802734375, -2.091522216796875, -1.98681640625, -1.882110595703125, -1.77740478515625, -1.672698974609375, -1.5679931640625, -1.463287353515625, -1.35858154296875, -1.253875732421875, -1.149169921875, -1.044464111328125, -0.93975830078125, -0.835052490234375, -0.7303466796875, -0.625640869140625, -0.52093505859375, -0.416229248046875, -0.3115234375, -0.206817626953125, -0.10211181640625, 0.002593994140625, 0.1072998046875, 0.212005615234375, 0.31671142578125, 0.421417236328125, 0.526123046875, 0.630828857421875, 0.73553466796875, 0.840240478515625, 0.9449462890625, 1.049652099609375, 1.15435791015625, 1.259063720703125, 1.36376953125, 1.468475341796875, 1.57318115234375, 1.677886962890625, 1.7825927734375, 1.887298583984375, 1.99200439453125, 2.096710205078125, 2.201416015625, 2.306121826171875, 2.41082763671875, 2.515533447265625, 2.6202392578125, 2.724945068359375, 2.82965087890625, 2.934356689453125, 3.0390625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 4.0, 11.0, 17.0, 25.0, 36.0, 78.0, 180.0, 384.0, 953.0, 3400.0, 19205.0, 203813.0, 742946.0, 66477.0, 8064.0, 1838.0, 595.0, 259.0, 121.0, 61.0, 31.0, 31.0, 9.0, 7.0, 1.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1162109375, -1.075286865234375, -1.03436279296875, -0.993438720703125, -0.9525146484375, -0.911590576171875, -0.87066650390625, -0.829742431640625, -0.788818359375, -0.747894287109375, -0.70697021484375, -0.666046142578125, -0.6251220703125, -0.584197998046875, -0.54327392578125, -0.502349853515625, -0.46142578125, -0.420501708984375, -0.37957763671875, -0.338653564453125, -0.2977294921875, -0.256805419921875, -0.21588134765625, -0.174957275390625, -0.134033203125, -0.093109130859375, -0.05218505859375, -0.011260986328125, 0.0296630859375, 0.070587158203125, 0.11151123046875, 0.152435302734375, 0.193359375, 0.234283447265625, 0.27520751953125, 0.316131591796875, 0.3570556640625, 0.397979736328125, 0.43890380859375, 0.479827880859375, 0.520751953125, 0.561676025390625, 0.60260009765625, 0.643524169921875, 0.6844482421875, 0.725372314453125, 0.76629638671875, 0.807220458984375, 0.84814453125, 0.889068603515625, 0.92999267578125, 0.970916748046875, 1.0118408203125, 1.052764892578125, 1.09368896484375, 1.134613037109375, 1.175537109375, 1.216461181640625, 1.25738525390625, 1.298309326171875, 1.3392333984375, 1.380157470703125, 1.42108154296875, 1.462005615234375, 1.5029296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 4.0, 14.0, 14.0, 18.0, 18.0, 34.0, 39.0, 39.0, 56.0, 68.0, 92.0, 93.0, 92.0, 99.0, 56.0, 48.0, 48.0, 32.0, 23.0, 17.0, 26.0, 15.0, 10.0, 4.0, 3.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0002880096435546875, -0.0002794116735458374, -0.0002708137035369873, -0.0002622157335281372, -0.0002536177635192871, -0.000245019793510437, -0.00023642182350158691, -0.00022782385349273682, -0.00021922588348388672, -0.00021062791347503662, -0.00020202994346618652, -0.00019343197345733643, -0.00018483400344848633, -0.00017623603343963623, -0.00016763806343078613, -0.00015904009342193604, -0.00015044212341308594, -0.00014184415340423584, -0.00013324618339538574, -0.00012464821338653564, -0.00011605024337768555, -0.00010745227336883545, -9.885430335998535e-05, -9.025633335113525e-05, -8.165836334228516e-05, -7.306039333343506e-05, -6.446242332458496e-05, -5.586445331573486e-05, -4.7266483306884766e-05, -3.866851329803467e-05, -3.007054328918457e-05, -2.1472573280334473e-05, -1.2874603271484375e-05, -4.276633262634277e-06, 4.32133674621582e-06, 1.2919306755065918e-05, 2.1517276763916016e-05, 3.0115246772766113e-05, 3.871321678161621e-05, 4.731118679046631e-05, 5.5909156799316406e-05, 6.45071268081665e-05, 7.31050968170166e-05, 8.17030668258667e-05, 9.03010368347168e-05, 9.88990068435669e-05, 0.00010749697685241699, 0.00011609494686126709, 0.0001246929168701172, 0.00013329088687896729, 0.00014188885688781738, 0.00015048682689666748, 0.00015908479690551758, 0.00016768276691436768, 0.00017628073692321777, 0.00018487870693206787, 0.00019347667694091797, 0.00020207464694976807, 0.00021067261695861816, 0.00021927058696746826, 0.00022786855697631836, 0.00023646652698516846, 0.00024506449699401855, 0.00025366246700286865, 0.00026226043701171875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 8.0, 16.0, 28.0, 45.0, 80.0, 164.0, 353.0, 965.0, 3287.0, 17210.0, 157894.0, 755436.0, 97445.0, 11702.0, 2442.0, 800.0, 329.0, 156.0, 72.0, 41.0, 20.0, 17.0, 11.0, 7.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86865234375, -0.8298721313476562, -0.7910919189453125, -0.7523117065429688, -0.713531494140625, -0.6747512817382812, -0.6359710693359375, -0.5971908569335938, -0.55841064453125, -0.5196304321289062, -0.4808502197265625, -0.44207000732421875, -0.403289794921875, -0.36450958251953125, -0.3257293701171875, -0.28694915771484375, -0.2481689453125, -0.20938873291015625, -0.1706085205078125, -0.13182830810546875, -0.093048095703125, -0.05426788330078125, -0.0154876708984375, 0.02329254150390625, 0.06207275390625, 0.10085296630859375, 0.1396331787109375, 0.17841339111328125, 0.217193603515625, 0.25597381591796875, 0.2947540283203125, 0.33353424072265625, 0.372314453125, 0.41109466552734375, 0.4498748779296875, 0.48865509033203125, 0.527435302734375, 0.5662155151367188, 0.6049957275390625, 0.6437759399414062, 0.68255615234375, 0.7213363647460938, 0.7601165771484375, 0.7988967895507812, 0.837677001953125, 0.8764572143554688, 0.9152374267578125, 0.9540176391601562, 0.9927978515625, 1.0315780639648438, 1.0703582763671875, 1.1091384887695312, 1.147918701171875, 1.1866989135742188, 1.2254791259765625, 1.2642593383789062, 1.30303955078125, 1.3418197631835938, 1.3805999755859375, 1.4193801879882812, 1.458160400390625, 1.4969406127929688, 1.5357208251953125, 1.5745010375976562, 1.61328125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 7.0, 7.0, 9.0, 11.0, 14.0, 16.0, 20.0, 21.0, 26.0, 25.0, 33.0, 32.0, 49.0, 40.0, 62.0, 59.0, 47.0, 68.0, 62.0, 62.0, 46.0, 41.0, 57.0, 32.0, 35.0, 24.0, 18.0, 13.0, 14.0, 11.0, 8.0, 3.0, 4.0, 7.0, 8.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.8349609375, -0.81304931640625, -0.7911376953125, -0.76922607421875, -0.747314453125, -0.72540283203125, -0.7034912109375, -0.68157958984375, -0.65966796875, -0.63775634765625, -0.6158447265625, -0.59393310546875, -0.572021484375, -0.55010986328125, -0.5281982421875, -0.50628662109375, -0.484375, -0.46246337890625, -0.4405517578125, -0.41864013671875, -0.396728515625, -0.37481689453125, -0.3529052734375, -0.33099365234375, -0.30908203125, -0.28717041015625, -0.2652587890625, -0.24334716796875, -0.221435546875, -0.19952392578125, -0.1776123046875, -0.15570068359375, -0.1337890625, -0.11187744140625, -0.0899658203125, -0.06805419921875, -0.046142578125, -0.02423095703125, -0.0023193359375, 0.01959228515625, 0.04150390625, 0.06341552734375, 0.0853271484375, 0.10723876953125, 0.129150390625, 0.15106201171875, 0.1729736328125, 0.19488525390625, 0.216796875, 0.23870849609375, 0.2606201171875, 0.28253173828125, 0.304443359375, 0.32635498046875, 0.3482666015625, 0.37017822265625, 0.39208984375, 0.41400146484375, 0.4359130859375, 0.45782470703125, 0.479736328125, 0.50164794921875, 0.5235595703125, 0.54547119140625, 0.5673828125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 5.0, 14.0, 30.0, 72.0, 155.0, 314.0, 203.0, 102.0, 56.0, 18.0, 10.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.671852111816406, -21.85114860534668, -21.03044319152832, -20.209739685058594, -19.389036178588867, -18.56833267211914, -17.74762725830078, -16.926923751831055, -16.106220245361328, -15.285515785217285, -14.464812278747559, -13.644107818603516, -12.823404312133789, -12.002699851989746, -11.181995391845703, -10.361291885375977, -9.540587425231934, -8.71988296508789, -7.899179458618164, -7.078474998474121, -6.2577714920043945, -5.437067031860352, -4.616363048553467, -3.795659065246582, -2.9749550819396973, -2.1542510986328125, -1.3335469961166382, -0.5128428936004639, 0.3078610897064209, 1.1285653114318848, 1.9492692947387695, 2.7699732780456543, 3.590677261352539, 4.411381244659424, 5.232085227966309, 6.052789688110352, 6.873493194580078, 7.694197654724121, 8.514902114868164, 9.33560562133789, 10.156309127807617, 10.97701358795166, 11.797717094421387, 12.61842155456543, 13.439125061035156, 14.2598295211792, 15.080533981323242, 15.901237487792969, 16.721942901611328, 17.542646408081055, 18.363351821899414, 19.18405532836914, 20.004758834838867, 20.825462341308594, 21.646167755126953, 22.46687126159668, 23.287574768066406, 24.108278274536133, 24.928983688354492, 25.74968719482422, 26.570390701293945, 27.391094207763672, 28.21179962158203, 29.032503128051758, 29.853206634521484]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 5.0, 5.0, 6.0, 7.0, 5.0, 7.0, 14.0, 12.0, 15.0, 14.0, 18.0, 17.0, 22.0, 23.0, 28.0, 19.0, 34.0, 29.0, 33.0, 48.0, 59.0, 71.0, 64.0, 81.0, 46.0, 45.0, 27.0, 36.0, 27.0, 23.0, 22.0, 16.0, 19.0, 13.0, 20.0, 21.0, 9.0, 10.0, 6.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.576784133911133, -9.259346008300781, -8.941906929016113, -8.624468803405762, -8.30703067779541, -7.9895920753479, -7.672153472900391, -7.354715347290039, -7.037276744842529, -6.7198381423950195, -6.402400016784668, -6.084961414337158, -5.767522811889648, -5.450084686279297, -5.132646083831787, -4.815207481384277, -4.497769355773926, -4.180330753326416, -3.8628926277160645, -3.5454540252685547, -3.228015661239624, -2.9105772972106934, -2.5931386947631836, -2.275700330734253, -1.9582619667053223, -1.6408236026763916, -1.3233851194381714, -1.0059466361999512, -0.6885082721710205, -0.37106990814208984, -0.05363142490386963, 0.2638070583343506, 0.5812463760375977, 0.8986847996711731, 1.2161232233047485, 1.5335617065429688, 1.8510000705718994, 2.16843843460083, 2.48587703704834, 2.8033154010772705, 3.120753765106201, 3.438192129135132, 3.7556304931640625, 4.073069095611572, 4.390507698059082, 4.707945823669434, 5.025384426116943, 5.342823028564453, 5.660261154174805, 5.9776997566223145, 6.295137882232666, 6.612576484680176, 6.930014610290527, 7.247453212738037, 7.564891815185547, 7.882329940795898, 8.19976806640625, 8.517206192016602, 8.83464527130127, 9.152083396911621, 9.469521522521973, 9.78696060180664, 10.104398727416992, 10.421836853027344, 10.739275932312012]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 13.0, 15.0, 26.0, 36.0, 51.0, 100.0, 147.0, 230.0, 500.0, 1091.0, 2932.0, 10086.0, 55258.0, 851831.0, 2989630.0, 248372.0, 24684.0, 5518.0, 1931.0, 836.0, 395.0, 214.0, 133.0, 85.0, 53.0, 27.0, 23.0, 19.0, 9.0, 10.0, 5.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6103515625, -1.56048583984375, -1.5106201171875, -1.46075439453125, -1.410888671875, -1.36102294921875, -1.3111572265625, -1.26129150390625, -1.21142578125, -1.16156005859375, -1.1116943359375, -1.06182861328125, -1.011962890625, -0.96209716796875, -0.9122314453125, -0.86236572265625, -0.8125, -0.76263427734375, -0.7127685546875, -0.66290283203125, -0.613037109375, -0.56317138671875, -0.5133056640625, -0.46343994140625, -0.41357421875, -0.36370849609375, -0.3138427734375, -0.26397705078125, -0.214111328125, -0.16424560546875, -0.1143798828125, -0.06451416015625, -0.0146484375, 0.03521728515625, 0.0850830078125, 0.13494873046875, 0.184814453125, 0.23468017578125, 0.2845458984375, 0.33441162109375, 0.38427734375, 0.43414306640625, 0.4840087890625, 0.53387451171875, 0.583740234375, 0.63360595703125, 0.6834716796875, 0.73333740234375, 0.783203125, 0.83306884765625, 0.8829345703125, 0.93280029296875, 0.982666015625, 1.03253173828125, 1.0823974609375, 1.13226318359375, 1.18212890625, 1.23199462890625, 1.2818603515625, 1.33172607421875, 1.381591796875, 1.43145751953125, 1.4813232421875, 1.53118896484375, 1.5810546875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 6.0, 14.0, 9.0, 17.0, 17.0, 23.0, 23.0, 27.0, 34.0, 33.0, 27.0, 39.0, 37.0, 48.0, 53.0, 55.0, 45.0, 55.0, 36.0, 39.0, 42.0, 42.0, 36.0, 27.0, 33.0, 30.0, 24.0, 19.0, 22.0, 17.0, 14.0, 8.0, 9.0, 2.0, 5.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.8623046875, -0.837982177734375, -0.81365966796875, -0.789337158203125, -0.7650146484375, -0.740692138671875, -0.71636962890625, -0.692047119140625, -0.667724609375, -0.643402099609375, -0.61907958984375, -0.594757080078125, -0.5704345703125, -0.546112060546875, -0.52178955078125, -0.497467041015625, -0.47314453125, -0.448822021484375, -0.42449951171875, -0.400177001953125, -0.3758544921875, -0.351531982421875, -0.32720947265625, -0.302886962890625, -0.278564453125, -0.254241943359375, -0.22991943359375, -0.205596923828125, -0.1812744140625, -0.156951904296875, -0.13262939453125, -0.108306884765625, -0.083984375, -0.059661865234375, -0.03533935546875, -0.011016845703125, 0.0133056640625, 0.037628173828125, 0.06195068359375, 0.086273193359375, 0.110595703125, 0.134918212890625, 0.15924072265625, 0.183563232421875, 0.2078857421875, 0.232208251953125, 0.25653076171875, 0.280853271484375, 0.30517578125, 0.329498291015625, 0.35382080078125, 0.378143310546875, 0.4024658203125, 0.426788330078125, 0.45111083984375, 0.475433349609375, 0.499755859375, 0.524078369140625, 0.54840087890625, 0.572723388671875, 0.5970458984375, 0.621368408203125, 0.64569091796875, 0.670013427734375, 0.6943359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 10.0, 6.0, 19.0, 19.0, 37.0, 70.0, 129.0, 276.0, 646.0, 2090.0, 10933.0, 170057.0, 3872837.0, 124064.0, 9783.0, 1998.0, 656.0, 342.0, 132.0, 67.0, 41.0, 22.0, 14.0, 7.0, 7.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.85546875, -3.755218505859375, -3.65496826171875, -3.554718017578125, -3.4544677734375, -3.354217529296875, -3.25396728515625, -3.153717041015625, -3.053466796875, -2.953216552734375, -2.85296630859375, -2.752716064453125, -2.6524658203125, -2.552215576171875, -2.45196533203125, -2.351715087890625, -2.25146484375, -2.151214599609375, -2.05096435546875, -1.950714111328125, -1.8504638671875, -1.750213623046875, -1.64996337890625, -1.549713134765625, -1.449462890625, -1.349212646484375, -1.24896240234375, -1.148712158203125, -1.0484619140625, -0.948211669921875, -0.84796142578125, -0.747711181640625, -0.6474609375, -0.547210693359375, -0.44696044921875, -0.346710205078125, -0.2464599609375, -0.146209716796875, -0.04595947265625, 0.054290771484375, 0.154541015625, 0.254791259765625, 0.35504150390625, 0.455291748046875, 0.5555419921875, 0.655792236328125, 0.75604248046875, 0.856292724609375, 0.95654296875, 1.056793212890625, 1.15704345703125, 1.257293701171875, 1.3575439453125, 1.457794189453125, 1.55804443359375, 1.658294677734375, 1.758544921875, 1.858795166015625, 1.95904541015625, 2.059295654296875, 2.1595458984375, 2.259796142578125, 2.36004638671875, 2.460296630859375, 2.560546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 11.0, 9.0, 11.0, 19.0, 28.0, 46.0, 48.0, 82.0, 142.0, 226.0, 439.0, 743.0, 803.0, 576.0, 321.0, 198.0, 126.0, 71.0, 46.0, 27.0, 25.0, 19.0, 10.0, 11.0, 10.0, 4.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8160858154296875, -1.754241943359375, -1.6923980712890625, -1.63055419921875, -1.5687103271484375, -1.506866455078125, -1.4450225830078125, -1.3831787109375, -1.3213348388671875, -1.259490966796875, -1.1976470947265625, -1.13580322265625, -1.0739593505859375, -1.012115478515625, -0.9502716064453125, -0.888427734375, -0.8265838623046875, -0.764739990234375, -0.7028961181640625, -0.64105224609375, -0.5792083740234375, -0.517364501953125, -0.4555206298828125, -0.3936767578125, -0.3318328857421875, -0.269989013671875, -0.2081451416015625, -0.14630126953125, -0.0844573974609375, -0.022613525390625, 0.0392303466796875, 0.10107421875, 0.1629180908203125, 0.224761962890625, 0.2866058349609375, 0.34844970703125, 0.4102935791015625, 0.472137451171875, 0.5339813232421875, 0.5958251953125, 0.6576690673828125, 0.719512939453125, 0.7813568115234375, 0.84320068359375, 0.9050445556640625, 0.966888427734375, 1.0287322998046875, 1.090576171875, 1.1524200439453125, 1.214263916015625, 1.2761077880859375, 1.33795166015625, 1.3997955322265625, 1.461639404296875, 1.5234832763671875, 1.5853271484375, 1.6471710205078125, 1.709014892578125, 1.7708587646484375, 1.83270263671875, 1.8945465087890625, 1.956390380859375, 2.0182342529296875, 2.080078125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 9.0, 18.0, 36.0, 53.0, 129.0, 177.0, 205.0, 169.0, 98.0, 50.0, 29.0, 15.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.004962921142578, -8.413089752197266, -7.821216583251953, -7.229342937469482, -6.63746976852417, -6.045596599578857, -5.453722953796387, -4.861849784851074, -4.269976615905762, -3.678103446960449, -3.0862300395965576, -2.494356632232666, -1.9024834632873535, -1.310610294342041, -0.7187368869781494, -0.1268634796142578, 0.4650096893310547, 1.0568829774856567, 1.6487562656402588, 2.2406296730041504, 2.832502841949463, 3.4243760108947754, 4.016249656677246, 4.608122825622559, 5.199995994567871, 5.791869163513184, 6.383742332458496, 6.975615978240967, 7.567489147186279, 8.15936279296875, 8.751235961914062, 9.343109130859375, 9.934982299804688, 10.52685546875, 11.118728637695312, 11.710601806640625, 12.302474975585938, 12.89434814453125, 13.486222267150879, 14.078095436096191, 14.669968605041504, 15.261841773986816, 15.853714942932129, 16.445589065551758, 17.03746223449707, 17.629335403442383, 18.221208572387695, 18.813081741333008, 19.40495491027832, 19.996828079223633, 20.588701248168945, 21.180574417114258, 21.77244758605957, 22.364320755004883, 22.956193923950195, 23.54806900024414, 24.139942169189453, 24.731815338134766, 25.323688507080078, 25.91556167602539, 26.507434844970703, 27.099308013916016, 27.691181182861328, 28.28305435180664, 28.874927520751953]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 10.0, 19.0, 9.0, 17.0, 17.0, 20.0, 32.0, 29.0, 40.0, 38.0, 41.0, 46.0, 50.0, 45.0, 46.0, 68.0, 57.0, 51.0, 33.0, 52.0, 42.0, 27.0, 22.0, 38.0, 25.0, 25.0, 14.0, 14.0, 18.0, 9.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.077053070068359, -6.8152337074279785, -6.553414344787598, -6.291594982147217, -6.029775619506836, -5.767956733703613, -5.506137371063232, -5.244318008422852, -4.982498645782471, -4.72067928314209, -4.458859920501709, -4.197040557861328, -3.9352214336395264, -3.6734020709991455, -3.4115829467773438, -3.149763584136963, -2.887944221496582, -2.626124858856201, -2.3643054962158203, -2.1024863719940186, -1.8406670093536377, -1.5788476467132568, -1.3170284032821655, -1.0552091598510742, -0.7933897972106934, -0.5315704941749573, -0.2697511911392212, -0.007931888103485107, 0.253887414932251, 0.5157067775726318, 0.7775260210037231, 1.0393452644348145, 1.3011655807495117, 1.5629849433898926, 1.8248041868209839, 2.086623430252075, 2.348442792892456, 2.610262155532837, 2.8720812797546387, 3.1339006423950195, 3.3957200050354004, 3.6575393676757812, 3.919358730316162, 4.181178092956543, 4.442996978759766, 4.704816818237305, 4.966635704040527, 5.228455066680908, 5.490274429321289, 5.75209379196167, 6.013913154602051, 6.275732517242432, 6.5375518798828125, 6.799370765686035, 7.061190128326416, 7.323009490966797, 7.584828853607178, 7.846648216247559, 8.108467102050781, 8.37028694152832, 8.632105827331543, 8.893925666809082, 9.155744552612305, 9.417564392089844, 9.679383277893066]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 6.0, 6.0, 16.0, 18.0, 29.0, 33.0, 46.0, 80.0, 118.0, 146.0, 277.0, 464.0, 769.0, 1386.0, 2673.0, 5388.0, 10952.0, 24057.0, 53030.0, 121259.0, 255098.0, 291717.0, 154855.0, 68322.0, 29882.0, 13953.0, 6653.0, 3218.0, 1699.0, 917.0, 555.0, 333.0, 210.0, 104.0, 87.0, 51.0, 38.0, 23.0, 21.0, 16.0, 9.0, 9.0, 6.0, 5.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.2568359375, -1.217742919921875, -1.17864990234375, -1.139556884765625, -1.1004638671875, -1.061370849609375, -1.02227783203125, -0.983184814453125, -0.944091796875, -0.904998779296875, -0.86590576171875, -0.826812744140625, -0.7877197265625, -0.748626708984375, -0.70953369140625, -0.670440673828125, -0.63134765625, -0.592254638671875, -0.55316162109375, -0.514068603515625, -0.4749755859375, -0.435882568359375, -0.39678955078125, -0.357696533203125, -0.318603515625, -0.279510498046875, -0.24041748046875, -0.201324462890625, -0.1622314453125, -0.123138427734375, -0.08404541015625, -0.044952392578125, -0.005859375, 0.033233642578125, 0.07232666015625, 0.111419677734375, 0.1505126953125, 0.189605712890625, 0.22869873046875, 0.267791748046875, 0.306884765625, 0.345977783203125, 0.38507080078125, 0.424163818359375, 0.4632568359375, 0.502349853515625, 0.54144287109375, 0.580535888671875, 0.61962890625, 0.658721923828125, 0.69781494140625, 0.736907958984375, 0.7760009765625, 0.815093994140625, 0.85418701171875, 0.893280029296875, 0.932373046875, 0.971466064453125, 1.01055908203125, 1.049652099609375, 1.0887451171875, 1.127838134765625, 1.16693115234375, 1.206024169921875, 1.2451171875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 1.0, 9.0, 2.0, 16.0, 10.0, 9.0, 13.0, 13.0, 17.0, 22.0, 33.0, 32.0, 38.0, 43.0, 36.0, 32.0, 46.0, 57.0, 47.0, 50.0, 43.0, 39.0, 44.0, 43.0, 31.0, 35.0, 41.0, 35.0, 22.0, 20.0, 23.0, 14.0, 10.0, 13.0, 13.0, 9.0, 6.0, 6.0, 8.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.75537109375, -0.7297592163085938, -0.7041473388671875, -0.6785354614257812, -0.652923583984375, -0.6273117065429688, -0.6016998291015625, -0.5760879516601562, -0.55047607421875, -0.5248641967773438, -0.4992523193359375, -0.47364044189453125, -0.448028564453125, -0.42241668701171875, -0.3968048095703125, -0.37119293212890625, -0.3455810546875, -0.31996917724609375, -0.2943572998046875, -0.26874542236328125, -0.243133544921875, -0.21752166748046875, -0.1919097900390625, -0.16629791259765625, -0.14068603515625, -0.11507415771484375, -0.0894622802734375, -0.06385040283203125, -0.038238525390625, -0.01262664794921875, 0.0129852294921875, 0.03859710693359375, 0.064208984375, 0.08982086181640625, 0.1154327392578125, 0.14104461669921875, 0.166656494140625, 0.19226837158203125, 0.2178802490234375, 0.24349212646484375, 0.26910400390625, 0.29471588134765625, 0.3203277587890625, 0.34593963623046875, 0.371551513671875, 0.39716339111328125, 0.4227752685546875, 0.44838714599609375, 0.4739990234375, 0.49961090087890625, 0.5252227783203125, 0.5508346557617188, 0.576446533203125, 0.6020584106445312, 0.6276702880859375, 0.6532821655273438, 0.67889404296875, 0.7045059204101562, 0.7301177978515625, 0.7557296752929688, 0.781341552734375, 0.8069534301757812, 0.8325653076171875, 0.8581771850585938, 0.8837890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 9.0, 5.0, 9.0, 10.0, 30.0, 32.0, 45.0, 64.0, 83.0, 143.0, 187.0, 318.0, 461.0, 726.0, 1406.0, 2921.0, 8107.0, 27973.0, 124150.0, 624447.0, 195922.0, 42300.0, 11263.0, 3818.0, 1724.0, 906.0, 521.0, 302.0, 193.0, 141.0, 88.0, 60.0, 51.0, 33.0, 23.0, 20.0, 11.0, 16.0, 8.0, 9.0, 1.0, 5.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.03515625, -1.96875, -1.90234375, -1.8359375, -1.76953125, -1.703125, -1.63671875, -1.5703125, -1.50390625, -1.4375, -1.37109375, -1.3046875, -1.23828125, -1.171875, -1.10546875, -1.0390625, -0.97265625, -0.90625, -0.83984375, -0.7734375, -0.70703125, -0.640625, -0.57421875, -0.5078125, -0.44140625, -0.375, -0.30859375, -0.2421875, -0.17578125, -0.109375, -0.04296875, 0.0234375, 0.08984375, 0.15625, 0.22265625, 0.2890625, 0.35546875, 0.421875, 0.48828125, 0.5546875, 0.62109375, 0.6875, 0.75390625, 0.8203125, 0.88671875, 0.953125, 1.01953125, 1.0859375, 1.15234375, 1.21875, 1.28515625, 1.3515625, 1.41796875, 1.484375, 1.55078125, 1.6171875, 1.68359375, 1.75, 1.81640625, 1.8828125, 1.94921875, 2.015625, 2.08203125, 2.1484375, 2.21484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 5.0, 9.0, 11.0, 16.0, 25.0, 14.0, 26.0, 29.0, 36.0, 55.0, 51.0, 47.0, 57.0, 59.0, 78.0, 60.0, 55.0, 52.0, 50.0, 55.0, 38.0, 40.0, 35.0, 32.0, 16.0, 9.0, 13.0, 8.0, 7.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.890625, -3.76470947265625, -3.6387939453125, -3.51287841796875, -3.386962890625, -3.26104736328125, -3.1351318359375, -3.00921630859375, -2.88330078125, -2.75738525390625, -2.6314697265625, -2.50555419921875, -2.379638671875, -2.25372314453125, -2.1278076171875, -2.00189208984375, -1.8759765625, -1.75006103515625, -1.6241455078125, -1.49822998046875, -1.372314453125, -1.24639892578125, -1.1204833984375, -0.99456787109375, -0.86865234375, -0.74273681640625, -0.6168212890625, -0.49090576171875, -0.364990234375, -0.23907470703125, -0.1131591796875, 0.01275634765625, 0.138671875, 0.26458740234375, 0.3905029296875, 0.51641845703125, 0.642333984375, 0.76824951171875, 0.8941650390625, 1.02008056640625, 1.14599609375, 1.27191162109375, 1.3978271484375, 1.52374267578125, 1.649658203125, 1.77557373046875, 1.9014892578125, 2.02740478515625, 2.1533203125, 2.27923583984375, 2.4051513671875, 2.53106689453125, 2.656982421875, 2.78289794921875, 2.9088134765625, 3.03472900390625, 3.16064453125, 3.28656005859375, 3.4124755859375, 3.53839111328125, 3.664306640625, 3.79022216796875, 3.9161376953125, 4.04205322265625, 4.16796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 8.0, 7.0, 9.0, 13.0, 22.0, 18.0, 29.0, 36.0, 67.0, 88.0, 125.0, 212.0, 273.0, 564.0, 1096.0, 2267.0, 5530.0, 14879.0, 46587.0, 193096.0, 638455.0, 100095.0, 27995.0, 9650.0, 3714.0, 1680.0, 815.0, 425.0, 261.0, 159.0, 111.0, 75.0, 72.0, 30.0, 21.0, 14.0, 21.0, 12.0, 6.0, 10.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.7607421875, -0.7403411865234375, -0.719940185546875, -0.6995391845703125, -0.67913818359375, -0.6587371826171875, -0.638336181640625, -0.6179351806640625, -0.5975341796875, -0.5771331787109375, -0.556732177734375, -0.5363311767578125, -0.51593017578125, -0.4955291748046875, -0.475128173828125, -0.4547271728515625, -0.434326171875, -0.4139251708984375, -0.393524169921875, -0.3731231689453125, -0.35272216796875, -0.3323211669921875, -0.311920166015625, -0.2915191650390625, -0.2711181640625, -0.2507171630859375, -0.230316162109375, -0.2099151611328125, -0.18951416015625, -0.1691131591796875, -0.148712158203125, -0.1283111572265625, -0.10791015625, -0.0875091552734375, -0.067108154296875, -0.0467071533203125, -0.02630615234375, -0.0059051513671875, 0.014495849609375, 0.0348968505859375, 0.0552978515625, 0.0756988525390625, 0.096099853515625, 0.1165008544921875, 0.13690185546875, 0.1573028564453125, 0.177703857421875, 0.1981048583984375, 0.218505859375, 0.2389068603515625, 0.259307861328125, 0.2797088623046875, 0.30010986328125, 0.3205108642578125, 0.340911865234375, 0.3613128662109375, 0.3817138671875, 0.4021148681640625, 0.422515869140625, 0.4429168701171875, 0.46331787109375, 0.4837188720703125, 0.504119873046875, 0.5245208740234375, 0.544921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 13.0, 14.0, 13.0, 14.0, 18.0, 20.0, 23.0, 29.0, 44.0, 54.0, 61.0, 78.0, 92.0, 93.0, 64.0, 89.0, 49.0, 45.0, 33.0, 26.0, 30.0, 12.0, 11.0, 10.0, 14.0, 6.0, 4.0, 5.0, 4.0, 1.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001958608627319336, -0.00019012577831745148, -0.00018439069390296936, -0.00017865560948848724, -0.00017292052507400513, -0.000167185440659523, -0.0001614503562450409, -0.00015571527183055878, -0.00014998018741607666, -0.00014424510300159454, -0.00013851001858711243, -0.0001327749341726303, -0.0001270398497581482, -0.00012130476534366608, -0.00011556968092918396, -0.00010983459651470184, -0.00010409951210021973, -9.836442768573761e-05, -9.262934327125549e-05, -8.689425885677338e-05, -8.115917444229126e-05, -7.542409002780914e-05, -6.968900561332703e-05, -6.395392119884491e-05, -5.821883678436279e-05, -5.2483752369880676e-05, -4.674866795539856e-05, -4.101358354091644e-05, -3.5278499126434326e-05, -2.954341471195221e-05, -2.3808330297470093e-05, -1.8073245882987976e-05, -1.233816146850586e-05, -6.603077054023743e-06, -8.67992639541626e-07, 4.867091774940491e-06, 1.0602176189422607e-05, 1.6337260603904724e-05, 2.207234501838684e-05, 2.7807429432868958e-05, 3.3542513847351074e-05, 3.927759826183319e-05, 4.501268267631531e-05, 5.0747767090797424e-05, 5.648285150527954e-05, 6.221793591976166e-05, 6.795302033424377e-05, 7.368810474872589e-05, 7.942318916320801e-05, 8.515827357769012e-05, 9.089335799217224e-05, 9.662844240665436e-05, 0.00010236352682113647, 0.00010809861123561859, 0.00011383369565010071, 0.00011956878006458282, 0.00012530386447906494, 0.00013103894889354706, 0.00013677403330802917, 0.0001425091177225113, 0.0001482442021369934, 0.00015397928655147552, 0.00015971437096595764, 0.00016544945538043976, 0.00017118453979492188]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 13.0, 14.0, 19.0, 35.0, 41.0, 83.0, 94.0, 180.0, 285.0, 459.0, 917.0, 1976.0, 4778.0, 13973.0, 49610.0, 246174.0, 614926.0, 81917.0, 20983.0, 6751.0, 2591.0, 1229.0, 628.0, 292.0, 210.0, 129.0, 83.0, 46.0, 27.0, 19.0, 29.0, 7.0, 7.0, 9.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.68408203125, -0.6628189086914062, -0.6415557861328125, -0.6202926635742188, -0.599029541015625, -0.5777664184570312, -0.5565032958984375, -0.5352401733398438, -0.51397705078125, -0.49271392822265625, -0.4714508056640625, -0.45018768310546875, -0.428924560546875, -0.40766143798828125, -0.3863983154296875, -0.36513519287109375, -0.3438720703125, -0.32260894775390625, -0.3013458251953125, -0.28008270263671875, -0.258819580078125, -0.23755645751953125, -0.2162933349609375, -0.19503021240234375, -0.17376708984375, -0.15250396728515625, -0.1312408447265625, -0.10997772216796875, -0.088714599609375, -0.06745147705078125, -0.0461883544921875, -0.02492523193359375, -0.003662109375, 0.01760101318359375, 0.0388641357421875, 0.06012725830078125, 0.081390380859375, 0.10265350341796875, 0.1239166259765625, 0.14517974853515625, 0.16644287109375, 0.18770599365234375, 0.2089691162109375, 0.23023223876953125, 0.251495361328125, 0.27275848388671875, 0.2940216064453125, 0.31528472900390625, 0.3365478515625, 0.35781097412109375, 0.3790740966796875, 0.40033721923828125, 0.421600341796875, 0.44286346435546875, 0.4641265869140625, 0.48538970947265625, 0.50665283203125, 0.5279159545898438, 0.5491790771484375, 0.5704421997070312, 0.591705322265625, 0.6129684448242188, 0.6342315673828125, 0.6554946899414062, 0.6767578125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 2.0, 8.0, 11.0, 9.0, 12.0, 15.0, 16.0, 31.0, 41.0, 40.0, 71.0, 73.0, 88.0, 85.0, 104.0, 81.0, 69.0, 71.0, 41.0, 27.0, 31.0, 13.0, 13.0, 12.0, 4.0, 8.0, 4.0, 3.0, 8.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83154296875, -0.8071060180664062, -0.7826690673828125, -0.7582321166992188, -0.733795166015625, -0.7093582153320312, -0.6849212646484375, -0.6604843139648438, -0.63604736328125, -0.6116104125976562, -0.5871734619140625, -0.5627365112304688, -0.538299560546875, -0.5138626098632812, -0.4894256591796875, -0.46498870849609375, -0.4405517578125, -0.41611480712890625, -0.3916778564453125, -0.36724090576171875, -0.342803955078125, -0.31836700439453125, -0.2939300537109375, -0.26949310302734375, -0.24505615234375, -0.22061920166015625, -0.1961822509765625, -0.17174530029296875, -0.147308349609375, -0.12287139892578125, -0.0984344482421875, -0.07399749755859375, -0.049560546875, -0.02512359619140625, -0.0006866455078125, 0.02375030517578125, 0.048187255859375, 0.07262420654296875, 0.0970611572265625, 0.12149810791015625, 0.14593505859375, 0.17037200927734375, 0.1948089599609375, 0.21924591064453125, 0.243682861328125, 0.26811981201171875, 0.2925567626953125, 0.31699371337890625, 0.3414306640625, 0.36586761474609375, 0.3903045654296875, 0.41474151611328125, 0.439178466796875, 0.46361541748046875, 0.4880523681640625, 0.5124893188476562, 0.53692626953125, 0.5613632202148438, 0.5858001708984375, 0.6102371215820312, 0.634674072265625, 0.6591110229492188, 0.6835479736328125, 0.7079849243164062, 0.732421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 9.0, 20.0, 42.0, 91.0, 158.0, 387.0, 153.0, 72.0, 40.0, 14.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.47957420349121, -15.631742477416992, -14.783909797668457, -13.936078071594238, -13.088245391845703, -12.240413665771484, -11.392581939697266, -10.544750213623047, -9.696917533874512, -8.849085807800293, -8.001253128051758, -7.153421401977539, -6.305589199066162, -5.457756996154785, -4.609925270080566, -3.7620930671691895, -2.9142608642578125, -2.0664286613464355, -1.2185966968536377, -0.37076473236083984, 0.4770674705505371, 1.324899673461914, 2.172731399536133, 3.0205636024475098, 3.8683958053588867, 4.716228008270264, 5.564060211181641, 6.411891937255859, 7.259724140167236, 8.107556343078613, 8.955388069152832, 9.803220748901367, 10.651054382324219, 11.498886108398438, 12.346718788146973, 13.194550514221191, 14.042383193969727, 14.890214920043945, 15.738046646118164, 16.585878372192383, 17.433712005615234, 18.281543731689453, 19.129375457763672, 19.97720718383789, 20.825040817260742, 21.67287254333496, 22.52070426940918, 23.3685359954834, 24.216367721557617, 25.064199447631836, 25.912031173706055, 26.759864807128906, 27.607696533203125, 28.455528259277344, 29.303359985351562, 30.15119171142578, 30.9990234375, 31.84685516357422, 32.69468688964844, 33.542518615722656, 34.390350341796875, 35.238182067871094, 36.08601379394531, 36.9338493347168, 37.781681060791016]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 2.0, 1.0, 3.0, 5.0, 6.0, 12.0, 10.0, 14.0, 24.0, 18.0, 27.0, 23.0, 34.0, 33.0, 25.0, 27.0, 46.0, 56.0, 91.0, 96.0, 72.0, 57.0, 43.0, 43.0, 35.0, 30.0, 31.0, 23.0, 20.0, 21.0, 17.0, 10.0, 8.0, 3.0, 7.0, 5.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.414369583129883, -12.051536560058594, -11.688702583312988, -11.3258695602417, -10.963035583496094, -10.600202560424805, -10.237369537353516, -9.87453556060791, -9.511701583862305, -9.148868560791016, -8.78603458404541, -8.423201560974121, -8.060367584228516, -7.697534561157227, -7.334701061248779, -6.971867561340332, -6.609034538269043, -6.246201038360596, -5.883367538452148, -5.520534515380859, -5.157700538635254, -4.794867515563965, -4.432034015655518, -4.06920051574707, -3.706367015838623, -3.343533515930176, -2.9807000160217285, -2.6178667545318604, -2.255033254623413, -1.8921997547149658, -1.5293664932250977, -1.1665329933166504, -0.8036994934082031, -0.44086605310440063, -0.07803261280059814, 0.28480076789855957, 0.6476342678070068, 1.010467767715454, 1.3733010292053223, 1.7361345291137695, 2.098968029022217, 2.461801528930664, 2.8246350288391113, 3.1874682903289795, 3.5503017902374268, 3.913135290145874, 4.275968551635742, 4.6388020515441895, 5.001635551452637, 5.364469051361084, 5.727302551269531, 6.09013557434082, 6.452969551086426, 6.815802574157715, 7.178636074066162, 7.541469573974609, 7.904303073883057, 8.267136573791504, 8.629969596862793, 8.992803573608398, 9.355636596679688, 9.718470573425293, 10.081303596496582, 10.444137573242188, 10.806970596313477]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 14.0, 28.0, 27.0, 40.0, 56.0, 94.0, 159.0, 312.0, 609.0, 1287.0, 3261.0, 10315.0, 47231.0, 416061.0, 2712647.0, 896600.0, 83283.0, 14597.0, 4264.0, 1553.0, 803.0, 409.0, 182.0, 134.0, 81.0, 42.0, 40.0, 31.0, 24.0, 21.0, 12.0, 11.0, 6.0, 5.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.4736328125, -1.4270782470703125, -1.380523681640625, -1.3339691162109375, -1.28741455078125, -1.2408599853515625, -1.194305419921875, -1.1477508544921875, -1.1011962890625, -1.0546417236328125, -1.008087158203125, -0.9615325927734375, -0.91497802734375, -0.8684234619140625, -0.821868896484375, -0.7753143310546875, -0.728759765625, -0.6822052001953125, -0.635650634765625, -0.5890960693359375, -0.54254150390625, -0.4959869384765625, -0.449432373046875, -0.4028778076171875, -0.3563232421875, -0.3097686767578125, -0.263214111328125, -0.2166595458984375, -0.17010498046875, -0.1235504150390625, -0.076995849609375, -0.0304412841796875, 0.01611328125, 0.0626678466796875, 0.109222412109375, 0.1557769775390625, 0.20233154296875, 0.2488861083984375, 0.295440673828125, 0.3419952392578125, 0.3885498046875, 0.4351043701171875, 0.481658935546875, 0.5282135009765625, 0.57476806640625, 0.6213226318359375, 0.667877197265625, 0.7144317626953125, 0.760986328125, 0.8075408935546875, 0.854095458984375, 0.9006500244140625, 0.94720458984375, 0.9937591552734375, 1.040313720703125, 1.0868682861328125, 1.1334228515625, 1.1799774169921875, 1.226531982421875, 1.2730865478515625, 1.31964111328125, 1.3661956787109375, 1.412750244140625, 1.4593048095703125, 1.505859375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 7.0, 7.0, 15.0, 11.0, 9.0, 17.0, 14.0, 20.0, 21.0, 34.0, 29.0, 39.0, 38.0, 28.0, 22.0, 42.0, 72.0, 47.0, 47.0, 52.0, 42.0, 50.0, 36.0, 53.0, 29.0, 40.0, 32.0, 21.0, 24.0, 19.0, 11.0, 15.0, 11.0, 4.0, 10.0, 8.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7490234375, -0.723480224609375, -0.69793701171875, -0.672393798828125, -0.6468505859375, -0.621307373046875, -0.59576416015625, -0.570220947265625, -0.544677734375, -0.519134521484375, -0.49359130859375, -0.468048095703125, -0.4425048828125, -0.416961669921875, -0.39141845703125, -0.365875244140625, -0.34033203125, -0.314788818359375, -0.28924560546875, -0.263702392578125, -0.2381591796875, -0.212615966796875, -0.18707275390625, -0.161529541015625, -0.135986328125, -0.110443115234375, -0.08489990234375, -0.059356689453125, -0.0338134765625, -0.008270263671875, 0.01727294921875, 0.042816162109375, 0.068359375, 0.093902587890625, 0.11944580078125, 0.144989013671875, 0.1705322265625, 0.196075439453125, 0.22161865234375, 0.247161865234375, 0.272705078125, 0.298248291015625, 0.32379150390625, 0.349334716796875, 0.3748779296875, 0.400421142578125, 0.42596435546875, 0.451507568359375, 0.47705078125, 0.502593994140625, 0.52813720703125, 0.553680419921875, 0.5792236328125, 0.604766845703125, 0.63031005859375, 0.655853271484375, 0.681396484375, 0.706939697265625, 0.73248291015625, 0.758026123046875, 0.7835693359375, 0.809112548828125, 0.83465576171875, 0.860198974609375, 0.8857421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 10.0, 5.0, 15.0, 22.0, 39.0, 64.0, 122.0, 196.0, 410.0, 986.0, 3867.0, 47146.0, 3791599.0, 336237.0, 10488.0, 1827.0, 612.0, 281.0, 123.0, 90.0, 48.0, 40.0, 23.0, 16.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.2337646484375, -4.100341796875, -3.9669189453125, -3.83349609375, -3.7000732421875, -3.566650390625, -3.4332275390625, -3.2998046875, -3.1663818359375, -3.032958984375, -2.8995361328125, -2.76611328125, -2.6326904296875, -2.499267578125, -2.3658447265625, -2.232421875, -2.0989990234375, -1.965576171875, -1.8321533203125, -1.69873046875, -1.5653076171875, -1.431884765625, -1.2984619140625, -1.1650390625, -1.0316162109375, -0.898193359375, -0.7647705078125, -0.63134765625, -0.4979248046875, -0.364501953125, -0.2310791015625, -0.09765625, 0.0357666015625, 0.169189453125, 0.3026123046875, 0.43603515625, 0.5694580078125, 0.702880859375, 0.8363037109375, 0.9697265625, 1.1031494140625, 1.236572265625, 1.3699951171875, 1.50341796875, 1.6368408203125, 1.770263671875, 1.9036865234375, 2.037109375, 2.1705322265625, 2.303955078125, 2.4373779296875, 2.57080078125, 2.7042236328125, 2.837646484375, 2.9710693359375, 3.1044921875, 3.2379150390625, 3.371337890625, 3.5047607421875, 3.63818359375, 3.7716064453125, 3.905029296875, 4.0384521484375, 4.171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 7.0, 10.0, 9.0, 30.0, 39.0, 50.0, 109.0, 201.0, 412.0, 729.0, 1025.0, 698.0, 321.0, 145.0, 101.0, 59.0, 37.0, 34.0, 19.0, 15.0, 7.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.489471435546875, -3.39105224609375, -3.292633056640625, -3.1942138671875, -3.095794677734375, -2.99737548828125, -2.898956298828125, -2.800537109375, -2.702117919921875, -2.60369873046875, -2.505279541015625, -2.4068603515625, -2.308441162109375, -2.21002197265625, -2.111602783203125, -2.01318359375, -1.914764404296875, -1.81634521484375, -1.717926025390625, -1.6195068359375, -1.521087646484375, -1.42266845703125, -1.324249267578125, -1.225830078125, -1.127410888671875, -1.02899169921875, -0.930572509765625, -0.8321533203125, -0.733734130859375, -0.63531494140625, -0.536895751953125, -0.4384765625, -0.340057373046875, -0.24163818359375, -0.143218994140625, -0.0447998046875, 0.053619384765625, 0.15203857421875, 0.250457763671875, 0.348876953125, 0.447296142578125, 0.54571533203125, 0.644134521484375, 0.7425537109375, 0.840972900390625, 0.93939208984375, 1.037811279296875, 1.13623046875, 1.234649658203125, 1.33306884765625, 1.431488037109375, 1.5299072265625, 1.628326416015625, 1.72674560546875, 1.825164794921875, 1.923583984375, 2.022003173828125, 2.12042236328125, 2.218841552734375, 2.3172607421875, 2.415679931640625, 2.51409912109375, 2.612518310546875, 2.7109375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 10.0, 10.0, 63.0, 165.0, 328.0, 260.0, 98.0, 38.0, 23.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.391866683959961, -7.300963878631592, -6.210061073303223, -5.119158744812012, -4.028255939483643, -2.9373531341552734, -1.8464508056640625, -0.7555480003356934, 0.3353548049926758, 1.4262574911117554, 2.517160177230835, 3.608062744140625, 4.698965549468994, 5.789868354797363, 6.880770683288574, 7.971673488616943, 9.062576293945312, 10.153478622436523, 11.24438190460205, 12.335284233093262, 13.426187515258789, 14.51708984375, 15.607992172241211, 16.698894500732422, 17.789798736572266, 18.880701065063477, 19.971603393554688, 21.06250762939453, 22.153409957885742, 23.244312286376953, 24.335214614868164, 25.426116943359375, 26.517017364501953, 27.607919692993164, 28.698822021484375, 29.78972625732422, 30.88062858581543, 31.97153091430664, 33.06243133544922, 34.15333557128906, 35.244239807128906, 36.33514404296875, 37.42604446411133, 38.51694869995117, 39.60784912109375, 40.698753356933594, 41.78965759277344, 42.880558013916016, 43.971458435058594, 45.06236267089844, 46.153263092041016, 47.24416732788086, 48.33506774902344, 49.42597198486328, 50.516876220703125, 51.6077766418457, 52.69868087768555, 53.78958511352539, 54.88048553466797, 55.97138977050781, 57.06229019165039, 58.153194427490234, 59.24409484863281, 60.334999084472656, 61.4259033203125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 7.0, 2.0, 3.0, 6.0, 4.0, 5.0, 5.0, 7.0, 7.0, 9.0, 10.0, 16.0, 22.0, 19.0, 27.0, 39.0, 34.0, 30.0, 38.0, 43.0, 49.0, 66.0, 60.0, 71.0, 48.0, 52.0, 48.0, 27.0, 31.0, 44.0, 32.0, 21.0, 19.0, 15.0, 22.0, 20.0, 6.0, 11.0, 8.0, 11.0, 6.0, 7.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.874604225158691, -8.557976722717285, -8.241349220275879, -7.924721717834473, -7.608094215393066, -7.29146671295166, -6.974839210510254, -6.658211708068848, -6.341584205627441, -6.024956703186035, -5.708329200744629, -5.391701698303223, -5.075074195861816, -4.75844669342041, -4.441819190979004, -4.125191688537598, -3.808563709259033, -3.491936206817627, -3.1753087043762207, -2.8586812019348145, -2.542053699493408, -2.225426197052002, -1.9087984561920166, -1.5921709537506104, -1.275543451309204, -0.9589159488677979, -0.6422883868217468, -0.3256608247756958, -0.00903332233428955, 0.3075941801071167, 0.6242218017578125, 0.9408493041992188, 1.257476806640625, 1.5741043090820312, 1.8907318115234375, 2.2073593139648438, 2.52398681640625, 2.8406143188476562, 3.1572420597076416, 3.473869562149048, 3.790497064590454, 4.1071248054504395, 4.423752307891846, 4.740379810333252, 5.057007312774658, 5.3736348152160645, 5.690262317657471, 6.006889820098877, 6.323517322540283, 6.6401448249816895, 6.956772327423096, 7.273399829864502, 7.590027332305908, 7.9066548347473145, 8.223282814025879, 8.539910316467285, 8.856537818908691, 9.173165321350098, 9.489792823791504, 9.80642032623291, 10.123047828674316, 10.439675331115723, 10.756302833557129, 11.072930335998535, 11.389557838439941]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 2.0, 8.0, 13.0, 17.0, 16.0, 42.0, 58.0, 83.0, 109.0, 190.0, 303.0, 471.0, 834.0, 1569.0, 2864.0, 5573.0, 11376.0, 24068.0, 56065.0, 136507.0, 301432.0, 285810.0, 125160.0, 51384.0, 22589.0, 10510.0, 5279.0, 2669.0, 1408.0, 853.0, 483.0, 264.0, 175.0, 115.0, 72.0, 42.0, 33.0, 20.0, 24.0, 20.0, 12.0, 9.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4873046875, -1.442169189453125, -1.39703369140625, -1.351898193359375, -1.3067626953125, -1.261627197265625, -1.21649169921875, -1.171356201171875, -1.126220703125, -1.081085205078125, -1.03594970703125, -0.990814208984375, -0.9456787109375, -0.900543212890625, -0.85540771484375, -0.810272216796875, -0.76513671875, -0.720001220703125, -0.67486572265625, -0.629730224609375, -0.5845947265625, -0.539459228515625, -0.49432373046875, -0.449188232421875, -0.404052734375, -0.358917236328125, -0.31378173828125, -0.268646240234375, -0.2235107421875, -0.178375244140625, -0.13323974609375, -0.088104248046875, -0.04296875, 0.002166748046875, 0.04730224609375, 0.092437744140625, 0.1375732421875, 0.182708740234375, 0.22784423828125, 0.272979736328125, 0.318115234375, 0.363250732421875, 0.40838623046875, 0.453521728515625, 0.4986572265625, 0.543792724609375, 0.58892822265625, 0.634063720703125, 0.67919921875, 0.724334716796875, 0.76947021484375, 0.814605712890625, 0.8597412109375, 0.904876708984375, 0.95001220703125, 0.995147705078125, 1.040283203125, 1.085418701171875, 1.13055419921875, 1.175689697265625, 1.2208251953125, 1.265960693359375, 1.31109619140625, 1.356231689453125, 1.4013671875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 15.0, 10.0, 12.0, 21.0, 18.0, 27.0, 34.0, 40.0, 40.0, 39.0, 46.0, 59.0, 58.0, 53.0, 69.0, 56.0, 57.0, 44.0, 48.0, 36.0, 29.0, 30.0, 25.0, 21.0, 24.0, 22.0, 14.0, 13.0, 5.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.947265625, -0.9149322509765625, -0.882598876953125, -0.8502655029296875, -0.81793212890625, -0.7855987548828125, -0.753265380859375, -0.7209320068359375, -0.6885986328125, -0.6562652587890625, -0.623931884765625, -0.5915985107421875, -0.55926513671875, -0.5269317626953125, -0.494598388671875, -0.4622650146484375, -0.429931640625, -0.3975982666015625, -0.365264892578125, -0.3329315185546875, -0.30059814453125, -0.2682647705078125, -0.235931396484375, -0.2035980224609375, -0.1712646484375, -0.1389312744140625, -0.106597900390625, -0.0742645263671875, -0.04193115234375, -0.0095977783203125, 0.022735595703125, 0.0550689697265625, 0.08740234375, 0.1197357177734375, 0.152069091796875, 0.1844024658203125, 0.21673583984375, 0.2490692138671875, 0.281402587890625, 0.3137359619140625, 0.3460693359375, 0.3784027099609375, 0.410736083984375, 0.4430694580078125, 0.47540283203125, 0.5077362060546875, 0.540069580078125, 0.5724029541015625, 0.604736328125, 0.6370697021484375, 0.669403076171875, 0.7017364501953125, 0.73406982421875, 0.7664031982421875, 0.798736572265625, 0.8310699462890625, 0.8634033203125, 0.8957366943359375, 0.928070068359375, 0.9604034423828125, 0.99273681640625, 1.0250701904296875, 1.057403564453125, 1.0897369384765625, 1.1220703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 7.0, 17.0, 18.0, 19.0, 20.0, 45.0, 52.0, 75.0, 90.0, 148.0, 192.0, 275.0, 391.0, 623.0, 996.0, 1964.0, 4341.0, 12916.0, 52197.0, 315146.0, 576936.0, 58262.0, 13878.0, 4670.0, 2081.0, 1078.0, 653.0, 404.0, 311.0, 206.0, 126.0, 106.0, 74.0, 61.0, 50.0, 24.0, 31.0, 19.0, 15.0, 6.0, 3.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.537109375, -2.457916259765625, -2.37872314453125, -2.299530029296875, -2.2203369140625, -2.141143798828125, -2.06195068359375, -1.982757568359375, -1.903564453125, -1.824371337890625, -1.74517822265625, -1.665985107421875, -1.5867919921875, -1.507598876953125, -1.42840576171875, -1.349212646484375, -1.27001953125, -1.190826416015625, -1.11163330078125, -1.032440185546875, -0.9532470703125, -0.874053955078125, -0.79486083984375, -0.715667724609375, -0.636474609375, -0.557281494140625, -0.47808837890625, -0.398895263671875, -0.3197021484375, -0.240509033203125, -0.16131591796875, -0.082122802734375, -0.0029296875, 0.076263427734375, 0.15545654296875, 0.234649658203125, 0.3138427734375, 0.393035888671875, 0.47222900390625, 0.551422119140625, 0.630615234375, 0.709808349609375, 0.78900146484375, 0.868194580078125, 0.9473876953125, 1.026580810546875, 1.10577392578125, 1.184967041015625, 1.26416015625, 1.343353271484375, 1.42254638671875, 1.501739501953125, 1.5809326171875, 1.660125732421875, 1.73931884765625, 1.818511962890625, 1.897705078125, 1.976898193359375, 2.05609130859375, 2.135284423828125, 2.2144775390625, 2.293670654296875, 2.37286376953125, 2.452056884765625, 2.53125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 5.0, 8.0, 6.0, 12.0, 11.0, 11.0, 16.0, 19.0, 21.0, 25.0, 23.0, 35.0, 34.0, 49.0, 44.0, 57.0, 49.0, 55.0, 65.0, 55.0, 57.0, 51.0, 35.0, 44.0, 25.0, 28.0, 26.0, 29.0, 14.0, 18.0, 15.0, 7.0, 8.0, 13.0, 4.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.17578125, -3.07257080078125, -2.9693603515625, -2.86614990234375, -2.762939453125, -2.65972900390625, -2.5565185546875, -2.45330810546875, -2.35009765625, -2.24688720703125, -2.1436767578125, -2.04046630859375, -1.937255859375, -1.83404541015625, -1.7308349609375, -1.62762451171875, -1.5244140625, -1.42120361328125, -1.3179931640625, -1.21478271484375, -1.111572265625, -1.00836181640625, -0.9051513671875, -0.80194091796875, -0.69873046875, -0.59552001953125, -0.4923095703125, -0.38909912109375, -0.285888671875, -0.18267822265625, -0.0794677734375, 0.02374267578125, 0.126953125, 0.23016357421875, 0.3333740234375, 0.43658447265625, 0.539794921875, 0.64300537109375, 0.7462158203125, 0.84942626953125, 0.95263671875, 1.05584716796875, 1.1590576171875, 1.26226806640625, 1.365478515625, 1.46868896484375, 1.5718994140625, 1.67510986328125, 1.7783203125, 1.88153076171875, 1.9847412109375, 2.08795166015625, 2.191162109375, 2.29437255859375, 2.3975830078125, 2.50079345703125, 2.60400390625, 2.70721435546875, 2.8104248046875, 2.91363525390625, 3.016845703125, 3.12005615234375, 3.2232666015625, 3.32647705078125, 3.4296875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 9.0, 6.0, 14.0, 23.0, 35.0, 47.0, 55.0, 102.0, 153.0, 338.0, 716.0, 1724.0, 6063.0, 33057.0, 325285.0, 633021.0, 37557.0, 6938.0, 1908.0, 709.0, 326.0, 177.0, 94.0, 48.0, 60.0, 28.0, 25.0, 13.0, 10.0, 5.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -1.0245819091796875, -0.994476318359375, -0.9643707275390625, -0.93426513671875, -0.9041595458984375, -0.874053955078125, -0.8439483642578125, -0.8138427734375, -0.7837371826171875, -0.753631591796875, -0.7235260009765625, -0.69342041015625, -0.6633148193359375, -0.633209228515625, -0.6031036376953125, -0.572998046875, -0.5428924560546875, -0.512786865234375, -0.4826812744140625, -0.45257568359375, -0.4224700927734375, -0.392364501953125, -0.3622589111328125, -0.3321533203125, -0.3020477294921875, -0.271942138671875, -0.2418365478515625, -0.21173095703125, -0.1816253662109375, -0.151519775390625, -0.1214141845703125, -0.09130859375, -0.0612030029296875, -0.031097412109375, -0.0009918212890625, 0.02911376953125, 0.0592193603515625, 0.089324951171875, 0.1194305419921875, 0.1495361328125, 0.1796417236328125, 0.209747314453125, 0.2398529052734375, 0.26995849609375, 0.3000640869140625, 0.330169677734375, 0.3602752685546875, 0.390380859375, 0.4204864501953125, 0.450592041015625, 0.4806976318359375, 0.51080322265625, 0.5409088134765625, 0.571014404296875, 0.6011199951171875, 0.6312255859375, 0.6613311767578125, 0.691436767578125, 0.7215423583984375, 0.75164794921875, 0.7817535400390625, 0.811859130859375, 0.8419647216796875, 0.8720703125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 8.0, 4.0, 12.0, 23.0, 34.0, 36.0, 30.0, 33.0, 67.0, 59.0, 93.0, 115.0, 94.0, 82.0, 70.0, 51.0, 41.0, 27.0, 25.0, 17.0, 14.0, 13.0, 10.0, 2.0, 8.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002989768981933594, -0.00029057078063488007, -0.00028216466307640076, -0.00027375854551792145, -0.00026535242795944214, -0.00025694631040096283, -0.0002485401928424835, -0.0002401340752840042, -0.0002317279577255249, -0.0002233218401670456, -0.00021491572260856628, -0.00020650960505008698, -0.00019810348749160767, -0.00018969736993312836, -0.00018129125237464905, -0.00017288513481616974, -0.00016447901725769043, -0.00015607289969921112, -0.0001476667821407318, -0.0001392606645822525, -0.0001308545470237732, -0.00012244842946529388, -0.00011404231190681458, -0.00010563619434833527, -9.723007678985596e-05, -8.882395923137665e-05, -8.041784167289734e-05, -7.201172411441803e-05, -6.360560655593872e-05, -5.519948899745941e-05, -4.67933714389801e-05, -3.8387253880500793e-05, -2.9981136322021484e-05, -2.1575018763542175e-05, -1.3168901205062866e-05, -4.762783646583557e-06, 3.643333911895752e-06, 1.2049451470375061e-05, 2.045556902885437e-05, 2.886168658733368e-05, 3.726780414581299e-05, 4.56739217042923e-05, 5.4080039262771606e-05, 6.248615682125092e-05, 7.089227437973022e-05, 7.929839193820953e-05, 8.770450949668884e-05, 9.611062705516815e-05, 0.00010451674461364746, 0.00011292286217212677, 0.00012132897973060608, 0.0001297350972890854, 0.0001381412148475647, 0.000146547332406044, 0.00015495344996452332, 0.00016335956752300262, 0.00017176568508148193, 0.00018017180263996124, 0.00018857792019844055, 0.00019698403775691986, 0.00020539015531539917, 0.00021379627287387848, 0.0002222023904323578, 0.0002306085079908371, 0.0002390146255493164]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 11.0, 11.0, 14.0, 9.0, 26.0, 41.0, 50.0, 65.0, 104.0, 144.0, 232.0, 344.0, 629.0, 994.0, 1962.0, 4409.0, 12340.0, 46250.0, 215397.0, 643347.0, 88117.0, 21110.0, 6815.0, 2791.0, 1347.0, 752.0, 429.0, 262.0, 167.0, 125.0, 83.0, 44.0, 30.0, 26.0, 24.0, 11.0, 15.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.599609375, -0.5820846557617188, -0.5645599365234375, -0.5470352172851562, -0.529510498046875, -0.5119857788085938, -0.4944610595703125, -0.47693634033203125, -0.45941162109375, -0.44188690185546875, -0.4243621826171875, -0.40683746337890625, -0.389312744140625, -0.37178802490234375, -0.3542633056640625, -0.33673858642578125, -0.3192138671875, -0.30168914794921875, -0.2841644287109375, -0.26663970947265625, -0.249114990234375, -0.23159027099609375, -0.2140655517578125, -0.19654083251953125, -0.17901611328125, -0.16149139404296875, -0.1439666748046875, -0.12644195556640625, -0.108917236328125, -0.09139251708984375, -0.0738677978515625, -0.05634307861328125, -0.038818359375, -0.02129364013671875, -0.0037689208984375, 0.01375579833984375, 0.031280517578125, 0.04880523681640625, 0.0663299560546875, 0.08385467529296875, 0.10137939453125, 0.11890411376953125, 0.1364288330078125, 0.15395355224609375, 0.171478271484375, 0.18900299072265625, 0.2065277099609375, 0.22405242919921875, 0.2415771484375, 0.25910186767578125, 0.2766265869140625, 0.29415130615234375, 0.311676025390625, 0.32920074462890625, 0.3467254638671875, 0.36425018310546875, 0.38177490234375, 0.39929962158203125, 0.4168243408203125, 0.43434906005859375, 0.451873779296875, 0.46939849853515625, 0.4869232177734375, 0.5044479370117188, 0.52197265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 6.0, 10.0, 7.0, 15.0, 10.0, 18.0, 21.0, 27.0, 22.0, 31.0, 34.0, 40.0, 42.0, 42.0, 55.0, 88.0, 57.0, 67.0, 62.0, 61.0, 37.0, 52.0, 31.0, 23.0, 23.0, 26.0, 15.0, 13.0, 8.0, 10.0, 11.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.6171875, -0.5996856689453125, -0.582183837890625, -0.5646820068359375, -0.54718017578125, -0.5296783447265625, -0.512176513671875, -0.4946746826171875, -0.4771728515625, -0.4596710205078125, -0.442169189453125, -0.4246673583984375, -0.40716552734375, -0.3896636962890625, -0.372161865234375, -0.3546600341796875, -0.337158203125, -0.3196563720703125, -0.302154541015625, -0.2846527099609375, -0.26715087890625, -0.2496490478515625, -0.232147216796875, -0.2146453857421875, -0.1971435546875, -0.1796417236328125, -0.162139892578125, -0.1446380615234375, -0.12713623046875, -0.1096343994140625, -0.092132568359375, -0.0746307373046875, -0.05712890625, -0.0396270751953125, -0.022125244140625, -0.0046234130859375, 0.01287841796875, 0.0303802490234375, 0.047882080078125, 0.0653839111328125, 0.0828857421875, 0.1003875732421875, 0.117889404296875, 0.1353912353515625, 0.15289306640625, 0.1703948974609375, 0.187896728515625, 0.2053985595703125, 0.222900390625, 0.2404022216796875, 0.257904052734375, 0.2754058837890625, 0.29290771484375, 0.3104095458984375, 0.327911376953125, 0.3454132080078125, 0.3629150390625, 0.3804168701171875, 0.397918701171875, 0.4154205322265625, 0.43292236328125, 0.4504241943359375, 0.467926025390625, 0.4854278564453125, 0.5029296875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 6.0, 26.0, 23.0, 67.0, 158.0, 388.0, 162.0, 90.0, 39.0, 19.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.272552490234375, -31.393699645996094, -30.514846801757812, -29.63599395751953, -28.757139205932617, -27.878286361694336, -26.999433517456055, -26.120580673217773, -25.24172592163086, -24.362873077392578, -23.484020233154297, -22.605167388916016, -21.7263126373291, -20.84745979309082, -19.96860694885254, -19.089754104614258, -18.210901260375977, -17.332048416137695, -16.453195571899414, -15.574341773986816, -14.695487976074219, -13.816635131835938, -12.937782287597656, -12.058929443359375, -11.180075645446777, -10.301222801208496, -9.422369003295898, -8.543516159057617, -7.664662837982178, -6.785809516906738, -5.906956672668457, -5.028103351593018, -4.149250030517578, -3.2703967094421387, -2.3915436267852783, -1.512690544128418, -0.6338372230529785, 0.24501609802246094, 1.1238689422607422, 2.0027222633361816, 2.881575584411621, 3.7604289054870605, 4.6392822265625, 5.518135070800781, 6.396988391876221, 7.27584171295166, 8.154694557189941, 9.033548355102539, 9.91240119934082, 10.791254043579102, 11.6701078414917, 12.54896068572998, 13.427814483642578, 14.30666732788086, 15.18552017211914, 16.064373016357422, 16.943225860595703, 17.822078704833984, 18.700931549072266, 19.579784393310547, 20.45863914489746, 21.337491989135742, 22.216344833374023, 23.095197677612305, 23.97405242919922]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 10.0, 11.0, 13.0, 13.0, 14.0, 24.0, 27.0, 37.0, 26.0, 32.0, 29.0, 49.0, 78.0, 175.0, 137.0, 46.0, 39.0, 39.0, 31.0, 31.0, 17.0, 25.0, 16.0, 17.0, 17.0, 11.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.693618774414062, -13.216774940490723, -12.739931106567383, -12.26308822631836, -11.78624439239502, -11.30940055847168, -10.83255672454834, -10.355712890625, -9.878870010375977, -9.402026176452637, -8.925182342529297, -8.448339462280273, -7.971495628356934, -7.494651794433594, -7.017807960510254, -6.540964603424072, -6.064120769500732, -5.587276935577393, -5.110433578491211, -4.633589744567871, -4.1567463874816895, -3.6799025535583496, -3.203058958053589, -2.726215362548828, -2.2493717670440674, -1.7725281715393066, -1.295684576034546, -0.8188408613204956, -0.34199726581573486, 0.13484644889831543, 0.6116900444030762, 1.088533639907837, 1.5653772354125977, 2.0422208309173584, 2.519064426422119, 2.995908260345459, 3.4727516174316406, 3.9495954513549805, 4.42643928527832, 4.903282642364502, 5.380125999450684, 5.856969833374023, 6.333813190460205, 6.810657024383545, 7.287500381469727, 7.764344215393066, 8.241188049316406, 8.71803092956543, 9.194875717163086, 9.671719551086426, 10.148563385009766, 10.625406265258789, 11.102250099182129, 11.579093933105469, 12.055937767028809, 12.532781600952148, 13.009624481201172, 13.486468315124512, 13.963312149047852, 14.440155029296875, 14.916998863220215, 15.393842697143555, 15.870686531066895, 16.347530364990234, 16.824373245239258]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 12.0, 10.0, 16.0, 12.0, 22.0, 32.0, 52.0, 82.0, 133.0, 225.0, 320.0, 495.0, 932.0, 1581.0, 3039.0, 6469.0, 16811.0, 51803.0, 197820.0, 818904.0, 1835094.0, 945474.0, 227536.0, 55396.0, 17473.0, 6934.0, 3294.0, 1640.0, 968.0, 559.0, 382.0, 258.0, 142.0, 117.0, 74.0, 41.0, 23.0, 20.0, 18.0, 14.0, 5.0, 11.0, 12.0, 10.0, 6.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0], "bins": [-1.267578125, -1.2274017333984375, -1.187225341796875, -1.1470489501953125, -1.10687255859375, -1.0666961669921875, -1.026519775390625, -0.9863433837890625, -0.9461669921875, -0.9059906005859375, -0.865814208984375, -0.8256378173828125, -0.78546142578125, -0.7452850341796875, -0.705108642578125, -0.6649322509765625, -0.624755859375, -0.5845794677734375, -0.544403076171875, -0.5042266845703125, -0.46405029296875, -0.4238739013671875, -0.383697509765625, -0.3435211181640625, -0.3033447265625, -0.2631683349609375, -0.222991943359375, -0.1828155517578125, -0.14263916015625, -0.1024627685546875, -0.062286376953125, -0.0221099853515625, 0.01806640625, 0.0582427978515625, 0.098419189453125, 0.1385955810546875, 0.17877197265625, 0.2189483642578125, 0.259124755859375, 0.2993011474609375, 0.3394775390625, 0.3796539306640625, 0.419830322265625, 0.4600067138671875, 0.50018310546875, 0.5403594970703125, 0.580535888671875, 0.6207122802734375, 0.660888671875, 0.7010650634765625, 0.741241455078125, 0.7814178466796875, 0.82159423828125, 0.8617706298828125, 0.901947021484375, 0.9421234130859375, 0.9822998046875, 1.0224761962890625, 1.062652587890625, 1.1028289794921875, 1.14300537109375, 1.1831817626953125, 1.223358154296875, 1.2635345458984375, 1.3037109375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 7.0, 11.0, 18.0, 20.0, 27.0, 25.0, 23.0, 29.0, 46.0, 41.0, 51.0, 53.0, 60.0, 50.0, 65.0, 52.0, 49.0, 44.0, 48.0, 41.0, 34.0, 40.0, 31.0, 28.0, 14.0, 15.0, 12.0, 14.0, 11.0, 9.0, 8.0, 2.0, 3.0, 7.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70263671875, -0.6739730834960938, -0.6453094482421875, -0.6166458129882812, -0.587982177734375, -0.5593185424804688, -0.5306549072265625, -0.5019912719726562, -0.47332763671875, -0.44466400146484375, -0.4160003662109375, -0.38733673095703125, -0.358673095703125, -0.33000946044921875, -0.3013458251953125, -0.27268218994140625, -0.2440185546875, -0.21535491943359375, -0.1866912841796875, -0.15802764892578125, -0.129364013671875, -0.10070037841796875, -0.0720367431640625, -0.04337310791015625, -0.01470947265625, 0.01395416259765625, 0.0426177978515625, 0.07128143310546875, 0.099945068359375, 0.12860870361328125, 0.1572723388671875, 0.18593597412109375, 0.214599609375, 0.24326324462890625, 0.2719268798828125, 0.30059051513671875, 0.329254150390625, 0.35791778564453125, 0.3865814208984375, 0.41524505615234375, 0.44390869140625, 0.47257232666015625, 0.5012359619140625, 0.5298995971679688, 0.558563232421875, 0.5872268676757812, 0.6158905029296875, 0.6445541381835938, 0.6732177734375, 0.7018814086914062, 0.7305450439453125, 0.7592086791992188, 0.787872314453125, 0.8165359497070312, 0.8451995849609375, 0.8738632202148438, 0.90252685546875, 0.9311904907226562, 0.9598541259765625, 0.9885177612304688, 1.017181396484375, 1.0458450317382812, 1.0745086669921875, 1.1031723022460938, 1.1318359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 9.0, 11.0, 10.0, 20.0, 43.0, 68.0, 153.0, 251.0, 628.0, 1675.0, 6606.0, 123414.0, 4012209.0, 42145.0, 4498.0, 1388.0, 561.0, 244.0, 138.0, 68.0, 44.0, 26.0, 20.0, 13.0, 7.0, 5.0, 4.0, 6.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.45703125, -6.23724365234375, -6.0174560546875, -5.79766845703125, -5.577880859375, -5.35809326171875, -5.1383056640625, -4.91851806640625, -4.69873046875, -4.47894287109375, -4.2591552734375, -4.03936767578125, -3.819580078125, -3.59979248046875, -3.3800048828125, -3.16021728515625, -2.9404296875, -2.72064208984375, -2.5008544921875, -2.28106689453125, -2.061279296875, -1.84149169921875, -1.6217041015625, -1.40191650390625, -1.18212890625, -0.96234130859375, -0.7425537109375, -0.52276611328125, -0.302978515625, -0.08319091796875, 0.1365966796875, 0.35638427734375, 0.576171875, 0.79595947265625, 1.0157470703125, 1.23553466796875, 1.455322265625, 1.67510986328125, 1.8948974609375, 2.11468505859375, 2.33447265625, 2.55426025390625, 2.7740478515625, 2.99383544921875, 3.213623046875, 3.43341064453125, 3.6531982421875, 3.87298583984375, 4.0927734375, 4.31256103515625, 4.5323486328125, 4.75213623046875, 4.971923828125, 5.19171142578125, 5.4114990234375, 5.63128662109375, 5.85107421875, 6.07086181640625, 6.2906494140625, 6.51043701171875, 6.730224609375, 6.95001220703125, 7.1697998046875, 7.38958740234375, 7.609375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 9.0, 13.0, 14.0, 24.0, 34.0, 37.0, 68.0, 92.0, 154.0, 194.0, 322.0, 444.0, 616.0, 615.0, 463.0, 317.0, 221.0, 138.0, 79.0, 77.0, 34.0, 22.0, 34.0, 9.0, 10.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.087890625, -1.978363037109375, -1.86883544921875, -1.759307861328125, -1.6497802734375, -1.540252685546875, -1.43072509765625, -1.321197509765625, -1.211669921875, -1.102142333984375, -0.99261474609375, -0.883087158203125, -0.7735595703125, -0.664031982421875, -0.55450439453125, -0.444976806640625, -0.33544921875, -0.225921630859375, -0.11639404296875, -0.006866455078125, 0.1026611328125, 0.212188720703125, 0.32171630859375, 0.431243896484375, 0.540771484375, 0.650299072265625, 0.75982666015625, 0.869354248046875, 0.9788818359375, 1.088409423828125, 1.19793701171875, 1.307464599609375, 1.4169921875, 1.526519775390625, 1.63604736328125, 1.745574951171875, 1.8551025390625, 1.964630126953125, 2.07415771484375, 2.183685302734375, 2.293212890625, 2.402740478515625, 2.51226806640625, 2.621795654296875, 2.7313232421875, 2.840850830078125, 2.95037841796875, 3.059906005859375, 3.16943359375, 3.278961181640625, 3.38848876953125, 3.498016357421875, 3.6075439453125, 3.717071533203125, 3.82659912109375, 3.936126708984375, 4.045654296875, 4.155181884765625, 4.26470947265625, 4.374237060546875, 4.4837646484375, 4.593292236328125, 4.70281982421875, 4.812347412109375, 4.921875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 8.0, 6.0, 17.0, 43.0, 89.0, 212.0, 333.0, 173.0, 66.0, 33.0, 10.0, 5.0, 8.0, 4.0, 1.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.6939582824707, -32.69845199584961, -30.70294761657715, -28.707443237304688, -26.711936950683594, -24.716432571411133, -22.720928192138672, -20.725421905517578, -18.729917526245117, -16.734413146972656, -14.738906860351562, -12.743402481079102, -10.747897148132324, -8.752391815185547, -6.756887435913086, -4.761382102966309, -2.7658767700195312, -0.770371675491333, 1.2251334190368652, 3.2206382751464844, 5.216143608093262, 7.211648941040039, 9.2071533203125, 11.202658653259277, 13.198163986206055, 15.193669319152832, 17.18917465209961, 19.18467903137207, 21.18018341064453, 23.175689697265625, 25.171194076538086, 27.166698455810547, 29.162208557128906, 31.157712936401367, 33.15321731567383, 35.14872360229492, 37.144229888916016, 39.139732360839844, 41.13523864746094, 43.13074493408203, 45.126251220703125, 47.12175750732422, 49.11725997924805, 51.11276626586914, 53.108272552490234, 55.10377502441406, 57.099281311035156, 59.09478759765625, 61.09029006958008, 63.08579635620117, 65.081298828125, 67.0768051147461, 69.07231140136719, 71.06781768798828, 73.06332397460938, 75.05882263183594, 77.05432891845703, 79.04983520507812, 81.04534149169922, 83.04084777832031, 85.03634643554688, 87.03185272216797, 89.02735900878906, 91.02286529541016, 93.01837158203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 11.0, 13.0, 16.0, 13.0, 21.0, 18.0, 20.0, 19.0, 34.0, 38.0, 36.0, 36.0, 36.0, 58.0, 76.0, 69.0, 69.0, 47.0, 51.0, 39.0, 37.0, 43.0, 19.0, 25.0, 21.0, 20.0, 19.0, 15.0, 10.0, 13.0, 16.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.473234176635742, -19.86264419555664, -19.25205421447754, -18.641464233398438, -18.030874252319336, -17.420284271240234, -16.809694290161133, -16.19910430908203, -15.588515281677246, -14.977925300598145, -14.367335319519043, -13.756745338439941, -13.146156311035156, -12.535566329956055, -11.924976348876953, -11.314386367797852, -10.70379638671875, -10.093206405639648, -9.482616424560547, -8.872026443481445, -8.261436462402344, -7.6508469581604, -7.040257453918457, -6.4296674728393555, -5.819077491760254, -5.208487510681152, -4.597897529602051, -3.9873080253601074, -3.376718044281006, -2.7661280632019043, -2.155538320541382, -1.5449485778808594, -0.934356689453125, -0.323766827583313, 0.286823034286499, 0.897412896156311, 1.508002758026123, 2.1185927391052246, 2.729182481765747, 3.3397722244262695, 3.950362205505371, 4.560952186584473, 5.171542167663574, 5.782131671905518, 6.392721652984619, 7.003311634063721, 7.613901138305664, 8.224491119384766, 8.835081100463867, 9.445671081542969, 10.05626106262207, 10.666851043701172, 11.277441024780273, 11.888031005859375, 12.49862003326416, 13.109210014343262, 13.719799995422363, 14.330389976501465, 14.940979957580566, 15.551569938659668, 16.162158966064453, 16.772748947143555, 17.383338928222656, 17.993928909301758, 18.60451889038086]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 8.0, 9.0, 15.0, 16.0, 30.0, 37.0, 54.0, 101.0, 171.0, 376.0, 809.0, 2093.0, 5788.0, 19708.0, 92192.0, 635707.0, 234704.0, 40599.0, 10328.0, 3371.0, 1298.0, 532.0, 249.0, 138.0, 89.0, 45.0, 29.0, 18.0, 13.0, 10.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.828125, -2.739044189453125, -2.64996337890625, -2.560882568359375, -2.4718017578125, -2.382720947265625, -2.29364013671875, -2.204559326171875, -2.115478515625, -2.026397705078125, -1.93731689453125, -1.848236083984375, -1.7591552734375, -1.670074462890625, -1.58099365234375, -1.491912841796875, -1.40283203125, -1.313751220703125, -1.22467041015625, -1.135589599609375, -1.0465087890625, -0.957427978515625, -0.86834716796875, -0.779266357421875, -0.690185546875, -0.601104736328125, -0.51202392578125, -0.422943115234375, -0.3338623046875, -0.244781494140625, -0.15570068359375, -0.066619873046875, 0.0224609375, 0.111541748046875, 0.20062255859375, 0.289703369140625, 0.3787841796875, 0.467864990234375, 0.55694580078125, 0.646026611328125, 0.735107421875, 0.824188232421875, 0.91326904296875, 1.002349853515625, 1.0914306640625, 1.180511474609375, 1.26959228515625, 1.358673095703125, 1.44775390625, 1.536834716796875, 1.62591552734375, 1.714996337890625, 1.8040771484375, 1.893157958984375, 1.98223876953125, 2.071319580078125, 2.160400390625, 2.249481201171875, 2.33856201171875, 2.427642822265625, 2.5167236328125, 2.605804443359375, 2.69488525390625, 2.783966064453125, 2.873046875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 5.0, 2.0, 7.0, 13.0, 22.0, 24.0, 34.0, 35.0, 44.0, 55.0, 71.0, 82.0, 71.0, 81.0, 66.0, 67.0, 58.0, 56.0, 47.0, 34.0, 30.0, 25.0, 18.0, 17.0, 11.0, 10.0, 7.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5078125, -1.4566497802734375, -1.405487060546875, -1.3543243408203125, -1.30316162109375, -1.2519989013671875, -1.200836181640625, -1.1496734619140625, -1.0985107421875, -1.0473480224609375, -0.996185302734375, -0.9450225830078125, -0.89385986328125, -0.8426971435546875, -0.791534423828125, -0.7403717041015625, -0.689208984375, -0.6380462646484375, -0.586883544921875, -0.5357208251953125, -0.48455810546875, -0.4333953857421875, -0.382232666015625, -0.3310699462890625, -0.2799072265625, -0.2287445068359375, -0.177581787109375, -0.1264190673828125, -0.07525634765625, -0.0240936279296875, 0.027069091796875, 0.0782318115234375, 0.12939453125, 0.1805572509765625, 0.231719970703125, 0.2828826904296875, 0.33404541015625, 0.3852081298828125, 0.436370849609375, 0.4875335693359375, 0.5386962890625, 0.5898590087890625, 0.641021728515625, 0.6921844482421875, 0.74334716796875, 0.7945098876953125, 0.845672607421875, 0.8968353271484375, 0.947998046875, 0.9991607666015625, 1.050323486328125, 1.1014862060546875, 1.15264892578125, 1.2038116455078125, 1.254974365234375, 1.3061370849609375, 1.3572998046875, 1.4084625244140625, 1.459625244140625, 1.5107879638671875, 1.56195068359375, 1.6131134033203125, 1.664276123046875, 1.7154388427734375, 1.7666015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 4.0, 7.0, 8.0, 5.0, 8.0, 13.0, 14.0, 29.0, 34.0, 60.0, 83.0, 112.0, 213.0, 286.0, 515.0, 1015.0, 2383.0, 7031.0, 31743.0, 700090.0, 266509.0, 27463.0, 6460.0, 2163.0, 967.0, 505.0, 279.0, 191.0, 111.0, 88.0, 51.0, 32.0, 25.0, 16.0, 9.0, 8.0, 5.0, 5.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1015625, -3.01531982421875, -2.9290771484375, -2.84283447265625, -2.756591796875, -2.67034912109375, -2.5841064453125, -2.49786376953125, -2.41162109375, -2.32537841796875, -2.2391357421875, -2.15289306640625, -2.066650390625, -1.98040771484375, -1.8941650390625, -1.80792236328125, -1.7216796875, -1.63543701171875, -1.5491943359375, -1.46295166015625, -1.376708984375, -1.29046630859375, -1.2042236328125, -1.11798095703125, -1.03173828125, -0.94549560546875, -0.8592529296875, -0.77301025390625, -0.686767578125, -0.60052490234375, -0.5142822265625, -0.42803955078125, -0.341796875, -0.25555419921875, -0.1693115234375, -0.08306884765625, 0.003173828125, 0.08941650390625, 0.1756591796875, 0.26190185546875, 0.34814453125, 0.43438720703125, 0.5206298828125, 0.60687255859375, 0.693115234375, 0.77935791015625, 0.8656005859375, 0.95184326171875, 1.0380859375, 1.12432861328125, 1.2105712890625, 1.29681396484375, 1.383056640625, 1.46929931640625, 1.5555419921875, 1.64178466796875, 1.72802734375, 1.81427001953125, 1.9005126953125, 1.98675537109375, 2.072998046875, 2.15924072265625, 2.2454833984375, 2.33172607421875, 2.41796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 6.0, 6.0, 12.0, 11.0, 14.0, 11.0, 11.0, 20.0, 18.0, 14.0, 19.0, 28.0, 29.0, 28.0, 56.0, 58.0, 62.0, 76.0, 78.0, 59.0, 56.0, 48.0, 42.0, 35.0, 21.0, 16.0, 18.0, 20.0, 15.0, 18.0, 12.0, 16.0, 12.0, 13.0, 7.0, 7.0, 2.0, 5.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-4.78515625, -4.65924072265625, -4.5333251953125, -4.40740966796875, -4.281494140625, -4.15557861328125, -4.0296630859375, -3.90374755859375, -3.77783203125, -3.65191650390625, -3.5260009765625, -3.40008544921875, -3.274169921875, -3.14825439453125, -3.0223388671875, -2.89642333984375, -2.7705078125, -2.64459228515625, -2.5186767578125, -2.39276123046875, -2.266845703125, -2.14093017578125, -2.0150146484375, -1.88909912109375, -1.76318359375, -1.63726806640625, -1.5113525390625, -1.38543701171875, -1.259521484375, -1.13360595703125, -1.0076904296875, -0.88177490234375, -0.755859375, -0.62994384765625, -0.5040283203125, -0.37811279296875, -0.252197265625, -0.12628173828125, -0.0003662109375, 0.12554931640625, 0.25146484375, 0.37738037109375, 0.5032958984375, 0.62921142578125, 0.755126953125, 0.88104248046875, 1.0069580078125, 1.13287353515625, 1.2587890625, 1.38470458984375, 1.5106201171875, 1.63653564453125, 1.762451171875, 1.88836669921875, 2.0142822265625, 2.14019775390625, 2.26611328125, 2.39202880859375, 2.5179443359375, 2.64385986328125, 2.769775390625, 2.89569091796875, 3.0216064453125, 3.14752197265625, 3.2734375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 8.0, 15.0, 16.0, 16.0, 26.0, 34.0, 36.0, 60.0, 89.0, 135.0, 253.0, 520.0, 1129.0, 3118.0, 10839.0, 54129.0, 886679.0, 72276.0, 12830.0, 3697.0, 1282.0, 597.0, 286.0, 156.0, 86.0, 74.0, 39.0, 29.0, 24.0, 7.0, 15.0, 13.0, 10.0, 10.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66943359375, -0.6442337036132812, -0.6190338134765625, -0.5938339233398438, -0.568634033203125, -0.5434341430664062, -0.5182342529296875, -0.49303436279296875, -0.46783447265625, -0.44263458251953125, -0.4174346923828125, -0.39223480224609375, -0.367034912109375, -0.34183502197265625, -0.3166351318359375, -0.29143524169921875, -0.2662353515625, -0.24103546142578125, -0.2158355712890625, -0.19063568115234375, -0.165435791015625, -0.14023590087890625, -0.1150360107421875, -0.08983612060546875, -0.06463623046875, -0.03943634033203125, -0.0142364501953125, 0.01096343994140625, 0.036163330078125, 0.06136322021484375, 0.0865631103515625, 0.11176300048828125, 0.136962890625, 0.16216278076171875, 0.1873626708984375, 0.21256256103515625, 0.237762451171875, 0.26296234130859375, 0.2881622314453125, 0.31336212158203125, 0.33856201171875, 0.36376190185546875, 0.3889617919921875, 0.41416168212890625, 0.439361572265625, 0.46456146240234375, 0.4897613525390625, 0.5149612426757812, 0.5401611328125, 0.5653610229492188, 0.5905609130859375, 0.6157608032226562, 0.640960693359375, 0.6661605834960938, 0.6913604736328125, 0.7165603637695312, 0.74176025390625, 0.7669601440429688, 0.7921600341796875, 0.8173599243164062, 0.842559814453125, 0.8677597045898438, 0.8929595947265625, 0.9181594848632812, 0.943359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 6.0, 2.0, 8.0, 4.0, 20.0, 15.0, 30.0, 33.0, 58.0, 74.0, 103.0, 146.0, 143.0, 95.0, 60.0, 54.0, 26.0, 27.0, 20.0, 17.0, 6.0, 11.0, 12.0, 3.0, 6.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003075599670410156, -0.00029921717941761017, -0.0002908743917942047, -0.00028253160417079926, -0.0002741888165473938, -0.00026584602892398834, -0.0002575032413005829, -0.00024916045367717743, -0.00024081766605377197, -0.00023247487843036652, -0.00022413209080696106, -0.0002157893031835556, -0.00020744651556015015, -0.0001991037279367447, -0.00019076094031333923, -0.00018241815268993378, -0.00017407536506652832, -0.00016573257744312286, -0.0001573897898197174, -0.00014904700219631195, -0.0001407042145729065, -0.00013236142694950104, -0.00012401863932609558, -0.00011567585170269012, -0.00010733306407928467, -9.899027645587921e-05, -9.064748883247375e-05, -8.23047012090683e-05, -7.396191358566284e-05, -6.561912596225739e-05, -5.727633833885193e-05, -4.893355071544647e-05, -4.0590763092041016e-05, -3.224797546863556e-05, -2.3905187845230103e-05, -1.5562400221824646e-05, -7.2196125984191895e-06, 1.123175024986267e-06, 9.465962648391724e-06, 1.780875027179718e-05, 2.6151537895202637e-05, 3.449432551860809e-05, 4.283711314201355e-05, 5.1179900765419006e-05, 5.952268838882446e-05, 6.786547601222992e-05, 7.620826363563538e-05, 8.455105125904083e-05, 9.289383888244629e-05, 0.00010123662650585175, 0.0001095794141292572, 0.00011792220175266266, 0.00012626498937606812, 0.00013460777699947357, 0.00014295056462287903, 0.00015129335224628448, 0.00015963613986968994, 0.0001679789274930954, 0.00017632171511650085, 0.0001846645027399063, 0.00019300729036331177, 0.00020135007798671722, 0.00020969286561012268, 0.00021803565323352814, 0.0002263784408569336]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 11.0, 14.0, 25.0, 50.0, 90.0, 198.0, 452.0, 1354.0, 4828.0, 27074.0, 890518.0, 108929.0, 10966.0, 2560.0, 822.0, 311.0, 155.0, 73.0, 37.0, 23.0, 18.0, 4.0, 4.0, 4.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8583984375, -0.8313751220703125, -0.804351806640625, -0.7773284912109375, -0.75030517578125, -0.7232818603515625, -0.696258544921875, -0.6692352294921875, -0.6422119140625, -0.6151885986328125, -0.588165283203125, -0.5611419677734375, -0.53411865234375, -0.5070953369140625, -0.480072021484375, -0.4530487060546875, -0.426025390625, -0.3990020751953125, -0.371978759765625, -0.3449554443359375, -0.31793212890625, -0.2909088134765625, -0.263885498046875, -0.2368621826171875, -0.2098388671875, -0.1828155517578125, -0.155792236328125, -0.1287689208984375, -0.10174560546875, -0.0747222900390625, -0.047698974609375, -0.0206756591796875, 0.00634765625, 0.0333709716796875, 0.060394287109375, 0.0874176025390625, 0.11444091796875, 0.1414642333984375, 0.168487548828125, 0.1955108642578125, 0.2225341796875, 0.2495574951171875, 0.276580810546875, 0.3036041259765625, 0.33062744140625, 0.3576507568359375, 0.384674072265625, 0.4116973876953125, 0.438720703125, 0.4657440185546875, 0.492767333984375, 0.5197906494140625, 0.54681396484375, 0.5738372802734375, 0.600860595703125, 0.6278839111328125, 0.6549072265625, 0.6819305419921875, 0.708953857421875, 0.7359771728515625, 0.76300048828125, 0.7900238037109375, 0.817047119140625, 0.8440704345703125, 0.87109375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 10.0, 11.0, 9.0, 24.0, 26.0, 42.0, 71.0, 122.0, 212.0, 167.0, 101.0, 62.0, 44.0, 25.0, 19.0, 11.0, 11.0, 4.0, 7.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80712890625, -0.7747116088867188, -0.7422943115234375, -0.7098770141601562, -0.677459716796875, -0.6450424194335938, -0.6126251220703125, -0.5802078247070312, -0.54779052734375, -0.5153732299804688, -0.4829559326171875, -0.45053863525390625, -0.418121337890625, -0.38570404052734375, -0.3532867431640625, -0.32086944580078125, -0.2884521484375, -0.25603485107421875, -0.2236175537109375, -0.19120025634765625, -0.158782958984375, -0.12636566162109375, -0.0939483642578125, -0.06153106689453125, -0.02911376953125, 0.00330352783203125, 0.0357208251953125, 0.06813812255859375, 0.100555419921875, 0.13297271728515625, 0.1653900146484375, 0.19780731201171875, 0.230224609375, 0.26264190673828125, 0.2950592041015625, 0.32747650146484375, 0.359893798828125, 0.39231109619140625, 0.4247283935546875, 0.45714569091796875, 0.48956298828125, 0.5219802856445312, 0.5543975830078125, 0.5868148803710938, 0.619232177734375, 0.6516494750976562, 0.6840667724609375, 0.7164840698242188, 0.7489013671875, 0.7813186645507812, 0.8137359619140625, 0.8461532592773438, 0.878570556640625, 0.9109878540039062, 0.9434051513671875, 0.9758224487304688, 1.00823974609375, 1.0406570434570312, 1.0730743408203125, 1.1054916381835938, 1.137908935546875, 1.1703262329101562, 1.2027435302734375, 1.2351608276367188, 1.267578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 9.0, 14.0, 47.0, 111.0, 365.0, 327.0, 72.0, 27.0, 16.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-60.41972351074219, -59.30076217651367, -58.18180465698242, -57.062843322753906, -55.943885803222656, -54.82492446899414, -53.705963134765625, -52.587005615234375, -51.46804428100586, -50.349082946777344, -49.230125427246094, -48.11116409301758, -46.99220275878906, -45.87324523925781, -44.7542839050293, -43.63532638549805, -42.51636505126953, -41.397403717041016, -40.278446197509766, -39.15948486328125, -38.04052734375, -36.921566009521484, -35.80260467529297, -34.68364715576172, -33.5646858215332, -32.44572448730469, -31.326766967773438, -30.207805633544922, -29.08884620666504, -27.969886779785156, -26.85092544555664, -25.731966018676758, -24.61301040649414, -23.494050979614258, -22.375091552734375, -21.25613021850586, -20.137170791625977, -19.018211364746094, -17.899250030517578, -16.780290603637695, -15.661331176757812, -14.54237174987793, -13.42341136932373, -12.304450988769531, -11.185491561889648, -10.066532135009766, -8.947571754455566, -7.828611850738525, -6.709651947021484, -5.590692043304443, -4.471732139587402, -3.3527722358703613, -2.2338123321533203, -1.1148524284362793, 0.004107475280761719, 1.1230673789978027, 2.2420272827148438, 3.3609871864318848, 4.479947090148926, 5.598906993865967, 6.717866897583008, 7.836826801300049, 8.95578670501709, 10.074747085571289, 11.193706512451172]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 7.0, 6.0, 13.0, 13.0, 12.0, 15.0, 9.0, 23.0, 18.0, 36.0, 24.0, 19.0, 22.0, 44.0, 190.0, 248.0, 53.0, 28.0, 26.0, 25.0, 21.0, 28.0, 18.0, 16.0, 12.0, 7.0, 12.0, 5.0, 8.0, 8.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.198326110839844, -11.779027938842773, -11.35973072052002, -10.94043254852295, -10.521134376525879, -10.101837158203125, -9.682538986206055, -9.263240814208984, -8.843942642211914, -8.424644470214844, -8.00534725189209, -7.5860490798950195, -7.166750907897949, -6.747453212738037, -6.328155517578125, -5.908857345581055, -5.489559650421143, -5.0702619552612305, -4.65096378326416, -4.231666088104248, -3.8123679161071777, -3.3930702209472656, -2.9737722873687744, -2.554474353790283, -2.135176420211792, -1.7158784866333008, -1.2965805530548096, -0.8772827386856079, -0.4579848051071167, -0.03868699073791504, 0.38061094284057617, 0.7999088764190674, 1.2192068099975586, 1.6385047435760498, 2.057802677154541, 2.477100372314453, 2.8963985443115234, 3.3156962394714355, 3.7349941730499268, 4.154292106628418, 4.573590278625488, 4.9928879737854, 5.412186145782471, 5.831483840942383, 6.250782012939453, 6.670079708099365, 7.089377403259277, 7.508675575256348, 7.92797327041626, 8.347270965576172, 8.766569137573242, 9.185867309570312, 9.605164527893066, 10.024462699890137, 10.443760871887207, 10.863058090209961, 11.282356262207031, 11.701654434204102, 12.120951652526855, 12.540249824523926, 12.959547996520996, 13.37884521484375, 13.79814338684082, 14.21744155883789, 14.636739730834961]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 7.0, 10.0, 7.0, 15.0, 14.0, 13.0, 15.0, 17.0, 28.0, 22.0, 38.0, 29.0, 52.0, 67.0, 224.0, 119.0, 51.0, 37.0, 37.0, 32.0, 20.0, 16.0, 15.0, 22.0, 17.0, 11.0, 11.0, 13.0, 9.0, 3.0, 6.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79638671875, -0.7628860473632812, -0.7293853759765625, -0.6958847045898438, -0.662384033203125, -0.6288833618164062, -0.5953826904296875, -0.5618820190429688, -0.52838134765625, -0.49488067626953125, -0.4613800048828125, -0.42787933349609375, -0.394378662109375, -0.36087799072265625, -0.3273773193359375, -0.29387664794921875, -0.2603759765625, -0.22687530517578125, -0.1933746337890625, -0.15987396240234375, -0.126373291015625, -0.09287261962890625, -0.0593719482421875, -0.02587127685546875, 0.00762939453125, 0.04113006591796875, 0.0746307373046875, 0.10813140869140625, 0.141632080078125, 0.17513275146484375, 0.2086334228515625, 0.24213409423828125, 0.275634765625, 0.30913543701171875, 0.3426361083984375, 0.37613677978515625, 0.409637451171875, 0.44313812255859375, 0.4766387939453125, 0.5101394653320312, 0.54364013671875, 0.5771408081054688, 0.6106414794921875, 0.6441421508789062, 0.677642822265625, 0.7111434936523438, 0.7446441650390625, 0.7781448364257812, 0.8116455078125, 0.8451461791992188, 0.8786468505859375, 0.9121475219726562, 0.945648193359375, 0.9791488647460938, 1.0126495361328125, 1.0461502075195312, 1.07965087890625, 1.1131515502929688, 1.1466522216796875, 1.1801528930664062, 1.213653564453125, 1.2471542358398438, 1.2806549072265625, 1.3141555786132812, 1.34765625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 14.0, 14.0, 14.0, 15.0, 8.0, 18.0, 36.0, 60.0, 132.0, 238.0, 492.0, 1477.0, 5672.0, 196711.0, 8174326.0, 6720.0, 1600.0, 539.0, 207.0, 120.0, 68.0, 26.0, 25.0, 18.0, 10.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.052157402038574, -12.690153121948242, -12.328149795532227, -11.966145515441895, -11.604141235351562, -11.24213695526123, -10.880132675170898, -10.518129348754883, -10.15612506866455, -9.794120788574219, -9.432117462158203, -9.070113182067871, -8.708108901977539, -8.346104621887207, -7.984100818634033, -7.622097015380859, -7.260092735290527, -6.898088455200195, -6.5360846519470215, -6.174080848693848, -5.812076568603516, -5.450072288513184, -5.08806848526001, -4.726064682006836, -4.364060401916504, -4.002056121826172, -3.640052318572998, -3.278048276901245, -2.916044235229492, -2.5540401935577393, -2.1920361518859863, -1.8300321102142334, -1.4680290222167969, -1.106024980545044, -0.744020938873291, -0.3820168972015381, -0.020012855529785156, 0.3419911861419678, 0.7039952278137207, 1.0659992694854736, 1.4280033111572266, 1.7900073528289795, 2.1520113945007324, 2.5140154361724854, 2.8760194778442383, 3.238023519515991, 3.600027561187744, 3.962031602859497, 4.32403564453125, 4.686039924621582, 5.048043727874756, 5.41004753112793, 5.772051811218262, 6.134056091308594, 6.496059894561768, 6.858063697814941, 7.220067977905273, 7.5820722579956055, 7.944076061248779, 8.306079864501953, 8.668084144592285, 9.030088424682617, 9.392091751098633, 9.754096031188965, 10.116100311279297]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 1.0, 4.0, 6.0, 3.0, 3.0, 5.0, 4.0, 5.0, 6.0, 2.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.049534797668457, -10.772295951843262, -10.495057106018066, -10.217818260192871, -9.940579414367676, -9.66334056854248, -9.386101722717285, -9.108863830566406, -8.831624984741211, -8.554386138916016, -8.27714729309082, -7.999908447265625, -7.72266960144043, -7.445430755615234, -7.168192386627197, -6.890953540802002, -6.613714218139648, -6.336475372314453, -6.059236526489258, -5.7819976806640625, -5.504758834838867, -5.227519989013672, -4.950281620025635, -4.6730427742004395, -4.395803928375244, -4.118565082550049, -3.8413262367248535, -3.5640876293182373, -3.286848783493042, -3.0096099376678467, -2.7323713302612305, -2.455132484436035, -2.177894115447998, -1.9006552696228027, -1.623416543006897, -1.3461778163909912, -1.068938970565796, -0.7917001247406006, -0.5144613981246948, -0.23722267150878906, 0.04001617431640625, 0.3172549605369568, 0.5944937467575073, 0.8717325329780579, 1.1489713191986084, 1.4262101650238037, 1.7034488916397095, 1.9806876182556152, 2.2579264640808105, 2.535165309906006, 2.812404155731201, 3.0896427631378174, 3.3668816089630127, 3.644120454788208, 3.921359062194824, 4.1985979080200195, 4.475836753845215, 4.75307559967041, 5.0303144454956055, 5.307553291320801, 5.584792137145996, 5.862030982971191, 6.1392693519592285, 6.416508197784424, 6.693747043609619]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 10.0, 7.0, 10.0, 14.0, 32.0, 38.0, 68.0, 105.0, 212.0, 637.0, 2515.0, 15599.0, 145855.0, 313839.0, 38476.0, 5139.0, 1059.0, 343.0, 129.0, 73.0, 40.0, 22.0, 18.0, 6.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.09375, -13.51171875, -12.9296875, -12.34765625, -11.765625, -11.18359375, -10.6015625, -10.01953125, -9.4375, -8.85546875, -8.2734375, -7.69140625, -7.109375, -6.52734375, -5.9453125, -5.36328125, -4.78125, -4.19921875, -3.6171875, -3.03515625, -2.453125, -1.87109375, -1.2890625, -0.70703125, -0.125, 0.45703125, 1.0390625, 1.62109375, 2.203125, 2.78515625, 3.3671875, 3.94921875, 4.53125, 5.11328125, 5.6953125, 6.27734375, 6.859375, 7.44140625, 8.0234375, 8.60546875, 9.1875, 9.76953125, 10.3515625, 10.93359375, 11.515625, 12.09765625, 12.6796875, 13.26171875, 13.84375, 14.42578125, 15.0078125, 15.58984375, 16.171875, 16.75390625, 17.3359375, 17.91796875, 18.5, 19.08203125, 19.6640625, 20.24609375, 20.828125, 21.41015625, 21.9921875, 22.57421875, 23.15625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 7.0, 18.0, 20.0, 17.0, 29.0, 39.0, 44.0, 54.0, 68.0, 75.0, 84.0, 88.0, 68.0, 78.0, 65.0, 51.0, 36.0, 56.0, 29.0, 18.0, 5.0, 13.0, 7.0, 4.0, 5.0, 4.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.705078125, -1.655426025390625, -1.60577392578125, -1.556121826171875, -1.5064697265625, -1.456817626953125, -1.40716552734375, -1.357513427734375, -1.307861328125, -1.258209228515625, -1.20855712890625, -1.158905029296875, -1.1092529296875, -1.059600830078125, -1.00994873046875, -0.960296630859375, -0.91064453125, -0.860992431640625, -0.81134033203125, -0.761688232421875, -0.7120361328125, -0.662384033203125, -0.61273193359375, -0.563079833984375, -0.513427734375, -0.463775634765625, -0.41412353515625, -0.364471435546875, -0.3148193359375, -0.265167236328125, -0.21551513671875, -0.165863037109375, -0.1162109375, -0.066558837890625, -0.01690673828125, 0.032745361328125, 0.0823974609375, 0.132049560546875, 0.18170166015625, 0.231353759765625, 0.281005859375, 0.330657958984375, 0.38031005859375, 0.429962158203125, 0.4796142578125, 0.529266357421875, 0.57891845703125, 0.628570556640625, 0.67822265625, 0.727874755859375, 0.77752685546875, 0.827178955078125, 0.8768310546875, 0.926483154296875, 0.97613525390625, 1.025787353515625, 1.075439453125, 1.125091552734375, 1.17474365234375, 1.224395751953125, 1.2740478515625, 1.323699951171875, 1.37335205078125, 1.423004150390625, 1.47265625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 11.0, 9.0, 13.0, 69.0, 135.0, 163.0, 50.0, 16.0, 9.0, 7.0, 2.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.818909645080566, -8.232321739196777, -7.6457343101501465, -7.059146881103516, -6.472558975219727, -5.885971546173096, -5.299384117126465, -4.712796211242676, -4.126208782196045, -3.539621114730835, -2.953033447265625, -2.366446018218994, -1.7798583507537842, -1.1932706832885742, -0.6066832542419434, -0.020095348358154297, 0.5664920806884766, 1.1530797481536865, 1.739667296409607, 2.3262548446655273, 2.9128425121307373, 3.4994301795959473, 4.086017608642578, 4.672605514526367, 5.259192943572998, 5.845780372619629, 6.432368278503418, 7.018955707550049, 7.60554313659668, 8.192131042480469, 8.778718948364258, 9.365306854248047, 9.951892852783203, 10.538480758666992, 11.125067710876465, 11.711655616760254, 12.298243522644043, 12.884830474853516, 13.471418380737305, 14.058006286621094, 14.644594192504883, 15.231182098388672, 15.817769050598145, 16.40435791015625, 16.990943908691406, 17.577531814575195, 18.164119720458984, 18.750707626342773, 19.337295532226562, 19.92388343811035, 20.51047134399414, 21.097057342529297, 21.683645248413086, 22.270233154296875, 22.856821060180664, 23.443408966064453, 24.02999496459961, 24.6165828704834, 25.203170776367188, 25.789756774902344, 26.376344680786133, 26.962932586669922, 27.54952049255371, 28.1361083984375, 28.72269630432129]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 10.0, 6.0, 6.0, 8.0, 39.0, 82.0, 121.0, 99.0, 46.0, 11.0, 12.0, 8.0, 7.0, 9.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.361876487731934, -8.096219062805176, -7.830562114715576, -7.564904689788818, -7.299247741699219, -7.033590316772461, -6.767932891845703, -6.502275466918945, -6.236618518829346, -5.970961093902588, -5.705304145812988, -5.4396467208862305, -5.173989295959473, -4.908332347869873, -4.642674922943115, -4.377017974853516, -4.111360549926758, -3.845703363418579, -3.5800461769104004, -3.3143887519836426, -3.048731565475464, -2.783074378967285, -2.5174169540405273, -2.2517597675323486, -1.98610258102417, -1.7204453945159912, -1.454788088798523, -1.1891307830810547, -0.923473596572876, -0.6578164100646973, -0.392159104347229, -0.12650179862976074, 0.13915634155273438, 0.40481358766555786, 0.6704708337783813, 0.9361280798912048, 1.2017853260040283, 1.467442512512207, 1.7330998182296753, 1.9987571239471436, 2.2644143104553223, 2.530071496963501, 2.7957286834716797, 3.0613861083984375, 3.327043294906616, 3.592700481414795, 3.8583579063415527, 4.124014854431152, 4.38967227935791, 4.655329704284668, 4.920986652374268, 5.186644077301025, 5.452301025390625, 5.717958450317383, 5.983615875244141, 6.249273300170898, 6.514930248260498, 6.780587673187256, 7.0462446212768555, 7.311902046203613, 7.577559471130371, 7.843216419219971, 8.10887336730957, 8.374530792236328, 8.640188217163086]}, "eval/loss": 4.305517673492432, "eval/wer": 1.9549980166600556, "eval/runtime": 784.9234, "eval/samples_per_second": 3.366, "eval/steps_per_second": 0.282, "train/train_runtime": 6633.4843, "train/train_samples_per_second": 4.302, "train/train_steps_per_second": 0.179, "train/total_flos": 0.0, "train/train_loss": 4.355411059521546} \ No newline at end of file