diff --git "a/wandb/run-20220324_170220-1u8cita3/files/wandb-summary.json" "b/wandb/run-20220324_170220-1u8cita3/files/wandb-summary.json" --- "a/wandb/run-20220324_170220-1u8cita3/files/wandb-summary.json" +++ "b/wandb/run-20220324_170220-1u8cita3/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.4226, "train/learning_rate": 1.267605633802817e-08, "train/epoch": 25.0, "train/global_step": 22300, "_runtime": 35320, "_timestamp": 1648176660, "_step": 5803, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 6.0, 7.0, 11.0, 11.0, 20.0, 11.0, 14.0, 23.0, 26.0, 38.0, 45.0, 46.0, 65.0, 51.0, 60.0, 89.0, 87.0, 60.0, 64.0, 45.0, 40.0, 34.0, 22.0, 25.0, 14.0, 13.0, 11.0, 11.0, 8.0, 3.0, 5.0, 7.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.9212875366211, -70.6487808227539, -68.37626647949219, -66.103759765625, -63.83124542236328, -61.558738708496094, -59.28622817993164, -57.01371765136719, -54.741207122802734, -52.46869659423828, -50.19618606567383, -47.923675537109375, -45.65116882324219, -43.37865447998047, -41.10614776611328, -38.83363723754883, -36.561126708984375, -34.28861618041992, -32.01610565185547, -29.74359703063965, -27.471086502075195, -25.198575973510742, -22.926067352294922, -20.65355682373047, -18.381046295166016, -16.108535766601562, -13.836026191711426, -11.563516616821289, -9.291006088256836, -7.018495559692383, -4.745985984802246, -2.4734764099121094, -0.200958251953125, 2.07155179977417, 4.344061851501465, 6.61657190322876, 8.889081954956055, 11.161592483520508, 13.434102058410645, 15.706611633300781, 17.979122161865234, 20.251632690429688, 22.52414321899414, 24.79665184020996, 27.069162368774414, 29.341672897338867, 31.614181518554688, 33.88669204711914, 36.159202575683594, 38.43171310424805, 40.7042236328125, 42.97673416137695, 45.249244689941406, 47.521751403808594, 49.79426193237305, 52.0667724609375, 54.33928298950195, 56.611793518066406, 58.88430404663086, 61.15681457519531, 63.4293212890625, 65.70183563232422, 67.9743423461914, 70.24685668945312, 72.51936340332031]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 7.0, 5.0, 10.0, 12.0, 19.0, 19.0, 23.0, 12.0, 26.0, 25.0, 37.0, 27.0, 17.0, 37.0, 38.0, 45.0, 38.0, 52.0, 47.0, 29.0, 52.0, 38.0, 43.0, 46.0, 35.0, 37.0, 25.0, 26.0, 29.0, 22.0, 33.0, 14.0, 17.0, 18.0, 12.0, 4.0, 6.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.53594207763672, -54.687095642089844, -52.8382453918457, -50.98939895629883, -49.14055252075195, -47.29170227050781, -45.44285583496094, -43.59400939941406, -41.74516296386719, -39.89631652832031, -38.04746627807617, -36.1986198425293, -34.34977340698242, -32.50092315673828, -30.652076721191406, -28.80323028564453, -26.954381942749023, -25.105533599853516, -23.25668716430664, -21.407838821411133, -19.558992385864258, -17.71014404296875, -15.861296653747559, -14.012449264526367, -12.163601875305176, -10.314754486083984, -8.465907096862793, -6.617059230804443, -4.768211841583252, -2.9193639755249023, -1.070516586303711, 0.7783308029174805, 2.627178192138672, 4.476025581359863, 6.324872970581055, 8.173721313476562, 10.022567749023438, 11.871416091918945, 13.720263481140137, 15.569110870361328, 17.417957305908203, 19.26680564880371, 21.115652084350586, 22.964500427246094, 24.81334686279297, 26.662195205688477, 28.511043548583984, 30.35988998413086, 32.208740234375, 34.057586669921875, 35.906436920166016, 37.75528335571289, 39.604129791259766, 41.452980041503906, 43.30182647705078, 45.150672912597656, 46.99951934814453, 48.848365783691406, 50.69721603393555, 52.54606246948242, 54.3949089050293, 56.24375915527344, 58.09260559082031, 59.94145202636719, 61.79029846191406]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 10.0, 10.0, 21.0, 26.0, 44.0, 83.0, 134.0, 211.0, 327.0, 586.0, 931.0, 1394.0, 2381.0, 3782.0, 6175.0, 10901.0, 18717.0, 34611.0, 67966.0, 161762.0, 685990.0, 2363443.0, 548131.0, 146489.0, 64826.0, 32758.0, 17488.0, 9830.0, 5845.0, 3556.0, 2130.0, 1248.0, 867.0, 542.0, 362.0, 241.0, 149.0, 93.0, 73.0, 40.0, 38.0, 33.0, 15.0, 11.0, 8.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-158.25, -152.685546875, -147.12109375, -141.556640625, -135.9921875, -130.427734375, -124.86328125, -119.298828125, -113.734375, -108.169921875, -102.60546875, -97.041015625, -91.4765625, -85.912109375, -80.34765625, -74.783203125, -69.21875, -63.654296875, -58.08984375, -52.525390625, -46.9609375, -41.396484375, -35.83203125, -30.267578125, -24.703125, -19.138671875, -13.57421875, -8.009765625, -2.4453125, 3.119140625, 8.68359375, 14.248046875, 19.8125, 25.376953125, 30.94140625, 36.505859375, 42.0703125, 47.634765625, 53.19921875, 58.763671875, 64.328125, 69.892578125, 75.45703125, 81.021484375, 86.5859375, 92.150390625, 97.71484375, 103.279296875, 108.84375, 114.408203125, 119.97265625, 125.537109375, 131.1015625, 136.666015625, 142.23046875, 147.794921875, 153.359375, 158.923828125, 164.48828125, 170.052734375, 175.6171875, 181.181640625, 186.74609375, 192.310546875, 197.875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 8.0, 4.0, 10.0, 9.0, 13.0, 15.0, 20.0, 23.0, 15.0, 19.0, 24.0, 29.0, 28.0, 38.0, 39.0, 47.0, 41.0, 45.0, 41.0, 34.0, 49.0, 34.0, 40.0, 46.0, 35.0, 36.0, 35.0, 44.0, 21.0, 18.0, 35.0, 22.0, 16.0, 10.0, 6.0, 7.0, 10.0, 8.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-63.4375, -61.49560546875, -59.5537109375, -57.61181640625, -55.669921875, -53.72802734375, -51.7861328125, -49.84423828125, -47.90234375, -45.96044921875, -44.0185546875, -42.07666015625, -40.134765625, -38.19287109375, -36.2509765625, -34.30908203125, -32.3671875, -30.42529296875, -28.4833984375, -26.54150390625, -24.599609375, -22.65771484375, -20.7158203125, -18.77392578125, -16.83203125, -14.89013671875, -12.9482421875, -11.00634765625, -9.064453125, -7.12255859375, -5.1806640625, -3.23876953125, -1.296875, 0.64501953125, 2.5869140625, 4.52880859375, 6.470703125, 8.41259765625, 10.3544921875, 12.29638671875, 14.23828125, 16.18017578125, 18.1220703125, 20.06396484375, 22.005859375, 23.94775390625, 25.8896484375, 27.83154296875, 29.7734375, 31.71533203125, 33.6572265625, 35.59912109375, 37.541015625, 39.48291015625, 41.4248046875, 43.36669921875, 45.30859375, 47.25048828125, 49.1923828125, 51.13427734375, 53.076171875, 55.01806640625, 56.9599609375, 58.90185546875, 60.84375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 8.0, 18.0, 12.0, 27.0, 40.0, 59.0, 61.0, 123.0, 172.0, 219.0, 378.0, 518.0, 799.0, 1188.0, 1920.0, 2780.0, 4217.0, 6438.0, 10368.0, 17425.0, 29950.0, 54812.0, 111080.0, 264698.0, 961221.0, 1966680.0, 431117.0, 157512.0, 73304.0, 39152.0, 21986.0, 13041.0, 8045.0, 5078.0, 3254.0, 2147.0, 1441.0, 980.0, 662.0, 416.0, 313.0, 210.0, 133.0, 101.0, 55.0, 43.0, 30.0, 21.0, 10.0, 13.0, 8.0, 5.0, 2.0, 2.0, 2.0], "bins": [-144.5, -140.27734375, -136.0546875, -131.83203125, -127.609375, -123.38671875, -119.1640625, -114.94140625, -110.71875, -106.49609375, -102.2734375, -98.05078125, -93.828125, -89.60546875, -85.3828125, -81.16015625, -76.9375, -72.71484375, -68.4921875, -64.26953125, -60.046875, -55.82421875, -51.6015625, -47.37890625, -43.15625, -38.93359375, -34.7109375, -30.48828125, -26.265625, -22.04296875, -17.8203125, -13.59765625, -9.375, -5.15234375, -0.9296875, 3.29296875, 7.515625, 11.73828125, 15.9609375, 20.18359375, 24.40625, 28.62890625, 32.8515625, 37.07421875, 41.296875, 45.51953125, 49.7421875, 53.96484375, 58.1875, 62.41015625, 66.6328125, 70.85546875, 75.078125, 79.30078125, 83.5234375, 87.74609375, 91.96875, 96.19140625, 100.4140625, 104.63671875, 108.859375, 113.08203125, 117.3046875, 121.52734375, 125.75]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 4.0, 13.0, 10.0, 9.0, 24.0, 25.0, 23.0, 27.0, 39.0, 34.0, 58.0, 85.0, 121.0, 139.0, 177.0, 279.0, 392.0, 639.0, 571.0, 368.0, 270.0, 182.0, 125.0, 92.0, 82.0, 67.0, 38.0, 33.0, 21.0, 28.0, 15.0, 11.0, 12.0, 10.0, 9.0, 9.0, 6.0, 5.0, 2.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-45.4375, -44.05517578125, -42.6728515625, -41.29052734375, -39.908203125, -38.52587890625, -37.1435546875, -35.76123046875, -34.37890625, -32.99658203125, -31.6142578125, -30.23193359375, -28.849609375, -27.46728515625, -26.0849609375, -24.70263671875, -23.3203125, -21.93798828125, -20.5556640625, -19.17333984375, -17.791015625, -16.40869140625, -15.0263671875, -13.64404296875, -12.26171875, -10.87939453125, -9.4970703125, -8.11474609375, -6.732421875, -5.35009765625, -3.9677734375, -2.58544921875, -1.203125, 0.17919921875, 1.5615234375, 2.94384765625, 4.326171875, 5.70849609375, 7.0908203125, 8.47314453125, 9.85546875, 11.23779296875, 12.6201171875, 14.00244140625, 15.384765625, 16.76708984375, 18.1494140625, 19.53173828125, 20.9140625, 22.29638671875, 23.6787109375, 25.06103515625, 26.443359375, 27.82568359375, 29.2080078125, 30.59033203125, 31.97265625, 33.35498046875, 34.7373046875, 36.11962890625, 37.501953125, 38.88427734375, 40.2666015625, 41.64892578125, 43.03125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 10.0, 8.0, 7.0, 16.0, 8.0, 20.0, 26.0, 29.0, 43.0, 62.0, 83.0, 100.0, 122.0, 107.0, 85.0, 76.0, 42.0, 34.0, 32.0, 24.0, 19.0, 6.0, 11.0, 12.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.39942932128906, -132.21673583984375, -128.0340576171875, -123.85136413574219, -119.66867065429688, -115.4859848022461, -111.30329895019531, -107.12060546875, -102.93791961669922, -98.75523376464844, -94.57254028320312, -90.38985443115234, -86.20716857910156, -82.02447509765625, -77.84178924560547, -73.65910339355469, -69.47640991210938, -65.2937240600586, -61.11103057861328, -56.9283447265625, -52.74565505981445, -48.562965393066406, -44.380279541015625, -40.19758987426758, -36.01490020751953, -31.832210540771484, -27.64952278137207, -23.466835021972656, -19.28414535522461, -15.101455688476562, -10.918767929077148, -6.736080169677734, -2.55340576171875, 1.6292829513549805, 5.811971664428711, 9.994660377502441, 14.177349090576172, 18.36003875732422, 22.542726516723633, 26.725414276123047, 30.908103942871094, 35.09079360961914, 39.27348327636719, 43.45616912841797, 47.638858795166016, 51.82154846191406, 56.004234313964844, 60.18692398071289, 64.36961364746094, 68.55229949951172, 72.73499298095703, 76.91767883300781, 81.10037231445312, 85.2830581665039, 89.46574401855469, 93.6484375, 97.83112335205078, 102.01380920410156, 106.19650268554688, 110.37918853759766, 114.56187438964844, 118.74456787109375, 122.92725372314453, 127.10993957519531, 131.29263305664062]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 7.0, 7.0, 13.0, 7.0, 15.0, 11.0, 20.0, 22.0, 25.0, 22.0, 38.0, 24.0, 36.0, 46.0, 43.0, 41.0, 46.0, 53.0, 46.0, 52.0, 39.0, 45.0, 42.0, 40.0, 20.0, 33.0, 29.0, 28.0, 20.0, 21.0, 16.0, 15.0, 12.0, 12.0, 8.0, 10.0, 10.0, 9.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-74.71490478515625, -72.24452209472656, -69.7741470336914, -67.30377197265625, -64.83338928222656, -62.36301040649414, -59.89263153076172, -57.4222526550293, -54.951873779296875, -52.48149490356445, -50.01111602783203, -47.54073715209961, -45.07035827636719, -42.599979400634766, -40.129600524902344, -37.65922164916992, -35.1888427734375, -32.71846389770508, -30.248085021972656, -27.777706146240234, -25.307327270507812, -22.83694839477539, -20.36656951904297, -17.896190643310547, -15.425811767578125, -12.955432891845703, -10.485054016113281, -8.01467514038086, -5.5442962646484375, -3.0739173889160156, -0.6035385131835938, 1.8668403625488281, 4.337226867675781, 6.807605743408203, 9.277984619140625, 11.748363494873047, 14.218742370605469, 16.68912124633789, 19.159500122070312, 21.629878997802734, 24.100257873535156, 26.570636749267578, 29.041015625, 31.511394500732422, 33.981773376464844, 36.452152252197266, 38.92253112792969, 41.39291000366211, 43.86328887939453, 46.33366775512695, 48.804046630859375, 51.2744255065918, 53.74480438232422, 56.21518325805664, 58.68556213378906, 61.155941009521484, 63.626319885253906, 66.09669494628906, 68.56707763671875, 71.03746032714844, 73.5078353881836, 75.97821044921875, 78.44859313964844, 80.91897583007812, 83.38935089111328]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 8.0, 8.0, 19.0, 26.0, 35.0, 52.0, 72.0, 118.0, 150.0, 238.0, 300.0, 445.0, 676.0, 925.0, 1418.0, 2052.0, 3065.0, 4531.0, 6650.0, 10002.0, 15085.0, 23352.0, 37639.0, 62513.0, 109378.0, 212042.0, 244831.0, 125036.0, 69905.0, 41915.0, 26019.0, 16541.0, 10825.0, 7336.0, 4831.0, 3302.0, 2227.0, 1539.0, 1116.0, 706.0, 496.0, 325.0, 240.0, 180.0, 118.0, 93.0, 54.0, 35.0, 26.0, 21.0, 17.0, 4.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-36.90625, -35.7568359375, -34.607421875, -33.4580078125, -32.30859375, -31.1591796875, -30.009765625, -28.8603515625, -27.7109375, -26.5615234375, -25.412109375, -24.2626953125, -23.11328125, -21.9638671875, -20.814453125, -19.6650390625, -18.515625, -17.3662109375, -16.216796875, -15.0673828125, -13.91796875, -12.7685546875, -11.619140625, -10.4697265625, -9.3203125, -8.1708984375, -7.021484375, -5.8720703125, -4.72265625, -3.5732421875, -2.423828125, -1.2744140625, -0.125, 1.0244140625, 2.173828125, 3.3232421875, 4.47265625, 5.6220703125, 6.771484375, 7.9208984375, 9.0703125, 10.2197265625, 11.369140625, 12.5185546875, 13.66796875, 14.8173828125, 15.966796875, 17.1162109375, 18.265625, 19.4150390625, 20.564453125, 21.7138671875, 22.86328125, 24.0126953125, 25.162109375, 26.3115234375, 27.4609375, 28.6103515625, 29.759765625, 30.9091796875, 32.05859375, 33.2080078125, 34.357421875, 35.5068359375, 36.65625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 10.0, 9.0, 12.0, 11.0, 15.0, 14.0, 22.0, 26.0, 31.0, 27.0, 31.0, 37.0, 43.0, 46.0, 40.0, 60.0, 61.0, 54.0, 51.0, 54.0, 39.0, 34.0, 39.0, 23.0, 29.0, 25.0, 22.0, 11.0, 21.0, 15.0, 15.0, 12.0, 8.0, 10.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.875, -79.2421875, -76.609375, -73.9765625, -71.34375, -68.7109375, -66.078125, -63.4453125, -60.8125, -58.1796875, -55.546875, -52.9140625, -50.28125, -47.6484375, -45.015625, -42.3828125, -39.75, -37.1171875, -34.484375, -31.8515625, -29.21875, -26.5859375, -23.953125, -21.3203125, -18.6875, -16.0546875, -13.421875, -10.7890625, -8.15625, -5.5234375, -2.890625, -0.2578125, 2.375, 5.0078125, 7.640625, 10.2734375, 12.90625, 15.5390625, 18.171875, 20.8046875, 23.4375, 26.0703125, 28.703125, 31.3359375, 33.96875, 36.6015625, 39.234375, 41.8671875, 44.5, 47.1328125, 49.765625, 52.3984375, 55.03125, 57.6640625, 60.296875, 62.9296875, 65.5625, 68.1953125, 70.828125, 73.4609375, 76.09375, 78.7265625, 81.359375, 83.9921875, 86.625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 16.0, 12.0, 21.0, 26.0, 45.0, 75.0, 131.0, 225.0, 492.0, 1114.0, 2880.0, 8596.0, 33849.0, 919540.0, 62954.0, 11954.0, 3874.0, 1440.0, 627.0, 265.0, 146.0, 87.0, 48.0, 29.0, 26.0, 13.0, 17.0, 10.0, 6.0, 9.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.75, -107.84765625, -103.9453125, -100.04296875, -96.140625, -92.23828125, -88.3359375, -84.43359375, -80.53125, -76.62890625, -72.7265625, -68.82421875, -64.921875, -61.01953125, -57.1171875, -53.21484375, -49.3125, -45.41015625, -41.5078125, -37.60546875, -33.703125, -29.80078125, -25.8984375, -21.99609375, -18.09375, -14.19140625, -10.2890625, -6.38671875, -2.484375, 1.41796875, 5.3203125, 9.22265625, 13.125, 17.02734375, 20.9296875, 24.83203125, 28.734375, 32.63671875, 36.5390625, 40.44140625, 44.34375, 48.24609375, 52.1484375, 56.05078125, 59.953125, 63.85546875, 67.7578125, 71.66015625, 75.5625, 79.46484375, 83.3671875, 87.26953125, 91.171875, 95.07421875, 98.9765625, 102.87890625, 106.78125, 110.68359375, 114.5859375, 118.48828125, 122.390625, 126.29296875, 130.1953125, 134.09765625, 138.0]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 6.0, 11.0, 17.0, 13.0, 15.0, 23.0, 29.0, 22.0, 20.0, 23.0, 17.0, 31.0, 35.0, 43.0, 37.0, 34.0, 36.0, 47.0, 35.0, 40.0, 44.0, 33.0, 30.0, 41.0, 49.0, 24.0, 28.0, 34.0, 27.0, 28.0, 13.0, 15.0, 12.0, 18.0, 12.0, 9.0, 5.0, 8.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.53125, -48.93505859375, -47.3388671875, -45.74267578125, -44.146484375, -42.55029296875, -40.9541015625, -39.35791015625, -37.76171875, -36.16552734375, -34.5693359375, -32.97314453125, -31.376953125, -29.78076171875, -28.1845703125, -26.58837890625, -24.9921875, -23.39599609375, -21.7998046875, -20.20361328125, -18.607421875, -17.01123046875, -15.4150390625, -13.81884765625, -12.22265625, -10.62646484375, -9.0302734375, -7.43408203125, -5.837890625, -4.24169921875, -2.6455078125, -1.04931640625, 0.546875, 2.14306640625, 3.7392578125, 5.33544921875, 6.931640625, 8.52783203125, 10.1240234375, 11.72021484375, 13.31640625, 14.91259765625, 16.5087890625, 18.10498046875, 19.701171875, 21.29736328125, 22.8935546875, 24.48974609375, 26.0859375, 27.68212890625, 29.2783203125, 30.87451171875, 32.470703125, 34.06689453125, 35.6630859375, 37.25927734375, 38.85546875, 40.45166015625, 42.0478515625, 43.64404296875, 45.240234375, 46.83642578125, 48.4326171875, 50.02880859375, 51.625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 12.0, 11.0, 15.0, 21.0, 30.0, 33.0, 43.0, 59.0, 83.0, 126.0, 208.0, 435.0, 794.0, 1796.0, 5140.0, 21582.0, 946542.0, 57893.0, 8498.0, 2769.0, 1117.0, 524.0, 268.0, 146.0, 107.0, 76.0, 49.0, 30.0, 29.0, 30.0, 15.0, 12.0, 10.0, 5.0, 8.0, 2.0, 7.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.3125, -25.5078125, -24.703125, -23.8984375, -23.09375, -22.2890625, -21.484375, -20.6796875, -19.875, -19.0703125, -18.265625, -17.4609375, -16.65625, -15.8515625, -15.046875, -14.2421875, -13.4375, -12.6328125, -11.828125, -11.0234375, -10.21875, -9.4140625, -8.609375, -7.8046875, -7.0, -6.1953125, -5.390625, -4.5859375, -3.78125, -2.9765625, -2.171875, -1.3671875, -0.5625, 0.2421875, 1.046875, 1.8515625, 2.65625, 3.4609375, 4.265625, 5.0703125, 5.875, 6.6796875, 7.484375, 8.2890625, 9.09375, 9.8984375, 10.703125, 11.5078125, 12.3125, 13.1171875, 13.921875, 14.7265625, 15.53125, 16.3359375, 17.140625, 17.9453125, 18.75, 19.5546875, 20.359375, 21.1640625, 21.96875, 22.7734375, 23.578125, 24.3828125, 25.1875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 10.0, 7.0, 16.0, 22.0, 27.0, 39.0, 49.0, 70.0, 83.0, 108.0, 101.0, 105.0, 96.0, 77.0, 44.0, 32.0, 31.0, 24.0, 13.0, 13.0, 11.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014286041259765625, -0.0013845711946487427, -0.0013405382633209229, -0.001296505331993103, -0.0012524724006652832, -0.0012084394693374634, -0.0011644065380096436, -0.0011203736066818237, -0.001076340675354004, -0.001032307744026184, -0.0009882748126983643, -0.0009442418813705444, -0.0009002089500427246, -0.0008561760187149048, -0.000812143087387085, -0.0007681101560592651, -0.0007240772247314453, -0.0006800442934036255, -0.0006360113620758057, -0.0005919784307479858, -0.000547945499420166, -0.0005039125680923462, -0.00045987963676452637, -0.00041584670543670654, -0.0003718137741088867, -0.0003277808427810669, -0.00028374791145324707, -0.00023971498012542725, -0.00019568204879760742, -0.0001516491174697876, -0.00010761618614196777, -6.358325481414795e-05, -1.9550323486328125e-05, 2.44826078414917e-05, 6.851553916931152e-05, 0.00011254847049713135, 0.00015658140182495117, 0.000200614333152771, 0.0002446472644805908, 0.00028868019580841064, 0.00033271312713623047, 0.0003767460584640503, 0.0004207789897918701, 0.00046481192111968994, 0.0005088448524475098, 0.0005528777837753296, 0.0005969107151031494, 0.0006409436464309692, 0.0006849765777587891, 0.0007290095090866089, 0.0007730424404144287, 0.0008170753717422485, 0.0008611083030700684, 0.0009051412343978882, 0.000949174165725708, 0.0009932070970535278, 0.0010372400283813477, 0.0010812729597091675, 0.0011253058910369873, 0.0011693388223648071, 0.001213371753692627, 0.0012574046850204468, 0.0013014376163482666, 0.0013454705476760864, 0.0013895034790039062]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 11.0, 11.0, 10.0, 20.0, 33.0, 49.0, 44.0, 76.0, 108.0, 146.0, 217.0, 306.0, 352.0, 492.0, 681.0, 911.0, 1266.0, 1732.0, 2524.0, 3726.0, 6371.0, 12084.0, 28814.0, 88302.0, 439730.0, 333502.0, 73171.0, 25142.0, 10758.0, 5804.0, 3628.0, 2362.0, 1669.0, 1200.0, 856.0, 671.0, 457.0, 315.0, 284.0, 207.0, 162.0, 98.0, 58.0, 56.0, 45.0, 37.0, 27.0, 14.0, 5.0, 6.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.589599609375, -18.00732421875, -17.425048828125, -16.8427734375, -16.260498046875, -15.67822265625, -15.095947265625, -14.513671875, -13.931396484375, -13.34912109375, -12.766845703125, -12.1845703125, -11.602294921875, -11.02001953125, -10.437744140625, -9.85546875, -9.273193359375, -8.69091796875, -8.108642578125, -7.5263671875, -6.944091796875, -6.36181640625, -5.779541015625, -5.197265625, -4.614990234375, -4.03271484375, -3.450439453125, -2.8681640625, -2.285888671875, -1.70361328125, -1.121337890625, -0.5390625, 0.043212890625, 0.62548828125, 1.207763671875, 1.7900390625, 2.372314453125, 2.95458984375, 3.536865234375, 4.119140625, 4.701416015625, 5.28369140625, 5.865966796875, 6.4482421875, 7.030517578125, 7.61279296875, 8.195068359375, 8.77734375, 9.359619140625, 9.94189453125, 10.524169921875, 11.1064453125, 11.688720703125, 12.27099609375, 12.853271484375, 13.435546875, 14.017822265625, 14.60009765625, 15.182373046875, 15.7646484375, 16.346923828125, 16.92919921875, 17.511474609375, 18.09375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 3.0, 5.0, 7.0, 6.0, 12.0, 16.0, 18.0, 28.0, 24.0, 32.0, 61.0, 59.0, 70.0, 64.0, 81.0, 69.0, 77.0, 64.0, 57.0, 44.0, 43.0, 32.0, 42.0, 20.0, 9.0, 15.0, 8.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.880859375, -2.770904541015625, -2.66094970703125, -2.550994873046875, -2.4410400390625, -2.331085205078125, -2.22113037109375, -2.111175537109375, -2.001220703125, -1.891265869140625, -1.78131103515625, -1.671356201171875, -1.5614013671875, -1.451446533203125, -1.34149169921875, -1.231536865234375, -1.12158203125, -1.011627197265625, -0.90167236328125, -0.791717529296875, -0.6817626953125, -0.571807861328125, -0.46185302734375, -0.351898193359375, -0.241943359375, -0.131988525390625, -0.02203369140625, 0.087921142578125, 0.1978759765625, 0.307830810546875, 0.41778564453125, 0.527740478515625, 0.6376953125, 0.747650146484375, 0.85760498046875, 0.967559814453125, 1.0775146484375, 1.187469482421875, 1.29742431640625, 1.407379150390625, 1.517333984375, 1.627288818359375, 1.73724365234375, 1.847198486328125, 1.9571533203125, 2.067108154296875, 2.17706298828125, 2.287017822265625, 2.39697265625, 2.506927490234375, 2.61688232421875, 2.726837158203125, 2.8367919921875, 2.946746826171875, 3.05670166015625, 3.166656494140625, 3.276611328125, 3.386566162109375, 3.49652099609375, 3.606475830078125, 3.7164306640625, 3.826385498046875, 3.93634033203125, 4.046295166015625, 4.15625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 11.0, 10.0, 13.0, 17.0, 13.0, 31.0, 45.0, 43.0, 69.0, 103.0, 116.0, 124.0, 102.0, 72.0, 56.0, 34.0, 42.0, 23.0, 22.0, 9.0, 13.0, 9.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.05120849609375, -131.8037872314453, -127.55636596679688, -123.30895233154297, -119.06153106689453, -114.8141098022461, -110.56669616699219, -106.31927490234375, -102.07185363769531, -97.82443237304688, -93.57701110839844, -89.32959747314453, -85.0821762084961, -80.83475494384766, -76.58734130859375, -72.33992004394531, -68.09249877929688, -63.84507751464844, -59.597660064697266, -55.350242614746094, -51.102821350097656, -46.85540008544922, -42.60798263549805, -38.360565185546875, -34.11314392089844, -29.865724563598633, -25.618305206298828, -21.370885848999023, -17.12346649169922, -12.876047134399414, -8.62862777709961, -4.381208419799805, -0.1337738037109375, 4.113645553588867, 8.361064910888672, 12.608484268188477, 16.85590362548828, 21.103322982788086, 25.35074234008789, 29.598161697387695, 33.8455810546875, 38.09300231933594, 42.34041976928711, 46.58783721923828, 50.83525848388672, 55.082679748535156, 59.33009719848633, 63.5775146484375, 67.82493591308594, 72.07235717773438, 76.31977844238281, 80.56719207763672, 84.81461334228516, 89.0620346069336, 93.3094482421875, 97.55686950683594, 101.80429077148438, 106.05171203613281, 110.29913330078125, 114.54654693603516, 118.7939682006836, 123.04138946533203, 127.28880310058594, 131.53622436523438, 135.7836456298828]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 7.0, 10.0, 10.0, 10.0, 14.0, 15.0, 18.0, 21.0, 34.0, 28.0, 30.0, 25.0, 35.0, 50.0, 41.0, 44.0, 41.0, 57.0, 45.0, 47.0, 43.0, 39.0, 48.0, 24.0, 25.0, 35.0, 29.0, 26.0, 18.0, 20.0, 15.0, 16.0, 11.0, 10.0, 11.0, 10.0, 7.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-72.27301788330078, -69.8780288696289, -67.48304748535156, -65.08805847167969, -62.693077087402344, -60.298091888427734, -57.903106689453125, -55.50811767578125, -53.113136291503906, -50.7181510925293, -48.32316589355469, -45.92818069458008, -43.53319549560547, -41.13821029663086, -38.74322509765625, -36.348236083984375, -33.953250885009766, -31.558265686035156, -29.163280487060547, -26.768295288085938, -24.373310089111328, -21.97832489013672, -19.583337783813477, -17.188352584838867, -14.793367385864258, -12.398382186889648, -10.003396987915039, -7.608410835266113, -5.213425636291504, -2.8184404373168945, -0.42345428466796875, 1.9715309143066406, 4.36651611328125, 6.761501312255859, 9.156486511230469, 11.551472663879395, 13.946457862854004, 16.341442108154297, 18.73642921447754, 21.13141441345215, 23.526399612426758, 25.921384811401367, 28.316370010375977, 30.71135711669922, 33.10634231567383, 35.50132751464844, 37.89631271362305, 40.291297912597656, 42.686283111572266, 45.081268310546875, 47.476253509521484, 49.871238708496094, 52.2662239074707, 54.66120910644531, 57.05619812011719, 59.45117950439453, 61.846168518066406, 64.24115753173828, 66.63613891601562, 69.0311279296875, 71.42610931396484, 73.82109832763672, 76.21607971191406, 78.61106872558594, 81.00605010986328]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 7.0, 9.0, 9.0, 23.0, 35.0, 40.0, 64.0, 83.0, 136.0, 194.0, 277.0, 430.0, 640.0, 981.0, 1567.0, 2528.0, 3755.0, 6369.0, 11011.0, 19240.0, 36117.0, 71115.0, 146939.0, 287531.0, 228464.0, 110071.0, 54486.0, 27885.0, 15306.0, 8896.0, 5282.0, 3225.0, 1959.0, 1356.0, 830.0, 549.0, 357.0, 283.0, 166.0, 97.0, 80.0, 57.0, 39.0, 17.0, 18.0, 6.0, 6.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-132.625, -128.455078125, -124.28515625, -120.115234375, -115.9453125, -111.775390625, -107.60546875, -103.435546875, -99.265625, -95.095703125, -90.92578125, -86.755859375, -82.5859375, -78.416015625, -74.24609375, -70.076171875, -65.90625, -61.736328125, -57.56640625, -53.396484375, -49.2265625, -45.056640625, -40.88671875, -36.716796875, -32.546875, -28.376953125, -24.20703125, -20.037109375, -15.8671875, -11.697265625, -7.52734375, -3.357421875, 0.8125, 4.982421875, 9.15234375, 13.322265625, 17.4921875, 21.662109375, 25.83203125, 30.001953125, 34.171875, 38.341796875, 42.51171875, 46.681640625, 50.8515625, 55.021484375, 59.19140625, 63.361328125, 67.53125, 71.701171875, 75.87109375, 80.041015625, 84.2109375, 88.380859375, 92.55078125, 96.720703125, 100.890625, 105.060546875, 109.23046875, 113.400390625, 117.5703125, 121.740234375, 125.91015625, 130.080078125, 134.25]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 11.0, 9.0, 11.0, 9.0, 22.0, 18.0, 28.0, 20.0, 33.0, 29.0, 41.0, 49.0, 44.0, 50.0, 51.0, 56.0, 51.0, 55.0, 50.0, 38.0, 44.0, 30.0, 29.0, 34.0, 26.0, 18.0, 18.0, 15.0, 17.0, 17.0, 8.0, 12.0, 9.0, 7.0, 9.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-76.0, -73.4814453125, -70.962890625, -68.4443359375, -65.92578125, -63.4072265625, -60.888671875, -58.3701171875, -55.8515625, -53.3330078125, -50.814453125, -48.2958984375, -45.77734375, -43.2587890625, -40.740234375, -38.2216796875, -35.703125, -33.1845703125, -30.666015625, -28.1474609375, -25.62890625, -23.1103515625, -20.591796875, -18.0732421875, -15.5546875, -13.0361328125, -10.517578125, -7.9990234375, -5.48046875, -2.9619140625, -0.443359375, 2.0751953125, 4.59375, 7.1123046875, 9.630859375, 12.1494140625, 14.66796875, 17.1865234375, 19.705078125, 22.2236328125, 24.7421875, 27.2607421875, 29.779296875, 32.2978515625, 34.81640625, 37.3349609375, 39.853515625, 42.3720703125, 44.890625, 47.4091796875, 49.927734375, 52.4462890625, 54.96484375, 57.4833984375, 60.001953125, 62.5205078125, 65.0390625, 67.5576171875, 70.076171875, 72.5947265625, 75.11328125, 77.6318359375, 80.150390625, 82.6689453125, 85.1875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 6.0, 3.0, 8.0, 14.0, 17.0, 27.0, 40.0, 58.0, 91.0, 149.0, 217.0, 354.0, 521.0, 878.0, 1416.0, 2378.0, 3933.0, 6984.0, 12526.0, 22547.0, 43374.0, 86977.0, 176099.0, 293109.0, 195071.0, 96162.0, 48461.0, 25005.0, 13551.0, 7573.0, 4424.0, 2537.0, 1547.0, 925.0, 533.0, 357.0, 215.0, 148.0, 102.0, 62.0, 47.0, 40.0, 19.0, 18.0, 6.0, 9.0, 2.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-167.125, -161.83203125, -156.5390625, -151.24609375, -145.953125, -140.66015625, -135.3671875, -130.07421875, -124.78125, -119.48828125, -114.1953125, -108.90234375, -103.609375, -98.31640625, -93.0234375, -87.73046875, -82.4375, -77.14453125, -71.8515625, -66.55859375, -61.265625, -55.97265625, -50.6796875, -45.38671875, -40.09375, -34.80078125, -29.5078125, -24.21484375, -18.921875, -13.62890625, -8.3359375, -3.04296875, 2.25, 7.54296875, 12.8359375, 18.12890625, 23.421875, 28.71484375, 34.0078125, 39.30078125, 44.59375, 49.88671875, 55.1796875, 60.47265625, 65.765625, 71.05859375, 76.3515625, 81.64453125, 86.9375, 92.23046875, 97.5234375, 102.81640625, 108.109375, 113.40234375, 118.6953125, 123.98828125, 129.28125, 134.57421875, 139.8671875, 145.16015625, 150.453125, 155.74609375, 161.0390625, 166.33203125, 171.625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 11.0, 11.0, 13.0, 16.0, 11.0, 17.0, 26.0, 28.0, 34.0, 29.0, 30.0, 34.0, 42.0, 50.0, 39.0, 53.0, 55.0, 47.0, 45.0, 46.0, 37.0, 31.0, 44.0, 40.0, 29.0, 17.0, 13.0, 20.0, 20.0, 16.0, 15.0, 14.0, 16.0, 4.0, 14.0, 6.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-51.0, -49.294921875, -47.58984375, -45.884765625, -44.1796875, -42.474609375, -40.76953125, -39.064453125, -37.359375, -35.654296875, -33.94921875, -32.244140625, -30.5390625, -28.833984375, -27.12890625, -25.423828125, -23.71875, -22.013671875, -20.30859375, -18.603515625, -16.8984375, -15.193359375, -13.48828125, -11.783203125, -10.078125, -8.373046875, -6.66796875, -4.962890625, -3.2578125, -1.552734375, 0.15234375, 1.857421875, 3.5625, 5.267578125, 6.97265625, 8.677734375, 10.3828125, 12.087890625, 13.79296875, 15.498046875, 17.203125, 18.908203125, 20.61328125, 22.318359375, 24.0234375, 25.728515625, 27.43359375, 29.138671875, 30.84375, 32.548828125, 34.25390625, 35.958984375, 37.6640625, 39.369140625, 41.07421875, 42.779296875, 44.484375, 46.189453125, 47.89453125, 49.599609375, 51.3046875, 53.009765625, 54.71484375, 56.419921875, 58.125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 7.0, 17.0, 19.0, 20.0, 45.0, 53.0, 57.0, 100.0, 137.0, 202.0, 312.0, 404.0, 590.0, 820.0, 1241.0, 2002.0, 3255.0, 5975.0, 11291.0, 23167.0, 55385.0, 187198.0, 545706.0, 126151.0, 42782.0, 19098.0, 9268.0, 4970.0, 2920.0, 1735.0, 1072.0, 742.0, 506.0, 376.0, 240.0, 214.0, 133.0, 109.0, 62.0, 39.0, 46.0, 19.0, 19.0, 10.0, 11.0, 10.0, 3.0, 1.0, 3.0, 3.0, 1.0], "bins": [-69.3125, -67.3525390625, -65.392578125, -63.4326171875, -61.47265625, -59.5126953125, -57.552734375, -55.5927734375, -53.6328125, -51.6728515625, -49.712890625, -47.7529296875, -45.79296875, -43.8330078125, -41.873046875, -39.9130859375, -37.953125, -35.9931640625, -34.033203125, -32.0732421875, -30.11328125, -28.1533203125, -26.193359375, -24.2333984375, -22.2734375, -20.3134765625, -18.353515625, -16.3935546875, -14.43359375, -12.4736328125, -10.513671875, -8.5537109375, -6.59375, -4.6337890625, -2.673828125, -0.7138671875, 1.24609375, 3.2060546875, 5.166015625, 7.1259765625, 9.0859375, 11.0458984375, 13.005859375, 14.9658203125, 16.92578125, 18.8857421875, 20.845703125, 22.8056640625, 24.765625, 26.7255859375, 28.685546875, 30.6455078125, 32.60546875, 34.5654296875, 36.525390625, 38.4853515625, 40.4453125, 42.4052734375, 44.365234375, 46.3251953125, 48.28515625, 50.2451171875, 52.205078125, 54.1650390625, 56.125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 4.0, 9.0, 15.0, 11.0, 15.0, 29.0, 45.0, 84.0, 195.0, 240.0, 131.0, 59.0, 55.0, 26.0, 21.0, 13.0, 10.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00860595703125, -0.008380889892578125, -0.00815582275390625, -0.007930755615234375, -0.0077056884765625, -0.007480621337890625, -0.00725555419921875, -0.007030487060546875, -0.006805419921875, -0.006580352783203125, -0.00635528564453125, -0.006130218505859375, -0.0059051513671875, -0.005680084228515625, -0.00545501708984375, -0.005229949951171875, -0.0050048828125, -0.004779815673828125, -0.00455474853515625, -0.004329681396484375, -0.0041046142578125, -0.003879547119140625, -0.00365447998046875, -0.003429412841796875, -0.003204345703125, -0.002979278564453125, -0.00275421142578125, -0.002529144287109375, -0.0023040771484375, -0.002079010009765625, -0.00185394287109375, -0.001628875732421875, -0.00140380859375, -0.001178741455078125, -0.00095367431640625, -0.000728607177734375, -0.0005035400390625, -0.000278472900390625, -5.340576171875e-05, 0.000171661376953125, 0.000396728515625, 0.000621795654296875, 0.00084686279296875, 0.001071929931640625, 0.0012969970703125, 0.001522064208984375, 0.00174713134765625, 0.001972198486328125, 0.002197265625, 0.002422332763671875, 0.00264739990234375, 0.002872467041015625, 0.0030975341796875, 0.003322601318359375, 0.00354766845703125, 0.003772735595703125, 0.003997802734375, 0.004222869873046875, 0.00444793701171875, 0.004673004150390625, 0.0048980712890625, 0.005123138427734375, 0.00534820556640625, 0.005573272705078125, 0.00579833984375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 4.0, 2.0, 1.0, 4.0, 10.0, 3.0, 16.0, 10.0, 12.0, 27.0, 23.0, 40.0, 56.0, 50.0, 83.0, 129.0, 176.0, 254.0, 419.0, 660.0, 1048.0, 1755.0, 3284.0, 6307.0, 13183.0, 36162.0, 165814.0, 655669.0, 111946.0, 27938.0, 10890.0, 5448.0, 2752.0, 1637.0, 918.0, 583.0, 396.0, 260.0, 158.0, 112.0, 71.0, 63.0, 47.0, 44.0, 20.0, 19.0, 19.0, 14.0, 8.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-79.625, -77.0048828125, -74.384765625, -71.7646484375, -69.14453125, -66.5244140625, -63.904296875, -61.2841796875, -58.6640625, -56.0439453125, -53.423828125, -50.8037109375, -48.18359375, -45.5634765625, -42.943359375, -40.3232421875, -37.703125, -35.0830078125, -32.462890625, -29.8427734375, -27.22265625, -24.6025390625, -21.982421875, -19.3623046875, -16.7421875, -14.1220703125, -11.501953125, -8.8818359375, -6.26171875, -3.6416015625, -1.021484375, 1.5986328125, 4.21875, 6.8388671875, 9.458984375, 12.0791015625, 14.69921875, 17.3193359375, 19.939453125, 22.5595703125, 25.1796875, 27.7998046875, 30.419921875, 33.0400390625, 35.66015625, 38.2802734375, 40.900390625, 43.5205078125, 46.140625, 48.7607421875, 51.380859375, 54.0009765625, 56.62109375, 59.2412109375, 61.861328125, 64.4814453125, 67.1015625, 69.7216796875, 72.341796875, 74.9619140625, 77.58203125, 80.2021484375, 82.822265625, 85.4423828125, 88.0625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 5.0, 14.0, 8.0, 13.0, 20.0, 33.0, 48.0, 59.0, 104.0, 169.0, 164.0, 126.0, 67.0, 49.0, 24.0, 17.0, 16.0, 13.0, 7.0, 13.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-27.734375, -27.02783203125, -26.3212890625, -25.61474609375, -24.908203125, -24.20166015625, -23.4951171875, -22.78857421875, -22.08203125, -21.37548828125, -20.6689453125, -19.96240234375, -19.255859375, -18.54931640625, -17.8427734375, -17.13623046875, -16.4296875, -15.72314453125, -15.0166015625, -14.31005859375, -13.603515625, -12.89697265625, -12.1904296875, -11.48388671875, -10.77734375, -10.07080078125, -9.3642578125, -8.65771484375, -7.951171875, -7.24462890625, -6.5380859375, -5.83154296875, -5.125, -4.41845703125, -3.7119140625, -3.00537109375, -2.298828125, -1.59228515625, -0.8857421875, -0.17919921875, 0.52734375, 1.23388671875, 1.9404296875, 2.64697265625, 3.353515625, 4.06005859375, 4.7666015625, 5.47314453125, 6.1796875, 6.88623046875, 7.5927734375, 8.29931640625, 9.005859375, 9.71240234375, 10.4189453125, 11.12548828125, 11.83203125, 12.53857421875, 13.2451171875, 13.95166015625, 14.658203125, 15.36474609375, 16.0712890625, 16.77783203125, 17.484375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 9.0, 4.0, 4.0, 2.0, 16.0, 13.0, 18.0, 21.0, 33.0, 44.0, 58.0, 86.0, 88.0, 124.0, 107.0, 96.0, 73.0, 51.0, 55.0, 30.0, 17.0, 16.0, 9.0, 12.0, 3.0, 11.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.9215850830078, -139.4133758544922, -134.90516662597656, -130.39697265625, -125.88876342773438, -121.38055419921875, -116.87234497070312, -112.36414337158203, -107.85594177246094, -103.34773254394531, -98.83953094482422, -94.3313217163086, -89.8231201171875, -85.31491088867188, -80.80670166015625, -76.29850006103516, -71.79029083251953, -67.2820816040039, -62.77388000488281, -58.26567077636719, -53.757469177246094, -49.24925994873047, -44.74105453491211, -40.23284912109375, -35.72464370727539, -31.21643829345703, -26.708232879638672, -22.20002555847168, -17.69182014465332, -13.183614730834961, -8.675407409667969, -4.167201995849609, 0.34100341796875, 4.849209308624268, 9.357415199279785, 13.865621566772461, 18.37382698059082, 22.88203239440918, 27.390239715576172, 31.89844512939453, 36.40665054321289, 40.91485595703125, 45.42306137084961, 49.93126678466797, 54.439476013183594, 58.94767761230469, 63.45588684082031, 67.96409606933594, 72.47229766845703, 76.98050689697266, 81.48870849609375, 85.99691772460938, 90.50511932373047, 95.0133285522461, 99.52153015136719, 104.02973937988281, 108.53794860839844, 113.04615783691406, 117.55435943603516, 122.06256866455078, 126.57077026367188, 131.0789794921875, 135.58718872070312, 140.09539794921875, 144.6035919189453]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 7.0, 4.0, 7.0, 6.0, 8.0, 19.0, 16.0, 12.0, 18.0, 13.0, 18.0, 39.0, 35.0, 39.0, 37.0, 58.0, 38.0, 45.0, 41.0, 45.0, 37.0, 52.0, 42.0, 39.0, 41.0, 39.0, 35.0, 31.0, 32.0, 24.0, 21.0, 18.0, 18.0, 13.0, 13.0, 9.0, 9.0, 9.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-82.38619995117188, -79.71418762207031, -77.04216766357422, -74.37014770507812, -71.69813537597656, -69.026123046875, -66.3541030883789, -63.68208694458008, -61.01007080078125, -58.33805465698242, -55.666038513183594, -52.994022369384766, -50.32200622558594, -47.64999008178711, -44.97797393798828, -42.30595779418945, -39.633941650390625, -36.9619255065918, -34.28990936279297, -31.61789321899414, -28.945877075195312, -26.273860931396484, -23.601844787597656, -20.929828643798828, -18.2578125, -15.585796356201172, -12.913780212402344, -10.241764068603516, -7.5697479248046875, -4.897731781005859, -2.2257156372070312, 0.4463005065917969, 3.1183090209960938, 5.790325164794922, 8.46234130859375, 11.134357452392578, 13.806373596191406, 16.478389739990234, 19.150405883789062, 21.82242202758789, 24.49443817138672, 27.166454315185547, 29.838470458984375, 32.5104866027832, 35.18250274658203, 37.85451889038086, 40.52653503417969, 43.198551177978516, 45.870567321777344, 48.54258346557617, 51.214599609375, 53.88661575317383, 56.558631896972656, 59.230648040771484, 61.90266418457031, 64.57467651367188, 67.24669647216797, 69.91871643066406, 72.59072875976562, 75.26274108886719, 77.93476104736328, 80.60678100585938, 83.27879333496094, 85.9508056640625, 88.6228256225586]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 13.0, 23.0, 24.0, 36.0, 59.0, 76.0, 117.0, 171.0, 235.0, 328.0, 456.0, 715.0, 1101.0, 1630.0, 2577.0, 4263.0, 7237.0, 14243.0, 32081.0, 103856.0, 642103.0, 2644515.0, 576792.0, 96305.0, 31504.0, 14129.0, 7367.0, 4394.0, 2699.0, 1740.0, 1144.0, 770.0, 510.0, 368.0, 216.0, 147.0, 109.0, 65.0, 45.0, 31.0, 25.0, 12.0, 14.0, 8.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-181.0, -175.59375, -170.1875, -164.78125, -159.375, -153.96875, -148.5625, -143.15625, -137.75, -132.34375, -126.9375, -121.53125, -116.125, -110.71875, -105.3125, -99.90625, -94.5, -89.09375, -83.6875, -78.28125, -72.875, -67.46875, -62.0625, -56.65625, -51.25, -45.84375, -40.4375, -35.03125, -29.625, -24.21875, -18.8125, -13.40625, -8.0, -2.59375, 2.8125, 8.21875, 13.625, 19.03125, 24.4375, 29.84375, 35.25, 40.65625, 46.0625, 51.46875, 56.875, 62.28125, 67.6875, 73.09375, 78.5, 83.90625, 89.3125, 94.71875, 100.125, 105.53125, 110.9375, 116.34375, 121.75, 127.15625, 132.5625, 137.96875, 143.375, 148.78125, 154.1875, 159.59375, 165.0]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 14.0, 10.0, 14.0, 13.0, 13.0, 22.0, 19.0, 37.0, 37.0, 38.0, 46.0, 54.0, 47.0, 49.0, 43.0, 59.0, 50.0, 47.0, 38.0, 47.0, 44.0, 38.0, 38.0, 28.0, 17.0, 22.0, 14.0, 22.0, 11.0, 15.0, 10.0, 10.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-81.4375, -78.85546875, -76.2734375, -73.69140625, -71.109375, -68.52734375, -65.9453125, -63.36328125, -60.78125, -58.19921875, -55.6171875, -53.03515625, -50.453125, -47.87109375, -45.2890625, -42.70703125, -40.125, -37.54296875, -34.9609375, -32.37890625, -29.796875, -27.21484375, -24.6328125, -22.05078125, -19.46875, -16.88671875, -14.3046875, -11.72265625, -9.140625, -6.55859375, -3.9765625, -1.39453125, 1.1875, 3.76953125, 6.3515625, 8.93359375, 11.515625, 14.09765625, 16.6796875, 19.26171875, 21.84375, 24.42578125, 27.0078125, 29.58984375, 32.171875, 34.75390625, 37.3359375, 39.91796875, 42.5, 45.08203125, 47.6640625, 50.24609375, 52.828125, 55.41015625, 57.9921875, 60.57421875, 63.15625, 65.73828125, 68.3203125, 70.90234375, 73.484375, 76.06640625, 78.6484375, 81.23046875, 83.8125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 9.0, 8.0, 15.0, 13.0, 19.0, 47.0, 49.0, 71.0, 82.0, 136.0, 206.0, 279.0, 389.0, 604.0, 880.0, 1234.0, 1931.0, 2954.0, 4645.0, 7504.0, 13340.0, 25530.0, 57206.0, 167293.0, 958999.0, 2459002.0, 323767.0, 88667.0, 35786.0, 17611.0, 9619.0, 5692.0, 3546.0, 2339.0, 1509.0, 1038.0, 655.0, 500.0, 333.0, 237.0, 166.0, 114.0, 72.0, 63.0, 42.0, 26.0, 17.0, 14.0, 14.0, 6.0, 9.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-163.875, -158.453125, -153.03125, -147.609375, -142.1875, -136.765625, -131.34375, -125.921875, -120.5, -115.078125, -109.65625, -104.234375, -98.8125, -93.390625, -87.96875, -82.546875, -77.125, -71.703125, -66.28125, -60.859375, -55.4375, -50.015625, -44.59375, -39.171875, -33.75, -28.328125, -22.90625, -17.484375, -12.0625, -6.640625, -1.21875, 4.203125, 9.625, 15.046875, 20.46875, 25.890625, 31.3125, 36.734375, 42.15625, 47.578125, 53.0, 58.421875, 63.84375, 69.265625, 74.6875, 80.109375, 85.53125, 90.953125, 96.375, 101.796875, 107.21875, 112.640625, 118.0625, 123.484375, 128.90625, 134.328125, 139.75, 145.171875, 150.59375, 156.015625, 161.4375, 166.859375, 172.28125, 177.703125, 183.125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 8.0, 9.0, 7.0, 23.0, 19.0, 25.0, 38.0, 54.0, 77.0, 113.0, 194.0, 265.0, 528.0, 889.0, 689.0, 407.0, 236.0, 145.0, 97.0, 54.0, 40.0, 25.0, 23.0, 18.0, 12.0, 14.0, 7.0, 2.0, 13.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.5, -45.8486328125, -44.197265625, -42.5458984375, -40.89453125, -39.2431640625, -37.591796875, -35.9404296875, -34.2890625, -32.6376953125, -30.986328125, -29.3349609375, -27.68359375, -26.0322265625, -24.380859375, -22.7294921875, -21.078125, -19.4267578125, -17.775390625, -16.1240234375, -14.47265625, -12.8212890625, -11.169921875, -9.5185546875, -7.8671875, -6.2158203125, -4.564453125, -2.9130859375, -1.26171875, 0.3896484375, 2.041015625, 3.6923828125, 5.34375, 6.9951171875, 8.646484375, 10.2978515625, 11.94921875, 13.6005859375, 15.251953125, 16.9033203125, 18.5546875, 20.2060546875, 21.857421875, 23.5087890625, 25.16015625, 26.8115234375, 28.462890625, 30.1142578125, 31.765625, 33.4169921875, 35.068359375, 36.7197265625, 38.37109375, 40.0224609375, 41.673828125, 43.3251953125, 44.9765625, 46.6279296875, 48.279296875, 49.9306640625, 51.58203125, 53.2333984375, 54.884765625, 56.5361328125, 58.1875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 6.0, 4.0, 3.0, 5.0, 6.0, 8.0, 11.0, 14.0, 15.0, 18.0, 26.0, 31.0, 34.0, 54.0, 46.0, 76.0, 105.0, 98.0, 117.0, 69.0, 54.0, 49.0, 38.0, 30.0, 23.0, 20.0, 8.0, 3.0, 8.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-119.2146987915039, -115.4179916381836, -111.62127685546875, -107.82456970214844, -104.02786254882812, -100.23114776611328, -96.43444061279297, -92.63772583007812, -88.84101867675781, -85.0443115234375, -81.24759674072266, -77.45088958740234, -73.6541748046875, -69.85746765136719, -66.06076049804688, -62.2640495300293, -58.46733856201172, -54.67062759399414, -50.87391662597656, -47.07720947265625, -43.28049850463867, -39.483787536621094, -35.68708038330078, -31.890369415283203, -28.093658447265625, -24.296947479248047, -20.5002384185791, -16.703529357910156, -12.906818389892578, -9.110107421875, -5.313398361206055, -1.5166893005371094, 2.2800140380859375, 6.076724052429199, 9.873434066772461, 13.670144081115723, 17.466854095458984, 21.263565063476562, 25.060274124145508, 28.856983184814453, 32.65369415283203, 36.45040512084961, 40.24711608886719, 44.0438232421875, 47.84053421020508, 51.637245178222656, 55.43395233154297, 59.23066329956055, 63.027374267578125, 66.82408142089844, 70.62079620361328, 74.4175033569336, 78.21421813964844, 82.01092529296875, 85.80763244628906, 89.60433959960938, 93.40105438232422, 97.19776153564453, 100.99447631835938, 104.79118347167969, 108.587890625, 112.38460540771484, 116.18131256103516, 119.97802734375, 123.77473449707031]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 10.0, 11.0, 7.0, 9.0, 7.0, 16.0, 24.0, 21.0, 30.0, 34.0, 25.0, 25.0, 28.0, 35.0, 47.0, 44.0, 39.0, 38.0, 40.0, 46.0, 50.0, 35.0, 43.0, 34.0, 33.0, 33.0, 28.0, 39.0, 24.0, 21.0, 20.0, 20.0, 21.0, 12.0, 7.0, 4.0, 5.0, 4.0, 8.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.59225463867188, -78.9365234375, -76.2807846069336, -73.62505340576172, -70.96931457519531, -68.31358337402344, -65.65784454345703, -63.002113342285156, -60.346378326416016, -57.690643310546875, -55.034908294677734, -52.379173278808594, -49.72344207763672, -47.06770324707031, -44.41197204589844, -41.7562370300293, -39.100502014160156, -36.444766998291016, -33.789031982421875, -31.133298873901367, -28.477563858032227, -25.821828842163086, -23.166095733642578, -20.510360717773438, -17.854625701904297, -15.198890686035156, -12.543156623840332, -9.887422561645508, -7.231687545776367, -4.575952529907227, -1.9202184677124023, 0.7355155944824219, 3.3912429809570312, 6.046977519989014, 8.702712059020996, 11.35844612121582, 14.014181137084961, 16.6699161529541, 19.32564926147461, 21.98138427734375, 24.63711929321289, 27.29285430908203, 29.948589324951172, 32.60432434082031, 35.26005554199219, 37.915794372558594, 40.57152557373047, 43.22726058959961, 45.88299560546875, 48.53873062133789, 51.19446563720703, 53.85020065307617, 56.50593566894531, 59.16166687011719, 61.81740188598633, 64.47313690185547, 67.12887573242188, 69.78460693359375, 72.44034576416016, 75.09607696533203, 77.75181579589844, 80.40754699707031, 83.06328582763672, 85.7190170288086, 88.37474822998047]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 15.0, 20.0, 34.0, 49.0, 74.0, 92.0, 130.0, 206.0, 277.0, 380.0, 596.0, 814.0, 1203.0, 1755.0, 2631.0, 3865.0, 5701.0, 8843.0, 13345.0, 21413.0, 34253.0, 56061.0, 91811.0, 151941.0, 210332.0, 169125.0, 103901.0, 63122.0, 38450.0, 23787.0, 15039.0, 9606.0, 6315.0, 4204.0, 2931.0, 1892.0, 1385.0, 918.0, 636.0, 431.0, 278.0, 216.0, 153.0, 80.0, 78.0, 51.0, 36.0, 26.0, 19.0, 11.0, 4.0, 7.0, 5.0, 0.0, 1.0, 2.0, 2.0], "bins": [-46.75, -45.271484375, -43.79296875, -42.314453125, -40.8359375, -39.357421875, -37.87890625, -36.400390625, -34.921875, -33.443359375, -31.96484375, -30.486328125, -29.0078125, -27.529296875, -26.05078125, -24.572265625, -23.09375, -21.615234375, -20.13671875, -18.658203125, -17.1796875, -15.701171875, -14.22265625, -12.744140625, -11.265625, -9.787109375, -8.30859375, -6.830078125, -5.3515625, -3.873046875, -2.39453125, -0.916015625, 0.5625, 2.041015625, 3.51953125, 4.998046875, 6.4765625, 7.955078125, 9.43359375, 10.912109375, 12.390625, 13.869140625, 15.34765625, 16.826171875, 18.3046875, 19.783203125, 21.26171875, 22.740234375, 24.21875, 25.697265625, 27.17578125, 28.654296875, 30.1328125, 31.611328125, 33.08984375, 34.568359375, 36.046875, 37.525390625, 39.00390625, 40.482421875, 41.9609375, 43.439453125, 44.91796875, 46.396484375, 47.875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 10.0, 9.0, 4.0, 6.0, 10.0, 23.0, 16.0, 22.0, 30.0, 31.0, 18.0, 31.0, 37.0, 38.0, 45.0, 51.0, 39.0, 49.0, 52.0, 49.0, 53.0, 43.0, 29.0, 39.0, 42.0, 31.0, 28.0, 32.0, 16.0, 17.0, 23.0, 16.0, 11.0, 8.0, 7.0, 4.0, 3.0, 2.0, 8.0, 3.0, 0.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-76.3125, -73.8701171875, -71.427734375, -68.9853515625, -66.54296875, -64.1005859375, -61.658203125, -59.2158203125, -56.7734375, -54.3310546875, -51.888671875, -49.4462890625, -47.00390625, -44.5615234375, -42.119140625, -39.6767578125, -37.234375, -34.7919921875, -32.349609375, -29.9072265625, -27.46484375, -25.0224609375, -22.580078125, -20.1376953125, -17.6953125, -15.2529296875, -12.810546875, -10.3681640625, -7.92578125, -5.4833984375, -3.041015625, -0.5986328125, 1.84375, 4.2861328125, 6.728515625, 9.1708984375, 11.61328125, 14.0556640625, 16.498046875, 18.9404296875, 21.3828125, 23.8251953125, 26.267578125, 28.7099609375, 31.15234375, 33.5947265625, 36.037109375, 38.4794921875, 40.921875, 43.3642578125, 45.806640625, 48.2490234375, 50.69140625, 53.1337890625, 55.576171875, 58.0185546875, 60.4609375, 62.9033203125, 65.345703125, 67.7880859375, 70.23046875, 72.6728515625, 75.115234375, 77.5576171875, 80.0]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 3.0, 10.0, 6.0, 15.0, 23.0, 36.0, 46.0, 76.0, 102.0, 159.0, 237.0, 315.0, 526.0, 838.0, 1217.0, 2032.0, 3343.0, 5691.0, 10545.0, 24046.0, 159398.0, 761680.0, 44644.0, 14880.0, 7445.0, 4291.0, 2548.0, 1576.0, 982.0, 642.0, 400.0, 265.0, 183.0, 116.0, 73.0, 65.0, 31.0, 28.0, 11.0, 10.0, 7.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.3125, -110.2646484375, -106.216796875, -102.1689453125, -98.12109375, -94.0732421875, -90.025390625, -85.9775390625, -81.9296875, -77.8818359375, -73.833984375, -69.7861328125, -65.73828125, -61.6904296875, -57.642578125, -53.5947265625, -49.546875, -45.4990234375, -41.451171875, -37.4033203125, -33.35546875, -29.3076171875, -25.259765625, -21.2119140625, -17.1640625, -13.1162109375, -9.068359375, -5.0205078125, -0.97265625, 3.0751953125, 7.123046875, 11.1708984375, 15.21875, 19.2666015625, 23.314453125, 27.3623046875, 31.41015625, 35.4580078125, 39.505859375, 43.5537109375, 47.6015625, 51.6494140625, 55.697265625, 59.7451171875, 63.79296875, 67.8408203125, 71.888671875, 75.9365234375, 79.984375, 84.0322265625, 88.080078125, 92.1279296875, 96.17578125, 100.2236328125, 104.271484375, 108.3193359375, 112.3671875, 116.4150390625, 120.462890625, 124.5107421875, 128.55859375, 132.6064453125, 136.654296875, 140.7021484375, 144.75]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 9.0, 5.0, 5.0, 9.0, 25.0, 14.0, 18.0, 19.0, 25.0, 22.0, 37.0, 25.0, 40.0, 43.0, 46.0, 46.0, 46.0, 46.0, 58.0, 42.0, 54.0, 57.0, 49.0, 35.0, 34.0, 31.0, 23.0, 20.0, 17.0, 16.0, 19.0, 17.0, 8.0, 11.0, 8.0, 6.0, 4.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-96.375, -93.3330078125, -90.291015625, -87.2490234375, -84.20703125, -81.1650390625, -78.123046875, -75.0810546875, -72.0390625, -68.9970703125, -65.955078125, -62.9130859375, -59.87109375, -56.8291015625, -53.787109375, -50.7451171875, -47.703125, -44.6611328125, -41.619140625, -38.5771484375, -35.53515625, -32.4931640625, -29.451171875, -26.4091796875, -23.3671875, -20.3251953125, -17.283203125, -14.2412109375, -11.19921875, -8.1572265625, -5.115234375, -2.0732421875, 0.96875, 4.0107421875, 7.052734375, 10.0947265625, 13.13671875, 16.1787109375, 19.220703125, 22.2626953125, 25.3046875, 28.3466796875, 31.388671875, 34.4306640625, 37.47265625, 40.5146484375, 43.556640625, 46.5986328125, 49.640625, 52.6826171875, 55.724609375, 58.7666015625, 61.80859375, 64.8505859375, 67.892578125, 70.9345703125, 73.9765625, 77.0185546875, 80.060546875, 83.1025390625, 86.14453125, 89.1865234375, 92.228515625, 95.2705078125, 98.3125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 8.0, 2.0, 5.0, 5.0, 12.0, 6.0, 15.0, 14.0, 24.0, 26.0, 35.0, 50.0, 75.0, 96.0, 138.0, 205.0, 310.0, 523.0, 1063.0, 3121.0, 23556.0, 985493.0, 27788.0, 3314.0, 1097.0, 566.0, 306.0, 197.0, 148.0, 97.0, 78.0, 47.0, 26.0, 23.0, 27.0, 14.0, 10.0, 11.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.84375, -49.3271484375, -47.810546875, -46.2939453125, -44.77734375, -43.2607421875, -41.744140625, -40.2275390625, -38.7109375, -37.1943359375, -35.677734375, -34.1611328125, -32.64453125, -31.1279296875, -29.611328125, -28.0947265625, -26.578125, -25.0615234375, -23.544921875, -22.0283203125, -20.51171875, -18.9951171875, -17.478515625, -15.9619140625, -14.4453125, -12.9287109375, -11.412109375, -9.8955078125, -8.37890625, -6.8623046875, -5.345703125, -3.8291015625, -2.3125, -0.7958984375, 0.720703125, 2.2373046875, 3.75390625, 5.2705078125, 6.787109375, 8.3037109375, 9.8203125, 11.3369140625, 12.853515625, 14.3701171875, 15.88671875, 17.4033203125, 18.919921875, 20.4365234375, 21.953125, 23.4697265625, 24.986328125, 26.5029296875, 28.01953125, 29.5361328125, 31.052734375, 32.5693359375, 34.0859375, 35.6025390625, 37.119140625, 38.6357421875, 40.15234375, 41.6689453125, 43.185546875, 44.7021484375, 46.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 2.0, 3.0, 4.0, 9.0, 12.0, 23.0, 41.0, 47.0, 75.0, 124.0, 257.0, 150.0, 74.0, 51.0, 32.0, 23.0, 14.0, 13.0, 13.0, 7.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008209228515625, -0.007932066917419434, -0.007654905319213867, -0.007377743721008301, -0.007100582122802734, -0.006823420524597168, -0.0065462589263916016, -0.006269097328186035, -0.005991935729980469, -0.005714774131774902, -0.005437612533569336, -0.0051604509353637695, -0.004883289337158203, -0.004606127738952637, -0.00432896614074707, -0.004051804542541504, -0.0037746429443359375, -0.003497481346130371, -0.0032203197479248047, -0.0029431581497192383, -0.002665996551513672, -0.0023888349533081055, -0.002111673355102539, -0.0018345117568969727, -0.0015573501586914062, -0.0012801885604858398, -0.0010030269622802734, -0.000725865364074707, -0.0004487037658691406, -0.00017154216766357422, 0.00010561943054199219, 0.0003827810287475586, 0.000659942626953125, 0.0009371042251586914, 0.0012142658233642578, 0.0014914274215698242, 0.0017685890197753906, 0.002045750617980957, 0.0023229122161865234, 0.00260007381439209, 0.0028772354125976562, 0.0031543970108032227, 0.003431558609008789, 0.0037087202072143555, 0.003985881805419922, 0.004263043403625488, 0.004540205001831055, 0.004817366600036621, 0.0050945281982421875, 0.005371689796447754, 0.00564885139465332, 0.005926012992858887, 0.006203174591064453, 0.0064803361892700195, 0.006757497787475586, 0.007034659385681152, 0.007311820983886719, 0.007588982582092285, 0.007866144180297852, 0.008143305778503418, 0.008420467376708984, 0.00869762897491455, 0.008974790573120117, 0.009251952171325684, 0.00952911376953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 9.0, 7.0, 11.0, 11.0, 7.0, 14.0, 17.0, 34.0, 34.0, 69.0, 79.0, 106.0, 145.0, 207.0, 330.0, 403.0, 586.0, 855.0, 1199.0, 1746.0, 2423.0, 3593.0, 6543.0, 34229.0, 857977.0, 114131.0, 10087.0, 4229.0, 2767.0, 1996.0, 1345.0, 982.0, 706.0, 461.0, 323.0, 250.0, 170.0, 124.0, 89.0, 60.0, 54.0, 32.0, 33.0, 24.0, 17.0, 14.0, 10.0, 6.0, 6.0, 3.0, 1.0, 3.0, 4.0], "bins": [-41.28125, -40.12451171875, -38.9677734375, -37.81103515625, -36.654296875, -35.49755859375, -34.3408203125, -33.18408203125, -32.02734375, -30.87060546875, -29.7138671875, -28.55712890625, -27.400390625, -26.24365234375, -25.0869140625, -23.93017578125, -22.7734375, -21.61669921875, -20.4599609375, -19.30322265625, -18.146484375, -16.98974609375, -15.8330078125, -14.67626953125, -13.51953125, -12.36279296875, -11.2060546875, -10.04931640625, -8.892578125, -7.73583984375, -6.5791015625, -5.42236328125, -4.265625, -3.10888671875, -1.9521484375, -0.79541015625, 0.361328125, 1.51806640625, 2.6748046875, 3.83154296875, 4.98828125, 6.14501953125, 7.3017578125, 8.45849609375, 9.615234375, 10.77197265625, 11.9287109375, 13.08544921875, 14.2421875, 15.39892578125, 16.5556640625, 17.71240234375, 18.869140625, 20.02587890625, 21.1826171875, 22.33935546875, 23.49609375, 24.65283203125, 25.8095703125, 26.96630859375, 28.123046875, 29.27978515625, 30.4365234375, 31.59326171875, 32.75]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 4.0, 5.0, 18.0, 44.0, 167.0, 367.0, 242.0, 85.0, 29.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.78125, -11.45166015625, -11.1220703125, -10.79248046875, -10.462890625, -10.13330078125, -9.8037109375, -9.47412109375, -9.14453125, -8.81494140625, -8.4853515625, -8.15576171875, -7.826171875, -7.49658203125, -7.1669921875, -6.83740234375, -6.5078125, -6.17822265625, -5.8486328125, -5.51904296875, -5.189453125, -4.85986328125, -4.5302734375, -4.20068359375, -3.87109375, -3.54150390625, -3.2119140625, -2.88232421875, -2.552734375, -2.22314453125, -1.8935546875, -1.56396484375, -1.234375, -0.90478515625, -0.5751953125, -0.24560546875, 0.083984375, 0.41357421875, 0.7431640625, 1.07275390625, 1.40234375, 1.73193359375, 2.0615234375, 2.39111328125, 2.720703125, 3.05029296875, 3.3798828125, 3.70947265625, 4.0390625, 4.36865234375, 4.6982421875, 5.02783203125, 5.357421875, 5.68701171875, 6.0166015625, 6.34619140625, 6.67578125, 7.00537109375, 7.3349609375, 7.66455078125, 7.994140625, 8.32373046875, 8.6533203125, 8.98291015625, 9.3125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 10.0, 5.0, 7.0, 15.0, 15.0, 20.0, 25.0, 22.0, 49.0, 37.0, 72.0, 83.0, 110.0, 112.0, 93.0, 65.0, 67.0, 37.0, 35.0, 27.0, 19.0, 14.0, 8.0, 11.0, 7.0, 4.0, 7.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-91.28695678710938, -88.04277801513672, -84.79859924316406, -81.5544204711914, -78.31024169921875, -75.06607055664062, -71.82189178466797, -68.57771301269531, -65.33353424072266, -62.08935546875, -58.845176696777344, -55.60100173950195, -52.3568229675293, -49.11264419555664, -45.86846923828125, -42.624290466308594, -39.38011169433594, -36.13593292236328, -32.891754150390625, -29.647579193115234, -26.403400421142578, -23.159221649169922, -19.9150447845459, -16.670867919921875, -13.426689147949219, -10.182511329650879, -6.938333511352539, -3.694155693054199, -0.4499778747558594, 2.794200897216797, 6.03837776184082, 9.282554626464844, 12.526741027832031, 15.770918846130371, 19.01509666442871, 22.259273529052734, 25.50345230102539, 28.747631072998047, 31.99180793762207, 35.235984802246094, 38.48016357421875, 41.724342346191406, 44.96852111816406, 48.21269607543945, 51.45687484741211, 54.701053619384766, 57.945228576660156, 61.18940734863281, 64.43358612060547, 67.67776489257812, 70.92194366455078, 74.16612243652344, 77.41029357910156, 80.65447998046875, 83.89865112304688, 87.14282989501953, 90.38700866699219, 93.63118743896484, 96.8753662109375, 100.11954498291016, 103.36372375488281, 106.60789489746094, 109.8520736694336, 113.09625244140625, 116.3404312133789]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 8.0, 5.0, 5.0, 8.0, 10.0, 13.0, 13.0, 13.0, 24.0, 27.0, 31.0, 29.0, 27.0, 31.0, 37.0, 37.0, 45.0, 49.0, 43.0, 44.0, 36.0, 43.0, 48.0, 30.0, 50.0, 39.0, 32.0, 22.0, 31.0, 30.0, 31.0, 19.0, 22.0, 15.0, 12.0, 6.0, 6.0, 5.0, 4.0, 5.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-72.8456039428711, -70.57373809814453, -68.30186462402344, -66.02999877929688, -63.75812530517578, -61.48625946044922, -59.21438980102539, -56.94252014160156, -54.670650482177734, -52.398780822753906, -50.12691116333008, -47.85504150390625, -45.58317565917969, -43.311302185058594, -41.03943634033203, -38.7675666809082, -36.495697021484375, -34.22382736206055, -31.95195770263672, -29.680089950561523, -27.408220291137695, -25.136350631713867, -22.864482879638672, -20.592613220214844, -18.320743560791016, -16.048873901367188, -13.777005195617676, -11.505136489868164, -9.233266830444336, -6.961397171020508, -4.689528465270996, -2.4176597595214844, -0.1457977294921875, 2.1260714530944824, 4.397940635681152, 6.669809818267822, 8.941679000854492, 11.21354866027832, 13.485417366027832, 15.757286071777344, 18.029155731201172, 20.301025390625, 22.572895050048828, 24.844762802124023, 27.11663246154785, 29.38850212097168, 31.660369873046875, 33.9322395324707, 36.20410919189453, 38.47597885131836, 40.74784851074219, 43.019718170166016, 45.291587829589844, 47.563453674316406, 49.835323333740234, 52.10719299316406, 54.37906265258789, 56.65093231201172, 58.92280197143555, 61.194671630859375, 63.46653747558594, 65.73841094970703, 68.0102767944336, 70.28215026855469, 72.55401611328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 12.0, 17.0, 12.0, 16.0, 45.0, 57.0, 60.0, 74.0, 107.0, 174.0, 220.0, 307.0, 387.0, 561.0, 720.0, 1052.0, 1650.0, 2321.0, 3428.0, 5235.0, 8205.0, 13795.0, 24568.0, 46528.0, 94904.0, 197038.0, 299615.0, 168472.0, 81753.0, 40703.0, 21725.0, 12154.0, 7455.0, 4795.0, 3154.0, 2101.0, 1442.0, 1046.0, 760.0, 520.0, 364.0, 255.0, 218.0, 144.0, 113.0, 81.0, 60.0, 39.0, 26.0, 27.0, 19.0, 5.0, 8.0, 4.0, 6.0, 4.0, 0.0, 2.0], "bins": [-102.5625, -99.396484375, -96.23046875, -93.064453125, -89.8984375, -86.732421875, -83.56640625, -80.400390625, -77.234375, -74.068359375, -70.90234375, -67.736328125, -64.5703125, -61.404296875, -58.23828125, -55.072265625, -51.90625, -48.740234375, -45.57421875, -42.408203125, -39.2421875, -36.076171875, -32.91015625, -29.744140625, -26.578125, -23.412109375, -20.24609375, -17.080078125, -13.9140625, -10.748046875, -7.58203125, -4.416015625, -1.25, 1.916015625, 5.08203125, 8.248046875, 11.4140625, 14.580078125, 17.74609375, 20.912109375, 24.078125, 27.244140625, 30.41015625, 33.576171875, 36.7421875, 39.908203125, 43.07421875, 46.240234375, 49.40625, 52.572265625, 55.73828125, 58.904296875, 62.0703125, 65.236328125, 68.40234375, 71.568359375, 74.734375, 77.900390625, 81.06640625, 84.232421875, 87.3984375, 90.564453125, 93.73046875, 96.896484375, 100.0625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 12.0, 9.0, 5.0, 14.0, 11.0, 20.0, 16.0, 25.0, 23.0, 32.0, 35.0, 27.0, 40.0, 47.0, 40.0, 65.0, 46.0, 45.0, 49.0, 40.0, 46.0, 46.0, 45.0, 41.0, 30.0, 20.0, 33.0, 31.0, 15.0, 19.0, 11.0, 12.0, 9.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-75.375, -73.0029296875, -70.630859375, -68.2587890625, -65.88671875, -63.5146484375, -61.142578125, -58.7705078125, -56.3984375, -54.0263671875, -51.654296875, -49.2822265625, -46.91015625, -44.5380859375, -42.166015625, -39.7939453125, -37.421875, -35.0498046875, -32.677734375, -30.3056640625, -27.93359375, -25.5615234375, -23.189453125, -20.8173828125, -18.4453125, -16.0732421875, -13.701171875, -11.3291015625, -8.95703125, -6.5849609375, -4.212890625, -1.8408203125, 0.53125, 2.9033203125, 5.275390625, 7.6474609375, 10.01953125, 12.3916015625, 14.763671875, 17.1357421875, 19.5078125, 21.8798828125, 24.251953125, 26.6240234375, 28.99609375, 31.3681640625, 33.740234375, 36.1123046875, 38.484375, 40.8564453125, 43.228515625, 45.6005859375, 47.97265625, 50.3447265625, 52.716796875, 55.0888671875, 57.4609375, 59.8330078125, 62.205078125, 64.5771484375, 66.94921875, 69.3212890625, 71.693359375, 74.0654296875, 76.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 7.0, 3.0, 7.0, 16.0, 15.0, 23.0, 34.0, 41.0, 67.0, 101.0, 136.0, 199.0, 271.0, 390.0, 559.0, 877.0, 1241.0, 1888.0, 2949.0, 4544.0, 7184.0, 11756.0, 19451.0, 33787.0, 60047.0, 113745.0, 211251.0, 249728.0, 146605.0, 76940.0, 42174.0, 23823.0, 14193.0, 8636.0, 5484.0, 3411.0, 2258.0, 1544.0, 971.0, 670.0, 484.0, 323.0, 231.0, 154.0, 105.0, 68.0, 48.0, 49.0, 25.0, 25.0, 8.0, 8.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-109.125, -105.626953125, -102.12890625, -98.630859375, -95.1328125, -91.634765625, -88.13671875, -84.638671875, -81.140625, -77.642578125, -74.14453125, -70.646484375, -67.1484375, -63.650390625, -60.15234375, -56.654296875, -53.15625, -49.658203125, -46.16015625, -42.662109375, -39.1640625, -35.666015625, -32.16796875, -28.669921875, -25.171875, -21.673828125, -18.17578125, -14.677734375, -11.1796875, -7.681640625, -4.18359375, -0.685546875, 2.8125, 6.310546875, 9.80859375, 13.306640625, 16.8046875, 20.302734375, 23.80078125, 27.298828125, 30.796875, 34.294921875, 37.79296875, 41.291015625, 44.7890625, 48.287109375, 51.78515625, 55.283203125, 58.78125, 62.279296875, 65.77734375, 69.275390625, 72.7734375, 76.271484375, 79.76953125, 83.267578125, 86.765625, 90.263671875, 93.76171875, 97.259765625, 100.7578125, 104.255859375, 107.75390625, 111.251953125, 114.75]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 13.0, 6.0, 11.0, 11.0, 15.0, 11.0, 22.0, 27.0, 29.0, 29.0, 20.0, 36.0, 32.0, 39.0, 34.0, 51.0, 40.0, 44.0, 52.0, 31.0, 45.0, 49.0, 47.0, 42.0, 31.0, 27.0, 26.0, 23.0, 20.0, 21.0, 18.0, 13.0, 14.0, 7.0, 6.0, 11.0, 8.0, 7.0, 4.0, 6.0, 6.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-47.875, -46.46728515625, -45.0595703125, -43.65185546875, -42.244140625, -40.83642578125, -39.4287109375, -38.02099609375, -36.61328125, -35.20556640625, -33.7978515625, -32.39013671875, -30.982421875, -29.57470703125, -28.1669921875, -26.75927734375, -25.3515625, -23.94384765625, -22.5361328125, -21.12841796875, -19.720703125, -18.31298828125, -16.9052734375, -15.49755859375, -14.08984375, -12.68212890625, -11.2744140625, -9.86669921875, -8.458984375, -7.05126953125, -5.6435546875, -4.23583984375, -2.828125, -1.42041015625, -0.0126953125, 1.39501953125, 2.802734375, 4.21044921875, 5.6181640625, 7.02587890625, 8.43359375, 9.84130859375, 11.2490234375, 12.65673828125, 14.064453125, 15.47216796875, 16.8798828125, 18.28759765625, 19.6953125, 21.10302734375, 22.5107421875, 23.91845703125, 25.326171875, 26.73388671875, 28.1416015625, 29.54931640625, 30.95703125, 32.36474609375, 33.7724609375, 35.18017578125, 36.587890625, 37.99560546875, 39.4033203125, 40.81103515625, 42.21875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 3.0, 9.0, 7.0, 10.0, 9.0, 20.0, 18.0, 40.0, 41.0, 77.0, 79.0, 129.0, 178.0, 243.0, 324.0, 547.0, 855.0, 1118.0, 1674.0, 2496.0, 3813.0, 5671.0, 8954.0, 14596.0, 25014.0, 46461.0, 99405.0, 271165.0, 324018.0, 116227.0, 52997.0, 27832.0, 15975.0, 9834.0, 6291.0, 3961.0, 2738.0, 1715.0, 1267.0, 843.0, 567.0, 391.0, 294.0, 178.0, 132.0, 100.0, 74.0, 51.0, 31.0, 24.0, 11.0, 14.0, 10.0, 9.0, 4.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0], "bins": [-27.28125, -26.40380859375, -25.5263671875, -24.64892578125, -23.771484375, -22.89404296875, -22.0166015625, -21.13916015625, -20.26171875, -19.38427734375, -18.5068359375, -17.62939453125, -16.751953125, -15.87451171875, -14.9970703125, -14.11962890625, -13.2421875, -12.36474609375, -11.4873046875, -10.60986328125, -9.732421875, -8.85498046875, -7.9775390625, -7.10009765625, -6.22265625, -5.34521484375, -4.4677734375, -3.59033203125, -2.712890625, -1.83544921875, -0.9580078125, -0.08056640625, 0.796875, 1.67431640625, 2.5517578125, 3.42919921875, 4.306640625, 5.18408203125, 6.0615234375, 6.93896484375, 7.81640625, 8.69384765625, 9.5712890625, 10.44873046875, 11.326171875, 12.20361328125, 13.0810546875, 13.95849609375, 14.8359375, 15.71337890625, 16.5908203125, 17.46826171875, 18.345703125, 19.22314453125, 20.1005859375, 20.97802734375, 21.85546875, 22.73291015625, 23.6103515625, 24.48779296875, 25.365234375, 26.24267578125, 27.1201171875, 27.99755859375, 28.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 5.0, 8.0, 8.0, 10.0, 15.0, 24.0, 23.0, 35.0, 38.0, 47.0, 98.0, 123.0, 143.0, 110.0, 82.0, 52.0, 29.0, 25.0, 21.0, 20.0, 21.0, 9.0, 8.0, 4.0, 10.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003299713134765625, -0.0031915903091430664, -0.003083467483520508, -0.0029753446578979492, -0.0028672218322753906, -0.002759099006652832, -0.0026509761810302734, -0.002542853355407715, -0.0024347305297851562, -0.0023266077041625977, -0.002218484878540039, -0.0021103620529174805, -0.002002239227294922, -0.0018941164016723633, -0.0017859935760498047, -0.001677870750427246, -0.0015697479248046875, -0.001461625099182129, -0.0013535022735595703, -0.0012453794479370117, -0.0011372566223144531, -0.0010291337966918945, -0.0009210109710693359, -0.0008128881454467773, -0.0007047653198242188, -0.0005966424942016602, -0.0004885196685791016, -0.00038039684295654297, -0.0002722740173339844, -0.00016415119171142578, -5.602836608886719e-05, 5.2094459533691406e-05, 0.00016021728515625, 0.0002683401107788086, 0.0003764629364013672, 0.0004845857620239258, 0.0005927085876464844, 0.000700831413269043, 0.0008089542388916016, 0.0009170770645141602, 0.0010251998901367188, 0.0011333227157592773, 0.001241445541381836, 0.0013495683670043945, 0.0014576911926269531, 0.0015658140182495117, 0.0016739368438720703, 0.001782059669494629, 0.0018901824951171875, 0.001998305320739746, 0.0021064281463623047, 0.0022145509719848633, 0.002322673797607422, 0.0024307966232299805, 0.002538919448852539, 0.0026470422744750977, 0.0027551651000976562, 0.002863287925720215, 0.0029714107513427734, 0.003079533576965332, 0.0031876564025878906, 0.0032957792282104492, 0.003403902053833008, 0.0035120248794555664, 0.003620147705078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 3.0, 9.0, 7.0, 14.0, 24.0, 36.0, 44.0, 70.0, 94.0, 131.0, 180.0, 272.0, 357.0, 562.0, 782.0, 1032.0, 1514.0, 2173.0, 3234.0, 4971.0, 7552.0, 12484.0, 21635.0, 41535.0, 90180.0, 236375.0, 350754.0, 139604.0, 58968.0, 29456.0, 16032.0, 9657.0, 5995.0, 4087.0, 2716.0, 1796.0, 1276.0, 872.0, 619.0, 424.0, 315.0, 206.0, 154.0, 107.0, 68.0, 62.0, 38.0, 28.0, 19.0, 9.0, 14.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-28.890625, -28.021484375, -27.15234375, -26.283203125, -25.4140625, -24.544921875, -23.67578125, -22.806640625, -21.9375, -21.068359375, -20.19921875, -19.330078125, -18.4609375, -17.591796875, -16.72265625, -15.853515625, -14.984375, -14.115234375, -13.24609375, -12.376953125, -11.5078125, -10.638671875, -9.76953125, -8.900390625, -8.03125, -7.162109375, -6.29296875, -5.423828125, -4.5546875, -3.685546875, -2.81640625, -1.947265625, -1.078125, -0.208984375, 0.66015625, 1.529296875, 2.3984375, 3.267578125, 4.13671875, 5.005859375, 5.875, 6.744140625, 7.61328125, 8.482421875, 9.3515625, 10.220703125, 11.08984375, 11.958984375, 12.828125, 13.697265625, 14.56640625, 15.435546875, 16.3046875, 17.173828125, 18.04296875, 18.912109375, 19.78125, 20.650390625, 21.51953125, 22.388671875, 23.2578125, 24.126953125, 24.99609375, 25.865234375, 26.734375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 6.0, 2.0, 3.0, 4.0, 5.0, 11.0, 11.0, 5.0, 12.0, 16.0, 18.0, 17.0, 27.0, 45.0, 38.0, 46.0, 69.0, 87.0, 90.0, 84.0, 74.0, 58.0, 52.0, 49.0, 45.0, 18.0, 18.0, 17.0, 14.0, 10.0, 11.0, 6.0, 3.0, 4.0, 2.0, 5.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.4375, -9.15966796875, -8.8818359375, -8.60400390625, -8.326171875, -8.04833984375, -7.7705078125, -7.49267578125, -7.21484375, -6.93701171875, -6.6591796875, -6.38134765625, -6.103515625, -5.82568359375, -5.5478515625, -5.27001953125, -4.9921875, -4.71435546875, -4.4365234375, -4.15869140625, -3.880859375, -3.60302734375, -3.3251953125, -3.04736328125, -2.76953125, -2.49169921875, -2.2138671875, -1.93603515625, -1.658203125, -1.38037109375, -1.1025390625, -0.82470703125, -0.546875, -0.26904296875, 0.0087890625, 0.28662109375, 0.564453125, 0.84228515625, 1.1201171875, 1.39794921875, 1.67578125, 1.95361328125, 2.2314453125, 2.50927734375, 2.787109375, 3.06494140625, 3.3427734375, 3.62060546875, 3.8984375, 4.17626953125, 4.4541015625, 4.73193359375, 5.009765625, 5.28759765625, 5.5654296875, 5.84326171875, 6.12109375, 6.39892578125, 6.6767578125, 6.95458984375, 7.232421875, 7.51025390625, 7.7880859375, 8.06591796875, 8.34375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 7.0, 13.0, 11.0, 14.0, 21.0, 27.0, 35.0, 54.0, 72.0, 92.0, 104.0, 114.0, 97.0, 70.0, 63.0, 40.0, 33.0, 32.0, 20.0, 9.0, 14.0, 10.0, 8.0, 4.0, 7.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.12782287597656, -90.66825103759766, -87.20867919921875, -83.74910736083984, -80.28953552246094, -76.82996368408203, -73.37039184570312, -69.91082000732422, -66.45124816894531, -62.991676330566406, -59.5321044921875, -56.072532653808594, -52.61296081542969, -49.15338897705078, -45.693817138671875, -42.23424530029297, -38.7746696472168, -35.31509780883789, -31.855525970458984, -28.395954132080078, -24.936382293701172, -21.476808547973633, -18.017236709594727, -14.55766487121582, -11.098093032836914, -7.638521194458008, -4.178948879241943, -0.7193765640258789, 2.7401952743530273, 6.19976806640625, 9.659339904785156, 13.118911743164062, 16.57848358154297, 20.038055419921875, 23.49762725830078, 26.957199096679688, 30.416770935058594, 33.8763427734375, 37.335914611816406, 40.79548645019531, 44.25505828857422, 47.714630126953125, 51.17420196533203, 54.63377380371094, 58.093345642089844, 61.55291748046875, 65.01248931884766, 68.47206115722656, 71.931640625, 75.3912124633789, 78.85078430175781, 82.31035614013672, 85.76992797851562, 89.22949981689453, 92.68907165527344, 96.14864349365234, 99.60821533203125, 103.06778717041016, 106.52735900878906, 109.98693084716797, 113.44650268554688, 116.90607452392578, 120.36564636230469, 123.8252182006836, 127.2847900390625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 11.0, 8.0, 9.0, 11.0, 6.0, 12.0, 9.0, 11.0, 19.0, 24.0, 21.0, 27.0, 36.0, 39.0, 40.0, 26.0, 37.0, 45.0, 42.0, 35.0, 38.0, 39.0, 48.0, 33.0, 40.0, 29.0, 34.0, 29.0, 34.0, 27.0, 23.0, 19.0, 24.0, 15.0, 19.0, 14.0, 11.0, 5.0, 13.0, 6.0, 8.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-65.30443572998047, -63.186561584472656, -61.068687438964844, -58.9508171081543, -56.832942962646484, -54.71506881713867, -52.597198486328125, -50.47932434082031, -48.3614501953125, -46.24357604980469, -44.125701904296875, -42.00783157348633, -39.889957427978516, -37.7720832824707, -35.654212951660156, -33.536338806152344, -31.41846466064453, -29.30059051513672, -27.18271827697754, -25.06484603881836, -22.946971893310547, -20.829097747802734, -18.711225509643555, -16.593353271484375, -14.475479125976562, -12.357605934143066, -10.23973274230957, -8.121859550476074, -6.003986358642578, -3.886113166809082, -1.768239974975586, 0.34963321685791016, 2.4675140380859375, 4.585387229919434, 6.70326042175293, 8.821133613586426, 10.939006805419922, 13.056879997253418, 15.174753189086914, 17.292625427246094, 19.410499572753906, 21.52837371826172, 23.6462459564209, 25.764118194580078, 27.88199234008789, 29.999866485595703, 32.11773681640625, 34.23561096191406, 36.353485107421875, 38.47135925292969, 40.5892333984375, 42.70710372924805, 44.82497787475586, 46.94285202026367, 49.06072235107422, 51.17859649658203, 53.296470642089844, 55.414344787597656, 57.53221893310547, 59.650089263916016, 61.76796340942383, 63.88583755493164, 66.00370788574219, 68.12158203125, 70.23945617675781]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 3.0, 17.0, 21.0, 12.0, 36.0, 43.0, 63.0, 73.0, 113.0, 164.0, 233.0, 357.0, 489.0, 767.0, 1070.0, 1631.0, 2544.0, 3880.0, 6081.0, 10112.0, 18614.0, 45417.0, 161411.0, 749467.0, 2216903.0, 734247.0, 153075.0, 41293.0, 18124.0, 10063.0, 6150.0, 3793.0, 2489.0, 1710.0, 1181.0, 771.0, 549.0, 351.0, 295.0, 201.0, 142.0, 88.0, 71.0, 49.0, 37.0, 23.0, 18.0, 12.0, 11.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-120.0625, -116.4775390625, -112.892578125, -109.3076171875, -105.72265625, -102.1376953125, -98.552734375, -94.9677734375, -91.3828125, -87.7978515625, -84.212890625, -80.6279296875, -77.04296875, -73.4580078125, -69.873046875, -66.2880859375, -62.703125, -59.1181640625, -55.533203125, -51.9482421875, -48.36328125, -44.7783203125, -41.193359375, -37.6083984375, -34.0234375, -30.4384765625, -26.853515625, -23.2685546875, -19.68359375, -16.0986328125, -12.513671875, -8.9287109375, -5.34375, -1.7587890625, 1.826171875, 5.4111328125, 8.99609375, 12.5810546875, 16.166015625, 19.7509765625, 23.3359375, 26.9208984375, 30.505859375, 34.0908203125, 37.67578125, 41.2607421875, 44.845703125, 48.4306640625, 52.015625, 55.6005859375, 59.185546875, 62.7705078125, 66.35546875, 69.9404296875, 73.525390625, 77.1103515625, 80.6953125, 84.2802734375, 87.865234375, 91.4501953125, 95.03515625, 98.6201171875, 102.205078125, 105.7900390625, 109.375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 12.0, 9.0, 9.0, 9.0, 9.0, 11.0, 15.0, 20.0, 27.0, 21.0, 40.0, 36.0, 28.0, 41.0, 37.0, 55.0, 46.0, 57.0, 43.0, 54.0, 42.0, 32.0, 35.0, 39.0, 24.0, 35.0, 35.0, 31.0, 20.0, 17.0, 18.0, 11.0, 14.0, 13.0, 10.0, 6.0, 9.0, 5.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.4375, -59.421875, -57.40625, -55.390625, -53.375, -51.359375, -49.34375, -47.328125, -45.3125, -43.296875, -41.28125, -39.265625, -37.25, -35.234375, -33.21875, -31.203125, -29.1875, -27.171875, -25.15625, -23.140625, -21.125, -19.109375, -17.09375, -15.078125, -13.0625, -11.046875, -9.03125, -7.015625, -5.0, -2.984375, -0.96875, 1.046875, 3.0625, 5.078125, 7.09375, 9.109375, 11.125, 13.140625, 15.15625, 17.171875, 19.1875, 21.203125, 23.21875, 25.234375, 27.25, 29.265625, 31.28125, 33.296875, 35.3125, 37.328125, 39.34375, 41.359375, 43.375, 45.390625, 47.40625, 49.421875, 51.4375, 53.453125, 55.46875, 57.484375, 59.5, 61.515625, 63.53125, 65.546875, 67.5625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 6.0, 6.0, 11.0, 12.0, 15.0, 26.0, 35.0, 53.0, 86.0, 84.0, 153.0, 167.0, 296.0, 392.0, 575.0, 796.0, 1136.0, 1634.0, 2451.0, 3782.0, 5765.0, 9065.0, 15447.0, 27695.0, 55778.0, 144545.0, 592342.0, 2443917.0, 613597.0, 147094.0, 56999.0, 27776.0, 15623.0, 9236.0, 5954.0, 3765.0, 2586.0, 1632.0, 1130.0, 787.0, 527.0, 390.0, 258.0, 172.0, 139.0, 106.0, 60.0, 56.0, 37.0, 36.0, 11.0, 21.0, 14.0, 6.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-118.6875, -114.5244140625, -110.361328125, -106.1982421875, -102.03515625, -97.8720703125, -93.708984375, -89.5458984375, -85.3828125, -81.2197265625, -77.056640625, -72.8935546875, -68.73046875, -64.5673828125, -60.404296875, -56.2412109375, -52.078125, -47.9150390625, -43.751953125, -39.5888671875, -35.42578125, -31.2626953125, -27.099609375, -22.9365234375, -18.7734375, -14.6103515625, -10.447265625, -6.2841796875, -2.12109375, 2.0419921875, 6.205078125, 10.3681640625, 14.53125, 18.6943359375, 22.857421875, 27.0205078125, 31.18359375, 35.3466796875, 39.509765625, 43.6728515625, 47.8359375, 51.9990234375, 56.162109375, 60.3251953125, 64.48828125, 68.6513671875, 72.814453125, 76.9775390625, 81.140625, 85.3037109375, 89.466796875, 93.6298828125, 97.79296875, 101.9560546875, 106.119140625, 110.2822265625, 114.4453125, 118.6083984375, 122.771484375, 126.9345703125, 131.09765625, 135.2607421875, 139.423828125, 143.5869140625, 147.75]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 5.0, 9.0, 8.0, 13.0, 11.0, 21.0, 27.0, 23.0, 27.0, 38.0, 56.0, 74.0, 92.0, 154.0, 241.0, 329.0, 524.0, 692.0, 564.0, 355.0, 253.0, 145.0, 96.0, 64.0, 49.0, 35.0, 39.0, 28.0, 13.0, 7.0, 12.0, 11.0, 14.0, 6.0, 6.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.40625, -35.17578125, -33.9453125, -32.71484375, -31.484375, -30.25390625, -29.0234375, -27.79296875, -26.5625, -25.33203125, -24.1015625, -22.87109375, -21.640625, -20.41015625, -19.1796875, -17.94921875, -16.71875, -15.48828125, -14.2578125, -13.02734375, -11.796875, -10.56640625, -9.3359375, -8.10546875, -6.875, -5.64453125, -4.4140625, -3.18359375, -1.953125, -0.72265625, 0.5078125, 1.73828125, 2.96875, 4.19921875, 5.4296875, 6.66015625, 7.890625, 9.12109375, 10.3515625, 11.58203125, 12.8125, 14.04296875, 15.2734375, 16.50390625, 17.734375, 18.96484375, 20.1953125, 21.42578125, 22.65625, 23.88671875, 25.1171875, 26.34765625, 27.578125, 28.80859375, 30.0390625, 31.26953125, 32.5, 33.73046875, 34.9609375, 36.19140625, 37.421875, 38.65234375, 39.8828125, 41.11328125, 42.34375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 10.0, 8.0, 8.0, 12.0, 22.0, 19.0, 29.0, 29.0, 36.0, 61.0, 70.0, 82.0, 103.0, 102.0, 77.0, 63.0, 53.0, 35.0, 27.0, 36.0, 20.0, 10.0, 10.0, 12.0, 12.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-92.34141540527344, -89.34625244140625, -86.35108947753906, -83.35592651367188, -80.36076354980469, -77.36560821533203, -74.37044525146484, -71.37528228759766, -68.38011932373047, -65.38495635986328, -62.389793395996094, -59.39463424682617, -56.399471282958984, -53.4043083190918, -50.409149169921875, -47.41398620605469, -44.4188232421875, -41.42366027832031, -38.428497314453125, -35.4333381652832, -32.438175201416016, -29.443012237548828, -26.447851181030273, -23.45269012451172, -20.45752716064453, -17.462364196777344, -14.467203140258789, -11.472041130065918, -8.476879119873047, -5.481717109680176, -2.4865550994873047, 0.50860595703125, 3.5037689208984375, 6.498930931091309, 9.49409294128418, 12.48925495147705, 15.484416961669922, 18.47957992553711, 21.474740982055664, 24.46990203857422, 27.465065002441406, 30.460227966308594, 33.45539093017578, 36.4505500793457, 39.44571304321289, 42.44087600708008, 45.43603515625, 48.43119812011719, 51.426361083984375, 54.42152404785156, 57.41668701171875, 60.41184616088867, 63.40700912475586, 66.40216827392578, 69.39733123779297, 72.39249420166016, 75.38765716552734, 78.38282012939453, 81.37798309326172, 84.3731460571289, 87.36830139160156, 90.36346435546875, 93.35862731933594, 96.35379028320312, 99.34895324707031]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 3.0, 7.0, 14.0, 13.0, 7.0, 11.0, 11.0, 13.0, 10.0, 25.0, 23.0, 35.0, 29.0, 22.0, 41.0, 45.0, 42.0, 39.0, 55.0, 40.0, 37.0, 40.0, 35.0, 44.0, 34.0, 38.0, 30.0, 38.0, 33.0, 28.0, 19.0, 19.0, 19.0, 18.0, 13.0, 11.0, 8.0, 12.0, 7.0, 7.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-76.96728515625, -74.66474914550781, -72.36222076416016, -70.05968475341797, -67.75715637207031, -65.45462036132812, -63.15208435058594, -60.849552154541016, -58.547019958496094, -56.24448776245117, -53.94195556640625, -51.63941955566406, -49.33688735961914, -47.03435516357422, -44.73181915283203, -42.42928695678711, -40.12675476074219, -37.824222564697266, -35.521690368652344, -33.219154357910156, -30.916622161865234, -28.614089965820312, -26.311555862426758, -24.009021759033203, -21.70648956298828, -19.40395736694336, -17.101423263549805, -14.798890113830566, -12.496356964111328, -10.19382381439209, -7.891290664672852, -5.588756561279297, -3.2862319946289062, -0.983698844909668, 1.3188343048095703, 3.6213674545288086, 5.923900604248047, 8.226433753967285, 10.528966903686523, 12.831501007080078, 15.134033203125, 17.436565399169922, 19.739099502563477, 22.04163360595703, 24.344165802001953, 26.646697998046875, 28.94923210144043, 31.251766204833984, 33.554298400878906, 35.85683059692383, 38.15936279296875, 40.46189880371094, 42.76443099975586, 45.06696319580078, 47.36949920654297, 49.67203140258789, 51.97456359863281, 54.277095794677734, 56.579627990722656, 58.882164001464844, 61.184696197509766, 63.48722839355469, 65.78976440429688, 68.09230041503906, 70.39482879638672]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 3.0, 8.0, 11.0, 13.0, 24.0, 21.0, 43.0, 40.0, 83.0, 136.0, 185.0, 232.0, 332.0, 467.0, 690.0, 1081.0, 1592.0, 2219.0, 3195.0, 4603.0, 6663.0, 9962.0, 15354.0, 24012.0, 38506.0, 67407.0, 121743.0, 207951.0, 219141.0, 132586.0, 73632.0, 41731.0, 24984.0, 16176.0, 10742.0, 7151.0, 4883.0, 3388.0, 2266.0, 1664.0, 1102.0, 753.0, 535.0, 387.0, 275.0, 197.0, 110.0, 96.0, 54.0, 53.0, 31.0, 20.0, 12.0, 9.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-42.9375, -41.5556640625, -40.173828125, -38.7919921875, -37.41015625, -36.0283203125, -34.646484375, -33.2646484375, -31.8828125, -30.5009765625, -29.119140625, -27.7373046875, -26.35546875, -24.9736328125, -23.591796875, -22.2099609375, -20.828125, -19.4462890625, -18.064453125, -16.6826171875, -15.30078125, -13.9189453125, -12.537109375, -11.1552734375, -9.7734375, -8.3916015625, -7.009765625, -5.6279296875, -4.24609375, -2.8642578125, -1.482421875, -0.1005859375, 1.28125, 2.6630859375, 4.044921875, 5.4267578125, 6.80859375, 8.1904296875, 9.572265625, 10.9541015625, 12.3359375, 13.7177734375, 15.099609375, 16.4814453125, 17.86328125, 19.2451171875, 20.626953125, 22.0087890625, 23.390625, 24.7724609375, 26.154296875, 27.5361328125, 28.91796875, 30.2998046875, 31.681640625, 33.0634765625, 34.4453125, 35.8271484375, 37.208984375, 38.5908203125, 39.97265625, 41.3544921875, 42.736328125, 44.1181640625, 45.5]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 5.0, 13.0, 8.0, 8.0, 6.0, 9.0, 11.0, 15.0, 6.0, 17.0, 26.0, 25.0, 24.0, 30.0, 31.0, 34.0, 39.0, 43.0, 46.0, 40.0, 48.0, 44.0, 44.0, 47.0, 38.0, 34.0, 39.0, 25.0, 33.0, 28.0, 24.0, 22.0, 14.0, 17.0, 14.0, 17.0, 11.0, 9.0, 7.0, 13.0, 8.0, 4.0, 5.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-62.96875, -61.078125, -59.1875, -57.296875, -55.40625, -53.515625, -51.625, -49.734375, -47.84375, -45.953125, -44.0625, -42.171875, -40.28125, -38.390625, -36.5, -34.609375, -32.71875, -30.828125, -28.9375, -27.046875, -25.15625, -23.265625, -21.375, -19.484375, -17.59375, -15.703125, -13.8125, -11.921875, -10.03125, -8.140625, -6.25, -4.359375, -2.46875, -0.578125, 1.3125, 3.203125, 5.09375, 6.984375, 8.875, 10.765625, 12.65625, 14.546875, 16.4375, 18.328125, 20.21875, 22.109375, 24.0, 25.890625, 27.78125, 29.671875, 31.5625, 33.453125, 35.34375, 37.234375, 39.125, 41.015625, 42.90625, 44.796875, 46.6875, 48.578125, 50.46875, 52.359375, 54.25, 56.140625, 58.03125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 4.0, 10.0, 6.0, 9.0, 20.0, 17.0, 35.0, 33.0, 49.0, 90.0, 97.0, 157.0, 225.0, 334.0, 458.0, 646.0, 959.0, 1376.0, 2119.0, 3473.0, 5545.0, 9245.0, 18258.0, 62497.0, 778120.0, 113903.0, 22633.0, 10939.0, 6113.0, 3891.0, 2457.0, 1563.0, 1044.0, 679.0, 439.0, 336.0, 228.0, 156.0, 94.0, 84.0, 60.0, 44.0, 27.0, 22.0, 20.0, 10.0, 9.0, 6.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-120.375, -116.169921875, -111.96484375, -107.759765625, -103.5546875, -99.349609375, -95.14453125, -90.939453125, -86.734375, -82.529296875, -78.32421875, -74.119140625, -69.9140625, -65.708984375, -61.50390625, -57.298828125, -53.09375, -48.888671875, -44.68359375, -40.478515625, -36.2734375, -32.068359375, -27.86328125, -23.658203125, -19.453125, -15.248046875, -11.04296875, -6.837890625, -2.6328125, 1.572265625, 5.77734375, 9.982421875, 14.1875, 18.392578125, 22.59765625, 26.802734375, 31.0078125, 35.212890625, 39.41796875, 43.623046875, 47.828125, 52.033203125, 56.23828125, 60.443359375, 64.6484375, 68.853515625, 73.05859375, 77.263671875, 81.46875, 85.673828125, 89.87890625, 94.083984375, 98.2890625, 102.494140625, 106.69921875, 110.904296875, 115.109375, 119.314453125, 123.51953125, 127.724609375, 131.9296875, 136.134765625, 140.33984375, 144.544921875, 148.75]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 7.0, 16.0, 10.0, 13.0, 22.0, 22.0, 15.0, 35.0, 31.0, 29.0, 38.0, 35.0, 41.0, 36.0, 36.0, 51.0, 45.0, 42.0, 41.0, 43.0, 35.0, 45.0, 28.0, 38.0, 43.0, 36.0, 23.0, 21.0, 19.0, 22.0, 18.0, 10.0, 13.0, 8.0, 8.0, 9.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-121.375, -118.064453125, -114.75390625, -111.443359375, -108.1328125, -104.822265625, -101.51171875, -98.201171875, -94.890625, -91.580078125, -88.26953125, -84.958984375, -81.6484375, -78.337890625, -75.02734375, -71.716796875, -68.40625, -65.095703125, -61.78515625, -58.474609375, -55.1640625, -51.853515625, -48.54296875, -45.232421875, -41.921875, -38.611328125, -35.30078125, -31.990234375, -28.6796875, -25.369140625, -22.05859375, -18.748046875, -15.4375, -12.126953125, -8.81640625, -5.505859375, -2.1953125, 1.115234375, 4.42578125, 7.736328125, 11.046875, 14.357421875, 17.66796875, 20.978515625, 24.2890625, 27.599609375, 30.91015625, 34.220703125, 37.53125, 40.841796875, 44.15234375, 47.462890625, 50.7734375, 54.083984375, 57.39453125, 60.705078125, 64.015625, 67.326171875, 70.63671875, 73.947265625, 77.2578125, 80.568359375, 83.87890625, 87.189453125, 90.5]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 5.0, 6.0, 14.0, 15.0, 14.0, 23.0, 32.0, 52.0, 75.0, 106.0, 145.0, 194.0, 344.0, 521.0, 829.0, 1396.0, 2421.0, 4610.0, 9688.0, 29265.0, 394399.0, 550328.0, 32458.0, 10268.0, 4793.0, 2495.0, 1491.0, 909.0, 555.0, 313.0, 228.0, 182.0, 114.0, 89.0, 50.0, 37.0, 25.0, 12.0, 10.0, 15.0, 5.0, 8.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.375, -16.776611328125, -16.17822265625, -15.579833984375, -14.9814453125, -14.383056640625, -13.78466796875, -13.186279296875, -12.587890625, -11.989501953125, -11.39111328125, -10.792724609375, -10.1943359375, -9.595947265625, -8.99755859375, -8.399169921875, -7.80078125, -7.202392578125, -6.60400390625, -6.005615234375, -5.4072265625, -4.808837890625, -4.21044921875, -3.612060546875, -3.013671875, -2.415283203125, -1.81689453125, -1.218505859375, -0.6201171875, -0.021728515625, 0.57666015625, 1.175048828125, 1.7734375, 2.371826171875, 2.97021484375, 3.568603515625, 4.1669921875, 4.765380859375, 5.36376953125, 5.962158203125, 6.560546875, 7.158935546875, 7.75732421875, 8.355712890625, 8.9541015625, 9.552490234375, 10.15087890625, 10.749267578125, 11.34765625, 11.946044921875, 12.54443359375, 13.142822265625, 13.7412109375, 14.339599609375, 14.93798828125, 15.536376953125, 16.134765625, 16.733154296875, 17.33154296875, 17.929931640625, 18.5283203125, 19.126708984375, 19.72509765625, 20.323486328125, 20.921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 11.0, 19.0, 21.0, 43.0, 51.0, 106.0, 167.0, 193.0, 138.0, 80.0, 49.0, 25.0, 20.0, 22.0, 9.0, 11.0, 5.0, 2.0, 6.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0109100341796875, -0.010509371757507324, -0.010108709335327148, -0.009708046913146973, -0.009307384490966797, -0.008906722068786621, -0.008506059646606445, -0.00810539722442627, -0.007704734802246094, -0.007304072380065918, -0.006903409957885742, -0.006502747535705566, -0.006102085113525391, -0.005701422691345215, -0.005300760269165039, -0.004900097846984863, -0.0044994354248046875, -0.004098773002624512, -0.003698110580444336, -0.00329744815826416, -0.0028967857360839844, -0.0024961233139038086, -0.002095460891723633, -0.001694798469543457, -0.0012941360473632812, -0.0008934736251831055, -0.0004928112030029297, -9.21487808227539e-05, 0.0003085136413574219, 0.0007091760635375977, 0.0011098384857177734, 0.0015105009078979492, 0.001911163330078125, 0.0023118257522583008, 0.0027124881744384766, 0.0031131505966186523, 0.003513813018798828, 0.003914475440979004, 0.00431513786315918, 0.0047158002853393555, 0.005116462707519531, 0.005517125129699707, 0.005917787551879883, 0.006318449974060059, 0.006719112396240234, 0.00711977481842041, 0.007520437240600586, 0.007921099662780762, 0.008321762084960938, 0.008722424507141113, 0.009123086929321289, 0.009523749351501465, 0.00992441177368164, 0.010325074195861816, 0.010725736618041992, 0.011126399040222168, 0.011527061462402344, 0.01192772388458252, 0.012328386306762695, 0.012729048728942871, 0.013129711151123047, 0.013530373573303223, 0.013931035995483398, 0.014331698417663574, 0.01473236083984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 7.0, 2.0, 8.0, 6.0, 14.0, 23.0, 32.0, 47.0, 57.0, 99.0, 126.0, 139.0, 214.0, 294.0, 447.0, 635.0, 961.0, 1454.0, 2228.0, 3488.0, 5456.0, 8998.0, 15452.0, 28021.0, 53898.0, 122910.0, 323168.0, 270496.0, 101860.0, 47224.0, 24509.0, 13869.0, 8089.0, 4999.0, 3096.0, 2011.0, 1334.0, 862.0, 609.0, 445.0, 300.0, 192.0, 129.0, 98.0, 69.0, 61.0, 29.0, 26.0, 26.0, 11.0, 7.0, 14.0, 5.0, 7.0, 3.0, 3.0, 2.0], "bins": [-7.60546875, -7.381103515625, -7.15673828125, -6.932373046875, -6.7080078125, -6.483642578125, -6.25927734375, -6.034912109375, -5.810546875, -5.586181640625, -5.36181640625, -5.137451171875, -4.9130859375, -4.688720703125, -4.46435546875, -4.239990234375, -4.015625, -3.791259765625, -3.56689453125, -3.342529296875, -3.1181640625, -2.893798828125, -2.66943359375, -2.445068359375, -2.220703125, -1.996337890625, -1.77197265625, -1.547607421875, -1.3232421875, -1.098876953125, -0.87451171875, -0.650146484375, -0.42578125, -0.201416015625, 0.02294921875, 0.247314453125, 0.4716796875, 0.696044921875, 0.92041015625, 1.144775390625, 1.369140625, 1.593505859375, 1.81787109375, 2.042236328125, 2.2666015625, 2.490966796875, 2.71533203125, 2.939697265625, 3.1640625, 3.388427734375, 3.61279296875, 3.837158203125, 4.0615234375, 4.285888671875, 4.51025390625, 4.734619140625, 4.958984375, 5.183349609375, 5.40771484375, 5.632080078125, 5.8564453125, 6.080810546875, 6.30517578125, 6.529541015625, 6.75390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 4.0, 5.0, 7.0, 5.0, 12.0, 13.0, 12.0, 22.0, 20.0, 24.0, 34.0, 47.0, 46.0, 48.0, 57.0, 60.0, 82.0, 62.0, 60.0, 62.0, 64.0, 42.0, 29.0, 27.0, 39.0, 15.0, 19.0, 17.0, 15.0, 11.0, 10.0, 8.0, 2.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.33984375, -2.274261474609375, -2.20867919921875, -2.143096923828125, -2.0775146484375, -2.011932373046875, -1.94635009765625, -1.880767822265625, -1.815185546875, -1.749603271484375, -1.68402099609375, -1.618438720703125, -1.5528564453125, -1.487274169921875, -1.42169189453125, -1.356109619140625, -1.29052734375, -1.224945068359375, -1.15936279296875, -1.093780517578125, -1.0281982421875, -0.962615966796875, -0.89703369140625, -0.831451416015625, -0.765869140625, -0.700286865234375, -0.63470458984375, -0.569122314453125, -0.5035400390625, -0.437957763671875, -0.37237548828125, -0.306793212890625, -0.2412109375, -0.175628662109375, -0.11004638671875, -0.044464111328125, 0.0211181640625, 0.086700439453125, 0.15228271484375, 0.217864990234375, 0.283447265625, 0.349029541015625, 0.41461181640625, 0.480194091796875, 0.5457763671875, 0.611358642578125, 0.67694091796875, 0.742523193359375, 0.80810546875, 0.873687744140625, 0.93927001953125, 1.004852294921875, 1.0704345703125, 1.136016845703125, 1.20159912109375, 1.267181396484375, 1.332763671875, 1.398345947265625, 1.46392822265625, 1.529510498046875, 1.5950927734375, 1.660675048828125, 1.72625732421875, 1.791839599609375, 1.857421875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 10.0, 8.0, 11.0, 12.0, 11.0, 18.0, 22.0, 24.0, 36.0, 52.0, 74.0, 85.0, 104.0, 107.0, 110.0, 76.0, 63.0, 42.0, 39.0, 28.0, 11.0, 8.0, 15.0, 11.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.31333923339844, -87.32707214355469, -84.3407974243164, -81.35453033447266, -78.36825561523438, -75.38198852539062, -72.39572143554688, -69.40945434570312, -66.42317962646484, -63.43690872192383, -60.45063781738281, -57.46437072753906, -54.47809982299805, -51.49182891845703, -48.50556182861328, -45.519290924072266, -42.53302001953125, -39.546749114990234, -36.56047821044922, -33.57421112060547, -30.587940216064453, -27.601669311523438, -24.615400314331055, -21.629131317138672, -18.642860412597656, -15.656590461730957, -12.670320510864258, -9.684050559997559, -6.697780609130859, -3.71151065826416, -0.7252407073974609, 2.261028289794922, 5.247291564941406, 8.233561515808105, 11.219831466674805, 14.206101417541504, 17.192371368408203, 20.17864227294922, 23.1649112701416, 26.151180267333984, 29.137451171875, 32.123722076416016, 35.10999298095703, 38.09626007080078, 41.0825309753418, 44.06880187988281, 47.05506896972656, 50.04133987426758, 53.027610778808594, 56.01388168334961, 59.000152587890625, 61.986419677734375, 64.97268676757812, 67.9589614868164, 70.94522857666016, 73.93150329589844, 76.91777038574219, 79.90403747558594, 82.89031219482422, 85.87657928466797, 88.86285400390625, 91.84912109375, 94.83538818359375, 97.8216552734375, 100.80792999267578]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 8.0, 14.0, 9.0, 3.0, 11.0, 13.0, 14.0, 13.0, 21.0, 22.0, 23.0, 34.0, 35.0, 34.0, 30.0, 44.0, 42.0, 43.0, 43.0, 39.0, 39.0, 41.0, 42.0, 46.0, 30.0, 28.0, 42.0, 24.0, 34.0, 22.0, 21.0, 19.0, 17.0, 16.0, 18.0, 11.0, 8.0, 8.0, 8.0, 10.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-61.97907257080078, -60.09901809692383, -58.21896743774414, -56.33891296386719, -54.4588623046875, -52.57880783081055, -50.698753356933594, -48.818702697753906, -46.93865203857422, -45.058597564697266, -43.17854690551758, -41.298492431640625, -39.41844177246094, -37.538387298583984, -35.65833282470703, -33.778282165527344, -31.89822769165039, -30.01817512512207, -28.13812255859375, -26.258068084716797, -24.37801742553711, -22.497962951660156, -20.617910385131836, -18.737857818603516, -16.857805252075195, -14.977752685546875, -13.097700119018555, -11.217646598815918, -9.337594032287598, -7.457541465759277, -5.577487945556641, -3.6974353790283203, -1.8173866271972656, 0.06266617774963379, 1.9427189826965332, 3.8227720260620117, 5.702824592590332, 7.582877159118652, 9.462930679321289, 11.34298324584961, 13.22303581237793, 15.10308837890625, 16.98314094543457, 18.86319351196289, 20.743247985839844, 22.62329864501953, 24.503353118896484, 26.383405685424805, 28.263458251953125, 30.143510818481445, 32.023563385009766, 33.90361785888672, 35.783668518066406, 37.66372299194336, 39.54377746582031, 41.423828125, 43.30387878417969, 45.18393325805664, 47.06398391723633, 48.94403839111328, 50.82408905029297, 52.70414352416992, 54.584197998046875, 56.46424865722656, 58.344303131103516]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 11.0, 7.0, 8.0, 13.0, 17.0, 23.0, 29.0, 35.0, 67.0, 88.0, 115.0, 171.0, 192.0, 332.0, 449.0, 619.0, 839.0, 1197.0, 1637.0, 2352.0, 3245.0, 4653.0, 6610.0, 9804.0, 14832.0, 23296.0, 36802.0, 62077.0, 107403.0, 189793.0, 230199.0, 140221.0, 79113.0, 46716.0, 28566.0, 18159.0, 11967.0, 8089.0, 5464.0, 3868.0, 2590.0, 1944.0, 1401.0, 1018.0, 728.0, 521.0, 373.0, 258.0, 184.0, 134.0, 104.0, 74.0, 51.0, 35.0, 37.0, 18.0, 8.0, 4.0, 7.0, 1.0, 2.0, 2.0], "bins": [-56.125, -54.3837890625, -52.642578125, -50.9013671875, -49.16015625, -47.4189453125, -45.677734375, -43.9365234375, -42.1953125, -40.4541015625, -38.712890625, -36.9716796875, -35.23046875, -33.4892578125, -31.748046875, -30.0068359375, -28.265625, -26.5244140625, -24.783203125, -23.0419921875, -21.30078125, -19.5595703125, -17.818359375, -16.0771484375, -14.3359375, -12.5947265625, -10.853515625, -9.1123046875, -7.37109375, -5.6298828125, -3.888671875, -2.1474609375, -0.40625, 1.3349609375, 3.076171875, 4.8173828125, 6.55859375, 8.2998046875, 10.041015625, 11.7822265625, 13.5234375, 15.2646484375, 17.005859375, 18.7470703125, 20.48828125, 22.2294921875, 23.970703125, 25.7119140625, 27.453125, 29.1943359375, 30.935546875, 32.6767578125, 34.41796875, 36.1591796875, 37.900390625, 39.6416015625, 41.3828125, 43.1240234375, 44.865234375, 46.6064453125, 48.34765625, 50.0888671875, 51.830078125, 53.5712890625, 55.3125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 0.0, 9.0, 14.0, 10.0, 4.0, 8.0, 11.0, 13.0, 17.0, 11.0, 23.0, 22.0, 29.0, 28.0, 30.0, 33.0, 45.0, 45.0, 44.0, 52.0, 39.0, 60.0, 46.0, 46.0, 47.0, 37.0, 31.0, 36.0, 28.0, 20.0, 24.0, 22.0, 18.0, 14.0, 20.0, 13.0, 11.0, 6.0, 10.0, 7.0, 6.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-64.625, -62.67578125, -60.7265625, -58.77734375, -56.828125, -54.87890625, -52.9296875, -50.98046875, -49.03125, -47.08203125, -45.1328125, -43.18359375, -41.234375, -39.28515625, -37.3359375, -35.38671875, -33.4375, -31.48828125, -29.5390625, -27.58984375, -25.640625, -23.69140625, -21.7421875, -19.79296875, -17.84375, -15.89453125, -13.9453125, -11.99609375, -10.046875, -8.09765625, -6.1484375, -4.19921875, -2.25, -0.30078125, 1.6484375, 3.59765625, 5.546875, 7.49609375, 9.4453125, 11.39453125, 13.34375, 15.29296875, 17.2421875, 19.19140625, 21.140625, 23.08984375, 25.0390625, 26.98828125, 28.9375, 30.88671875, 32.8359375, 34.78515625, 36.734375, 38.68359375, 40.6328125, 42.58203125, 44.53125, 46.48046875, 48.4296875, 50.37890625, 52.328125, 54.27734375, 56.2265625, 58.17578125, 60.125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 10.0, 8.0, 21.0, 36.0, 30.0, 70.0, 95.0, 129.0, 188.0, 293.0, 378.0, 613.0, 964.0, 1368.0, 2149.0, 3299.0, 4962.0, 7663.0, 12243.0, 19353.0, 31074.0, 52935.0, 93617.0, 176373.0, 259329.0, 164268.0, 87096.0, 49309.0, 29634.0, 18439.0, 11450.0, 7314.0, 4662.0, 3155.0, 1983.0, 1338.0, 866.0, 581.0, 422.0, 269.0, 184.0, 128.0, 83.0, 51.0, 47.0, 33.0, 12.0, 13.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-73.875, -71.525390625, -69.17578125, -66.826171875, -64.4765625, -62.126953125, -59.77734375, -57.427734375, -55.078125, -52.728515625, -50.37890625, -48.029296875, -45.6796875, -43.330078125, -40.98046875, -38.630859375, -36.28125, -33.931640625, -31.58203125, -29.232421875, -26.8828125, -24.533203125, -22.18359375, -19.833984375, -17.484375, -15.134765625, -12.78515625, -10.435546875, -8.0859375, -5.736328125, -3.38671875, -1.037109375, 1.3125, 3.662109375, 6.01171875, 8.361328125, 10.7109375, 13.060546875, 15.41015625, 17.759765625, 20.109375, 22.458984375, 24.80859375, 27.158203125, 29.5078125, 31.857421875, 34.20703125, 36.556640625, 38.90625, 41.255859375, 43.60546875, 45.955078125, 48.3046875, 50.654296875, 53.00390625, 55.353515625, 57.703125, 60.052734375, 62.40234375, 64.751953125, 67.1015625, 69.451171875, 71.80078125, 74.150390625, 76.5]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 10.0, 16.0, 20.0, 11.0, 17.0, 20.0, 17.0, 29.0, 16.0, 28.0, 49.0, 36.0, 41.0, 40.0, 39.0, 41.0, 32.0, 33.0, 53.0, 43.0, 42.0, 49.0, 44.0, 28.0, 25.0, 27.0, 36.0, 20.0, 18.0, 18.0, 16.0, 13.0, 17.0, 9.0, 9.0, 4.0, 3.0, 3.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.6875, -39.47216796875, -38.2568359375, -37.04150390625, -35.826171875, -34.61083984375, -33.3955078125, -32.18017578125, -30.96484375, -29.74951171875, -28.5341796875, -27.31884765625, -26.103515625, -24.88818359375, -23.6728515625, -22.45751953125, -21.2421875, -20.02685546875, -18.8115234375, -17.59619140625, -16.380859375, -15.16552734375, -13.9501953125, -12.73486328125, -11.51953125, -10.30419921875, -9.0888671875, -7.87353515625, -6.658203125, -5.44287109375, -4.2275390625, -3.01220703125, -1.796875, -0.58154296875, 0.6337890625, 1.84912109375, 3.064453125, 4.27978515625, 5.4951171875, 6.71044921875, 7.92578125, 9.14111328125, 10.3564453125, 11.57177734375, 12.787109375, 14.00244140625, 15.2177734375, 16.43310546875, 17.6484375, 18.86376953125, 20.0791015625, 21.29443359375, 22.509765625, 23.72509765625, 24.9404296875, 26.15576171875, 27.37109375, 28.58642578125, 29.8017578125, 31.01708984375, 32.232421875, 33.44775390625, 34.6630859375, 35.87841796875, 37.09375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 11.0, 13.0, 28.0, 31.0, 50.0, 62.0, 115.0, 169.0, 230.0, 337.0, 494.0, 853.0, 1206.0, 1815.0, 2819.0, 4538.0, 7407.0, 12567.0, 22327.0, 41592.0, 85897.0, 204944.0, 349283.0, 159600.0, 69540.0, 35007.0, 18955.0, 10650.0, 6570.0, 3948.0, 2575.0, 1621.0, 1074.0, 723.0, 486.0, 350.0, 212.0, 142.0, 102.0, 68.0, 42.0, 34.0, 22.0, 10.0, 12.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.109375, -24.308837890625, -23.50830078125, -22.707763671875, -21.9072265625, -21.106689453125, -20.30615234375, -19.505615234375, -18.705078125, -17.904541015625, -17.10400390625, -16.303466796875, -15.5029296875, -14.702392578125, -13.90185546875, -13.101318359375, -12.30078125, -11.500244140625, -10.69970703125, -9.899169921875, -9.0986328125, -8.298095703125, -7.49755859375, -6.697021484375, -5.896484375, -5.095947265625, -4.29541015625, -3.494873046875, -2.6943359375, -1.893798828125, -1.09326171875, -0.292724609375, 0.5078125, 1.308349609375, 2.10888671875, 2.909423828125, 3.7099609375, 4.510498046875, 5.31103515625, 6.111572265625, 6.912109375, 7.712646484375, 8.51318359375, 9.313720703125, 10.1142578125, 10.914794921875, 11.71533203125, 12.515869140625, 13.31640625, 14.116943359375, 14.91748046875, 15.718017578125, 16.5185546875, 17.319091796875, 18.11962890625, 18.920166015625, 19.720703125, 20.521240234375, 21.32177734375, 22.122314453125, 22.9228515625, 23.723388671875, 24.52392578125, 25.324462890625, 26.125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 4.0, 6.0, 9.0, 10.0, 14.0, 20.0, 18.0, 19.0, 27.0, 47.0, 56.0, 84.0, 121.0, 127.0, 107.0, 68.0, 60.0, 46.0, 30.0, 18.0, 20.0, 14.0, 11.0, 9.0, 13.0, 4.0, 4.0, 9.0, 4.0, 0.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00307464599609375, -0.0029824376106262207, -0.0028902292251586914, -0.002798020839691162, -0.002705812454223633, -0.0026136040687561035, -0.0025213956832885742, -0.002429187297821045, -0.0023369789123535156, -0.0022447705268859863, -0.002152562141418457, -0.0020603537559509277, -0.0019681453704833984, -0.0018759369850158691, -0.0017837285995483398, -0.0016915202140808105, -0.0015993118286132812, -0.001507103443145752, -0.0014148950576782227, -0.0013226866722106934, -0.001230478286743164, -0.0011382699012756348, -0.0010460615158081055, -0.0009538531303405762, -0.0008616447448730469, -0.0007694363594055176, -0.0006772279739379883, -0.000585019588470459, -0.0004928112030029297, -0.0004006028175354004, -0.0003083944320678711, -0.0002161860466003418, -0.0001239776611328125, -3.17692756652832e-05, 6.0439109802246094e-05, 0.0001526474952697754, 0.0002448558807373047, 0.000337064266204834, 0.0004292726516723633, 0.0005214810371398926, 0.0006136894226074219, 0.0007058978080749512, 0.0007981061935424805, 0.0008903145790100098, 0.000982522964477539, 0.0010747313499450684, 0.0011669397354125977, 0.001259148120880127, 0.0013513565063476562, 0.0014435648918151855, 0.0015357732772827148, 0.0016279816627502441, 0.0017201900482177734, 0.0018123984336853027, 0.001904606819152832, 0.0019968152046203613, 0.0020890235900878906, 0.00218123197555542, 0.0022734403610229492, 0.0023656487464904785, 0.002457857131958008, 0.002550065517425537, 0.0026422739028930664, 0.0027344822883605957, 0.002826690673828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 14.0, 14.0, 24.0, 35.0, 29.0, 55.0, 75.0, 110.0, 156.0, 261.0, 346.0, 460.0, 736.0, 1108.0, 1740.0, 2711.0, 4487.0, 7552.0, 13167.0, 23971.0, 47476.0, 102829.0, 249473.0, 321777.0, 138656.0, 61541.0, 30030.0, 15892.0, 9004.0, 5419.0, 3294.0, 2072.0, 1373.0, 824.0, 566.0, 361.0, 276.0, 158.0, 149.0, 85.0, 75.0, 36.0, 40.0, 35.0, 25.0, 12.0, 5.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-24.421875, -23.662841796875, -22.90380859375, -22.144775390625, -21.3857421875, -20.626708984375, -19.86767578125, -19.108642578125, -18.349609375, -17.590576171875, -16.83154296875, -16.072509765625, -15.3134765625, -14.554443359375, -13.79541015625, -13.036376953125, -12.27734375, -11.518310546875, -10.75927734375, -10.000244140625, -9.2412109375, -8.482177734375, -7.72314453125, -6.964111328125, -6.205078125, -5.446044921875, -4.68701171875, -3.927978515625, -3.1689453125, -2.409912109375, -1.65087890625, -0.891845703125, -0.1328125, 0.626220703125, 1.38525390625, 2.144287109375, 2.9033203125, 3.662353515625, 4.42138671875, 5.180419921875, 5.939453125, 6.698486328125, 7.45751953125, 8.216552734375, 8.9755859375, 9.734619140625, 10.49365234375, 11.252685546875, 12.01171875, 12.770751953125, 13.52978515625, 14.288818359375, 15.0478515625, 15.806884765625, 16.56591796875, 17.324951171875, 18.083984375, 18.843017578125, 19.60205078125, 20.361083984375, 21.1201171875, 21.879150390625, 22.63818359375, 23.397216796875, 24.15625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 10.0, 10.0, 9.0, 10.0, 8.0, 20.0, 20.0, 15.0, 28.0, 40.0, 41.0, 40.0, 46.0, 61.0, 62.0, 58.0, 64.0, 71.0, 59.0, 48.0, 46.0, 42.0, 33.0, 24.0, 37.0, 25.0, 18.0, 11.0, 9.0, 10.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1484375, -7.9169921875, -7.685546875, -7.4541015625, -7.22265625, -6.9912109375, -6.759765625, -6.5283203125, -6.296875, -6.0654296875, -5.833984375, -5.6025390625, -5.37109375, -5.1396484375, -4.908203125, -4.6767578125, -4.4453125, -4.2138671875, -3.982421875, -3.7509765625, -3.51953125, -3.2880859375, -3.056640625, -2.8251953125, -2.59375, -2.3623046875, -2.130859375, -1.8994140625, -1.66796875, -1.4365234375, -1.205078125, -0.9736328125, -0.7421875, -0.5107421875, -0.279296875, -0.0478515625, 0.18359375, 0.4150390625, 0.646484375, 0.8779296875, 1.109375, 1.3408203125, 1.572265625, 1.8037109375, 2.03515625, 2.2666015625, 2.498046875, 2.7294921875, 2.9609375, 3.1923828125, 3.423828125, 3.6552734375, 3.88671875, 4.1181640625, 4.349609375, 4.5810546875, 4.8125, 5.0439453125, 5.275390625, 5.5068359375, 5.73828125, 5.9697265625, 6.201171875, 6.4326171875, 6.6640625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 7.0, 11.0, 14.0, 13.0, 14.0, 21.0, 38.0, 39.0, 48.0, 62.0, 94.0, 112.0, 109.0, 101.0, 77.0, 56.0, 47.0, 29.0, 23.0, 17.0, 17.0, 11.0, 8.0, 5.0, 11.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.94277954101562, -82.0176773071289, -79.09258270263672, -76.16748046875, -73.24238586425781, -70.3172836303711, -67.39218139648438, -64.46708679199219, -61.541988372802734, -58.61688995361328, -55.69179153442383, -52.766693115234375, -49.841590881347656, -46.91649627685547, -43.99139404296875, -41.0662956237793, -38.141197204589844, -35.21609878540039, -32.29100036621094, -29.36590003967285, -26.4408016204834, -23.515703201293945, -20.59060287475586, -17.665504455566406, -14.740406036376953, -11.8153076171875, -8.89020824432373, -5.965108871459961, -3.040010452270508, -0.11491203308105469, 2.8101882934570312, 5.735286712646484, 8.660385131835938, 11.58548355102539, 14.51058292388916, 17.43568229675293, 20.360780715942383, 23.285879135131836, 26.210979461669922, 29.136077880859375, 32.06117630004883, 34.98627471923828, 37.911373138427734, 40.83647155761719, 43.761573791503906, 46.686668395996094, 49.61177062988281, 52.536869049072266, 55.46196746826172, 58.38706588745117, 61.312164306640625, 64.23726654052734, 67.16236114501953, 70.08746337890625, 73.01255798339844, 75.93766021728516, 78.86276245117188, 81.7878646850586, 84.71295928955078, 87.6380615234375, 90.56315612792969, 93.4882583618164, 96.41336059570312, 99.33845520019531, 102.2635498046875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 6.0, 9.0, 4.0, 9.0, 4.0, 9.0, 11.0, 18.0, 22.0, 13.0, 21.0, 20.0, 30.0, 41.0, 40.0, 36.0, 43.0, 34.0, 39.0, 46.0, 35.0, 26.0, 42.0, 31.0, 41.0, 37.0, 32.0, 29.0, 39.0, 27.0, 23.0, 24.0, 22.0, 23.0, 13.0, 24.0, 12.0, 13.0, 11.0, 11.0, 9.0, 3.0, 3.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-62.063899993896484, -60.25804138183594, -58.452186584472656, -56.646331787109375, -54.84047317504883, -53.03461456298828, -51.228759765625, -49.42290496826172, -47.61704635620117, -45.811187744140625, -44.005332946777344, -42.19947814941406, -40.393619537353516, -38.58776092529297, -36.78190612792969, -34.976051330566406, -33.17019271850586, -31.364336013793945, -29.55847930908203, -27.752622604370117, -25.946765899658203, -24.14090919494629, -22.335052490234375, -20.52919578552246, -18.723339080810547, -16.917482376098633, -15.111625671386719, -13.305768966674805, -11.49991226196289, -9.694055557250977, -7.8881988525390625, -6.082342147827148, -4.276485443115234, -2.4706287384033203, -0.6647720336914062, 1.1410846710205078, 2.946941375732422, 4.752798080444336, 6.55865478515625, 8.364511489868164, 10.170368194580078, 11.976224899291992, 13.782081604003906, 15.58793830871582, 17.393795013427734, 19.19965171813965, 21.005508422851562, 22.811365127563477, 24.61722183227539, 26.423078536987305, 28.22893524169922, 30.034791946411133, 31.840648651123047, 33.646507263183594, 35.452362060546875, 37.258216857910156, 39.0640754699707, 40.86993408203125, 42.67578887939453, 44.48164367675781, 46.28750228881836, 48.093360900878906, 49.89921569824219, 51.70507049560547, 53.510929107666016]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 7.0, 21.0, 12.0, 18.0, 21.0, 40.0, 50.0, 84.0, 84.0, 136.0, 185.0, 268.0, 399.0, 595.0, 862.0, 1369.0, 2142.0, 3378.0, 5803.0, 10013.0, 20067.0, 56019.0, 285590.0, 1523091.0, 1841127.0, 328792.0, 66079.0, 21586.0, 10408.0, 5894.0, 3518.0, 2325.0, 1398.0, 951.0, 618.0, 392.0, 290.0, 206.0, 119.0, 73.0, 68.0, 45.0, 40.0, 34.0, 15.0, 5.0, 8.0, 9.0, 6.0, 4.0, 6.0, 5.0, 1.0], "bins": [-120.875, -117.4267578125, -113.978515625, -110.5302734375, -107.08203125, -103.6337890625, -100.185546875, -96.7373046875, -93.2890625, -89.8408203125, -86.392578125, -82.9443359375, -79.49609375, -76.0478515625, -72.599609375, -69.1513671875, -65.703125, -62.2548828125, -58.806640625, -55.3583984375, -51.91015625, -48.4619140625, -45.013671875, -41.5654296875, -38.1171875, -34.6689453125, -31.220703125, -27.7724609375, -24.32421875, -20.8759765625, -17.427734375, -13.9794921875, -10.53125, -7.0830078125, -3.634765625, -0.1865234375, 3.26171875, 6.7099609375, 10.158203125, 13.6064453125, 17.0546875, 20.5029296875, 23.951171875, 27.3994140625, 30.84765625, 34.2958984375, 37.744140625, 41.1923828125, 44.640625, 48.0888671875, 51.537109375, 54.9853515625, 58.43359375, 61.8818359375, 65.330078125, 68.7783203125, 72.2265625, 75.6748046875, 79.123046875, 82.5712890625, 86.01953125, 89.4677734375, 92.916015625, 96.3642578125, 99.8125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 5.0, 6.0, 7.0, 5.0, 7.0, 14.0, 15.0, 10.0, 23.0, 16.0, 18.0, 19.0, 30.0, 39.0, 29.0, 42.0, 56.0, 40.0, 46.0, 47.0, 32.0, 40.0, 36.0, 42.0, 44.0, 31.0, 35.0, 38.0, 28.0, 31.0, 28.0, 13.0, 17.0, 17.0, 20.0, 9.0, 17.0, 5.0, 12.0, 13.0, 6.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-57.3125, -55.6328125, -53.953125, -52.2734375, -50.59375, -48.9140625, -47.234375, -45.5546875, -43.875, -42.1953125, -40.515625, -38.8359375, -37.15625, -35.4765625, -33.796875, -32.1171875, -30.4375, -28.7578125, -27.078125, -25.3984375, -23.71875, -22.0390625, -20.359375, -18.6796875, -17.0, -15.3203125, -13.640625, -11.9609375, -10.28125, -8.6015625, -6.921875, -5.2421875, -3.5625, -1.8828125, -0.203125, 1.4765625, 3.15625, 4.8359375, 6.515625, 8.1953125, 9.875, 11.5546875, 13.234375, 14.9140625, 16.59375, 18.2734375, 19.953125, 21.6328125, 23.3125, 24.9921875, 26.671875, 28.3515625, 30.03125, 31.7109375, 33.390625, 35.0703125, 36.75, 38.4296875, 40.109375, 41.7890625, 43.46875, 45.1484375, 46.828125, 48.5078125, 50.1875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 11.0, 9.0, 17.0, 34.0, 36.0, 48.0, 51.0, 93.0, 108.0, 205.0, 275.0, 430.0, 596.0, 1048.0, 1497.0, 2428.0, 3990.0, 6548.0, 11268.0, 20502.0, 40339.0, 93729.0, 315349.0, 2183670.0, 1163809.0, 203724.0, 70404.0, 32446.0, 17036.0, 9339.0, 5665.0, 3438.0, 2184.0, 1436.0, 849.0, 542.0, 358.0, 235.0, 159.0, 114.0, 82.0, 49.0, 42.0, 16.0, 25.0, 16.0, 14.0, 8.0, 3.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0], "bins": [-123.8125, -120.04296875, -116.2734375, -112.50390625, -108.734375, -104.96484375, -101.1953125, -97.42578125, -93.65625, -89.88671875, -86.1171875, -82.34765625, -78.578125, -74.80859375, -71.0390625, -67.26953125, -63.5, -59.73046875, -55.9609375, -52.19140625, -48.421875, -44.65234375, -40.8828125, -37.11328125, -33.34375, -29.57421875, -25.8046875, -22.03515625, -18.265625, -14.49609375, -10.7265625, -6.95703125, -3.1875, 0.58203125, 4.3515625, 8.12109375, 11.890625, 15.66015625, 19.4296875, 23.19921875, 26.96875, 30.73828125, 34.5078125, 38.27734375, 42.046875, 45.81640625, 49.5859375, 53.35546875, 57.125, 60.89453125, 64.6640625, 68.43359375, 72.203125, 75.97265625, 79.7421875, 83.51171875, 87.28125, 91.05078125, 94.8203125, 98.58984375, 102.359375, 106.12890625, 109.8984375, 113.66796875, 117.4375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 10.0, 14.0, 13.0, 12.0, 18.0, 24.0, 17.0, 28.0, 45.0, 69.0, 87.0, 96.0, 163.0, 294.0, 423.0, 656.0, 717.0, 471.0, 298.0, 187.0, 100.0, 73.0, 58.0, 54.0, 26.0, 37.0, 16.0, 11.0, 17.0, 10.0, 6.0, 9.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.125, -37.97802734375, -36.8310546875, -35.68408203125, -34.537109375, -33.39013671875, -32.2431640625, -31.09619140625, -29.94921875, -28.80224609375, -27.6552734375, -26.50830078125, -25.361328125, -24.21435546875, -23.0673828125, -21.92041015625, -20.7734375, -19.62646484375, -18.4794921875, -17.33251953125, -16.185546875, -15.03857421875, -13.8916015625, -12.74462890625, -11.59765625, -10.45068359375, -9.3037109375, -8.15673828125, -7.009765625, -5.86279296875, -4.7158203125, -3.56884765625, -2.421875, -1.27490234375, -0.1279296875, 1.01904296875, 2.166015625, 3.31298828125, 4.4599609375, 5.60693359375, 6.75390625, 7.90087890625, 9.0478515625, 10.19482421875, 11.341796875, 12.48876953125, 13.6357421875, 14.78271484375, 15.9296875, 17.07666015625, 18.2236328125, 19.37060546875, 20.517578125, 21.66455078125, 22.8115234375, 23.95849609375, 25.10546875, 26.25244140625, 27.3994140625, 28.54638671875, 29.693359375, 30.84033203125, 31.9873046875, 33.13427734375, 34.28125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 6.0, 4.0, 8.0, 14.0, 23.0, 22.0, 32.0, 31.0, 51.0, 70.0, 82.0, 112.0, 96.0, 100.0, 74.0, 61.0, 37.0, 41.0, 28.0, 21.0, 12.0, 14.0, 13.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.39539337158203, -62.81571960449219, -60.236045837402344, -57.656368255615234, -55.07669448852539, -52.49702072143555, -49.91734313964844, -47.337669372558594, -44.75799560546875, -42.178321838378906, -39.59864807128906, -37.01897048950195, -34.43929672241211, -31.859622955322266, -29.27994728088379, -26.700271606445312, -24.12059783935547, -21.540924072265625, -18.96124839782715, -16.381572723388672, -13.801898956298828, -11.222224235534668, -8.642549514770508, -6.062873840332031, -3.4832000732421875, -0.9035253524780273, 1.6761493682861328, 4.255824089050293, 6.835498809814453, 9.415173530578613, 11.994848251342773, 14.57452392578125, 17.154205322265625, 19.73387908935547, 22.313554763793945, 24.893230438232422, 27.472904205322266, 30.05257797241211, 32.63225555419922, 35.21192932128906, 37.791603088378906, 40.37127685546875, 42.950950622558594, 45.5306282043457, 48.11030197143555, 50.68997573852539, 53.2696533203125, 55.849327087402344, 58.42900085449219, 61.00867462158203, 63.588348388671875, 66.16802215576172, 68.74769592285156, 71.32737731933594, 73.90705108642578, 76.48672485351562, 79.06639862060547, 81.64607238769531, 84.22574615478516, 86.805419921875, 89.38510131835938, 91.96477508544922, 94.54444885253906, 97.1241226196289, 99.70379638671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 7.0, 11.0, 14.0, 17.0, 14.0, 16.0, 14.0, 21.0, 30.0, 41.0, 37.0, 40.0, 44.0, 43.0, 37.0, 52.0, 37.0, 41.0, 36.0, 42.0, 52.0, 36.0, 37.0, 27.0, 26.0, 29.0, 20.0, 23.0, 17.0, 20.0, 17.0, 21.0, 15.0, 8.0, 8.0, 9.0, 7.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.66313934326172, -53.819252014160156, -51.97536087036133, -50.131473541259766, -48.28758239746094, -46.443695068359375, -44.59980773925781, -42.755916595458984, -40.91202926635742, -39.06814193725586, -37.22425079345703, -35.38036346435547, -33.53647232055664, -31.692584991455078, -29.848695755004883, -28.004806518554688, -26.160917282104492, -24.317028045654297, -22.4731388092041, -20.629249572753906, -18.785362243652344, -16.94147300720215, -15.097583770751953, -13.253695487976074, -11.409806251525879, -9.565917015075684, -7.722028732299805, -5.878139495849609, -4.034250736236572, -2.190361976623535, -0.34647274017333984, 1.497415542602539, 3.3413047790527344, 5.1851935386657715, 7.029082298278809, 8.872971534729004, 10.716859817504883, 12.560749053955078, 14.404638290405273, 16.24852752685547, 18.09241485595703, 19.936304092407227, 21.780193328857422, 23.624080657958984, 25.46796989440918, 27.311859130859375, 29.15574836730957, 30.999637603759766, 32.843528747558594, 34.687416076660156, 36.531307220458984, 38.37519454956055, 40.219085693359375, 42.06297302246094, 43.9068603515625, 45.75075149536133, 47.59463882446289, 49.43852615356445, 51.28241729736328, 53.126304626464844, 54.97019577026367, 56.814083099365234, 58.65797424316406, 60.501861572265625, 62.34574890136719]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 10.0, 15.0, 18.0, 28.0, 29.0, 50.0, 69.0, 93.0, 149.0, 191.0, 268.0, 387.0, 624.0, 931.0, 1403.0, 2199.0, 3430.0, 5581.0, 9211.0, 15981.0, 27662.0, 51669.0, 105641.0, 226523.0, 287755.0, 150110.0, 70745.0, 36370.0, 20332.0, 11906.0, 7000.0, 4414.0, 2655.0, 1765.0, 1104.0, 722.0, 481.0, 320.0, 204.0, 159.0, 97.0, 74.0, 54.0, 41.0, 27.0, 13.0, 18.0, 7.0, 12.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.5, -39.16015625, -37.8203125, -36.48046875, -35.140625, -33.80078125, -32.4609375, -31.12109375, -29.78125, -28.44140625, -27.1015625, -25.76171875, -24.421875, -23.08203125, -21.7421875, -20.40234375, -19.0625, -17.72265625, -16.3828125, -15.04296875, -13.703125, -12.36328125, -11.0234375, -9.68359375, -8.34375, -7.00390625, -5.6640625, -4.32421875, -2.984375, -1.64453125, -0.3046875, 1.03515625, 2.375, 3.71484375, 5.0546875, 6.39453125, 7.734375, 9.07421875, 10.4140625, 11.75390625, 13.09375, 14.43359375, 15.7734375, 17.11328125, 18.453125, 19.79296875, 21.1328125, 22.47265625, 23.8125, 25.15234375, 26.4921875, 27.83203125, 29.171875, 30.51171875, 31.8515625, 33.19140625, 34.53125, 35.87109375, 37.2109375, 38.55078125, 39.890625, 41.23046875, 42.5703125, 43.91015625, 45.25]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 0.0, 4.0, 4.0, 6.0, 3.0, 3.0, 5.0, 13.0, 15.0, 10.0, 10.0, 11.0, 17.0, 24.0, 27.0, 39.0, 37.0, 37.0, 42.0, 38.0, 58.0, 35.0, 43.0, 45.0, 50.0, 56.0, 52.0, 42.0, 37.0, 34.0, 23.0, 21.0, 20.0, 18.0, 21.0, 17.0, 17.0, 15.0, 11.0, 12.0, 3.0, 6.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.21875, -55.3896484375, -53.560546875, -51.7314453125, -49.90234375, -48.0732421875, -46.244140625, -44.4150390625, -42.5859375, -40.7568359375, -38.927734375, -37.0986328125, -35.26953125, -33.4404296875, -31.611328125, -29.7822265625, -27.953125, -26.1240234375, -24.294921875, -22.4658203125, -20.63671875, -18.8076171875, -16.978515625, -15.1494140625, -13.3203125, -11.4912109375, -9.662109375, -7.8330078125, -6.00390625, -4.1748046875, -2.345703125, -0.5166015625, 1.3125, 3.1416015625, 4.970703125, 6.7998046875, 8.62890625, 10.4580078125, 12.287109375, 14.1162109375, 15.9453125, 17.7744140625, 19.603515625, 21.4326171875, 23.26171875, 25.0908203125, 26.919921875, 28.7490234375, 30.578125, 32.4072265625, 34.236328125, 36.0654296875, 37.89453125, 39.7236328125, 41.552734375, 43.3818359375, 45.2109375, 47.0400390625, 48.869140625, 50.6982421875, 52.52734375, 54.3564453125, 56.185546875, 58.0146484375, 59.84375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 8.0, 20.0, 26.0, 20.0, 37.0, 52.0, 62.0, 90.0, 121.0, 194.0, 287.0, 409.0, 585.0, 888.0, 1365.0, 2045.0, 3108.0, 5291.0, 9013.0, 17725.0, 57607.0, 772324.0, 125551.0, 23524.0, 10947.0, 6253.0, 3898.0, 2355.0, 1559.0, 962.0, 674.0, 442.0, 317.0, 216.0, 159.0, 122.0, 81.0, 57.0, 39.0, 27.0, 18.0, 16.0, 17.0, 9.0, 9.0, 5.0, 1.0, 4.0, 1.0, 0.0, 3.0], "bins": [-80.9375, -78.6025390625, -76.267578125, -73.9326171875, -71.59765625, -69.2626953125, -66.927734375, -64.5927734375, -62.2578125, -59.9228515625, -57.587890625, -55.2529296875, -52.91796875, -50.5830078125, -48.248046875, -45.9130859375, -43.578125, -41.2431640625, -38.908203125, -36.5732421875, -34.23828125, -31.9033203125, -29.568359375, -27.2333984375, -24.8984375, -22.5634765625, -20.228515625, -17.8935546875, -15.55859375, -13.2236328125, -10.888671875, -8.5537109375, -6.21875, -3.8837890625, -1.548828125, 0.7861328125, 3.12109375, 5.4560546875, 7.791015625, 10.1259765625, 12.4609375, 14.7958984375, 17.130859375, 19.4658203125, 21.80078125, 24.1357421875, 26.470703125, 28.8056640625, 31.140625, 33.4755859375, 35.810546875, 38.1455078125, 40.48046875, 42.8154296875, 45.150390625, 47.4853515625, 49.8203125, 52.1552734375, 54.490234375, 56.8251953125, 59.16015625, 61.4951171875, 63.830078125, 66.1650390625, 68.5]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 9.0, 3.0, 11.0, 7.0, 7.0, 11.0, 14.0, 14.0, 25.0, 18.0, 21.0, 34.0, 37.0, 49.0, 32.0, 39.0, 51.0, 35.0, 42.0, 45.0, 58.0, 35.0, 23.0, 39.0, 39.0, 39.0, 31.0, 39.0, 25.0, 26.0, 27.0, 18.0, 23.0, 11.0, 16.0, 16.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-51.46875, -49.71044921875, -47.9521484375, -46.19384765625, -44.435546875, -42.67724609375, -40.9189453125, -39.16064453125, -37.40234375, -35.64404296875, -33.8857421875, -32.12744140625, -30.369140625, -28.61083984375, -26.8525390625, -25.09423828125, -23.3359375, -21.57763671875, -19.8193359375, -18.06103515625, -16.302734375, -14.54443359375, -12.7861328125, -11.02783203125, -9.26953125, -7.51123046875, -5.7529296875, -3.99462890625, -2.236328125, -0.47802734375, 1.2802734375, 3.03857421875, 4.796875, 6.55517578125, 8.3134765625, 10.07177734375, 11.830078125, 13.58837890625, 15.3466796875, 17.10498046875, 18.86328125, 20.62158203125, 22.3798828125, 24.13818359375, 25.896484375, 27.65478515625, 29.4130859375, 31.17138671875, 32.9296875, 34.68798828125, 36.4462890625, 38.20458984375, 39.962890625, 41.72119140625, 43.4794921875, 45.23779296875, 46.99609375, 48.75439453125, 50.5126953125, 52.27099609375, 54.029296875, 55.78759765625, 57.5458984375, 59.30419921875, 61.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 7.0, 8.0, 13.0, 14.0, 22.0, 35.0, 40.0, 65.0, 83.0, 122.0, 161.0, 224.0, 358.0, 544.0, 891.0, 1513.0, 2936.0, 6597.0, 18550.0, 106298.0, 834851.0, 51279.0, 12980.0, 5021.0, 2317.0, 1290.0, 790.0, 489.0, 314.0, 203.0, 147.0, 106.0, 68.0, 44.0, 47.0, 28.0, 22.0, 15.0, 15.0, 10.0, 10.0, 8.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.20703125, -5.988037109375, -5.76904296875, -5.550048828125, -5.3310546875, -5.112060546875, -4.89306640625, -4.674072265625, -4.455078125, -4.236083984375, -4.01708984375, -3.798095703125, -3.5791015625, -3.360107421875, -3.14111328125, -2.922119140625, -2.703125, -2.484130859375, -2.26513671875, -2.046142578125, -1.8271484375, -1.608154296875, -1.38916015625, -1.170166015625, -0.951171875, -0.732177734375, -0.51318359375, -0.294189453125, -0.0751953125, 0.143798828125, 0.36279296875, 0.581787109375, 0.80078125, 1.019775390625, 1.23876953125, 1.457763671875, 1.6767578125, 1.895751953125, 2.11474609375, 2.333740234375, 2.552734375, 2.771728515625, 2.99072265625, 3.209716796875, 3.4287109375, 3.647705078125, 3.86669921875, 4.085693359375, 4.3046875, 4.523681640625, 4.74267578125, 4.961669921875, 5.1806640625, 5.399658203125, 5.61865234375, 5.837646484375, 6.056640625, 6.275634765625, 6.49462890625, 6.713623046875, 6.9326171875, 7.151611328125, 7.37060546875, 7.589599609375, 7.80859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 5.0, 8.0, 4.0, 8.0, 12.0, 12.0, 14.0, 29.0, 35.0, 48.0, 68.0, 82.0, 99.0, 135.0, 112.0, 79.0, 52.0, 45.0, 30.0, 28.0, 12.0, 22.0, 14.0, 8.0, 8.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0030670166015625, -0.0029805004596710205, -0.002893984317779541, -0.0028074681758880615, -0.002720952033996582, -0.0026344358921051025, -0.002547919750213623, -0.0024614036083221436, -0.002374887466430664, -0.0022883713245391846, -0.002201855182647705, -0.0021153390407562256, -0.002028822898864746, -0.0019423067569732666, -0.0018557906150817871, -0.0017692744731903076, -0.0016827583312988281, -0.0015962421894073486, -0.0015097260475158691, -0.0014232099056243896, -0.0013366937637329102, -0.0012501776218414307, -0.0011636614799499512, -0.0010771453380584717, -0.0009906291961669922, -0.0009041130542755127, -0.0008175969123840332, -0.0007310807704925537, -0.0006445646286010742, -0.0005580484867095947, -0.00047153234481811523, -0.00038501620292663574, -0.00029850006103515625, -0.00021198391914367676, -0.00012546777725219727, -3.8951635360717773e-05, 4.756450653076172e-05, 0.0001340806484222412, 0.0002205967903137207, 0.0003071129322052002, 0.0003936290740966797, 0.0004801452159881592, 0.0005666613578796387, 0.0006531774997711182, 0.0007396936416625977, 0.0008262097835540771, 0.0009127259254455566, 0.0009992420673370361, 0.0010857582092285156, 0.0011722743511199951, 0.0012587904930114746, 0.001345306634902954, 0.0014318227767944336, 0.001518338918685913, 0.0016048550605773926, 0.001691371202468872, 0.0017778873443603516, 0.001864403486251831, 0.0019509196281433105, 0.00203743577003479, 0.0021239519119262695, 0.002210468053817749, 0.0022969841957092285, 0.002383500337600708, 0.0024700164794921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 6.0, 5.0, 8.0, 13.0, 22.0, 32.0, 38.0, 56.0, 85.0, 120.0, 175.0, 231.0, 337.0, 538.0, 709.0, 1204.0, 1912.0, 3128.0, 5291.0, 9407.0, 18284.0, 37906.0, 92937.0, 284961.0, 368469.0, 125288.0, 47848.0, 22115.0, 11466.0, 6249.0, 3480.0, 2174.0, 1318.0, 882.0, 548.0, 377.0, 296.0, 196.0, 123.0, 96.0, 60.0, 47.0, 34.0, 28.0, 19.0, 14.0, 6.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-3.146484375, -3.05694580078125, -2.9674072265625, -2.87786865234375, -2.788330078125, -2.69879150390625, -2.6092529296875, -2.51971435546875, -2.43017578125, -2.34063720703125, -2.2510986328125, -2.16156005859375, -2.072021484375, -1.98248291015625, -1.8929443359375, -1.80340576171875, -1.7138671875, -1.62432861328125, -1.5347900390625, -1.44525146484375, -1.355712890625, -1.26617431640625, -1.1766357421875, -1.08709716796875, -0.99755859375, -0.90802001953125, -0.8184814453125, -0.72894287109375, -0.639404296875, -0.54986572265625, -0.4603271484375, -0.37078857421875, -0.28125, -0.19171142578125, -0.1021728515625, -0.01263427734375, 0.076904296875, 0.16644287109375, 0.2559814453125, 0.34552001953125, 0.43505859375, 0.52459716796875, 0.6141357421875, 0.70367431640625, 0.793212890625, 0.88275146484375, 0.9722900390625, 1.06182861328125, 1.1513671875, 1.24090576171875, 1.3304443359375, 1.41998291015625, 1.509521484375, 1.59906005859375, 1.6885986328125, 1.77813720703125, 1.86767578125, 1.95721435546875, 2.0467529296875, 2.13629150390625, 2.225830078125, 2.31536865234375, 2.4049072265625, 2.49444580078125, 2.583984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 9.0, 15.0, 17.0, 18.0, 12.0, 28.0, 33.0, 30.0, 60.0, 69.0, 101.0, 90.0, 85.0, 79.0, 81.0, 49.0, 40.0, 35.0, 22.0, 14.0, 13.0, 18.0, 22.0, 11.0, 8.0, 5.0, 4.0, 2.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9072265625, -0.8797149658203125, -0.852203369140625, -0.8246917724609375, -0.79718017578125, -0.7696685791015625, -0.742156982421875, -0.7146453857421875, -0.6871337890625, -0.6596221923828125, -0.632110595703125, -0.6045989990234375, -0.57708740234375, -0.5495758056640625, -0.522064208984375, -0.4945526123046875, -0.467041015625, -0.4395294189453125, -0.412017822265625, -0.3845062255859375, -0.35699462890625, -0.3294830322265625, -0.301971435546875, -0.2744598388671875, -0.2469482421875, -0.2194366455078125, -0.191925048828125, -0.1644134521484375, -0.13690185546875, -0.1093902587890625, -0.081878662109375, -0.0543670654296875, -0.02685546875, 0.0006561279296875, 0.028167724609375, 0.0556793212890625, 0.08319091796875, 0.1107025146484375, 0.138214111328125, 0.1657257080078125, 0.1932373046875, 0.2207489013671875, 0.248260498046875, 0.2757720947265625, 0.30328369140625, 0.3307952880859375, 0.358306884765625, 0.3858184814453125, 0.413330078125, 0.4408416748046875, 0.468353271484375, 0.4958648681640625, 0.52337646484375, 0.5508880615234375, 0.578399658203125, 0.6059112548828125, 0.6334228515625, 0.6609344482421875, 0.688446044921875, 0.7159576416015625, 0.74346923828125, 0.7709808349609375, 0.798492431640625, 0.8260040283203125, 0.853515625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 3.0, 4.0, 14.0, 14.0, 24.0, 20.0, 36.0, 34.0, 55.0, 78.0, 97.0, 98.0, 113.0, 105.0, 68.0, 55.0, 37.0, 37.0, 19.0, 19.0, 15.0, 14.0, 6.0, 7.0, 5.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.0177001953125, -71.4654769897461, -68.91324615478516, -66.36102294921875, -63.80879592895508, -61.256568908691406, -58.704341888427734, -56.15211486816406, -53.599891662597656, -51.047664642333984, -48.49543762207031, -45.943214416503906, -43.390987396240234, -40.83876037597656, -38.28653335571289, -35.73430633544922, -33.18207931518555, -30.629852294921875, -28.077627182006836, -25.525400161743164, -22.973175048828125, -20.420948028564453, -17.86872100830078, -15.316495895385742, -12.76426887512207, -10.212042808532715, -7.659816265106201, -5.1075897216796875, -2.555363655090332, -0.0031375885009765625, 2.5490894317626953, 5.101314544677734, 7.653541564941406, 10.205767631530762, 12.757993698120117, 15.310220718383789, 17.862445831298828, 20.4146728515625, 22.966899871826172, 25.51912498474121, 28.071352005004883, 30.623579025268555, 33.175804138183594, 35.728031158447266, 38.28025817871094, 40.832481384277344, 43.38471221923828, 45.93693542480469, 48.48916244506836, 51.04138946533203, 53.5936164855957, 56.145843505859375, 58.69806671142578, 61.25029373168945, 63.802520751953125, 66.35474395751953, 68.90697479248047, 71.45919799804688, 74.01142883300781, 76.56365203857422, 79.11588287353516, 81.66810607910156, 84.2203369140625, 86.7725601196289, 89.32478332519531]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 6.0, 2.0, 6.0, 5.0, 5.0, 7.0, 11.0, 14.0, 19.0, 15.0, 17.0, 14.0, 18.0, 33.0, 42.0, 37.0, 45.0, 33.0, 51.0, 39.0, 46.0, 42.0, 36.0, 39.0, 52.0, 43.0, 37.0, 33.0, 28.0, 27.0, 24.0, 22.0, 23.0, 22.0, 17.0, 16.0, 21.0, 15.0, 6.0, 8.0, 5.0, 11.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.7095947265625, -49.992801666259766, -48.27600860595703, -46.5592155456543, -44.84242248535156, -43.12562942504883, -41.408836364746094, -39.69204330444336, -37.975250244140625, -36.25845718383789, -34.541664123535156, -32.82487106323242, -31.108078002929688, -29.391284942626953, -27.67449188232422, -25.957698822021484, -24.24090576171875, -22.524112701416016, -20.80731964111328, -19.090526580810547, -17.373733520507812, -15.656940460205078, -13.940147399902344, -12.22335433959961, -10.506561279296875, -8.78976821899414, -7.072975158691406, -5.356182098388672, -3.6393890380859375, -1.9225959777832031, -0.20580291748046875, 1.5109901428222656, 3.2277870178222656, 4.944580078125, 6.661373138427734, 8.378166198730469, 10.094959259033203, 11.811752319335938, 13.528545379638672, 15.245338439941406, 16.96213150024414, 18.678924560546875, 20.39571762084961, 22.112510681152344, 23.829303741455078, 25.546096801757812, 27.262889862060547, 28.97968292236328, 30.696475982666016, 32.41326904296875, 34.130062103271484, 35.84685516357422, 37.56364822387695, 39.28044128417969, 40.99723434448242, 42.714027404785156, 44.43082046508789, 46.147613525390625, 47.86440658569336, 49.581199645996094, 51.29799270629883, 53.01478576660156, 54.7315788269043, 56.44837188720703, 58.165164947509766]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 9.0, 7.0, 14.0, 24.0, 41.0, 40.0, 72.0, 110.0, 146.0, 197.0, 302.0, 519.0, 841.0, 1245.0, 2151.0, 3449.0, 6096.0, 10942.0, 20134.0, 40966.0, 90703.0, 230498.0, 350087.0, 156873.0, 65342.0, 30976.0, 15804.0, 8525.0, 4897.0, 2757.0, 1731.0, 1065.0, 630.0, 435.0, 307.0, 190.0, 122.0, 86.0, 69.0, 39.0, 30.0, 27.0, 12.0, 18.0, 7.0, 2.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-89.875, -87.2548828125, -84.634765625, -82.0146484375, -79.39453125, -76.7744140625, -74.154296875, -71.5341796875, -68.9140625, -66.2939453125, -63.673828125, -61.0537109375, -58.43359375, -55.8134765625, -53.193359375, -50.5732421875, -47.953125, -45.3330078125, -42.712890625, -40.0927734375, -37.47265625, -34.8525390625, -32.232421875, -29.6123046875, -26.9921875, -24.3720703125, -21.751953125, -19.1318359375, -16.51171875, -13.8916015625, -11.271484375, -8.6513671875, -6.03125, -3.4111328125, -0.791015625, 1.8291015625, 4.44921875, 7.0693359375, 9.689453125, 12.3095703125, 14.9296875, 17.5498046875, 20.169921875, 22.7900390625, 25.41015625, 28.0302734375, 30.650390625, 33.2705078125, 35.890625, 38.5107421875, 41.130859375, 43.7509765625, 46.37109375, 48.9912109375, 51.611328125, 54.2314453125, 56.8515625, 59.4716796875, 62.091796875, 64.7119140625, 67.33203125, 69.9521484375, 72.572265625, 75.1923828125, 77.8125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 5.0, 5.0, 3.0, 3.0, 7.0, 7.0, 10.0, 10.0, 12.0, 15.0, 17.0, 15.0, 22.0, 24.0, 40.0, 33.0, 28.0, 43.0, 46.0, 45.0, 51.0, 44.0, 42.0, 40.0, 50.0, 47.0, 42.0, 33.0, 40.0, 24.0, 24.0, 17.0, 24.0, 14.0, 26.0, 16.0, 18.0, 16.0, 7.0, 7.0, 10.0, 5.0, 6.0, 4.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.90625, -53.15966796875, -51.4130859375, -49.66650390625, -47.919921875, -46.17333984375, -44.4267578125, -42.68017578125, -40.93359375, -39.18701171875, -37.4404296875, -35.69384765625, -33.947265625, -32.20068359375, -30.4541015625, -28.70751953125, -26.9609375, -25.21435546875, -23.4677734375, -21.72119140625, -19.974609375, -18.22802734375, -16.4814453125, -14.73486328125, -12.98828125, -11.24169921875, -9.4951171875, -7.74853515625, -6.001953125, -4.25537109375, -2.5087890625, -0.76220703125, 0.984375, 2.73095703125, 4.4775390625, 6.22412109375, 7.970703125, 9.71728515625, 11.4638671875, 13.21044921875, 14.95703125, 16.70361328125, 18.4501953125, 20.19677734375, 21.943359375, 23.68994140625, 25.4365234375, 27.18310546875, 28.9296875, 30.67626953125, 32.4228515625, 34.16943359375, 35.916015625, 37.66259765625, 39.4091796875, 41.15576171875, 42.90234375, 44.64892578125, 46.3955078125, 48.14208984375, 49.888671875, 51.63525390625, 53.3818359375, 55.12841796875, 56.875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 16.0, 18.0, 24.0, 43.0, 54.0, 67.0, 101.0, 153.0, 213.0, 313.0, 429.0, 582.0, 797.0, 1205.0, 1765.0, 2599.0, 3822.0, 6030.0, 9499.0, 14855.0, 24829.0, 42357.0, 75776.0, 148133.0, 270766.0, 204209.0, 101660.0, 54464.0, 31501.0, 18802.0, 11559.0, 7316.0, 4664.0, 3089.0, 2060.0, 1444.0, 992.0, 687.0, 482.0, 335.0, 259.0, 171.0, 121.0, 95.0, 62.0, 41.0, 40.0, 22.0, 13.0, 7.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0], "bins": [-69.0, -66.8916015625, -64.783203125, -62.6748046875, -60.56640625, -58.4580078125, -56.349609375, -54.2412109375, -52.1328125, -50.0244140625, -47.916015625, -45.8076171875, -43.69921875, -41.5908203125, -39.482421875, -37.3740234375, -35.265625, -33.1572265625, -31.048828125, -28.9404296875, -26.83203125, -24.7236328125, -22.615234375, -20.5068359375, -18.3984375, -16.2900390625, -14.181640625, -12.0732421875, -9.96484375, -7.8564453125, -5.748046875, -3.6396484375, -1.53125, 0.5771484375, 2.685546875, 4.7939453125, 6.90234375, 9.0107421875, 11.119140625, 13.2275390625, 15.3359375, 17.4443359375, 19.552734375, 21.6611328125, 23.76953125, 25.8779296875, 27.986328125, 30.0947265625, 32.203125, 34.3115234375, 36.419921875, 38.5283203125, 40.63671875, 42.7451171875, 44.853515625, 46.9619140625, 49.0703125, 51.1787109375, 53.287109375, 55.3955078125, 57.50390625, 59.6123046875, 61.720703125, 63.8291015625, 65.9375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 1.0, 9.0, 3.0, 11.0, 17.0, 13.0, 15.0, 30.0, 21.0, 24.0, 20.0, 37.0, 34.0, 43.0, 38.0, 46.0, 32.0, 43.0, 51.0, 45.0, 42.0, 43.0, 39.0, 39.0, 35.0, 31.0, 27.0, 24.0, 26.0, 29.0, 23.0, 19.0, 13.0, 14.0, 7.0, 8.0, 8.0, 4.0, 5.0, 3.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-31.296875, -30.258056640625, -29.21923828125, -28.180419921875, -27.1416015625, -26.102783203125, -25.06396484375, -24.025146484375, -22.986328125, -21.947509765625, -20.90869140625, -19.869873046875, -18.8310546875, -17.792236328125, -16.75341796875, -15.714599609375, -14.67578125, -13.636962890625, -12.59814453125, -11.559326171875, -10.5205078125, -9.481689453125, -8.44287109375, -7.404052734375, -6.365234375, -5.326416015625, -4.28759765625, -3.248779296875, -2.2099609375, -1.171142578125, -0.13232421875, 0.906494140625, 1.9453125, 2.984130859375, 4.02294921875, 5.061767578125, 6.1005859375, 7.139404296875, 8.17822265625, 9.217041015625, 10.255859375, 11.294677734375, 12.33349609375, 13.372314453125, 14.4111328125, 15.449951171875, 16.48876953125, 17.527587890625, 18.56640625, 19.605224609375, 20.64404296875, 21.682861328125, 22.7216796875, 23.760498046875, 24.79931640625, 25.838134765625, 26.876953125, 27.915771484375, 28.95458984375, 29.993408203125, 31.0322265625, 32.071044921875, 33.10986328125, 34.148681640625, 35.1875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 6.0, 8.0, 13.0, 18.0, 27.0, 39.0, 75.0, 110.0, 142.0, 186.0, 289.0, 472.0, 644.0, 1091.0, 1557.0, 2546.0, 4299.0, 7424.0, 13200.0, 24625.0, 48574.0, 103069.0, 231129.0, 311932.0, 151716.0, 69418.0, 33698.0, 17848.0, 9842.0, 5394.0, 3314.0, 2096.0, 1295.0, 818.0, 551.0, 346.0, 242.0, 166.0, 111.0, 71.0, 49.0, 34.0, 24.0, 16.0, 12.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.953125, -22.2412109375, -21.529296875, -20.8173828125, -20.10546875, -19.3935546875, -18.681640625, -17.9697265625, -17.2578125, -16.5458984375, -15.833984375, -15.1220703125, -14.41015625, -13.6982421875, -12.986328125, -12.2744140625, -11.5625, -10.8505859375, -10.138671875, -9.4267578125, -8.71484375, -8.0029296875, -7.291015625, -6.5791015625, -5.8671875, -5.1552734375, -4.443359375, -3.7314453125, -3.01953125, -2.3076171875, -1.595703125, -0.8837890625, -0.171875, 0.5400390625, 1.251953125, 1.9638671875, 2.67578125, 3.3876953125, 4.099609375, 4.8115234375, 5.5234375, 6.2353515625, 6.947265625, 7.6591796875, 8.37109375, 9.0830078125, 9.794921875, 10.5068359375, 11.21875, 11.9306640625, 12.642578125, 13.3544921875, 14.06640625, 14.7783203125, 15.490234375, 16.2021484375, 16.9140625, 17.6259765625, 18.337890625, 19.0498046875, 19.76171875, 20.4736328125, 21.185546875, 21.8974609375, 22.609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 6.0, 2.0, 5.0, 7.0, 8.0, 13.0, 13.0, 17.0, 19.0, 23.0, 36.0, 66.0, 58.0, 92.0, 90.0, 126.0, 76.0, 61.0, 66.0, 52.0, 31.0, 19.0, 27.0, 19.0, 15.0, 11.0, 6.0, 9.0, 3.0, 4.0, 5.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002597808837890625, -0.0025197267532348633, -0.0024416446685791016, -0.00236356258392334, -0.002285480499267578, -0.0022073984146118164, -0.0021293163299560547, -0.002051234245300293, -0.0019731521606445312, -0.0018950700759887695, -0.0018169879913330078, -0.001738905906677246, -0.0016608238220214844, -0.0015827417373657227, -0.001504659652709961, -0.0014265775680541992, -0.0013484954833984375, -0.0012704133987426758, -0.001192331314086914, -0.0011142492294311523, -0.0010361671447753906, -0.0009580850601196289, -0.0008800029754638672, -0.0008019208908081055, -0.0007238388061523438, -0.000645756721496582, -0.0005676746368408203, -0.0004895925521850586, -0.0004115104675292969, -0.00033342838287353516, -0.00025534629821777344, -0.00017726421356201172, -9.918212890625e-05, -2.110004425048828e-05, 5.698204040527344e-05, 0.00013506412506103516, 0.00021314620971679688, 0.0002912282943725586, 0.0003693103790283203, 0.00044739246368408203, 0.0005254745483398438, 0.0006035566329956055, 0.0006816387176513672, 0.0007597208023071289, 0.0008378028869628906, 0.0009158849716186523, 0.000993967056274414, 0.0010720491409301758, 0.0011501312255859375, 0.0012282133102416992, 0.001306295394897461, 0.0013843774795532227, 0.0014624595642089844, 0.001540541648864746, 0.0016186237335205078, 0.0016967058181762695, 0.0017747879028320312, 0.001852869987487793, 0.0019309520721435547, 0.0020090341567993164, 0.002087116241455078, 0.00216519832611084, 0.0022432804107666016, 0.0023213624954223633, 0.002399444580078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 5.0, 6.0, 6.0, 4.0, 14.0, 15.0, 32.0, 32.0, 40.0, 48.0, 95.0, 90.0, 152.0, 222.0, 295.0, 413.0, 589.0, 933.0, 1524.0, 2370.0, 3967.0, 6747.0, 12311.0, 22781.0, 44619.0, 91834.0, 197118.0, 307393.0, 180473.0, 84442.0, 40751.0, 21095.0, 11157.0, 6588.0, 3805.0, 2301.0, 1464.0, 859.0, 584.0, 404.0, 272.0, 180.0, 153.0, 100.0, 67.0, 59.0, 48.0, 29.0, 25.0, 14.0, 10.0, 10.0, 5.0, 9.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-19.53125, -18.92919921875, -18.3271484375, -17.72509765625, -17.123046875, -16.52099609375, -15.9189453125, -15.31689453125, -14.71484375, -14.11279296875, -13.5107421875, -12.90869140625, -12.306640625, -11.70458984375, -11.1025390625, -10.50048828125, -9.8984375, -9.29638671875, -8.6943359375, -8.09228515625, -7.490234375, -6.88818359375, -6.2861328125, -5.68408203125, -5.08203125, -4.47998046875, -3.8779296875, -3.27587890625, -2.673828125, -2.07177734375, -1.4697265625, -0.86767578125, -0.265625, 0.33642578125, 0.9384765625, 1.54052734375, 2.142578125, 2.74462890625, 3.3466796875, 3.94873046875, 4.55078125, 5.15283203125, 5.7548828125, 6.35693359375, 6.958984375, 7.56103515625, 8.1630859375, 8.76513671875, 9.3671875, 9.96923828125, 10.5712890625, 11.17333984375, 11.775390625, 12.37744140625, 12.9794921875, 13.58154296875, 14.18359375, 14.78564453125, 15.3876953125, 15.98974609375, 16.591796875, 17.19384765625, 17.7958984375, 18.39794921875, 19.0]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 11.0, 9.0, 11.0, 16.0, 20.0, 30.0, 29.0, 34.0, 43.0, 47.0, 70.0, 76.0, 84.0, 70.0, 73.0, 82.0, 59.0, 58.0, 37.0, 27.0, 23.0, 16.0, 14.0, 19.0, 12.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6640625, -6.45135498046875, -6.2386474609375, -6.02593994140625, -5.813232421875, -5.60052490234375, -5.3878173828125, -5.17510986328125, -4.96240234375, -4.74969482421875, -4.5369873046875, -4.32427978515625, -4.111572265625, -3.89886474609375, -3.6861572265625, -3.47344970703125, -3.2607421875, -3.04803466796875, -2.8353271484375, -2.62261962890625, -2.409912109375, -2.19720458984375, -1.9844970703125, -1.77178955078125, -1.55908203125, -1.34637451171875, -1.1336669921875, -0.92095947265625, -0.708251953125, -0.49554443359375, -0.2828369140625, -0.07012939453125, 0.142578125, 0.35528564453125, 0.5679931640625, 0.78070068359375, 0.993408203125, 1.20611572265625, 1.4188232421875, 1.63153076171875, 1.84423828125, 2.05694580078125, 2.2696533203125, 2.48236083984375, 2.695068359375, 2.90777587890625, 3.1204833984375, 3.33319091796875, 3.5458984375, 3.75860595703125, 3.9713134765625, 4.18402099609375, 4.396728515625, 4.60943603515625, 4.8221435546875, 5.03485107421875, 5.24755859375, 5.46026611328125, 5.6729736328125, 5.88568115234375, 6.098388671875, 6.31109619140625, 6.5238037109375, 6.73651123046875, 6.94921875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 0.0, 2.0, 5.0, 8.0, 9.0, 13.0, 13.0, 18.0, 24.0, 50.0, 40.0, 78.0, 103.0, 115.0, 109.0, 104.0, 85.0, 58.0, 40.0, 26.0, 31.0, 24.0, 14.0, 12.0, 11.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.49870300292969, -74.7408676147461, -71.9830322265625, -69.2251968383789, -66.46736145019531, -63.70952224731445, -60.951683044433594, -58.19384765625, -55.436012268066406, -52.67817687988281, -49.92034149169922, -47.16250228881836, -44.404666900634766, -41.64683151245117, -38.88899230957031, -36.13115692138672, -33.373321533203125, -30.61548614501953, -27.857648849487305, -25.099811553955078, -22.341976165771484, -19.58414077758789, -16.826303482055664, -14.068466186523438, -11.310630798339844, -8.552794456481934, -5.794958114624023, -3.0371217727661133, -0.2792854309082031, 2.478550910949707, 5.236387252807617, 7.994224548339844, 10.752067565917969, 13.509903907775879, 16.26774024963379, 19.025577545166016, 21.78341293334961, 24.541248321533203, 27.29908561706543, 30.056922912597656, 32.81475830078125, 35.572593688964844, 38.33042907714844, 41.0882682800293, 43.84610366821289, 46.603939056396484, 49.361778259277344, 52.11961364746094, 54.87744903564453, 57.635284423828125, 60.39311981201172, 63.15095901489258, 65.90879821777344, 68.66663360595703, 71.42446899414062, 74.18230438232422, 76.94013977050781, 79.6979751586914, 82.455810546875, 85.2136459350586, 87.97148132324219, 90.72932434082031, 93.4871597290039, 96.2449951171875, 99.0028305053711]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 8.0, 6.0, 6.0, 6.0, 11.0, 10.0, 18.0, 14.0, 13.0, 15.0, 16.0, 25.0, 23.0, 34.0, 44.0, 42.0, 30.0, 42.0, 45.0, 42.0, 45.0, 45.0, 36.0, 43.0, 39.0, 35.0, 34.0, 28.0, 32.0, 24.0, 27.0, 17.0, 22.0, 21.0, 20.0, 15.0, 11.0, 11.0, 6.0, 3.0, 9.0, 7.0, 3.0, 2.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-53.536766052246094, -51.87102127075195, -50.20528030395508, -48.53953552246094, -46.87379455566406, -45.20804977416992, -43.54230499267578, -41.876564025878906, -40.21082305908203, -38.54507827758789, -36.879337310791016, -35.213592529296875, -33.5478515625, -31.88210678100586, -30.21636390686035, -28.550621032714844, -26.884876251220703, -25.219133377075195, -23.553390502929688, -21.887645721435547, -20.221904754638672, -18.55615997314453, -16.890417098999023, -15.224674224853516, -13.558931350708008, -11.8931884765625, -10.227445602416992, -8.561701774597168, -6.89595890045166, -5.230216026306152, -3.564472198486328, -1.8987293243408203, -0.23298263549804688, 1.43276047706604, 3.098503589630127, 4.764246940612793, 6.429989814758301, 8.095732688903809, 9.761476516723633, 11.42721939086914, 13.092962265014648, 14.758705139160156, 16.424448013305664, 18.090190887451172, 19.755935668945312, 21.421676635742188, 23.087421417236328, 24.753164291381836, 26.418907165527344, 28.08465003967285, 29.75039291381836, 31.4161376953125, 33.081878662109375, 34.747623443603516, 36.413368225097656, 38.07910919189453, 39.744850158691406, 41.41059494018555, 43.07633590698242, 44.74208068847656, 46.40782165527344, 48.07356643676758, 49.73931121826172, 51.405052185058594, 53.070796966552734]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 5.0, 11.0, 5.0, 15.0, 29.0, 23.0, 35.0, 70.0, 87.0, 119.0, 151.0, 236.0, 289.0, 440.0, 629.0, 904.0, 1241.0, 1882.0, 2686.0, 3940.0, 6084.0, 9984.0, 17171.0, 38349.0, 119400.0, 459895.0, 1670667.0, 1357458.0, 343094.0, 85731.0, 30357.0, 15307.0, 8928.0, 5921.0, 3915.0, 2643.0, 1902.0, 1328.0, 987.0, 663.0, 474.0, 342.0, 251.0, 183.0, 127.0, 98.0, 65.0, 47.0, 41.0, 24.0, 16.0, 12.0, 7.0, 6.0, 4.0, 6.0, 4.0], "bins": [-79.9375, -77.5791015625, -75.220703125, -72.8623046875, -70.50390625, -68.1455078125, -65.787109375, -63.4287109375, -61.0703125, -58.7119140625, -56.353515625, -53.9951171875, -51.63671875, -49.2783203125, -46.919921875, -44.5615234375, -42.203125, -39.8447265625, -37.486328125, -35.1279296875, -32.76953125, -30.4111328125, -28.052734375, -25.6943359375, -23.3359375, -20.9775390625, -18.619140625, -16.2607421875, -13.90234375, -11.5439453125, -9.185546875, -6.8271484375, -4.46875, -2.1103515625, 0.248046875, 2.6064453125, 4.96484375, 7.3232421875, 9.681640625, 12.0400390625, 14.3984375, 16.7568359375, 19.115234375, 21.4736328125, 23.83203125, 26.1904296875, 28.548828125, 30.9072265625, 33.265625, 35.6240234375, 37.982421875, 40.3408203125, 42.69921875, 45.0576171875, 47.416015625, 49.7744140625, 52.1328125, 54.4912109375, 56.849609375, 59.2080078125, 61.56640625, 63.9248046875, 66.283203125, 68.6416015625, 71.0]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 9.0, 8.0, 8.0, 5.0, 8.0, 7.0, 15.0, 13.0, 12.0, 17.0, 15.0, 27.0, 22.0, 23.0, 51.0, 34.0, 46.0, 33.0, 47.0, 38.0, 49.0, 52.0, 44.0, 39.0, 48.0, 41.0, 30.0, 33.0, 39.0, 25.0, 21.0, 17.0, 19.0, 18.0, 16.0, 15.0, 12.0, 10.0, 7.0, 6.0, 5.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-48.25, -46.75732421875, -45.2646484375, -43.77197265625, -42.279296875, -40.78662109375, -39.2939453125, -37.80126953125, -36.30859375, -34.81591796875, -33.3232421875, -31.83056640625, -30.337890625, -28.84521484375, -27.3525390625, -25.85986328125, -24.3671875, -22.87451171875, -21.3818359375, -19.88916015625, -18.396484375, -16.90380859375, -15.4111328125, -13.91845703125, -12.42578125, -10.93310546875, -9.4404296875, -7.94775390625, -6.455078125, -4.96240234375, -3.4697265625, -1.97705078125, -0.484375, 1.00830078125, 2.5009765625, 3.99365234375, 5.486328125, 6.97900390625, 8.4716796875, 9.96435546875, 11.45703125, 12.94970703125, 14.4423828125, 15.93505859375, 17.427734375, 18.92041015625, 20.4130859375, 21.90576171875, 23.3984375, 24.89111328125, 26.3837890625, 27.87646484375, 29.369140625, 30.86181640625, 32.3544921875, 33.84716796875, 35.33984375, 36.83251953125, 38.3251953125, 39.81787109375, 41.310546875, 42.80322265625, 44.2958984375, 45.78857421875, 47.28125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 8.0, 17.0, 22.0, 31.0, 26.0, 35.0, 81.0, 99.0, 158.0, 254.0, 341.0, 547.0, 834.0, 1227.0, 2133.0, 3408.0, 5598.0, 9726.0, 18011.0, 36415.0, 86317.0, 293724.0, 2051764.0, 1328752.0, 215736.0, 70236.0, 30996.0, 15668.0, 8924.0, 4976.0, 2950.0, 1865.0, 1169.0, 737.0, 471.0, 341.0, 208.0, 144.0, 114.0, 92.0, 38.0, 36.0, 21.0, 10.0, 8.0, 7.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.4375, -100.1943359375, -96.951171875, -93.7080078125, -90.46484375, -87.2216796875, -83.978515625, -80.7353515625, -77.4921875, -74.2490234375, -71.005859375, -67.7626953125, -64.51953125, -61.2763671875, -58.033203125, -54.7900390625, -51.546875, -48.3037109375, -45.060546875, -41.8173828125, -38.57421875, -35.3310546875, -32.087890625, -28.8447265625, -25.6015625, -22.3583984375, -19.115234375, -15.8720703125, -12.62890625, -9.3857421875, -6.142578125, -2.8994140625, 0.34375, 3.5869140625, 6.830078125, 10.0732421875, 13.31640625, 16.5595703125, 19.802734375, 23.0458984375, 26.2890625, 29.5322265625, 32.775390625, 36.0185546875, 39.26171875, 42.5048828125, 45.748046875, 48.9912109375, 52.234375, 55.4775390625, 58.720703125, 61.9638671875, 65.20703125, 68.4501953125, 71.693359375, 74.9365234375, 78.1796875, 81.4228515625, 84.666015625, 87.9091796875, 91.15234375, 94.3955078125, 97.638671875, 100.8818359375, 104.125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 9.0, 5.0, 14.0, 10.0, 15.0, 23.0, 19.0, 29.0, 45.0, 48.0, 65.0, 97.0, 118.0, 200.0, 311.0, 477.0, 681.0, 593.0, 437.0, 251.0, 176.0, 83.0, 84.0, 56.0, 56.0, 32.0, 36.0, 27.0, 12.0, 10.0, 8.0, 12.0, 7.0, 8.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.9375, -25.037353515625, -24.13720703125, -23.237060546875, -22.3369140625, -21.436767578125, -20.53662109375, -19.636474609375, -18.736328125, -17.836181640625, -16.93603515625, -16.035888671875, -15.1357421875, -14.235595703125, -13.33544921875, -12.435302734375, -11.53515625, -10.635009765625, -9.73486328125, -8.834716796875, -7.9345703125, -7.034423828125, -6.13427734375, -5.234130859375, -4.333984375, -3.433837890625, -2.53369140625, -1.633544921875, -0.7333984375, 0.166748046875, 1.06689453125, 1.967041015625, 2.8671875, 3.767333984375, 4.66748046875, 5.567626953125, 6.4677734375, 7.367919921875, 8.26806640625, 9.168212890625, 10.068359375, 10.968505859375, 11.86865234375, 12.768798828125, 13.6689453125, 14.569091796875, 15.46923828125, 16.369384765625, 17.26953125, 18.169677734375, 19.06982421875, 19.969970703125, 20.8701171875, 21.770263671875, 22.67041015625, 23.570556640625, 24.470703125, 25.370849609375, 26.27099609375, 27.171142578125, 28.0712890625, 28.971435546875, 29.87158203125, 30.771728515625, 31.671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 6.0, 7.0, 6.0, 7.0, 11.0, 16.0, 21.0, 29.0, 38.0, 58.0, 47.0, 78.0, 72.0, 105.0, 88.0, 106.0, 63.0, 47.0, 46.0, 36.0, 22.0, 18.0, 15.0, 7.0, 9.0, 7.0, 6.0, 11.0, 4.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.113773345947266, -49.06436538696289, -47.014957427978516, -44.96554946899414, -42.9161376953125, -40.866729736328125, -38.81732177734375, -36.767913818359375, -34.718505859375, -32.669097900390625, -30.61968994140625, -28.570280075073242, -26.520872116088867, -24.471464157104492, -22.422054290771484, -20.37264633178711, -18.323238372802734, -16.27383041381836, -14.224421501159668, -12.175012588500977, -10.125604629516602, -8.076196670532227, -6.026787757873535, -3.9773788452148438, -1.9279708862304688, 0.12143754959106445, 2.1708459854125977, 4.220254421234131, 6.269662857055664, 8.319070816040039, 10.36847972869873, 12.417888641357422, 14.467292785644531, 16.516700744628906, 18.56610870361328, 20.61551856994629, 22.664926528930664, 24.71433448791504, 26.763744354248047, 28.813152313232422, 30.862560272216797, 32.91196823120117, 34.96137619018555, 37.01078414916992, 39.06019592285156, 41.10960388183594, 43.15901184082031, 45.20841979980469, 47.25782775878906, 49.30723571777344, 51.35664367675781, 53.40605163574219, 55.45545959472656, 57.50486755371094, 59.55427932739258, 61.60368728637695, 63.65309524536133, 65.70250701904297, 67.75191497802734, 69.80132293701172, 71.8507308959961, 73.90013885498047, 75.94954681396484, 77.99895477294922, 80.0483627319336]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 4.0, 7.0, 7.0, 10.0, 12.0, 11.0, 14.0, 13.0, 15.0, 18.0, 25.0, 32.0, 22.0, 25.0, 30.0, 41.0, 39.0, 48.0, 28.0, 41.0, 37.0, 38.0, 35.0, 41.0, 48.0, 46.0, 36.0, 23.0, 28.0, 22.0, 28.0, 25.0, 25.0, 15.0, 21.0, 9.0, 13.0, 12.0, 11.0, 4.0, 4.0, 8.0, 5.0, 5.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-46.545711517333984, -45.09880447387695, -43.65189743041992, -42.204986572265625, -40.758079528808594, -39.31117248535156, -37.86426544189453, -36.4173583984375, -34.97045135498047, -33.52354431152344, -32.076637268066406, -30.629728317260742, -29.18282127380371, -27.735912322998047, -26.289005279541016, -24.842098236083984, -23.39518928527832, -21.94828224182129, -20.501373291015625, -19.054466247558594, -17.607559204101562, -16.16065216064453, -14.713743209838867, -13.266836166381836, -11.819928169250488, -10.37302017211914, -8.92611312866211, -7.479205131530762, -6.032297611236572, -4.585390090942383, -3.138482093811035, -1.691575050354004, -0.24466705322265625, 1.2022405862808228, 2.6491482257843018, 4.09605598449707, 5.54296350479126, 6.989871025085449, 8.436779022216797, 9.883686065673828, 11.330594062805176, 12.777502059936523, 14.224409103393555, 15.671317100524902, 17.11822509765625, 18.56513214111328, 20.012039184570312, 21.458946228027344, 22.905855178833008, 24.35276222229004, 25.799671173095703, 27.246578216552734, 28.693485260009766, 30.140392303466797, 31.58730125427246, 33.034210205078125, 34.481117248535156, 35.92802429199219, 37.37493133544922, 38.82183837890625, 40.26874923706055, 41.71565628051758, 43.16256332397461, 44.60947036743164, 46.05637741088867]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 21.0, 25.0, 38.0, 64.0, 103.0, 146.0, 224.0, 267.0, 438.0, 598.0, 873.0, 1366.0, 1955.0, 3010.0, 4458.0, 6704.0, 10614.0, 16668.0, 27408.0, 48098.0, 89532.0, 181472.0, 286326.0, 167579.0, 83517.0, 45485.0, 26361.0, 15884.0, 9951.0, 6469.0, 4164.0, 2863.0, 1889.0, 1273.0, 882.0, 566.0, 427.0, 258.0, 159.0, 137.0, 95.0, 63.0, 42.0, 22.0, 21.0, 10.0, 12.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.34375, -29.34716796875, -28.3505859375, -27.35400390625, -26.357421875, -25.36083984375, -24.3642578125, -23.36767578125, -22.37109375, -21.37451171875, -20.3779296875, -19.38134765625, -18.384765625, -17.38818359375, -16.3916015625, -15.39501953125, -14.3984375, -13.40185546875, -12.4052734375, -11.40869140625, -10.412109375, -9.41552734375, -8.4189453125, -7.42236328125, -6.42578125, -5.42919921875, -4.4326171875, -3.43603515625, -2.439453125, -1.44287109375, -0.4462890625, 0.55029296875, 1.546875, 2.54345703125, 3.5400390625, 4.53662109375, 5.533203125, 6.52978515625, 7.5263671875, 8.52294921875, 9.51953125, 10.51611328125, 11.5126953125, 12.50927734375, 13.505859375, 14.50244140625, 15.4990234375, 16.49560546875, 17.4921875, 18.48876953125, 19.4853515625, 20.48193359375, 21.478515625, 22.47509765625, 23.4716796875, 24.46826171875, 25.46484375, 26.46142578125, 27.4580078125, 28.45458984375, 29.451171875, 30.44775390625, 31.4443359375, 32.44091796875, 33.4375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 3.0, 7.0, 8.0, 10.0, 14.0, 14.0, 16.0, 14.0, 26.0, 20.0, 22.0, 31.0, 22.0, 34.0, 33.0, 41.0, 48.0, 39.0, 42.0, 41.0, 51.0, 51.0, 52.0, 45.0, 28.0, 38.0, 20.0, 32.0, 19.0, 24.0, 23.0, 15.0, 21.0, 19.0, 4.0, 9.0, 11.0, 12.0, 0.0, 7.0, 5.0, 7.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-50.15625, -48.62353515625, -47.0908203125, -45.55810546875, -44.025390625, -42.49267578125, -40.9599609375, -39.42724609375, -37.89453125, -36.36181640625, -34.8291015625, -33.29638671875, -31.763671875, -30.23095703125, -28.6982421875, -27.16552734375, -25.6328125, -24.10009765625, -22.5673828125, -21.03466796875, -19.501953125, -17.96923828125, -16.4365234375, -14.90380859375, -13.37109375, -11.83837890625, -10.3056640625, -8.77294921875, -7.240234375, -5.70751953125, -4.1748046875, -2.64208984375, -1.109375, 0.42333984375, 1.9560546875, 3.48876953125, 5.021484375, 6.55419921875, 8.0869140625, 9.61962890625, 11.15234375, 12.68505859375, 14.2177734375, 15.75048828125, 17.283203125, 18.81591796875, 20.3486328125, 21.88134765625, 23.4140625, 24.94677734375, 26.4794921875, 28.01220703125, 29.544921875, 31.07763671875, 32.6103515625, 34.14306640625, 35.67578125, 37.20849609375, 38.7412109375, 40.27392578125, 41.806640625, 43.33935546875, 44.8720703125, 46.40478515625, 47.9375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 12.0, 6.0, 8.0, 12.0, 26.0, 36.0, 47.0, 47.0, 75.0, 92.0, 156.0, 224.0, 310.0, 439.0, 660.0, 979.0, 1412.0, 2182.0, 3259.0, 5399.0, 8749.0, 15760.0, 40602.0, 598207.0, 302423.0, 31726.0, 13823.0, 7839.0, 4822.0, 3073.0, 2022.0, 1310.0, 914.0, 596.0, 385.0, 276.0, 188.0, 152.0, 93.0, 60.0, 53.0, 32.0, 17.0, 9.0, 20.0, 11.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.8125, -47.23291015625, -45.6533203125, -44.07373046875, -42.494140625, -40.91455078125, -39.3349609375, -37.75537109375, -36.17578125, -34.59619140625, -33.0166015625, -31.43701171875, -29.857421875, -28.27783203125, -26.6982421875, -25.11865234375, -23.5390625, -21.95947265625, -20.3798828125, -18.80029296875, -17.220703125, -15.64111328125, -14.0615234375, -12.48193359375, -10.90234375, -9.32275390625, -7.7431640625, -6.16357421875, -4.583984375, -3.00439453125, -1.4248046875, 0.15478515625, 1.734375, 3.31396484375, 4.8935546875, 6.47314453125, 8.052734375, 9.63232421875, 11.2119140625, 12.79150390625, 14.37109375, 15.95068359375, 17.5302734375, 19.10986328125, 20.689453125, 22.26904296875, 23.8486328125, 25.42822265625, 27.0078125, 28.58740234375, 30.1669921875, 31.74658203125, 33.326171875, 34.90576171875, 36.4853515625, 38.06494140625, 39.64453125, 41.22412109375, 42.8037109375, 44.38330078125, 45.962890625, 47.54248046875, 49.1220703125, 50.70166015625, 52.28125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 4.0, 5.0, 0.0, 6.0, 8.0, 9.0, 14.0, 7.0, 24.0, 17.0, 17.0, 13.0, 20.0, 24.0, 29.0, 29.0, 27.0, 37.0, 36.0, 24.0, 36.0, 39.0, 43.0, 41.0, 46.0, 43.0, 39.0, 37.0, 33.0, 29.0, 37.0, 30.0, 18.0, 24.0, 19.0, 18.0, 18.0, 11.0, 21.0, 14.0, 8.0, 11.0, 5.0, 7.0, 7.0, 6.0, 2.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-36.34375, -35.21142578125, -34.0791015625, -32.94677734375, -31.814453125, -30.68212890625, -29.5498046875, -28.41748046875, -27.28515625, -26.15283203125, -25.0205078125, -23.88818359375, -22.755859375, -21.62353515625, -20.4912109375, -19.35888671875, -18.2265625, -17.09423828125, -15.9619140625, -14.82958984375, -13.697265625, -12.56494140625, -11.4326171875, -10.30029296875, -9.16796875, -8.03564453125, -6.9033203125, -5.77099609375, -4.638671875, -3.50634765625, -2.3740234375, -1.24169921875, -0.109375, 1.02294921875, 2.1552734375, 3.28759765625, 4.419921875, 5.55224609375, 6.6845703125, 7.81689453125, 8.94921875, 10.08154296875, 11.2138671875, 12.34619140625, 13.478515625, 14.61083984375, 15.7431640625, 16.87548828125, 18.0078125, 19.14013671875, 20.2724609375, 21.40478515625, 22.537109375, 23.66943359375, 24.8017578125, 25.93408203125, 27.06640625, 28.19873046875, 29.3310546875, 30.46337890625, 31.595703125, 32.72802734375, 33.8603515625, 34.99267578125, 36.125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 5.0, 10.0, 10.0, 13.0, 19.0, 45.0, 59.0, 76.0, 139.0, 207.0, 344.0, 510.0, 883.0, 1723.0, 3089.0, 6628.0, 17092.0, 90258.0, 847303.0, 54581.0, 13704.0, 5571.0, 2687.0, 1476.0, 801.0, 480.0, 291.0, 170.0, 114.0, 91.0, 52.0, 41.0, 24.0, 15.0, 15.0, 8.0, 5.0, 3.0, 9.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.9453125, -3.830596923828125, -3.71588134765625, -3.601165771484375, -3.4864501953125, -3.371734619140625, -3.25701904296875, -3.142303466796875, -3.027587890625, -2.912872314453125, -2.79815673828125, -2.683441162109375, -2.5687255859375, -2.454010009765625, -2.33929443359375, -2.224578857421875, -2.10986328125, -1.995147705078125, -1.88043212890625, -1.765716552734375, -1.6510009765625, -1.536285400390625, -1.42156982421875, -1.306854248046875, -1.192138671875, -1.077423095703125, -0.96270751953125, -0.847991943359375, -0.7332763671875, -0.618560791015625, -0.50384521484375, -0.389129638671875, -0.2744140625, -0.159698486328125, -0.04498291015625, 0.069732666015625, 0.1844482421875, 0.299163818359375, 0.41387939453125, 0.528594970703125, 0.643310546875, 0.758026123046875, 0.87274169921875, 0.987457275390625, 1.1021728515625, 1.216888427734375, 1.33160400390625, 1.446319580078125, 1.56103515625, 1.675750732421875, 1.79046630859375, 1.905181884765625, 2.0198974609375, 2.134613037109375, 2.24932861328125, 2.364044189453125, 2.478759765625, 2.593475341796875, 2.70819091796875, 2.822906494140625, 2.9376220703125, 3.052337646484375, 3.16705322265625, 3.281768798828125, 3.396484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 6.0, 12.0, 4.0, 15.0, 22.0, 23.0, 44.0, 47.0, 83.0, 135.0, 184.0, 119.0, 72.0, 52.0, 32.0, 41.0, 26.0, 3.0, 11.0, 10.0, 15.0, 4.0, 1.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001567840576171875, -0.001516297459602356, -0.001464754343032837, -0.0014132112264633179, -0.0013616681098937988, -0.0013101249933242798, -0.0012585818767547607, -0.0012070387601852417, -0.0011554956436157227, -0.0011039525270462036, -0.0010524094104766846, -0.0010008662939071655, -0.0009493231773376465, -0.0008977800607681274, -0.0008462369441986084, -0.0007946938276290894, -0.0007431507110595703, -0.0006916075944900513, -0.0006400644779205322, -0.0005885213613510132, -0.0005369782447814941, -0.0004854351282119751, -0.00043389201164245605, -0.000382348895072937, -0.00033080577850341797, -0.0002792626619338989, -0.00022771954536437988, -0.00017617642879486084, -0.0001246333122253418, -7.309019565582275e-05, -2.154707908630371e-05, 2.9996037483215332e-05, 8.153915405273438e-05, 0.00013308227062225342, 0.00018462538719177246, 0.0002361685037612915, 0.00028771162033081055, 0.0003392547369003296, 0.00039079785346984863, 0.0004423409700393677, 0.0004938840866088867, 0.0005454272031784058, 0.0005969703197479248, 0.0006485134363174438, 0.0007000565528869629, 0.0007515996694564819, 0.000803142786026001, 0.00085468590259552, 0.0009062290191650391, 0.0009577721357345581, 0.0010093152523040771, 0.0010608583688735962, 0.0011124014854431152, 0.0011639446020126343, 0.0012154877185821533, 0.0012670308351516724, 0.0013185739517211914, 0.0013701170682907104, 0.0014216601848602295, 0.0014732033014297485, 0.0015247464179992676, 0.0015762895345687866, 0.0016278326511383057, 0.0016793757677078247, 0.0017309188842773438]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 9.0, 11.0, 13.0, 24.0, 33.0, 62.0, 90.0, 147.0, 217.0, 324.0, 485.0, 737.0, 1085.0, 1663.0, 2684.0, 4147.0, 7056.0, 12425.0, 22024.0, 43134.0, 94126.0, 241105.0, 342000.0, 143488.0, 61374.0, 30199.0, 16103.0, 9192.0, 5347.0, 3325.0, 2090.0, 1294.0, 844.0, 553.0, 393.0, 268.0, 178.0, 122.0, 79.0, 46.0, 23.0, 11.0, 18.0, 10.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.951171875, -1.8957977294921875, -1.840423583984375, -1.7850494384765625, -1.72967529296875, -1.6743011474609375, -1.618927001953125, -1.5635528564453125, -1.5081787109375, -1.4528045654296875, -1.397430419921875, -1.3420562744140625, -1.28668212890625, -1.2313079833984375, -1.175933837890625, -1.1205596923828125, -1.065185546875, -1.0098114013671875, -0.954437255859375, -0.8990631103515625, -0.84368896484375, -0.7883148193359375, -0.732940673828125, -0.6775665283203125, -0.6221923828125, -0.5668182373046875, -0.511444091796875, -0.4560699462890625, -0.40069580078125, -0.3453216552734375, -0.289947509765625, -0.2345733642578125, -0.17919921875, -0.1238250732421875, -0.068450927734375, -0.0130767822265625, 0.04229736328125, 0.0976715087890625, 0.153045654296875, 0.2084197998046875, 0.2637939453125, 0.3191680908203125, 0.374542236328125, 0.4299163818359375, 0.48529052734375, 0.5406646728515625, 0.596038818359375, 0.6514129638671875, 0.706787109375, 0.7621612548828125, 0.817535400390625, 0.8729095458984375, 0.92828369140625, 0.9836578369140625, 1.039031982421875, 1.0944061279296875, 1.1497802734375, 1.2051544189453125, 1.260528564453125, 1.3159027099609375, 1.37127685546875, 1.4266510009765625, 1.482025146484375, 1.5373992919921875, 1.5927734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 9.0, 9.0, 11.0, 14.0, 17.0, 25.0, 29.0, 21.0, 32.0, 26.0, 55.0, 69.0, 64.0, 77.0, 67.0, 76.0, 62.0, 60.0, 41.0, 55.0, 28.0, 28.0, 17.0, 14.0, 11.0, 11.0, 7.0, 8.0, 7.0, 5.0, 2.0, 7.0, 3.0, 3.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.470703125, -0.4547576904296875, -0.438812255859375, -0.4228668212890625, -0.40692138671875, -0.3909759521484375, -0.375030517578125, -0.3590850830078125, -0.3431396484375, -0.3271942138671875, -0.311248779296875, -0.2953033447265625, -0.27935791015625, -0.2634124755859375, -0.247467041015625, -0.2315216064453125, -0.215576171875, -0.1996307373046875, -0.183685302734375, -0.1677398681640625, -0.15179443359375, -0.1358489990234375, -0.119903564453125, -0.1039581298828125, -0.0880126953125, -0.0720672607421875, -0.056121826171875, -0.0401763916015625, -0.02423095703125, -0.0082855224609375, 0.007659912109375, 0.0236053466796875, 0.03955078125, 0.0554962158203125, 0.071441650390625, 0.0873870849609375, 0.10333251953125, 0.1192779541015625, 0.135223388671875, 0.1511688232421875, 0.1671142578125, 0.1830596923828125, 0.199005126953125, 0.2149505615234375, 0.23089599609375, 0.2468414306640625, 0.262786865234375, 0.2787322998046875, 0.294677734375, 0.3106231689453125, 0.326568603515625, 0.3425140380859375, 0.35845947265625, 0.3744049072265625, 0.390350341796875, 0.4062957763671875, 0.4222412109375, 0.4381866455078125, 0.454132080078125, 0.4700775146484375, 0.48602294921875, 0.5019683837890625, 0.517913818359375, 0.5338592529296875, 0.5498046875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 6.0, 16.0, 13.0, 17.0, 25.0, 41.0, 43.0, 53.0, 49.0, 71.0, 85.0, 101.0, 85.0, 85.0, 77.0, 47.0, 41.0, 19.0, 20.0, 21.0, 12.0, 11.0, 7.0, 7.0, 8.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.05890655517578, -47.134620666503906, -45.21033477783203, -43.286048889160156, -41.361759185791016, -39.43747329711914, -37.513187408447266, -35.58890151977539, -33.66461181640625, -31.740325927734375, -29.816038131713867, -27.891752243041992, -25.967464447021484, -24.04317855834961, -22.118892669677734, -20.19460678100586, -18.270320892333984, -16.34603500366211, -14.421747207641602, -12.497461318969727, -10.573174476623535, -8.648887634277344, -6.724601745605469, -4.800314903259277, -2.876028060913086, -0.9517414569854736, 0.9725451469421387, 2.896831512451172, 4.821118354797363, 6.745405197143555, 8.66969108581543, 10.593977928161621, 12.518264770507812, 14.442551612854004, 16.366838455200195, 18.29112434387207, 20.215412139892578, 22.139698028564453, 24.063983917236328, 25.988269805908203, 27.91255760192871, 29.836843490600586, 31.761131286621094, 33.68541717529297, 35.609703063964844, 37.53398895263672, 39.458274841308594, 41.382564544677734, 43.30685043334961, 45.231136322021484, 47.15542221069336, 49.0797119140625, 51.003997802734375, 52.92828369140625, 54.852569580078125, 56.77685546875, 58.701141357421875, 60.62542724609375, 62.549713134765625, 64.4739990234375, 66.39828491210938, 68.32257080078125, 70.24685668945312, 72.17115020751953, 74.0954360961914]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 4.0, 6.0, 9.0, 9.0, 11.0, 14.0, 15.0, 9.0, 16.0, 19.0, 25.0, 32.0, 24.0, 22.0, 32.0, 45.0, 35.0, 50.0, 27.0, 38.0, 35.0, 49.0, 33.0, 39.0, 50.0, 42.0, 32.0, 25.0, 31.0, 21.0, 31.0, 23.0, 22.0, 17.0, 18.0, 10.0, 14.0, 10.0, 13.0, 2.0, 7.0, 5.0, 6.0, 4.0, 4.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-45.38300323486328, -43.97460174560547, -42.56620407104492, -41.15780258178711, -39.74940490722656, -38.34100341796875, -36.93260192871094, -35.52420425415039, -34.115806579589844, -32.70740509033203, -31.299007415771484, -29.890605926513672, -28.482208251953125, -27.073806762695312, -25.665407180786133, -24.257007598876953, -22.84860610961914, -21.44020652770996, -20.03180694580078, -18.62340545654297, -17.215007781982422, -15.806607246398926, -14.39820671081543, -12.98980712890625, -11.58140754699707, -10.17300796508789, -8.764608383178711, -7.356207847595215, -5.947808265686035, -4.5394086837768555, -3.1310081481933594, -1.7226085662841797, -0.314208984375, 1.0941908359527588, 2.5025906562805176, 3.9109907150268555, 5.319390296936035, 6.727789878845215, 8.136190414428711, 9.54458999633789, 10.95298957824707, 12.36138916015625, 13.76978874206543, 15.178189277648926, 16.586589813232422, 17.99498748779297, 19.40338897705078, 20.81178855895996, 22.22018814086914, 23.62858772277832, 25.0369873046875, 26.445388793945312, 27.85378646850586, 29.262187957763672, 30.67058753967285, 32.07898712158203, 33.487388610839844, 34.895790100097656, 36.3041877746582, 37.712589263916016, 39.12098693847656, 40.529388427734375, 41.93778991699219, 43.346187591552734, 44.75458526611328]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 13.0, 14.0, 22.0, 23.0, 29.0, 49.0, 73.0, 121.0, 161.0, 257.0, 369.0, 520.0, 763.0, 1171.0, 1785.0, 2876.0, 4437.0, 7131.0, 11923.0, 20813.0, 38368.0, 76848.0, 169996.0, 314269.0, 202439.0, 90743.0, 44412.0, 23646.0, 13419.0, 7987.0, 4952.0, 3019.0, 1987.0, 1273.0, 868.0, 551.0, 408.0, 240.0, 172.0, 128.0, 87.0, 61.0, 43.0, 30.0, 18.0, 20.0, 9.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.6875, -63.609375, -61.53125, -59.453125, -57.375, -55.296875, -53.21875, -51.140625, -49.0625, -46.984375, -44.90625, -42.828125, -40.75, -38.671875, -36.59375, -34.515625, -32.4375, -30.359375, -28.28125, -26.203125, -24.125, -22.046875, -19.96875, -17.890625, -15.8125, -13.734375, -11.65625, -9.578125, -7.5, -5.421875, -3.34375, -1.265625, 0.8125, 2.890625, 4.96875, 7.046875, 9.125, 11.203125, 13.28125, 15.359375, 17.4375, 19.515625, 21.59375, 23.671875, 25.75, 27.828125, 29.90625, 31.984375, 34.0625, 36.140625, 38.21875, 40.296875, 42.375, 44.453125, 46.53125, 48.609375, 50.6875, 52.765625, 54.84375, 56.921875, 59.0, 61.078125, 63.15625, 65.234375, 67.3125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 5.0, 6.0, 8.0, 9.0, 14.0, 14.0, 12.0, 15.0, 13.0, 30.0, 29.0, 19.0, 25.0, 40.0, 40.0, 41.0, 48.0, 38.0, 34.0, 50.0, 43.0, 45.0, 39.0, 60.0, 37.0, 40.0, 22.0, 27.0, 26.0, 21.0, 20.0, 19.0, 16.0, 17.0, 15.0, 7.0, 7.0, 7.0, 3.0, 5.0, 4.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-47.90625, -46.44677734375, -44.9873046875, -43.52783203125, -42.068359375, -40.60888671875, -39.1494140625, -37.68994140625, -36.23046875, -34.77099609375, -33.3115234375, -31.85205078125, -30.392578125, -28.93310546875, -27.4736328125, -26.01416015625, -24.5546875, -23.09521484375, -21.6357421875, -20.17626953125, -18.716796875, -17.25732421875, -15.7978515625, -14.33837890625, -12.87890625, -11.41943359375, -9.9599609375, -8.50048828125, -7.041015625, -5.58154296875, -4.1220703125, -2.66259765625, -1.203125, 0.25634765625, 1.7158203125, 3.17529296875, 4.634765625, 6.09423828125, 7.5537109375, 9.01318359375, 10.47265625, 11.93212890625, 13.3916015625, 14.85107421875, 16.310546875, 17.77001953125, 19.2294921875, 20.68896484375, 22.1484375, 23.60791015625, 25.0673828125, 26.52685546875, 27.986328125, 29.44580078125, 30.9052734375, 32.36474609375, 33.82421875, 35.28369140625, 36.7431640625, 38.20263671875, 39.662109375, 41.12158203125, 42.5810546875, 44.04052734375, 45.5]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 8.0, 5.0, 19.0, 31.0, 38.0, 60.0, 82.0, 144.0, 215.0, 302.0, 436.0, 628.0, 1019.0, 1491.0, 2362.0, 3954.0, 6219.0, 10073.0, 17239.0, 29389.0, 53034.0, 98802.0, 194391.0, 270292.0, 163985.0, 84473.0, 45533.0, 25556.0, 14862.0, 8885.0, 5315.0, 3459.0, 2128.0, 1378.0, 931.0, 629.0, 405.0, 264.0, 190.0, 101.0, 83.0, 44.0, 25.0, 29.0, 19.0, 12.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-64.0625, -62.0205078125, -59.978515625, -57.9365234375, -55.89453125, -53.8525390625, -51.810546875, -49.7685546875, -47.7265625, -45.6845703125, -43.642578125, -41.6005859375, -39.55859375, -37.5166015625, -35.474609375, -33.4326171875, -31.390625, -29.3486328125, -27.306640625, -25.2646484375, -23.22265625, -21.1806640625, -19.138671875, -17.0966796875, -15.0546875, -13.0126953125, -10.970703125, -8.9287109375, -6.88671875, -4.8447265625, -2.802734375, -0.7607421875, 1.28125, 3.3232421875, 5.365234375, 7.4072265625, 9.44921875, 11.4912109375, 13.533203125, 15.5751953125, 17.6171875, 19.6591796875, 21.701171875, 23.7431640625, 25.78515625, 27.8271484375, 29.869140625, 31.9111328125, 33.953125, 35.9951171875, 38.037109375, 40.0791015625, 42.12109375, 44.1630859375, 46.205078125, 48.2470703125, 50.2890625, 52.3310546875, 54.373046875, 56.4150390625, 58.45703125, 60.4990234375, 62.541015625, 64.5830078125, 66.625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 4.0, 9.0, 9.0, 10.0, 10.0, 19.0, 16.0, 25.0, 21.0, 38.0, 32.0, 36.0, 34.0, 28.0, 47.0, 41.0, 47.0, 34.0, 44.0, 52.0, 45.0, 29.0, 40.0, 40.0, 33.0, 37.0, 35.0, 24.0, 26.0, 27.0, 16.0, 17.0, 12.0, 9.0, 8.0, 7.0, 6.0, 5.0, 2.0, 3.0, 4.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.90625, -29.94970703125, -28.9931640625, -28.03662109375, -27.080078125, -26.12353515625, -25.1669921875, -24.21044921875, -23.25390625, -22.29736328125, -21.3408203125, -20.38427734375, -19.427734375, -18.47119140625, -17.5146484375, -16.55810546875, -15.6015625, -14.64501953125, -13.6884765625, -12.73193359375, -11.775390625, -10.81884765625, -9.8623046875, -8.90576171875, -7.94921875, -6.99267578125, -6.0361328125, -5.07958984375, -4.123046875, -3.16650390625, -2.2099609375, -1.25341796875, -0.296875, 0.65966796875, 1.6162109375, 2.57275390625, 3.529296875, 4.48583984375, 5.4423828125, 6.39892578125, 7.35546875, 8.31201171875, 9.2685546875, 10.22509765625, 11.181640625, 12.13818359375, 13.0947265625, 14.05126953125, 15.0078125, 15.96435546875, 16.9208984375, 17.87744140625, 18.833984375, 19.79052734375, 20.7470703125, 21.70361328125, 22.66015625, 23.61669921875, 24.5732421875, 25.52978515625, 26.486328125, 27.44287109375, 28.3994140625, 29.35595703125, 30.3125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 6.0, 5.0, 6.0, 18.0, 26.0, 25.0, 57.0, 94.0, 122.0, 183.0, 276.0, 541.0, 851.0, 1485.0, 2746.0, 5031.0, 9630.0, 19718.0, 45165.0, 116411.0, 338007.0, 318268.0, 108346.0, 42627.0, 18830.0, 9125.0, 4763.0, 2507.0, 1455.0, 843.0, 542.0, 311.0, 207.0, 106.0, 81.0, 50.0, 36.0, 24.0, 15.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.546875, -28.62255859375, -27.6982421875, -26.77392578125, -25.849609375, -24.92529296875, -24.0009765625, -23.07666015625, -22.15234375, -21.22802734375, -20.3037109375, -19.37939453125, -18.455078125, -17.53076171875, -16.6064453125, -15.68212890625, -14.7578125, -13.83349609375, -12.9091796875, -11.98486328125, -11.060546875, -10.13623046875, -9.2119140625, -8.28759765625, -7.36328125, -6.43896484375, -5.5146484375, -4.59033203125, -3.666015625, -2.74169921875, -1.8173828125, -0.89306640625, 0.03125, 0.95556640625, 1.8798828125, 2.80419921875, 3.728515625, 4.65283203125, 5.5771484375, 6.50146484375, 7.42578125, 8.35009765625, 9.2744140625, 10.19873046875, 11.123046875, 12.04736328125, 12.9716796875, 13.89599609375, 14.8203125, 15.74462890625, 16.6689453125, 17.59326171875, 18.517578125, 19.44189453125, 20.3662109375, 21.29052734375, 22.21484375, 23.13916015625, 24.0634765625, 24.98779296875, 25.912109375, 26.83642578125, 27.7607421875, 28.68505859375, 29.609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 1.0, 10.0, 12.0, 7.0, 12.0, 15.0, 19.0, 22.0, 33.0, 53.0, 60.0, 106.0, 125.0, 114.0, 105.0, 81.0, 52.0, 52.0, 37.0, 16.0, 14.0, 5.0, 10.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028018951416015625, -0.0027174949645996094, -0.0026330947875976562, -0.002548694610595703, -0.00246429443359375, -0.002379894256591797, -0.0022954940795898438, -0.0022110939025878906, -0.0021266937255859375, -0.0020422935485839844, -0.0019578933715820312, -0.0018734931945800781, -0.001789093017578125, -0.0017046928405761719, -0.0016202926635742188, -0.0015358924865722656, -0.0014514923095703125, -0.0013670921325683594, -0.0012826919555664062, -0.0011982917785644531, -0.0011138916015625, -0.0010294914245605469, -0.0009450912475585938, -0.0008606910705566406, -0.0007762908935546875, -0.0006918907165527344, -0.0006074905395507812, -0.0005230903625488281, -0.000438690185546875, -0.0003542900085449219, -0.00026988983154296875, -0.00018548965454101562, -0.0001010894775390625, -1.6689300537109375e-05, 6.771087646484375e-05, 0.00015211105346679688, 0.00023651123046875, 0.0003209114074707031, 0.00040531158447265625, 0.0004897117614746094, 0.0005741119384765625, 0.0006585121154785156, 0.0007429122924804688, 0.0008273124694824219, 0.000911712646484375, 0.0009961128234863281, 0.0010805130004882812, 0.0011649131774902344, 0.0012493133544921875, 0.0013337135314941406, 0.0014181137084960938, 0.0015025138854980469, 0.0015869140625, 0.0016713142395019531, 0.0017557144165039062, 0.0018401145935058594, 0.0019245147705078125, 0.0020089149475097656, 0.0020933151245117188, 0.002177715301513672, 0.002262115478515625, 0.002346515655517578, 0.0024309158325195312, 0.0025153160095214844, 0.0025997161865234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 10.0, 20.0, 25.0, 22.0, 32.0, 54.0, 73.0, 110.0, 180.0, 255.0, 391.0, 585.0, 909.0, 1467.0, 2336.0, 3798.0, 6491.0, 11101.0, 19807.0, 37407.0, 74294.0, 157066.0, 287984.0, 223804.0, 105806.0, 51425.0, 26989.0, 14645.0, 8559.0, 4814.0, 2953.0, 1865.0, 1163.0, 701.0, 463.0, 285.0, 219.0, 145.0, 101.0, 65.0, 41.0, 36.0, 18.0, 13.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0], "bins": [-21.28125, -20.668701171875, -20.05615234375, -19.443603515625, -18.8310546875, -18.218505859375, -17.60595703125, -16.993408203125, -16.380859375, -15.768310546875, -15.15576171875, -14.543212890625, -13.9306640625, -13.318115234375, -12.70556640625, -12.093017578125, -11.48046875, -10.867919921875, -10.25537109375, -9.642822265625, -9.0302734375, -8.417724609375, -7.80517578125, -7.192626953125, -6.580078125, -5.967529296875, -5.35498046875, -4.742431640625, -4.1298828125, -3.517333984375, -2.90478515625, -2.292236328125, -1.6796875, -1.067138671875, -0.45458984375, 0.157958984375, 0.7705078125, 1.383056640625, 1.99560546875, 2.608154296875, 3.220703125, 3.833251953125, 4.44580078125, 5.058349609375, 5.6708984375, 6.283447265625, 6.89599609375, 7.508544921875, 8.12109375, 8.733642578125, 9.34619140625, 9.958740234375, 10.5712890625, 11.183837890625, 11.79638671875, 12.408935546875, 13.021484375, 13.634033203125, 14.24658203125, 14.859130859375, 15.4716796875, 16.084228515625, 16.69677734375, 17.309326171875, 17.921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 9.0, 12.0, 19.0, 19.0, 41.0, 23.0, 37.0, 49.0, 39.0, 50.0, 56.0, 69.0, 74.0, 62.0, 60.0, 58.0, 47.0, 51.0, 35.0, 26.0, 35.0, 23.0, 21.0, 18.0, 9.0, 14.0, 10.0, 5.0, 4.0, 5.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.22265625, -6.0164794921875, -5.810302734375, -5.6041259765625, -5.39794921875, -5.1917724609375, -4.985595703125, -4.7794189453125, -4.5732421875, -4.3670654296875, -4.160888671875, -3.9547119140625, -3.74853515625, -3.5423583984375, -3.336181640625, -3.1300048828125, -2.923828125, -2.7176513671875, -2.511474609375, -2.3052978515625, -2.09912109375, -1.8929443359375, -1.686767578125, -1.4805908203125, -1.2744140625, -1.0682373046875, -0.862060546875, -0.6558837890625, -0.44970703125, -0.2435302734375, -0.037353515625, 0.1688232421875, 0.375, 0.5811767578125, 0.787353515625, 0.9935302734375, 1.19970703125, 1.4058837890625, 1.612060546875, 1.8182373046875, 2.0244140625, 2.2305908203125, 2.436767578125, 2.6429443359375, 2.84912109375, 3.0552978515625, 3.261474609375, 3.4676513671875, 3.673828125, 3.8800048828125, 4.086181640625, 4.2923583984375, 4.49853515625, 4.7047119140625, 4.910888671875, 5.1170654296875, 5.3232421875, 5.5294189453125, 5.735595703125, 5.9417724609375, 6.14794921875, 6.3541259765625, 6.560302734375, 6.7664794921875, 6.97265625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 7.0, 13.0, 14.0, 19.0, 23.0, 31.0, 30.0, 43.0, 47.0, 70.0, 61.0, 76.0, 80.0, 80.0, 78.0, 66.0, 48.0, 46.0, 34.0, 20.0, 18.0, 22.0, 12.0, 10.0, 9.0, 2.0, 5.0, 6.0, 7.0, 6.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-46.28619384765625, -44.47490310668945, -42.663612365722656, -40.85232162475586, -39.04103088378906, -37.229740142822266, -35.41844940185547, -33.60715866088867, -31.795867919921875, -29.984577178955078, -28.17328643798828, -26.361995697021484, -24.550704956054688, -22.73941421508789, -20.928123474121094, -19.116832733154297, -17.305543899536133, -15.494253158569336, -13.682962417602539, -11.871671676635742, -10.060380935668945, -8.249091148376465, -6.437800407409668, -4.626509666442871, -2.815218925476074, -1.003928303718567, 0.8073623180389404, 2.618652820587158, 4.429943561553955, 6.241233825683594, 8.05252456665039, 9.863815307617188, 11.675106048583984, 13.486396789550781, 15.297687530517578, 17.108978271484375, 18.920269012451172, 20.73155975341797, 22.542850494384766, 24.354141235351562, 26.16543197631836, 27.976722717285156, 29.788013458251953, 31.59930419921875, 33.41059494018555, 35.221885681152344, 37.03317642211914, 38.84446716308594, 40.65575408935547, 42.467044830322266, 44.27833557128906, 46.08962631225586, 47.900917053222656, 49.71220779418945, 51.52349853515625, 53.33478927612305, 55.146080017089844, 56.95737075805664, 58.76866149902344, 60.579952239990234, 62.39124298095703, 64.20252990722656, 66.01382446289062, 67.82511138916016, 69.63640594482422]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 4.0, 10.0, 11.0, 12.0, 14.0, 22.0, 16.0, 21.0, 24.0, 23.0, 22.0, 26.0, 31.0, 38.0, 41.0, 37.0, 31.0, 33.0, 47.0, 30.0, 50.0, 28.0, 41.0, 50.0, 36.0, 38.0, 32.0, 31.0, 21.0, 20.0, 25.0, 17.0, 19.0, 11.0, 7.0, 18.0, 9.0, 6.0, 11.0, 6.0, 9.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-45.57964324951172, -44.09043502807617, -42.601226806640625, -41.11201858520508, -39.62281036376953, -38.133602142333984, -36.64439392089844, -35.15518569946289, -33.665977478027344, -32.1767692565918, -30.68756103515625, -29.198352813720703, -27.709144592285156, -26.21993637084961, -24.730728149414062, -23.241519927978516, -21.75231170654297, -20.263103485107422, -18.773895263671875, -17.284687042236328, -15.795478820800781, -14.306270599365234, -12.817062377929688, -11.32785415649414, -9.838645935058594, -8.349437713623047, -6.8602294921875, -5.371021270751953, -3.8818130493164062, -2.3926048278808594, -0.9033966064453125, 0.5858116149902344, 2.0750198364257812, 3.564228057861328, 5.053436279296875, 6.542644500732422, 8.031852722167969, 9.521060943603516, 11.010269165039062, 12.49947738647461, 13.988685607910156, 15.477893829345703, 16.96710205078125, 18.456310272216797, 19.945518493652344, 21.43472671508789, 22.923934936523438, 24.413143157958984, 25.90235137939453, 27.391559600830078, 28.880767822265625, 30.369976043701172, 31.85918426513672, 33.348392486572266, 34.83760070800781, 36.32680892944336, 37.816017150878906, 39.30522537231445, 40.79443359375, 42.28364181518555, 43.772850036621094, 45.26205825805664, 46.75126647949219, 48.240474700927734, 49.72968292236328]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 3.0, 9.0, 16.0, 22.0, 29.0, 45.0, 53.0, 84.0, 96.0, 172.0, 284.0, 414.0, 585.0, 897.0, 1299.0, 2154.0, 3219.0, 5348.0, 9672.0, 19459.0, 54626.0, 259882.0, 1364810.0, 1924529.0, 418698.0, 76868.0, 23226.0, 10986.0, 6048.0, 3631.0, 2318.0, 1558.0, 1061.0, 670.0, 467.0, 300.0, 232.0, 172.0, 103.0, 70.0, 46.0, 34.0, 27.0, 24.0, 11.0, 4.0, 13.0, 7.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-82.875, -80.3740234375, -77.873046875, -75.3720703125, -72.87109375, -70.3701171875, -67.869140625, -65.3681640625, -62.8671875, -60.3662109375, -57.865234375, -55.3642578125, -52.86328125, -50.3623046875, -47.861328125, -45.3603515625, -42.859375, -40.3583984375, -37.857421875, -35.3564453125, -32.85546875, -30.3544921875, -27.853515625, -25.3525390625, -22.8515625, -20.3505859375, -17.849609375, -15.3486328125, -12.84765625, -10.3466796875, -7.845703125, -5.3447265625, -2.84375, -0.3427734375, 2.158203125, 4.6591796875, 7.16015625, 9.6611328125, 12.162109375, 14.6630859375, 17.1640625, 19.6650390625, 22.166015625, 24.6669921875, 27.16796875, 29.6689453125, 32.169921875, 34.6708984375, 37.171875, 39.6728515625, 42.173828125, 44.6748046875, 47.17578125, 49.6767578125, 52.177734375, 54.6787109375, 57.1796875, 59.6806640625, 62.181640625, 64.6826171875, 67.18359375, 69.6845703125, 72.185546875, 74.6865234375, 77.1875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 5.0, 7.0, 5.0, 10.0, 13.0, 20.0, 14.0, 9.0, 23.0, 23.0, 18.0, 19.0, 18.0, 28.0, 46.0, 29.0, 32.0, 43.0, 31.0, 50.0, 46.0, 28.0, 41.0, 51.0, 40.0, 49.0, 32.0, 37.0, 29.0, 35.0, 26.0, 19.0, 20.0, 14.0, 14.0, 12.0, 7.0, 14.0, 7.0, 9.0, 7.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.71875, -36.4296875, -35.140625, -33.8515625, -32.5625, -31.2734375, -29.984375, -28.6953125, -27.40625, -26.1171875, -24.828125, -23.5390625, -22.25, -20.9609375, -19.671875, -18.3828125, -17.09375, -15.8046875, -14.515625, -13.2265625, -11.9375, -10.6484375, -9.359375, -8.0703125, -6.78125, -5.4921875, -4.203125, -2.9140625, -1.625, -0.3359375, 0.953125, 2.2421875, 3.53125, 4.8203125, 6.109375, 7.3984375, 8.6875, 9.9765625, 11.265625, 12.5546875, 13.84375, 15.1328125, 16.421875, 17.7109375, 19.0, 20.2890625, 21.578125, 22.8671875, 24.15625, 25.4453125, 26.734375, 28.0234375, 29.3125, 30.6015625, 31.890625, 33.1796875, 34.46875, 35.7578125, 37.046875, 38.3359375, 39.625, 40.9140625, 42.203125, 43.4921875, 44.78125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 10.0, 13.0, 13.0, 20.0, 32.0, 29.0, 53.0, 80.0, 109.0, 139.0, 247.0, 319.0, 528.0, 723.0, 1200.0, 1995.0, 3363.0, 5920.0, 11272.0, 23008.0, 53835.0, 158527.0, 787917.0, 2525035.0, 431163.0, 108627.0, 40480.0, 18090.0, 9063.0, 4876.0, 2872.0, 1669.0, 1021.0, 655.0, 425.0, 303.0, 197.0, 123.0, 104.0, 76.0, 31.0, 39.0, 21.0, 16.0, 9.0, 13.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-92.0, -88.9677734375, -85.935546875, -82.9033203125, -79.87109375, -76.8388671875, -73.806640625, -70.7744140625, -67.7421875, -64.7099609375, -61.677734375, -58.6455078125, -55.61328125, -52.5810546875, -49.548828125, -46.5166015625, -43.484375, -40.4521484375, -37.419921875, -34.3876953125, -31.35546875, -28.3232421875, -25.291015625, -22.2587890625, -19.2265625, -16.1943359375, -13.162109375, -10.1298828125, -7.09765625, -4.0654296875, -1.033203125, 1.9990234375, 5.03125, 8.0634765625, 11.095703125, 14.1279296875, 17.16015625, 20.1923828125, 23.224609375, 26.2568359375, 29.2890625, 32.3212890625, 35.353515625, 38.3857421875, 41.41796875, 44.4501953125, 47.482421875, 50.5146484375, 53.546875, 56.5791015625, 59.611328125, 62.6435546875, 65.67578125, 68.7080078125, 71.740234375, 74.7724609375, 77.8046875, 80.8369140625, 83.869140625, 86.9013671875, 89.93359375, 92.9658203125, 95.998046875, 99.0302734375, 102.0625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 6.0, 8.0, 13.0, 11.0, 13.0, 21.0, 32.0, 58.0, 50.0, 89.0, 111.0, 185.0, 293.0, 470.0, 688.0, 672.0, 457.0, 269.0, 161.0, 139.0, 81.0, 66.0, 48.0, 34.0, 19.0, 20.0, 10.0, 14.0, 7.0, 9.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.28125, -20.3935546875, -19.505859375, -18.6181640625, -17.73046875, -16.8427734375, -15.955078125, -15.0673828125, -14.1796875, -13.2919921875, -12.404296875, -11.5166015625, -10.62890625, -9.7412109375, -8.853515625, -7.9658203125, -7.078125, -6.1904296875, -5.302734375, -4.4150390625, -3.52734375, -2.6396484375, -1.751953125, -0.8642578125, 0.0234375, 0.9111328125, 1.798828125, 2.6865234375, 3.57421875, 4.4619140625, 5.349609375, 6.2373046875, 7.125, 8.0126953125, 8.900390625, 9.7880859375, 10.67578125, 11.5634765625, 12.451171875, 13.3388671875, 14.2265625, 15.1142578125, 16.001953125, 16.8896484375, 17.77734375, 18.6650390625, 19.552734375, 20.4404296875, 21.328125, 22.2158203125, 23.103515625, 23.9912109375, 24.87890625, 25.7666015625, 26.654296875, 27.5419921875, 28.4296875, 29.3173828125, 30.205078125, 31.0927734375, 31.98046875, 32.8681640625, 33.755859375, 34.6435546875, 35.53125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 6.0, 6.0, 4.0, 7.0, 4.0, 14.0, 12.0, 16.0, 24.0, 25.0, 35.0, 41.0, 49.0, 69.0, 82.0, 94.0, 82.0, 80.0, 70.0, 70.0, 34.0, 34.0, 44.0, 16.0, 11.0, 21.0, 12.0, 8.0, 9.0, 6.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-54.37342071533203, -52.585872650146484, -50.7983283996582, -49.010780334472656, -47.223236083984375, -45.43568801879883, -43.64813995361328, -41.860595703125, -40.07304763793945, -38.285499572753906, -36.497955322265625, -34.71040725708008, -32.9228630065918, -31.13531494140625, -29.347768783569336, -27.560222625732422, -25.772676467895508, -23.985130310058594, -22.19758415222168, -20.410037994384766, -18.62248992919922, -16.834943771362305, -15.04739761352539, -13.25985050201416, -11.472304344177246, -9.684758186340332, -7.897211074829102, -6.1096649169921875, -4.322118282318115, -2.534571647644043, -0.7470254898071289, 1.0405216217041016, 2.8280677795410156, 4.615614414215088, 6.40316104888916, 8.190707206726074, 9.978254318237305, 11.765800476074219, 13.553346633911133, 15.340893745422363, 17.128440856933594, 18.915987014770508, 20.703533172607422, 22.49108123779297, 24.278627395629883, 26.066173553466797, 27.85371971130371, 29.641265869140625, 31.42881202697754, 33.21635818481445, 35.00390625, 36.79145050048828, 38.57899856567383, 40.366546630859375, 42.154090881347656, 43.9416389465332, 45.729183197021484, 47.51673126220703, 49.30427551269531, 51.09182357788086, 52.87936782836914, 54.66691589355469, 56.45446014404297, 58.242008209228516, 60.02955627441406]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 8.0, 3.0, 2.0, 5.0, 12.0, 16.0, 8.0, 12.0, 18.0, 14.0, 37.0, 30.0, 26.0, 28.0, 29.0, 38.0, 40.0, 39.0, 43.0, 44.0, 48.0, 53.0, 37.0, 50.0, 50.0, 32.0, 34.0, 29.0, 32.0, 23.0, 29.0, 26.0, 16.0, 20.0, 15.0, 11.0, 10.0, 13.0, 8.0, 6.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.65070724487305, -41.14067459106445, -39.630645751953125, -38.12061309814453, -36.6105842590332, -35.10055160522461, -33.59052276611328, -32.08049011230469, -30.570457458496094, -29.060426712036133, -27.550395965576172, -26.040363311767578, -24.530332565307617, -23.020301818847656, -21.510271072387695, -20.000240325927734, -18.490209579467773, -16.980178833007812, -15.470147132873535, -13.960116386413574, -12.450084686279297, -10.940053939819336, -9.430023193359375, -7.919991493225098, -6.409960746765137, -4.899929523468018, -3.3898985385894775, -1.8798675537109375, -0.36983633041381836, 1.1401948928833008, 2.6502256393432617, 4.160257339477539, 5.6702880859375, 7.180319309234619, 8.690350532531738, 10.2003812789917, 11.710412979125977, 13.220443725585938, 14.730474472045898, 16.24050521850586, 17.750537872314453, 19.260568618774414, 20.770599365234375, 22.28063201904297, 23.79066276550293, 25.30069351196289, 26.81072425842285, 28.320755004882812, 29.830785751342773, 31.340816497802734, 32.85084915161133, 34.360877990722656, 35.87091064453125, 37.380943298339844, 38.89097213745117, 40.401004791259766, 41.911033630371094, 43.42106628417969, 44.931095123291016, 46.44112777709961, 47.95115661621094, 49.46118927001953, 50.971221923828125, 52.48125076293945, 53.99128341674805]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 7.0, 9.0, 7.0, 27.0, 28.0, 54.0, 66.0, 72.0, 134.0, 194.0, 286.0, 390.0, 541.0, 725.0, 1064.0, 1450.0, 2105.0, 3069.0, 4193.0, 5958.0, 8662.0, 12837.0, 19312.0, 29646.0, 46993.0, 77466.0, 132686.0, 215853.0, 187610.0, 111730.0, 65657.0, 40066.0, 25483.0, 16950.0, 11420.0, 7660.0, 5381.0, 3735.0, 2707.0, 1896.0, 1288.0, 893.0, 708.0, 459.0, 340.0, 217.0, 163.0, 124.0, 83.0, 54.0, 41.0, 28.0, 11.0, 11.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0], "bins": [-18.25, -17.6767578125, -17.103515625, -16.5302734375, -15.95703125, -15.3837890625, -14.810546875, -14.2373046875, -13.6640625, -13.0908203125, -12.517578125, -11.9443359375, -11.37109375, -10.7978515625, -10.224609375, -9.6513671875, -9.078125, -8.5048828125, -7.931640625, -7.3583984375, -6.78515625, -6.2119140625, -5.638671875, -5.0654296875, -4.4921875, -3.9189453125, -3.345703125, -2.7724609375, -2.19921875, -1.6259765625, -1.052734375, -0.4794921875, 0.09375, 0.6669921875, 1.240234375, 1.8134765625, 2.38671875, 2.9599609375, 3.533203125, 4.1064453125, 4.6796875, 5.2529296875, 5.826171875, 6.3994140625, 6.97265625, 7.5458984375, 8.119140625, 8.6923828125, 9.265625, 9.8388671875, 10.412109375, 10.9853515625, 11.55859375, 12.1318359375, 12.705078125, 13.2783203125, 13.8515625, 14.4248046875, 14.998046875, 15.5712890625, 16.14453125, 16.7177734375, 17.291015625, 17.8642578125, 18.4375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 4.0, 4.0, 4.0, 9.0, 4.0, 14.0, 18.0, 13.0, 10.0, 21.0, 25.0, 29.0, 26.0, 23.0, 28.0, 43.0, 36.0, 46.0, 52.0, 39.0, 46.0, 44.0, 42.0, 48.0, 45.0, 34.0, 30.0, 31.0, 29.0, 23.0, 29.0, 28.0, 21.0, 19.0, 9.0, 22.0, 7.0, 10.0, 7.0, 10.0, 2.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.8125, -40.3369140625, -38.861328125, -37.3857421875, -35.91015625, -34.4345703125, -32.958984375, -31.4833984375, -30.0078125, -28.5322265625, -27.056640625, -25.5810546875, -24.10546875, -22.6298828125, -21.154296875, -19.6787109375, -18.203125, -16.7275390625, -15.251953125, -13.7763671875, -12.30078125, -10.8251953125, -9.349609375, -7.8740234375, -6.3984375, -4.9228515625, -3.447265625, -1.9716796875, -0.49609375, 0.9794921875, 2.455078125, 3.9306640625, 5.40625, 6.8818359375, 8.357421875, 9.8330078125, 11.30859375, 12.7841796875, 14.259765625, 15.7353515625, 17.2109375, 18.6865234375, 20.162109375, 21.6376953125, 23.11328125, 24.5888671875, 26.064453125, 27.5400390625, 29.015625, 30.4912109375, 31.966796875, 33.4423828125, 34.91796875, 36.3935546875, 37.869140625, 39.3447265625, 40.8203125, 42.2958984375, 43.771484375, 45.2470703125, 46.72265625, 48.1982421875, 49.673828125, 51.1494140625, 52.625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 8.0, 13.0, 18.0, 34.0, 25.0, 44.0, 60.0, 82.0, 112.0, 154.0, 222.0, 313.0, 436.0, 663.0, 952.0, 1460.0, 2140.0, 3464.0, 5492.0, 9665.0, 19171.0, 60702.0, 760320.0, 127792.0, 25056.0, 11909.0, 6716.0, 4035.0, 2507.0, 1568.0, 1069.0, 688.0, 492.0, 343.0, 234.0, 161.0, 121.0, 101.0, 51.0, 52.0, 30.0, 22.0, 15.0, 11.0, 5.0, 14.0, 3.0, 3.0, 0.0, 2.0, 2.0], "bins": [-42.5, -41.30810546875, -40.1162109375, -38.92431640625, -37.732421875, -36.54052734375, -35.3486328125, -34.15673828125, -32.96484375, -31.77294921875, -30.5810546875, -29.38916015625, -28.197265625, -27.00537109375, -25.8134765625, -24.62158203125, -23.4296875, -22.23779296875, -21.0458984375, -19.85400390625, -18.662109375, -17.47021484375, -16.2783203125, -15.08642578125, -13.89453125, -12.70263671875, -11.5107421875, -10.31884765625, -9.126953125, -7.93505859375, -6.7431640625, -5.55126953125, -4.359375, -3.16748046875, -1.9755859375, -0.78369140625, 0.408203125, 1.60009765625, 2.7919921875, 3.98388671875, 5.17578125, 6.36767578125, 7.5595703125, 8.75146484375, 9.943359375, 11.13525390625, 12.3271484375, 13.51904296875, 14.7109375, 15.90283203125, 17.0947265625, 18.28662109375, 19.478515625, 20.67041015625, 21.8623046875, 23.05419921875, 24.24609375, 25.43798828125, 26.6298828125, 27.82177734375, 29.013671875, 30.20556640625, 31.3974609375, 32.58935546875, 33.78125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 11.0, 11.0, 10.0, 10.0, 13.0, 13.0, 20.0, 23.0, 23.0, 23.0, 24.0, 25.0, 33.0, 27.0, 47.0, 38.0, 45.0, 42.0, 34.0, 38.0, 46.0, 39.0, 36.0, 41.0, 46.0, 27.0, 46.0, 26.0, 35.0, 20.0, 15.0, 18.0, 15.0, 10.0, 13.0, 3.0, 5.0, 9.0, 10.0, 8.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-30.484375, -29.447021484375, -28.40966796875, -27.372314453125, -26.3349609375, -25.297607421875, -24.26025390625, -23.222900390625, -22.185546875, -21.148193359375, -20.11083984375, -19.073486328125, -18.0361328125, -16.998779296875, -15.96142578125, -14.924072265625, -13.88671875, -12.849365234375, -11.81201171875, -10.774658203125, -9.7373046875, -8.699951171875, -7.66259765625, -6.625244140625, -5.587890625, -4.550537109375, -3.51318359375, -2.475830078125, -1.4384765625, -0.401123046875, 0.63623046875, 1.673583984375, 2.7109375, 3.748291015625, 4.78564453125, 5.822998046875, 6.8603515625, 7.897705078125, 8.93505859375, 9.972412109375, 11.009765625, 12.047119140625, 13.08447265625, 14.121826171875, 15.1591796875, 16.196533203125, 17.23388671875, 18.271240234375, 19.30859375, 20.345947265625, 21.38330078125, 22.420654296875, 23.4580078125, 24.495361328125, 25.53271484375, 26.570068359375, 27.607421875, 28.644775390625, 29.68212890625, 30.719482421875, 31.7568359375, 32.794189453125, 33.83154296875, 34.868896484375, 35.90625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 8.0, 9.0, 21.0, 34.0, 45.0, 88.0, 178.0, 330.0, 596.0, 1518.0, 4573.0, 21986.0, 929529.0, 76471.0, 8848.0, 2417.0, 1007.0, 403.0, 204.0, 98.0, 59.0, 48.0, 27.0, 13.0, 8.0, 8.0, 7.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1796875, -6.9208984375, -6.662109375, -6.4033203125, -6.14453125, -5.8857421875, -5.626953125, -5.3681640625, -5.109375, -4.8505859375, -4.591796875, -4.3330078125, -4.07421875, -3.8154296875, -3.556640625, -3.2978515625, -3.0390625, -2.7802734375, -2.521484375, -2.2626953125, -2.00390625, -1.7451171875, -1.486328125, -1.2275390625, -0.96875, -0.7099609375, -0.451171875, -0.1923828125, 0.06640625, 0.3251953125, 0.583984375, 0.8427734375, 1.1015625, 1.3603515625, 1.619140625, 1.8779296875, 2.13671875, 2.3955078125, 2.654296875, 2.9130859375, 3.171875, 3.4306640625, 3.689453125, 3.9482421875, 4.20703125, 4.4658203125, 4.724609375, 4.9833984375, 5.2421875, 5.5009765625, 5.759765625, 6.0185546875, 6.27734375, 6.5361328125, 6.794921875, 7.0537109375, 7.3125, 7.5712890625, 7.830078125, 8.0888671875, 8.34765625, 8.6064453125, 8.865234375, 9.1240234375, 9.3828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 10.0, 11.0, 25.0, 27.0, 36.0, 59.0, 77.0, 140.0, 147.0, 148.0, 89.0, 62.0, 44.0, 34.0, 17.0, 13.0, 11.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000743865966796875, -0.0007168799638748169, -0.0006898939609527588, -0.0006629079580307007, -0.0006359219551086426, -0.0006089359521865845, -0.0005819499492645264, -0.0005549639463424683, -0.0005279779434204102, -0.000500991940498352, -0.00047400593757629395, -0.00044701993465423584, -0.00042003393173217773, -0.00039304792881011963, -0.0003660619258880615, -0.0003390759229660034, -0.0003120899200439453, -0.0002851039171218872, -0.0002581179141998291, -0.000231131911277771, -0.0002041459083557129, -0.00017715990543365479, -0.00015017390251159668, -0.00012318789958953857, -9.620189666748047e-05, -6.921589374542236e-05, -4.222989082336426e-05, -1.5243887901306152e-05, 1.1742115020751953e-05, 3.872811794281006e-05, 6.571412086486816e-05, 9.270012378692627e-05, 0.00011968612670898438, 0.00014667212963104248, 0.00017365813255310059, 0.0002006441354751587, 0.0002276301383972168, 0.0002546161413192749, 0.000281602144241333, 0.0003085881471633911, 0.0003355741500854492, 0.0003625601530075073, 0.00038954615592956543, 0.00041653215885162354, 0.00044351816177368164, 0.00047050416469573975, 0.0004974901676177979, 0.000524476170539856, 0.0005514621734619141, 0.0005784481763839722, 0.0006054341793060303, 0.0006324201822280884, 0.0006594061851501465, 0.0006863921880722046, 0.0007133781909942627, 0.0007403641939163208, 0.0007673501968383789, 0.000794336199760437, 0.0008213222026824951, 0.0008483082056045532, 0.0008752942085266113, 0.0009022802114486694, 0.0009292662143707275, 0.0009562522172927856, 0.0009832382202148438]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 8.0, 11.0, 8.0, 22.0, 18.0, 36.0, 50.0, 55.0, 99.0, 144.0, 166.0, 258.0, 386.0, 587.0, 912.0, 1456.0, 2508.0, 4546.0, 9346.0, 22490.0, 69919.0, 330441.0, 457919.0, 95073.0, 28121.0, 11159.0, 5315.0, 2871.0, 1615.0, 1047.0, 636.0, 410.0, 275.0, 167.0, 136.0, 97.0, 69.0, 51.0, 27.0, 24.0, 18.0, 11.0, 15.0, 12.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.15625, -5.9583740234375, -5.760498046875, -5.5626220703125, -5.36474609375, -5.1668701171875, -4.968994140625, -4.7711181640625, -4.5732421875, -4.3753662109375, -4.177490234375, -3.9796142578125, -3.78173828125, -3.5838623046875, -3.385986328125, -3.1881103515625, -2.990234375, -2.7923583984375, -2.594482421875, -2.3966064453125, -2.19873046875, -2.0008544921875, -1.802978515625, -1.6051025390625, -1.4072265625, -1.2093505859375, -1.011474609375, -0.8135986328125, -0.61572265625, -0.4178466796875, -0.219970703125, -0.0220947265625, 0.17578125, 0.3736572265625, 0.571533203125, 0.7694091796875, 0.96728515625, 1.1651611328125, 1.363037109375, 1.5609130859375, 1.7587890625, 1.9566650390625, 2.154541015625, 2.3524169921875, 2.55029296875, 2.7481689453125, 2.946044921875, 3.1439208984375, 3.341796875, 3.5396728515625, 3.737548828125, 3.9354248046875, 4.13330078125, 4.3311767578125, 4.529052734375, 4.7269287109375, 4.9248046875, 5.1226806640625, 5.320556640625, 5.5184326171875, 5.71630859375, 5.9141845703125, 6.112060546875, 6.3099365234375, 6.5078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 9.0, 5.0, 11.0, 17.0, 25.0, 36.0, 53.0, 95.0, 116.0, 174.0, 144.0, 114.0, 52.0, 38.0, 20.0, 20.0, 19.0, 7.0, 9.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6865234375, -1.629425048828125, -1.57232666015625, -1.515228271484375, -1.4581298828125, -1.401031494140625, -1.34393310546875, -1.286834716796875, -1.229736328125, -1.172637939453125, -1.11553955078125, -1.058441162109375, -1.0013427734375, -0.944244384765625, -0.88714599609375, -0.830047607421875, -0.77294921875, -0.715850830078125, -0.65875244140625, -0.601654052734375, -0.5445556640625, -0.487457275390625, -0.43035888671875, -0.373260498046875, -0.316162109375, -0.259063720703125, -0.20196533203125, -0.144866943359375, -0.0877685546875, -0.030670166015625, 0.02642822265625, 0.083526611328125, 0.140625, 0.197723388671875, 0.25482177734375, 0.311920166015625, 0.3690185546875, 0.426116943359375, 0.48321533203125, 0.540313720703125, 0.597412109375, 0.654510498046875, 0.71160888671875, 0.768707275390625, 0.8258056640625, 0.882904052734375, 0.94000244140625, 0.997100830078125, 1.05419921875, 1.111297607421875, 1.16839599609375, 1.225494384765625, 1.2825927734375, 1.339691162109375, 1.39678955078125, 1.453887939453125, 1.510986328125, 1.568084716796875, 1.62518310546875, 1.682281494140625, 1.7393798828125, 1.796478271484375, 1.85357666015625, 1.910675048828125, 1.9677734375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 7.0, 3.0, 8.0, 11.0, 10.0, 7.0, 21.0, 19.0, 23.0, 43.0, 41.0, 61.0, 58.0, 84.0, 90.0, 85.0, 77.0, 77.0, 58.0, 40.0, 41.0, 33.0, 21.0, 17.0, 10.0, 11.0, 10.0, 10.0, 8.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.22563552856445, -45.49348449707031, -43.76133346557617, -42.02918243408203, -40.297035217285156, -38.564884185791016, -36.832733154296875, -35.100582122802734, -33.368431091308594, -31.636280059814453, -29.904130935668945, -28.171979904174805, -26.439828872680664, -24.707679748535156, -22.975528717041016, -21.243377685546875, -19.511228561401367, -17.779077529907227, -16.04692840576172, -14.314777374267578, -12.582626342773438, -10.850476264953613, -9.118326187133789, -7.386175155639648, -5.654025077819824, -3.921874523162842, -2.1897242069244385, -0.45757389068603516, 1.2745766639709473, 3.0067272186279297, 4.738877296447754, 6.4710283279418945, 8.203178405761719, 9.935328483581543, 11.667479515075684, 13.399629592895508, 15.131780624389648, 16.863929748535156, 18.596080780029297, 20.328231811523438, 22.060382843017578, 23.79253387451172, 25.524682998657227, 27.256834030151367, 28.988985061645508, 30.721134185791016, 32.453285217285156, 34.1854362487793, 35.91758728027344, 37.64973831176758, 39.38188934326172, 41.114036560058594, 42.846187591552734, 44.578338623046875, 46.310489654541016, 48.042640686035156, 49.77478790283203, 51.50693893432617, 53.23908996582031, 54.97123718261719, 56.70338821411133, 58.43553924560547, 60.16769027709961, 61.89984130859375, 63.63199234008789]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 5.0, 2.0, 4.0, 10.0, 17.0, 8.0, 12.0, 16.0, 13.0, 39.0, 28.0, 32.0, 25.0, 28.0, 36.0, 41.0, 42.0, 42.0, 46.0, 47.0, 50.0, 39.0, 51.0, 47.0, 33.0, 36.0, 29.0, 33.0, 24.0, 26.0, 26.0, 21.0, 19.0, 14.0, 9.0, 12.0, 11.0, 8.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.657379150390625, -40.182823181152344, -38.70826721191406, -37.23371505737305, -35.759159088134766, -34.284603118896484, -32.81005096435547, -31.335494995117188, -29.860939025878906, -28.386383056640625, -26.911828994750977, -25.437274932861328, -23.962718963623047, -22.488162994384766, -21.013608932495117, -19.53905487060547, -18.064498901367188, -16.589942932128906, -15.115388870239258, -13.640833854675293, -12.166278839111328, -10.691723823547363, -9.217168807983398, -7.742613792419434, -6.268058776855469, -4.793503761291504, -3.318948745727539, -1.8443937301635742, -0.3698387145996094, 1.1047163009643555, 2.5792713165283203, 4.053826332092285, 5.528385162353516, 7.0029401779174805, 8.477495193481445, 9.95205020904541, 11.426605224609375, 12.90116024017334, 14.375715255737305, 15.85027027130127, 17.324825286865234, 18.799381256103516, 20.273935317993164, 21.748489379882812, 23.223045349121094, 24.697601318359375, 26.172155380249023, 27.646709442138672, 29.121265411376953, 30.595821380615234, 32.07037353515625, 33.54492950439453, 35.01948547363281, 36.494041442871094, 37.968597412109375, 39.44314956665039, 40.91770553588867, 42.39226150512695, 43.86681365966797, 45.34136962890625, 46.81592559814453, 48.29048156738281, 49.765037536621094, 51.23958969116211, 52.71414566040039]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 12.0, 16.0, 34.0, 19.0, 38.0, 64.0, 96.0, 150.0, 211.0, 330.0, 438.0, 719.0, 1004.0, 1617.0, 2487.0, 3842.0, 5950.0, 9954.0, 16658.0, 28735.0, 53169.0, 105241.0, 218391.0, 282525.0, 149215.0, 73524.0, 38526.0, 21692.0, 12624.0, 7650.0, 4796.0, 3107.0, 1872.0, 1276.0, 822.0, 568.0, 368.0, 263.0, 175.0, 113.0, 88.0, 54.0, 35.0, 28.0, 21.0, 16.0, 3.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-56.0, -54.20751953125, -52.4150390625, -50.62255859375, -48.830078125, -47.03759765625, -45.2451171875, -43.45263671875, -41.66015625, -39.86767578125, -38.0751953125, -36.28271484375, -34.490234375, -32.69775390625, -30.9052734375, -29.11279296875, -27.3203125, -25.52783203125, -23.7353515625, -21.94287109375, -20.150390625, -18.35791015625, -16.5654296875, -14.77294921875, -12.98046875, -11.18798828125, -9.3955078125, -7.60302734375, -5.810546875, -4.01806640625, -2.2255859375, -0.43310546875, 1.359375, 3.15185546875, 4.9443359375, 6.73681640625, 8.529296875, 10.32177734375, 12.1142578125, 13.90673828125, 15.69921875, 17.49169921875, 19.2841796875, 21.07666015625, 22.869140625, 24.66162109375, 26.4541015625, 28.24658203125, 30.0390625, 31.83154296875, 33.6240234375, 35.41650390625, 37.208984375, 39.00146484375, 40.7939453125, 42.58642578125, 44.37890625, 46.17138671875, 47.9638671875, 49.75634765625, 51.548828125, 53.34130859375, 55.1337890625, 56.92626953125, 58.71875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 13.0, 7.0, 10.0, 14.0, 18.0, 27.0, 30.0, 24.0, 24.0, 32.0, 36.0, 40.0, 49.0, 45.0, 54.0, 53.0, 48.0, 55.0, 61.0, 50.0, 38.0, 31.0, 33.0, 26.0, 29.0, 25.0, 23.0, 19.0, 16.0, 11.0, 8.0, 10.0, 8.0, 7.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.03125, -42.470703125, -40.91015625, -39.349609375, -37.7890625, -36.228515625, -34.66796875, -33.107421875, -31.546875, -29.986328125, -28.42578125, -26.865234375, -25.3046875, -23.744140625, -22.18359375, -20.623046875, -19.0625, -17.501953125, -15.94140625, -14.380859375, -12.8203125, -11.259765625, -9.69921875, -8.138671875, -6.578125, -5.017578125, -3.45703125, -1.896484375, -0.3359375, 1.224609375, 2.78515625, 4.345703125, 5.90625, 7.466796875, 9.02734375, 10.587890625, 12.1484375, 13.708984375, 15.26953125, 16.830078125, 18.390625, 19.951171875, 21.51171875, 23.072265625, 24.6328125, 26.193359375, 27.75390625, 29.314453125, 30.875, 32.435546875, 33.99609375, 35.556640625, 37.1171875, 38.677734375, 40.23828125, 41.798828125, 43.359375, 44.919921875, 46.48046875, 48.041015625, 49.6015625, 51.162109375, 52.72265625, 54.283203125, 55.84375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 5.0, 5.0, 9.0, 15.0, 20.0, 23.0, 36.0, 70.0, 87.0, 149.0, 235.0, 352.0, 532.0, 740.0, 1168.0, 1754.0, 2792.0, 4189.0, 6369.0, 10309.0, 16229.0, 26510.0, 44146.0, 77424.0, 140489.0, 235193.0, 204504.0, 114224.0, 63065.0, 37174.0, 22100.0, 13894.0, 8586.0, 5684.0, 3523.0, 2368.0, 1614.0, 966.0, 673.0, 476.0, 291.0, 207.0, 115.0, 94.0, 59.0, 34.0, 23.0, 23.0, 5.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-58.90625, -57.21484375, -55.5234375, -53.83203125, -52.140625, -50.44921875, -48.7578125, -47.06640625, -45.375, -43.68359375, -41.9921875, -40.30078125, -38.609375, -36.91796875, -35.2265625, -33.53515625, -31.84375, -30.15234375, -28.4609375, -26.76953125, -25.078125, -23.38671875, -21.6953125, -20.00390625, -18.3125, -16.62109375, -14.9296875, -13.23828125, -11.546875, -9.85546875, -8.1640625, -6.47265625, -4.78125, -3.08984375, -1.3984375, 0.29296875, 1.984375, 3.67578125, 5.3671875, 7.05859375, 8.75, 10.44140625, 12.1328125, 13.82421875, 15.515625, 17.20703125, 18.8984375, 20.58984375, 22.28125, 23.97265625, 25.6640625, 27.35546875, 29.046875, 30.73828125, 32.4296875, 34.12109375, 35.8125, 37.50390625, 39.1953125, 40.88671875, 42.578125, 44.26953125, 45.9609375, 47.65234375, 49.34375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 13.0, 11.0, 12.0, 10.0, 13.0, 18.0, 19.0, 29.0, 25.0, 22.0, 27.0, 30.0, 40.0, 30.0, 39.0, 23.0, 36.0, 45.0, 39.0, 53.0, 41.0, 38.0, 43.0, 37.0, 35.0, 32.0, 28.0, 26.0, 16.0, 24.0, 19.0, 20.0, 16.0, 10.0, 13.0, 4.0, 11.0, 8.0, 8.0, 7.0, 5.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-28.484375, -27.630126953125, -26.77587890625, -25.921630859375, -25.0673828125, -24.213134765625, -23.35888671875, -22.504638671875, -21.650390625, -20.796142578125, -19.94189453125, -19.087646484375, -18.2333984375, -17.379150390625, -16.52490234375, -15.670654296875, -14.81640625, -13.962158203125, -13.10791015625, -12.253662109375, -11.3994140625, -10.545166015625, -9.69091796875, -8.836669921875, -7.982421875, -7.128173828125, -6.27392578125, -5.419677734375, -4.5654296875, -3.711181640625, -2.85693359375, -2.002685546875, -1.1484375, -0.294189453125, 0.56005859375, 1.414306640625, 2.2685546875, 3.122802734375, 3.97705078125, 4.831298828125, 5.685546875, 6.539794921875, 7.39404296875, 8.248291015625, 9.1025390625, 9.956787109375, 10.81103515625, 11.665283203125, 12.51953125, 13.373779296875, 14.22802734375, 15.082275390625, 15.9365234375, 16.790771484375, 17.64501953125, 18.499267578125, 19.353515625, 20.207763671875, 21.06201171875, 21.916259765625, 22.7705078125, 23.624755859375, 24.47900390625, 25.333251953125, 26.1875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 1.0, 6.0, 12.0, 20.0, 23.0, 28.0, 48.0, 70.0, 100.0, 165.0, 248.0, 440.0, 731.0, 1199.0, 2183.0, 4312.0, 9951.0, 25476.0, 80189.0, 315661.0, 434965.0, 113867.0, 34590.0, 12793.0, 5330.0, 2576.0, 1432.0, 817.0, 493.0, 287.0, 185.0, 124.0, 59.0, 49.0, 51.0, 17.0, 18.0, 14.0, 12.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.0625, -38.77587890625, -37.4892578125, -36.20263671875, -34.916015625, -33.62939453125, -32.3427734375, -31.05615234375, -29.76953125, -28.48291015625, -27.1962890625, -25.90966796875, -24.623046875, -23.33642578125, -22.0498046875, -20.76318359375, -19.4765625, -18.18994140625, -16.9033203125, -15.61669921875, -14.330078125, -13.04345703125, -11.7568359375, -10.47021484375, -9.18359375, -7.89697265625, -6.6103515625, -5.32373046875, -4.037109375, -2.75048828125, -1.4638671875, -0.17724609375, 1.109375, 2.39599609375, 3.6826171875, 4.96923828125, 6.255859375, 7.54248046875, 8.8291015625, 10.11572265625, 11.40234375, 12.68896484375, 13.9755859375, 15.26220703125, 16.548828125, 17.83544921875, 19.1220703125, 20.40869140625, 21.6953125, 22.98193359375, 24.2685546875, 25.55517578125, 26.841796875, 28.12841796875, 29.4150390625, 30.70166015625, 31.98828125, 33.27490234375, 34.5615234375, 35.84814453125, 37.134765625, 38.42138671875, 39.7080078125, 40.99462890625, 42.28125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 9.0, 7.0, 17.0, 18.0, 29.0, 37.0, 79.0, 141.0, 179.0, 169.0, 107.0, 76.0, 43.0, 27.0, 24.0, 16.0, 6.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028438568115234375, -0.0027130544185638428, -0.002582252025604248, -0.0024514496326446533, -0.0023206472396850586, -0.002189844846725464, -0.002059042453765869, -0.0019282400608062744, -0.0017974376678466797, -0.001666635274887085, -0.0015358328819274902, -0.0014050304889678955, -0.0012742280960083008, -0.001143425703048706, -0.0010126233100891113, -0.0008818209171295166, -0.0007510185241699219, -0.0006202161312103271, -0.0004894137382507324, -0.0003586113452911377, -0.00022780895233154297, -9.700655937194824e-05, 3.3795833587646484e-05, 0.0001645982265472412, 0.00029540061950683594, 0.00042620301246643066, 0.0005570054054260254, 0.0006878077983856201, 0.0008186101913452148, 0.0009494125843048096, 0.0010802149772644043, 0.001211017370223999, 0.0013418197631835938, 0.0014726221561431885, 0.0016034245491027832, 0.001734226942062378, 0.0018650293350219727, 0.0019958317279815674, 0.002126634120941162, 0.002257436513900757, 0.0023882389068603516, 0.0025190412998199463, 0.002649843692779541, 0.0027806460857391357, 0.0029114484786987305, 0.003042250871658325, 0.00317305326461792, 0.0033038556575775146, 0.0034346580505371094, 0.003565460443496704, 0.003696262836456299, 0.0038270652294158936, 0.003957867622375488, 0.004088670015335083, 0.004219472408294678, 0.0043502748012542725, 0.004481077194213867, 0.004611879587173462, 0.004742681980133057, 0.004873484373092651, 0.005004286766052246, 0.005135089159011841, 0.0052658915519714355, 0.00539669394493103, 0.005527496337890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 6.0, 4.0, 16.0, 11.0, 25.0, 21.0, 26.0, 45.0, 77.0, 93.0, 142.0, 217.0, 308.0, 467.0, 776.0, 1194.0, 2061.0, 3830.0, 7562.0, 16503.0, 40236.0, 112003.0, 328009.0, 341590.0, 116624.0, 42287.0, 17161.0, 7786.0, 3994.0, 2010.0, 1251.0, 735.0, 502.0, 285.0, 188.0, 151.0, 95.0, 81.0, 41.0, 43.0, 25.0, 23.0, 13.0, 15.0, 9.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.328125, -27.384521484375, -26.44091796875, -25.497314453125, -24.5537109375, -23.610107421875, -22.66650390625, -21.722900390625, -20.779296875, -19.835693359375, -18.89208984375, -17.948486328125, -17.0048828125, -16.061279296875, -15.11767578125, -14.174072265625, -13.23046875, -12.286865234375, -11.34326171875, -10.399658203125, -9.4560546875, -8.512451171875, -7.56884765625, -6.625244140625, -5.681640625, -4.738037109375, -3.79443359375, -2.850830078125, -1.9072265625, -0.963623046875, -0.02001953125, 0.923583984375, 1.8671875, 2.810791015625, 3.75439453125, 4.697998046875, 5.6416015625, 6.585205078125, 7.52880859375, 8.472412109375, 9.416015625, 10.359619140625, 11.30322265625, 12.246826171875, 13.1904296875, 14.134033203125, 15.07763671875, 16.021240234375, 16.96484375, 17.908447265625, 18.85205078125, 19.795654296875, 20.7392578125, 21.682861328125, 22.62646484375, 23.570068359375, 24.513671875, 25.457275390625, 26.40087890625, 27.344482421875, 28.2880859375, 29.231689453125, 30.17529296875, 31.118896484375, 32.0625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 4.0, 8.0, 13.0, 9.0, 11.0, 22.0, 23.0, 30.0, 50.0, 50.0, 69.0, 62.0, 74.0, 83.0, 85.0, 73.0, 62.0, 51.0, 40.0, 38.0, 33.0, 25.0, 15.0, 19.0, 12.0, 4.0, 14.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.890625, -7.650634765625, -7.41064453125, -7.170654296875, -6.9306640625, -6.690673828125, -6.45068359375, -6.210693359375, -5.970703125, -5.730712890625, -5.49072265625, -5.250732421875, -5.0107421875, -4.770751953125, -4.53076171875, -4.290771484375, -4.05078125, -3.810791015625, -3.57080078125, -3.330810546875, -3.0908203125, -2.850830078125, -2.61083984375, -2.370849609375, -2.130859375, -1.890869140625, -1.65087890625, -1.410888671875, -1.1708984375, -0.930908203125, -0.69091796875, -0.450927734375, -0.2109375, 0.029052734375, 0.26904296875, 0.509033203125, 0.7490234375, 0.989013671875, 1.22900390625, 1.468994140625, 1.708984375, 1.948974609375, 2.18896484375, 2.428955078125, 2.6689453125, 2.908935546875, 3.14892578125, 3.388916015625, 3.62890625, 3.868896484375, 4.10888671875, 4.348876953125, 4.5888671875, 4.828857421875, 5.06884765625, 5.308837890625, 5.548828125, 5.788818359375, 6.02880859375, 6.268798828125, 6.5087890625, 6.748779296875, 6.98876953125, 7.228759765625, 7.46875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 3.0, 7.0, 14.0, 15.0, 23.0, 23.0, 21.0, 36.0, 52.0, 49.0, 77.0, 66.0, 86.0, 96.0, 74.0, 77.0, 45.0, 48.0, 37.0, 38.0, 27.0, 21.0, 8.0, 11.0, 7.0, 8.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.10462951660156, -46.39650344848633, -44.688377380371094, -42.98025131225586, -41.272125244140625, -39.56399917602539, -37.855873107910156, -36.14774703979492, -34.43962097167969, -32.73149490356445, -31.02336883544922, -29.315242767333984, -27.60711669921875, -25.898990631103516, -24.19086456298828, -22.482738494873047, -20.774612426757812, -19.066486358642578, -17.358360290527344, -15.65023422241211, -13.942108154296875, -12.23398208618164, -10.525856018066406, -8.817729949951172, -7.1096038818359375, -5.401477813720703, -3.6933517456054688, -1.9852256774902344, -0.277099609375, 1.4310264587402344, 3.1391525268554688, 4.847278594970703, 6.555408477783203, 8.263534545898438, 9.971660614013672, 11.679786682128906, 13.38791275024414, 15.096038818359375, 16.80416488647461, 18.512290954589844, 20.220417022705078, 21.928543090820312, 23.636669158935547, 25.34479522705078, 27.052921295166016, 28.76104736328125, 30.469173431396484, 32.17729949951172, 33.88542556762695, 35.59355163574219, 37.30167770385742, 39.009803771972656, 40.71792984008789, 42.426055908203125, 44.13418197631836, 45.842308044433594, 47.55043411254883, 49.25856018066406, 50.9666862487793, 52.67481231689453, 54.382938385009766, 56.091064453125, 57.799190521240234, 59.50731658935547, 61.2154426574707]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 8.0, 7.0, 11.0, 11.0, 12.0, 10.0, 22.0, 21.0, 23.0, 39.0, 38.0, 41.0, 42.0, 42.0, 56.0, 44.0, 47.0, 48.0, 36.0, 52.0, 41.0, 43.0, 40.0, 40.0, 39.0, 24.0, 34.0, 19.0, 20.0, 24.0, 14.0, 11.0, 13.0, 11.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.30747604370117, -44.63785934448242, -42.968238830566406, -41.298622131347656, -39.629005432128906, -37.959388732910156, -36.289772033691406, -34.62015151977539, -32.95053482055664, -31.28091812133789, -29.611299514770508, -27.941680908203125, -26.272064208984375, -24.602447509765625, -22.932828903198242, -21.26321029663086, -19.59359359741211, -17.92397689819336, -16.254358291625977, -14.58474063873291, -12.915122985839844, -11.245505332946777, -9.575887680053711, -7.9062700271606445, -6.236652374267578, -4.567034721374512, -2.8974170684814453, -1.227799415588379, 0.4418182373046875, 2.111435890197754, 3.7810535430908203, 5.450671195983887, 7.120288848876953, 8.78990650177002, 10.459524154663086, 12.129141807556152, 13.798759460449219, 15.468377113342285, 17.13799476623535, 18.807613372802734, 20.477230072021484, 22.146846771240234, 23.816465377807617, 25.486083984375, 27.15570068359375, 28.8253173828125, 30.494935989379883, 32.164554595947266, 33.834171295166016, 35.503787994384766, 37.17340850830078, 38.84302520751953, 40.51264190673828, 42.18225860595703, 43.85187530517578, 45.5214958190918, 47.19111251831055, 48.8607292175293, 50.53034973144531, 52.19996643066406, 53.86958312988281, 55.53919982910156, 57.20881652832031, 58.87843704223633, 60.54805374145508]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [3.0, 4.0, 8.0, 9.0, 16.0, 18.0, 22.0, 42.0, 49.0, 78.0, 105.0, 190.0, 232.0, 303.0, 488.0, 733.0, 1007.0, 1568.0, 2430.0, 3651.0, 6001.0, 10176.0, 19867.0, 46041.0, 143957.0, 517808.0, 1595474.0, 1303254.0, 365226.0, 97405.0, 35240.0, 16718.0, 9416.0, 5473.0, 3545.0, 2304.0, 1531.0, 1090.0, 828.0, 526.0, 422.0, 278.0, 220.0, 142.0, 117.0, 91.0, 48.0, 37.0, 33.0, 27.0, 14.0, 19.0, 9.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.71875, -47.86865234375, -46.0185546875, -44.16845703125, -42.318359375, -40.46826171875, -38.6181640625, -36.76806640625, -34.91796875, -33.06787109375, -31.2177734375, -29.36767578125, -27.517578125, -25.66748046875, -23.8173828125, -21.96728515625, -20.1171875, -18.26708984375, -16.4169921875, -14.56689453125, -12.716796875, -10.86669921875, -9.0166015625, -7.16650390625, -5.31640625, -3.46630859375, -1.6162109375, 0.23388671875, 2.083984375, 3.93408203125, 5.7841796875, 7.63427734375, 9.484375, 11.33447265625, 13.1845703125, 15.03466796875, 16.884765625, 18.73486328125, 20.5849609375, 22.43505859375, 24.28515625, 26.13525390625, 27.9853515625, 29.83544921875, 31.685546875, 33.53564453125, 35.3857421875, 37.23583984375, 39.0859375, 40.93603515625, 42.7861328125, 44.63623046875, 46.486328125, 48.33642578125, 50.1865234375, 52.03662109375, 53.88671875, 55.73681640625, 57.5869140625, 59.43701171875, 61.287109375, 63.13720703125, 64.9873046875, 66.83740234375, 68.6875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 10.0, 8.0, 10.0, 8.0, 7.0, 19.0, 17.0, 25.0, 24.0, 32.0, 31.0, 49.0, 45.0, 47.0, 57.0, 53.0, 60.0, 40.0, 51.0, 48.0, 53.0, 46.0, 36.0, 41.0, 28.0, 31.0, 29.0, 23.0, 21.0, 11.0, 9.0, 10.0, 11.0, 8.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.40625, -39.896484375, -38.38671875, -36.876953125, -35.3671875, -33.857421875, -32.34765625, -30.837890625, -29.328125, -27.818359375, -26.30859375, -24.798828125, -23.2890625, -21.779296875, -20.26953125, -18.759765625, -17.25, -15.740234375, -14.23046875, -12.720703125, -11.2109375, -9.701171875, -8.19140625, -6.681640625, -5.171875, -3.662109375, -2.15234375, -0.642578125, 0.8671875, 2.376953125, 3.88671875, 5.396484375, 6.90625, 8.416015625, 9.92578125, 11.435546875, 12.9453125, 14.455078125, 15.96484375, 17.474609375, 18.984375, 20.494140625, 22.00390625, 23.513671875, 25.0234375, 26.533203125, 28.04296875, 29.552734375, 31.0625, 32.572265625, 34.08203125, 35.591796875, 37.1015625, 38.611328125, 40.12109375, 41.630859375, 43.140625, 44.650390625, 46.16015625, 47.669921875, 49.1796875, 50.689453125, 52.19921875, 53.708984375, 55.21875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 14.0, 13.0, 13.0, 21.0, 26.0, 52.0, 90.0, 121.0, 193.0, 240.0, 385.0, 586.0, 928.0, 1359.0, 2169.0, 3688.0, 6189.0, 11245.0, 22359.0, 50400.0, 137311.0, 507643.0, 2188399.0, 912934.0, 213288.0, 71314.0, 29546.0, 14459.0, 7693.0, 4341.0, 2609.0, 1607.0, 1031.0, 648.0, 438.0, 298.0, 205.0, 143.0, 109.0, 62.0, 34.0, 30.0, 16.0, 11.0, 13.0, 2.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.0, -72.5556640625, -70.111328125, -67.6669921875, -65.22265625, -62.7783203125, -60.333984375, -57.8896484375, -55.4453125, -53.0009765625, -50.556640625, -48.1123046875, -45.66796875, -43.2236328125, -40.779296875, -38.3349609375, -35.890625, -33.4462890625, -31.001953125, -28.5576171875, -26.11328125, -23.6689453125, -21.224609375, -18.7802734375, -16.3359375, -13.8916015625, -11.447265625, -9.0029296875, -6.55859375, -4.1142578125, -1.669921875, 0.7744140625, 3.21875, 5.6630859375, 8.107421875, 10.5517578125, 12.99609375, 15.4404296875, 17.884765625, 20.3291015625, 22.7734375, 25.2177734375, 27.662109375, 30.1064453125, 32.55078125, 34.9951171875, 37.439453125, 39.8837890625, 42.328125, 44.7724609375, 47.216796875, 49.6611328125, 52.10546875, 54.5498046875, 56.994140625, 59.4384765625, 61.8828125, 64.3271484375, 66.771484375, 69.2158203125, 71.66015625, 74.1044921875, 76.548828125, 78.9931640625, 81.4375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 7.0, 2.0, 9.0, 5.0, 10.0, 16.0, 18.0, 20.0, 27.0, 35.0, 60.0, 87.0, 108.0, 150.0, 202.0, 274.0, 373.0, 516.0, 603.0, 421.0, 286.0, 246.0, 164.0, 116.0, 74.0, 64.0, 34.0, 34.0, 25.0, 23.0, 9.0, 8.0, 7.0, 10.0, 15.0, 6.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.921875, -22.20849609375, -21.4951171875, -20.78173828125, -20.068359375, -19.35498046875, -18.6416015625, -17.92822265625, -17.21484375, -16.50146484375, -15.7880859375, -15.07470703125, -14.361328125, -13.64794921875, -12.9345703125, -12.22119140625, -11.5078125, -10.79443359375, -10.0810546875, -9.36767578125, -8.654296875, -7.94091796875, -7.2275390625, -6.51416015625, -5.80078125, -5.08740234375, -4.3740234375, -3.66064453125, -2.947265625, -2.23388671875, -1.5205078125, -0.80712890625, -0.09375, 0.61962890625, 1.3330078125, 2.04638671875, 2.759765625, 3.47314453125, 4.1865234375, 4.89990234375, 5.61328125, 6.32666015625, 7.0400390625, 7.75341796875, 8.466796875, 9.18017578125, 9.8935546875, 10.60693359375, 11.3203125, 12.03369140625, 12.7470703125, 13.46044921875, 14.173828125, 14.88720703125, 15.6005859375, 16.31396484375, 17.02734375, 17.74072265625, 18.4541015625, 19.16748046875, 19.880859375, 20.59423828125, 21.3076171875, 22.02099609375, 22.734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 6.0, 5.0, 8.0, 11.0, 6.0, 9.0, 16.0, 16.0, 16.0, 15.0, 23.0, 40.0, 54.0, 59.0, 55.0, 74.0, 89.0, 69.0, 72.0, 62.0, 49.0, 50.0, 40.0, 39.0, 23.0, 17.0, 22.0, 15.0, 14.0, 3.0, 7.0, 4.0, 2.0, 1.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-44.840267181396484, -43.35997772216797, -41.87968826293945, -40.39939880371094, -38.91911315917969, -37.43882369995117, -35.958534240722656, -34.47824478149414, -32.997955322265625, -31.51766586303711, -30.037378311157227, -28.55708885192871, -27.076801300048828, -25.596511840820312, -24.116222381591797, -22.63593292236328, -21.15564727783203, -19.675357818603516, -18.195070266723633, -16.714780807495117, -15.234492301940918, -13.754203796386719, -12.273914337158203, -10.793625831604004, -9.313337326049805, -7.8330488204956055, -6.352759838104248, -4.872470855712891, -3.3921823501586914, -1.9118938446044922, -0.43160438537597656, 1.0486841201782227, 2.5289764404296875, 4.009264945983887, 5.489553928375244, 6.969842910766602, 8.4501314163208, 9.930419921875, 11.410709381103516, 12.890997886657715, 14.371286392211914, 15.851574897766113, 17.331863403320312, 18.812152862548828, 20.292442321777344, 21.772729873657227, 23.253019332885742, 24.733306884765625, 26.21359634399414, 27.693885803222656, 29.17417335510254, 30.654462814331055, 32.13475036621094, 33.61503982543945, 35.09532928466797, 36.575618743896484, 38.055908203125, 39.536197662353516, 41.01648712158203, 42.49677276611328, 43.9770622253418, 45.45735168457031, 46.93764114379883, 48.417930603027344, 49.898216247558594]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 10.0, 12.0, 10.0, 15.0, 15.0, 18.0, 12.0, 26.0, 27.0, 26.0, 39.0, 34.0, 36.0, 49.0, 41.0, 41.0, 44.0, 37.0, 47.0, 45.0, 41.0, 41.0, 38.0, 32.0, 43.0, 24.0, 33.0, 25.0, 28.0, 14.0, 20.0, 12.0, 11.0, 17.0, 8.0, 5.0, 2.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.163185119628906, -39.7889404296875, -38.41469192504883, -37.04044723510742, -35.66619873046875, -34.291954040527344, -32.91770935058594, -31.543460845947266, -30.16921615600586, -28.79496955871582, -27.42072296142578, -26.046478271484375, -24.672231674194336, -23.297985076904297, -21.923738479614258, -20.54949188232422, -19.17524528503418, -17.80099868774414, -16.4267520904541, -15.052506446838379, -13.678260803222656, -12.304014205932617, -10.929767608642578, -9.555521965026855, -8.181275367736816, -6.8070292472839355, -5.432783126831055, -4.058536529541016, -2.6842904090881348, -1.310044288635254, 0.06420230865478516, 1.4384479522705078, 2.812694549560547, 4.186940670013428, 5.561186790466309, 6.935433387756348, 8.30967903137207, 9.68392562866211, 11.058172225952148, 12.432417869567871, 13.80666446685791, 15.18091106414795, 16.555156707763672, 17.92940330505371, 19.30364990234375, 20.677894592285156, 22.052143096923828, 23.426387786865234, 24.800634384155273, 26.174880981445312, 27.54912757873535, 28.92337417602539, 30.297618865966797, 31.671865463256836, 33.046112060546875, 34.42035675048828, 35.79460525512695, 37.16884994506836, 38.54309844970703, 39.91734313964844, 41.29159164428711, 42.665836334228516, 44.04008483886719, 45.414329528808594, 46.78857421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 13.0, 11.0, 21.0, 22.0, 42.0, 56.0, 60.0, 126.0, 150.0, 209.0, 306.0, 470.0, 677.0, 931.0, 1393.0, 2202.0, 3149.0, 4741.0, 6992.0, 11121.0, 17308.0, 27710.0, 47300.0, 82841.0, 151644.0, 249589.0, 188215.0, 102670.0, 56757.0, 33219.0, 20518.0, 13123.0, 8265.0, 5372.0, 3574.0, 2459.0, 1690.0, 1132.0, 787.0, 523.0, 324.0, 267.0, 172.0, 139.0, 81.0, 59.0, 48.0, 30.0, 22.0, 15.0, 2.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-18.46875, -17.903564453125, -17.33837890625, -16.773193359375, -16.2080078125, -15.642822265625, -15.07763671875, -14.512451171875, -13.947265625, -13.382080078125, -12.81689453125, -12.251708984375, -11.6865234375, -11.121337890625, -10.55615234375, -9.990966796875, -9.42578125, -8.860595703125, -8.29541015625, -7.730224609375, -7.1650390625, -6.599853515625, -6.03466796875, -5.469482421875, -4.904296875, -4.339111328125, -3.77392578125, -3.208740234375, -2.6435546875, -2.078369140625, -1.51318359375, -0.947998046875, -0.3828125, 0.182373046875, 0.74755859375, 1.312744140625, 1.8779296875, 2.443115234375, 3.00830078125, 3.573486328125, 4.138671875, 4.703857421875, 5.26904296875, 5.834228515625, 6.3994140625, 6.964599609375, 7.52978515625, 8.094970703125, 8.66015625, 9.225341796875, 9.79052734375, 10.355712890625, 10.9208984375, 11.486083984375, 12.05126953125, 12.616455078125, 13.181640625, 13.746826171875, 14.31201171875, 14.877197265625, 15.4423828125, 16.007568359375, 16.57275390625, 17.137939453125, 17.703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 7.0, 11.0, 14.0, 13.0, 10.0, 10.0, 25.0, 23.0, 24.0, 31.0, 35.0, 29.0, 38.0, 50.0, 43.0, 45.0, 39.0, 36.0, 37.0, 41.0, 47.0, 58.0, 33.0, 36.0, 37.0, 32.0, 25.0, 28.0, 21.0, 15.0, 14.0, 17.0, 10.0, 6.0, 13.0, 9.0, 5.0, 2.0, 3.0, 3.0, 5.0, 0.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.84375, -39.48291015625, -38.1220703125, -36.76123046875, -35.400390625, -34.03955078125, -32.6787109375, -31.31787109375, -29.95703125, -28.59619140625, -27.2353515625, -25.87451171875, -24.513671875, -23.15283203125, -21.7919921875, -20.43115234375, -19.0703125, -17.70947265625, -16.3486328125, -14.98779296875, -13.626953125, -12.26611328125, -10.9052734375, -9.54443359375, -8.18359375, -6.82275390625, -5.4619140625, -4.10107421875, -2.740234375, -1.37939453125, -0.0185546875, 1.34228515625, 2.703125, 4.06396484375, 5.4248046875, 6.78564453125, 8.146484375, 9.50732421875, 10.8681640625, 12.22900390625, 13.58984375, 14.95068359375, 16.3115234375, 17.67236328125, 19.033203125, 20.39404296875, 21.7548828125, 23.11572265625, 24.4765625, 25.83740234375, 27.1982421875, 28.55908203125, 29.919921875, 31.28076171875, 32.6416015625, 34.00244140625, 35.36328125, 36.72412109375, 38.0849609375, 39.44580078125, 40.806640625, 42.16748046875, 43.5283203125, 44.88916015625, 46.25]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 3.0, 14.0, 13.0, 21.0, 33.0, 46.0, 59.0, 85.0, 148.0, 214.0, 341.0, 571.0, 899.0, 1348.0, 2400.0, 3880.0, 6731.0, 12190.0, 26185.0, 158199.0, 742604.0, 52341.0, 17785.0, 9336.0, 5135.0, 2995.0, 1806.0, 1166.0, 733.0, 442.0, 303.0, 167.0, 132.0, 59.0, 50.0, 46.0, 26.0, 13.0, 10.0, 5.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.28125, -35.22265625, -34.1640625, -33.10546875, -32.046875, -30.98828125, -29.9296875, -28.87109375, -27.8125, -26.75390625, -25.6953125, -24.63671875, -23.578125, -22.51953125, -21.4609375, -20.40234375, -19.34375, -18.28515625, -17.2265625, -16.16796875, -15.109375, -14.05078125, -12.9921875, -11.93359375, -10.875, -9.81640625, -8.7578125, -7.69921875, -6.640625, -5.58203125, -4.5234375, -3.46484375, -2.40625, -1.34765625, -0.2890625, 0.76953125, 1.828125, 2.88671875, 3.9453125, 5.00390625, 6.0625, 7.12109375, 8.1796875, 9.23828125, 10.296875, 11.35546875, 12.4140625, 13.47265625, 14.53125, 15.58984375, 16.6484375, 17.70703125, 18.765625, 19.82421875, 20.8828125, 21.94140625, 23.0, 24.05859375, 25.1171875, 26.17578125, 27.234375, 28.29296875, 29.3515625, 30.41015625, 31.46875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 1.0, 6.0, 4.0, 10.0, 17.0, 10.0, 15.0, 21.0, 15.0, 22.0, 20.0, 34.0, 37.0, 26.0, 40.0, 47.0, 37.0, 36.0, 45.0, 50.0, 46.0, 38.0, 43.0, 46.0, 35.0, 28.0, 40.0, 27.0, 34.0, 31.0, 14.0, 19.0, 18.0, 19.0, 17.0, 15.0, 13.0, 6.0, 4.0, 6.0, 3.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.84375, -28.8251953125, -27.806640625, -26.7880859375, -25.76953125, -24.7509765625, -23.732421875, -22.7138671875, -21.6953125, -20.6767578125, -19.658203125, -18.6396484375, -17.62109375, -16.6025390625, -15.583984375, -14.5654296875, -13.546875, -12.5283203125, -11.509765625, -10.4912109375, -9.47265625, -8.4541015625, -7.435546875, -6.4169921875, -5.3984375, -4.3798828125, -3.361328125, -2.3427734375, -1.32421875, -0.3056640625, 0.712890625, 1.7314453125, 2.75, 3.7685546875, 4.787109375, 5.8056640625, 6.82421875, 7.8427734375, 8.861328125, 9.8798828125, 10.8984375, 11.9169921875, 12.935546875, 13.9541015625, 14.97265625, 15.9912109375, 17.009765625, 18.0283203125, 19.046875, 20.0654296875, 21.083984375, 22.1025390625, 23.12109375, 24.1396484375, 25.158203125, 26.1767578125, 27.1953125, 28.2138671875, 29.232421875, 30.2509765625, 31.26953125, 32.2880859375, 33.306640625, 34.3251953125, 35.34375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 18.0, 20.0, 37.0, 52.0, 60.0, 86.0, 125.0, 174.0, 282.0, 431.0, 728.0, 1230.0, 2253.0, 4399.0, 9206.0, 22871.0, 128126.0, 804883.0, 44743.0, 14834.0, 6411.0, 3205.0, 1740.0, 971.0, 562.0, 377.0, 198.0, 151.0, 106.0, 65.0, 63.0, 35.0, 30.0, 15.0, 15.0, 9.0, 10.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3359375, -3.232574462890625, -3.12921142578125, -3.025848388671875, -2.9224853515625, -2.819122314453125, -2.71575927734375, -2.612396240234375, -2.509033203125, -2.405670166015625, -2.30230712890625, -2.198944091796875, -2.0955810546875, -1.992218017578125, -1.88885498046875, -1.785491943359375, -1.68212890625, -1.578765869140625, -1.47540283203125, -1.372039794921875, -1.2686767578125, -1.165313720703125, -1.06195068359375, -0.958587646484375, -0.855224609375, -0.751861572265625, -0.64849853515625, -0.545135498046875, -0.4417724609375, -0.338409423828125, -0.23504638671875, -0.131683349609375, -0.0283203125, 0.075042724609375, 0.17840576171875, 0.281768798828125, 0.3851318359375, 0.488494873046875, 0.59185791015625, 0.695220947265625, 0.798583984375, 0.901947021484375, 1.00531005859375, 1.108673095703125, 1.2120361328125, 1.315399169921875, 1.41876220703125, 1.522125244140625, 1.62548828125, 1.728851318359375, 1.83221435546875, 1.935577392578125, 2.0389404296875, 2.142303466796875, 2.24566650390625, 2.349029541015625, 2.452392578125, 2.555755615234375, 2.65911865234375, 2.762481689453125, 2.8658447265625, 2.969207763671875, 3.07257080078125, 3.175933837890625, 3.279296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 9.0, 16.0, 23.0, 52.0, 70.0, 108.0, 145.0, 176.0, 124.0, 106.0, 75.0, 40.0, 18.0, 13.0, 9.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006508827209472656, -0.0006280690431594849, -0.0006052553653717041, -0.0005824416875839233, -0.0005596280097961426, -0.0005368143320083618, -0.0005140006542205811, -0.0004911869764328003, -0.00046837329864501953, -0.00044555962085723877, -0.000422745943069458, -0.00039993226528167725, -0.0003771185874938965, -0.0003543049097061157, -0.00033149123191833496, -0.0003086775541305542, -0.00028586387634277344, -0.0002630501985549927, -0.00024023652076721191, -0.00021742284297943115, -0.0001946091651916504, -0.00017179548740386963, -0.00014898180961608887, -0.0001261681318283081, -0.00010335445404052734, -8.054077625274658e-05, -5.772709846496582e-05, -3.491342067718506e-05, -1.2099742889404297e-05, 1.0713934898376465e-05, 3.3527612686157227e-05, 5.634129047393799e-05, 7.915496826171875e-05, 0.00010196864604949951, 0.00012478232383728027, 0.00014759600162506104, 0.0001704096794128418, 0.00019322335720062256, 0.00021603703498840332, 0.00023885071277618408, 0.00026166439056396484, 0.0002844780683517456, 0.00030729174613952637, 0.00033010542392730713, 0.0003529191017150879, 0.00037573277950286865, 0.0003985464572906494, 0.0004213601350784302, 0.00044417381286621094, 0.0004669874906539917, 0.0004898011684417725, 0.0005126148462295532, 0.000535428524017334, 0.0005582422018051147, 0.0005810558795928955, 0.0006038695573806763, 0.000626683235168457, 0.0006494969129562378, 0.0006723105907440186, 0.0006951242685317993, 0.0007179379463195801, 0.0007407516241073608, 0.0007635653018951416, 0.0007863789796829224, 0.0008091926574707031]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 9.0, 9.0, 9.0, 12.0, 15.0, 25.0, 40.0, 52.0, 77.0, 138.0, 151.0, 240.0, 351.0, 468.0, 696.0, 982.0, 1435.0, 2188.0, 3121.0, 4755.0, 7134.0, 10908.0, 16831.0, 27006.0, 44433.0, 75589.0, 133211.0, 211581.0, 202320.0, 121976.0, 70137.0, 40940.0, 24780.0, 15852.0, 10240.0, 6722.0, 4461.0, 3083.0, 2052.0, 1392.0, 1013.0, 659.0, 424.0, 318.0, 245.0, 121.0, 101.0, 82.0, 60.0, 37.0, 30.0, 22.0, 10.0, 9.0, 7.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.13671875, -2.067626953125, -1.99853515625, -1.929443359375, -1.8603515625, -1.791259765625, -1.72216796875, -1.653076171875, -1.583984375, -1.514892578125, -1.44580078125, -1.376708984375, -1.3076171875, -1.238525390625, -1.16943359375, -1.100341796875, -1.03125, -0.962158203125, -0.89306640625, -0.823974609375, -0.7548828125, -0.685791015625, -0.61669921875, -0.547607421875, -0.478515625, -0.409423828125, -0.34033203125, -0.271240234375, -0.2021484375, -0.133056640625, -0.06396484375, 0.005126953125, 0.07421875, 0.143310546875, 0.21240234375, 0.281494140625, 0.3505859375, 0.419677734375, 0.48876953125, 0.557861328125, 0.626953125, 0.696044921875, 0.76513671875, 0.834228515625, 0.9033203125, 0.972412109375, 1.04150390625, 1.110595703125, 1.1796875, 1.248779296875, 1.31787109375, 1.386962890625, 1.4560546875, 1.525146484375, 1.59423828125, 1.663330078125, 1.732421875, 1.801513671875, 1.87060546875, 1.939697265625, 2.0087890625, 2.077880859375, 2.14697265625, 2.216064453125, 2.28515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 8.0, 5.0, 10.0, 10.0, 11.0, 12.0, 12.0, 21.0, 18.0, 23.0, 28.0, 25.0, 38.0, 37.0, 44.0, 42.0, 70.0, 72.0, 72.0, 68.0, 57.0, 44.0, 41.0, 32.0, 25.0, 23.0, 24.0, 31.0, 10.0, 13.0, 12.0, 11.0, 14.0, 4.0, 2.0, 5.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74658203125, -0.72076416015625, -0.6949462890625, -0.66912841796875, -0.643310546875, -0.61749267578125, -0.5916748046875, -0.56585693359375, -0.5400390625, -0.51422119140625, -0.4884033203125, -0.46258544921875, -0.436767578125, -0.41094970703125, -0.3851318359375, -0.35931396484375, -0.33349609375, -0.30767822265625, -0.2818603515625, -0.25604248046875, -0.230224609375, -0.20440673828125, -0.1785888671875, -0.15277099609375, -0.126953125, -0.10113525390625, -0.0753173828125, -0.04949951171875, -0.023681640625, 0.00213623046875, 0.0279541015625, 0.05377197265625, 0.07958984375, 0.10540771484375, 0.1312255859375, 0.15704345703125, 0.182861328125, 0.20867919921875, 0.2344970703125, 0.26031494140625, 0.2861328125, 0.31195068359375, 0.3377685546875, 0.36358642578125, 0.389404296875, 0.41522216796875, 0.4410400390625, 0.46685791015625, 0.49267578125, 0.51849365234375, 0.5443115234375, 0.57012939453125, 0.595947265625, 0.62176513671875, 0.6475830078125, 0.67340087890625, 0.69921875, 0.72503662109375, 0.7508544921875, 0.77667236328125, 0.802490234375, 0.82830810546875, 0.8541259765625, 0.87994384765625, 0.90576171875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 0.0, 3.0, 7.0, 5.0, 8.0, 9.0, 15.0, 10.0, 11.0, 22.0, 23.0, 37.0, 52.0, 62.0, 61.0, 85.0, 95.0, 92.0, 65.0, 70.0, 54.0, 45.0, 40.0, 39.0, 14.0, 23.0, 15.0, 11.0, 5.0, 3.0, 5.0, 6.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.892513275146484, -47.27054977416992, -45.648590087890625, -44.02662658691406, -42.4046630859375, -40.7827033996582, -39.16073989868164, -37.538780212402344, -35.91681671142578, -34.29485321044922, -32.67289352416992, -31.05093002319336, -29.42896842956543, -27.8070068359375, -26.185043334960938, -24.563081741333008, -22.941118240356445, -21.319156646728516, -19.697193145751953, -18.075231552124023, -16.453269958496094, -14.831307411193848, -13.209344863891602, -11.587383270263672, -9.965420722961426, -8.34345817565918, -6.72149658203125, -5.099534034729004, -3.477571964263916, -1.8556098937988281, -0.23364734649658203, 1.3883142471313477, 3.0102767944335938, 4.632238864898682, 6.2542009353637695, 7.876163482666016, 9.498125076293945, 11.120087623596191, 12.742050170898438, 14.364011764526367, 15.985974311828613, 17.60793685913086, 19.22989845275879, 20.85186004638672, 22.47382354736328, 24.09578514099121, 25.71774673461914, 27.339710235595703, 28.961671829223633, 30.583633422851562, 32.205596923828125, 33.82756042480469, 35.449520111083984, 37.07148361206055, 38.693443298339844, 40.315406799316406, 41.93737030029297, 43.55933380126953, 45.18129348754883, 46.80325698852539, 48.42522048950195, 50.04718017578125, 51.66914367675781, 53.291107177734375, 54.91306686401367]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 10.0, 8.0, 12.0, 11.0, 19.0, 16.0, 16.0, 23.0, 25.0, 29.0, 32.0, 34.0, 37.0, 44.0, 52.0, 45.0, 42.0, 32.0, 44.0, 47.0, 47.0, 42.0, 38.0, 37.0, 38.0, 31.0, 29.0, 27.0, 27.0, 13.0, 18.0, 13.0, 11.0, 18.0, 9.0, 3.0, 2.0, 4.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.21173858642578, -39.8424186706543, -38.47309494018555, -37.10377502441406, -35.73445510864258, -34.365135192871094, -32.995811462402344, -31.62649154663086, -30.257169723510742, -28.887847900390625, -27.51852798461914, -26.149206161499023, -24.779884338378906, -23.410564422607422, -22.041242599487305, -20.671920776367188, -19.302600860595703, -17.933279037475586, -16.5639591217041, -15.194637298583984, -13.825316429138184, -12.455995559692383, -11.086673736572266, -9.717352867126465, -8.348031997680664, -6.978711128234863, -5.609389781951904, -4.240068435668945, -2.8707475662231445, -1.5014266967773438, -0.13210487365722656, 1.2372159957885742, 2.6065330505371094, 3.9758541584014893, 5.345175266265869, 6.714496612548828, 8.083817481994629, 9.45313835144043, 10.822460174560547, 12.191781044006348, 13.561101913452148, 14.93042278289795, 16.29974365234375, 17.669065475463867, 19.038387298583984, 20.40770721435547, 21.777029037475586, 23.146350860595703, 24.515670776367188, 25.884992599487305, 27.25431251525879, 28.623634338378906, 29.99295425415039, 31.362276077270508, 32.731597900390625, 34.10091781616211, 35.470237731933594, 36.83955764770508, 38.20888137817383, 39.57820129394531, 40.9475212097168, 42.31684112548828, 43.68616485595703, 45.055484771728516, 46.424808502197266]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 13.0, 11.0, 18.0, 34.0, 47.0, 70.0, 87.0, 172.0, 252.0, 365.0, 554.0, 787.0, 1213.0, 1881.0, 2633.0, 4179.0, 6529.0, 10543.0, 16626.0, 26977.0, 44716.0, 77811.0, 143249.0, 238386.0, 202275.0, 111432.0, 61406.0, 36234.0, 22017.0, 13596.0, 8568.0, 5426.0, 3545.0, 2252.0, 1589.0, 1012.0, 726.0, 430.0, 315.0, 208.0, 124.0, 94.0, 50.0, 32.0, 32.0, 15.0, 8.0, 5.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.875, -44.38525390625, -42.8955078125, -41.40576171875, -39.916015625, -38.42626953125, -36.9365234375, -35.44677734375, -33.95703125, -32.46728515625, -30.9775390625, -29.48779296875, -27.998046875, -26.50830078125, -25.0185546875, -23.52880859375, -22.0390625, -20.54931640625, -19.0595703125, -17.56982421875, -16.080078125, -14.59033203125, -13.1005859375, -11.61083984375, -10.12109375, -8.63134765625, -7.1416015625, -5.65185546875, -4.162109375, -2.67236328125, -1.1826171875, 0.30712890625, 1.796875, 3.28662109375, 4.7763671875, 6.26611328125, 7.755859375, 9.24560546875, 10.7353515625, 12.22509765625, 13.71484375, 15.20458984375, 16.6943359375, 18.18408203125, 19.673828125, 21.16357421875, 22.6533203125, 24.14306640625, 25.6328125, 27.12255859375, 28.6123046875, 30.10205078125, 31.591796875, 33.08154296875, 34.5712890625, 36.06103515625, 37.55078125, 39.04052734375, 40.5302734375, 42.02001953125, 43.509765625, 44.99951171875, 46.4892578125, 47.97900390625, 49.46875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 13.0, 8.0, 12.0, 17.0, 17.0, 12.0, 21.0, 21.0, 28.0, 22.0, 32.0, 39.0, 48.0, 47.0, 50.0, 39.0, 41.0, 40.0, 40.0, 43.0, 60.0, 29.0, 36.0, 26.0, 42.0, 30.0, 26.0, 20.0, 24.0, 20.0, 20.0, 13.0, 9.0, 6.0, 9.0, 8.0, 3.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.5, -38.203125, -36.90625, -35.609375, -34.3125, -33.015625, -31.71875, -30.421875, -29.125, -27.828125, -26.53125, -25.234375, -23.9375, -22.640625, -21.34375, -20.046875, -18.75, -17.453125, -16.15625, -14.859375, -13.5625, -12.265625, -10.96875, -9.671875, -8.375, -7.078125, -5.78125, -4.484375, -3.1875, -1.890625, -0.59375, 0.703125, 2.0, 3.296875, 4.59375, 5.890625, 7.1875, 8.484375, 9.78125, 11.078125, 12.375, 13.671875, 14.96875, 16.265625, 17.5625, 18.859375, 20.15625, 21.453125, 22.75, 24.046875, 25.34375, 26.640625, 27.9375, 29.234375, 30.53125, 31.828125, 33.125, 34.421875, 35.71875, 37.015625, 38.3125, 39.609375, 40.90625, 42.203125, 43.5]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 15.0, 20.0, 22.0, 33.0, 51.0, 89.0, 106.0, 152.0, 213.0, 355.0, 446.0, 745.0, 1098.0, 1681.0, 2496.0, 3876.0, 6036.0, 9300.0, 14857.0, 23634.0, 39460.0, 66401.0, 113235.0, 188531.0, 216807.0, 144651.0, 84477.0, 49242.0, 29672.0, 18212.0, 11595.0, 7309.0, 4582.0, 3015.0, 2002.0, 1304.0, 933.0, 577.0, 415.0, 284.0, 181.0, 148.0, 96.0, 68.0, 38.0, 36.0, 22.0, 12.0, 9.0, 5.0, 3.0, 0.0, 1.0, 3.0], "bins": [-53.375, -51.8154296875, -50.255859375, -48.6962890625, -47.13671875, -45.5771484375, -44.017578125, -42.4580078125, -40.8984375, -39.3388671875, -37.779296875, -36.2197265625, -34.66015625, -33.1005859375, -31.541015625, -29.9814453125, -28.421875, -26.8623046875, -25.302734375, -23.7431640625, -22.18359375, -20.6240234375, -19.064453125, -17.5048828125, -15.9453125, -14.3857421875, -12.826171875, -11.2666015625, -9.70703125, -8.1474609375, -6.587890625, -5.0283203125, -3.46875, -1.9091796875, -0.349609375, 1.2099609375, 2.76953125, 4.3291015625, 5.888671875, 7.4482421875, 9.0078125, 10.5673828125, 12.126953125, 13.6865234375, 15.24609375, 16.8056640625, 18.365234375, 19.9248046875, 21.484375, 23.0439453125, 24.603515625, 26.1630859375, 27.72265625, 29.2822265625, 30.841796875, 32.4013671875, 33.9609375, 35.5205078125, 37.080078125, 38.6396484375, 40.19921875, 41.7587890625, 43.318359375, 44.8779296875, 46.4375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 9.0, 5.0, 10.0, 11.0, 10.0, 10.0, 7.0, 13.0, 13.0, 8.0, 22.0, 16.0, 32.0, 40.0, 30.0, 27.0, 32.0, 46.0, 41.0, 48.0, 47.0, 34.0, 31.0, 40.0, 38.0, 27.0, 43.0, 39.0, 28.0, 28.0, 30.0, 16.0, 21.0, 23.0, 18.0, 16.0, 13.0, 19.0, 16.0, 8.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-25.875, -25.0791015625, -24.283203125, -23.4873046875, -22.69140625, -21.8955078125, -21.099609375, -20.3037109375, -19.5078125, -18.7119140625, -17.916015625, -17.1201171875, -16.32421875, -15.5283203125, -14.732421875, -13.9365234375, -13.140625, -12.3447265625, -11.548828125, -10.7529296875, -9.95703125, -9.1611328125, -8.365234375, -7.5693359375, -6.7734375, -5.9775390625, -5.181640625, -4.3857421875, -3.58984375, -2.7939453125, -1.998046875, -1.2021484375, -0.40625, 0.3896484375, 1.185546875, 1.9814453125, 2.77734375, 3.5732421875, 4.369140625, 5.1650390625, 5.9609375, 6.7568359375, 7.552734375, 8.3486328125, 9.14453125, 9.9404296875, 10.736328125, 11.5322265625, 12.328125, 13.1240234375, 13.919921875, 14.7158203125, 15.51171875, 16.3076171875, 17.103515625, 17.8994140625, 18.6953125, 19.4912109375, 20.287109375, 21.0830078125, 21.87890625, 22.6748046875, 23.470703125, 24.2666015625, 25.0625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 8.0, 9.0, 15.0, 21.0, 26.0, 47.0, 76.0, 61.0, 98.0, 153.0, 227.0, 346.0, 472.0, 773.0, 1094.0, 1693.0, 2703.0, 4318.0, 6887.0, 11244.0, 18874.0, 33375.0, 61340.0, 117326.0, 227908.0, 256274.0, 138319.0, 70837.0, 38361.0, 21979.0, 12616.0, 7686.0, 4654.0, 2930.0, 1881.0, 1235.0, 897.0, 581.0, 414.0, 264.0, 187.0, 104.0, 75.0, 50.0, 33.0, 32.0, 17.0, 13.0, 11.0, 5.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-23.828125, -23.108642578125, -22.38916015625, -21.669677734375, -20.9501953125, -20.230712890625, -19.51123046875, -18.791748046875, -18.072265625, -17.352783203125, -16.63330078125, -15.913818359375, -15.1943359375, -14.474853515625, -13.75537109375, -13.035888671875, -12.31640625, -11.596923828125, -10.87744140625, -10.157958984375, -9.4384765625, -8.718994140625, -7.99951171875, -7.280029296875, -6.560546875, -5.841064453125, -5.12158203125, -4.402099609375, -3.6826171875, -2.963134765625, -2.24365234375, -1.524169921875, -0.8046875, -0.085205078125, 0.63427734375, 1.353759765625, 2.0732421875, 2.792724609375, 3.51220703125, 4.231689453125, 4.951171875, 5.670654296875, 6.39013671875, 7.109619140625, 7.8291015625, 8.548583984375, 9.26806640625, 9.987548828125, 10.70703125, 11.426513671875, 12.14599609375, 12.865478515625, 13.5849609375, 14.304443359375, 15.02392578125, 15.743408203125, 16.462890625, 17.182373046875, 17.90185546875, 18.621337890625, 19.3408203125, 20.060302734375, 20.77978515625, 21.499267578125, 22.21875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 4.0, 8.0, 8.0, 20.0, 18.0, 29.0, 35.0, 32.0, 54.0, 67.0, 85.0, 97.0, 98.0, 89.0, 80.0, 49.0, 54.0, 40.0, 32.0, 22.0, 19.0, 15.0, 6.0, 5.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0025501251220703125, -0.002465665340423584, -0.0023812055587768555, -0.002296745777130127, -0.0022122859954833984, -0.00212782621383667, -0.0020433664321899414, -0.001958906650543213, -0.0018744468688964844, -0.0017899870872497559, -0.0017055273056030273, -0.0016210675239562988, -0.0015366077423095703, -0.0014521479606628418, -0.0013676881790161133, -0.0012832283973693848, -0.0011987686157226562, -0.0011143088340759277, -0.0010298490524291992, -0.0009453892707824707, -0.0008609294891357422, -0.0007764697074890137, -0.0006920099258422852, -0.0006075501441955566, -0.0005230903625488281, -0.0004386305809020996, -0.0003541707992553711, -0.0002697110176086426, -0.00018525123596191406, -0.00010079145431518555, -1.633167266845703e-05, 6.812810897827148e-05, 0.000152587890625, 0.00023704767227172852, 0.00032150745391845703, 0.00040596723556518555, 0.0004904270172119141, 0.0005748867988586426, 0.0006593465805053711, 0.0007438063621520996, 0.0008282661437988281, 0.0009127259254455566, 0.0009971857070922852, 0.0010816454887390137, 0.0011661052703857422, 0.0012505650520324707, 0.0013350248336791992, 0.0014194846153259277, 0.0015039443969726562, 0.0015884041786193848, 0.0016728639602661133, 0.0017573237419128418, 0.0018417835235595703, 0.0019262433052062988, 0.0020107030868530273, 0.002095162868499756, 0.0021796226501464844, 0.002264082431793213, 0.0023485422134399414, 0.00243300199508667, 0.0025174617767333984, 0.002601921558380127, 0.0026863813400268555, 0.002770841121673584, 0.0028553009033203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 14.0, 8.0, 13.0, 24.0, 34.0, 43.0, 77.0, 133.0, 191.0, 261.0, 430.0, 687.0, 1087.0, 1795.0, 2998.0, 5204.0, 9346.0, 17753.0, 36381.0, 79783.0, 183510.0, 326727.0, 206603.0, 90118.0, 40961.0, 20126.0, 10304.0, 5719.0, 3336.0, 1841.0, 1133.0, 670.0, 428.0, 272.0, 168.0, 113.0, 78.0, 46.0, 32.0, 31.0, 18.0, 13.0, 8.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-24.3125, -23.517333984375, -22.72216796875, -21.927001953125, -21.1318359375, -20.336669921875, -19.54150390625, -18.746337890625, -17.951171875, -17.156005859375, -16.36083984375, -15.565673828125, -14.7705078125, -13.975341796875, -13.18017578125, -12.385009765625, -11.58984375, -10.794677734375, -9.99951171875, -9.204345703125, -8.4091796875, -7.614013671875, -6.81884765625, -6.023681640625, -5.228515625, -4.433349609375, -3.63818359375, -2.843017578125, -2.0478515625, -1.252685546875, -0.45751953125, 0.337646484375, 1.1328125, 1.927978515625, 2.72314453125, 3.518310546875, 4.3134765625, 5.108642578125, 5.90380859375, 6.698974609375, 7.494140625, 8.289306640625, 9.08447265625, 9.879638671875, 10.6748046875, 11.469970703125, 12.26513671875, 13.060302734375, 13.85546875, 14.650634765625, 15.44580078125, 16.240966796875, 17.0361328125, 17.831298828125, 18.62646484375, 19.421630859375, 20.216796875, 21.011962890625, 21.80712890625, 22.602294921875, 23.3974609375, 24.192626953125, 24.98779296875, 25.782958984375, 26.578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 7.0, 10.0, 12.0, 12.0, 21.0, 22.0, 25.0, 37.0, 36.0, 49.0, 43.0, 41.0, 52.0, 60.0, 72.0, 62.0, 63.0, 61.0, 53.0, 30.0, 45.0, 33.0, 29.0, 24.0, 19.0, 18.0, 11.0, 13.0, 6.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5703125, -5.372802734375, -5.17529296875, -4.977783203125, -4.7802734375, -4.582763671875, -4.38525390625, -4.187744140625, -3.990234375, -3.792724609375, -3.59521484375, -3.397705078125, -3.2001953125, -3.002685546875, -2.80517578125, -2.607666015625, -2.41015625, -2.212646484375, -2.01513671875, -1.817626953125, -1.6201171875, -1.422607421875, -1.22509765625, -1.027587890625, -0.830078125, -0.632568359375, -0.43505859375, -0.237548828125, -0.0400390625, 0.157470703125, 0.35498046875, 0.552490234375, 0.75, 0.947509765625, 1.14501953125, 1.342529296875, 1.5400390625, 1.737548828125, 1.93505859375, 2.132568359375, 2.330078125, 2.527587890625, 2.72509765625, 2.922607421875, 3.1201171875, 3.317626953125, 3.51513671875, 3.712646484375, 3.91015625, 4.107666015625, 4.30517578125, 4.502685546875, 4.7001953125, 4.897705078125, 5.09521484375, 5.292724609375, 5.490234375, 5.687744140625, 5.88525390625, 6.082763671875, 6.2802734375, 6.477783203125, 6.67529296875, 6.872802734375, 7.0703125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 3.0, 8.0, 13.0, 9.0, 16.0, 17.0, 16.0, 16.0, 29.0, 40.0, 60.0, 55.0, 63.0, 71.0, 80.0, 77.0, 59.0, 65.0, 58.0, 40.0, 34.0, 27.0, 20.0, 30.0, 22.0, 9.0, 16.0, 6.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.81684875488281, -39.41847229003906, -38.02009582519531, -36.62171936035156, -35.22334289550781, -33.82497024536133, -32.42659378051758, -31.028217315673828, -29.629840850830078, -28.231464385986328, -26.833087921142578, -25.43471336364746, -24.03633689880371, -22.63796043395996, -21.239585876464844, -19.841209411621094, -18.442832946777344, -17.044456481933594, -15.64608097076416, -14.247705459594727, -12.849328994750977, -11.450952529907227, -10.052577018737793, -8.65420150756836, -7.255825042724609, -5.857449054718018, -4.459073066711426, -3.060697078704834, -1.6623210906982422, -0.2639451026916504, 1.1344308853149414, 2.532806396484375, 3.931182861328125, 5.329558849334717, 6.727934837341309, 8.126310348510742, 9.524686813354492, 10.923063278198242, 12.321438789367676, 13.71981430053711, 15.11819076538086, 16.51656723022461, 17.91494369506836, 19.313318252563477, 20.711694717407227, 22.110071182250977, 23.508445739746094, 24.906822204589844, 26.305198669433594, 27.703575134277344, 29.101951599121094, 30.50032615661621, 31.89870262145996, 33.29707717895508, 34.69545364379883, 36.09383010864258, 37.49220657348633, 38.89058303833008, 40.28895950317383, 41.68733596801758, 43.08570861816406, 44.48408508300781, 45.88246154785156, 47.28083801269531, 48.67921447753906]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 13.0, 15.0, 14.0, 14.0, 20.0, 22.0, 29.0, 15.0, 31.0, 44.0, 28.0, 34.0, 38.0, 52.0, 53.0, 43.0, 37.0, 56.0, 38.0, 46.0, 42.0, 32.0, 33.0, 26.0, 25.0, 31.0, 27.0, 19.0, 16.0, 12.0, 17.0, 13.0, 13.0, 6.0, 6.0, 4.0, 7.0, 6.0, 2.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.6596565246582, -39.28377151489258, -37.90788650512695, -36.53200149536133, -35.1561164855957, -33.78023147583008, -32.40434646606445, -31.028461456298828, -29.652576446533203, -28.276691436767578, -26.900806427001953, -25.524921417236328, -24.149036407470703, -22.773151397705078, -21.397266387939453, -20.021381378173828, -18.64549446105957, -17.269609451293945, -15.89372444152832, -14.517839431762695, -13.14195442199707, -11.766069412231445, -10.390183448791504, -9.014298439025879, -7.638413429260254, -6.262528419494629, -4.886643409729004, -3.5107579231262207, -2.1348729133605957, -0.7589879035949707, 0.6168975830078125, 1.9927825927734375, 3.3686676025390625, 4.7445526123046875, 6.1204376220703125, 7.496323108673096, 8.872207641601562, 10.248092651367188, 11.623978614807129, 12.999863624572754, 14.375748634338379, 15.751633644104004, 17.127519607543945, 18.50340461730957, 19.879289627075195, 21.25517463684082, 22.631059646606445, 24.00694465637207, 25.382829666137695, 26.75871467590332, 28.134599685668945, 29.51048469543457, 30.886369705200195, 32.26225662231445, 33.63814163208008, 35.0140266418457, 36.38991165161133, 37.76579666137695, 39.14168167114258, 40.5175666809082, 41.89345169067383, 43.26933670043945, 44.64522171020508, 46.0211067199707, 47.39699172973633]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 6.0, 12.0, 15.0, 13.0, 29.0, 42.0, 61.0, 67.0, 110.0, 150.0, 204.0, 344.0, 438.0, 617.0, 947.0, 1337.0, 2026.0, 3041.0, 4918.0, 7871.0, 13667.0, 25896.0, 58326.0, 183117.0, 746151.0, 1911021.0, 885868.0, 214148.0, 65864.0, 28619.0, 15027.0, 8524.0, 5234.0, 3274.0, 2254.0, 1468.0, 1078.0, 696.0, 502.0, 378.0, 255.0, 197.0, 134.0, 93.0, 79.0, 59.0, 31.0, 24.0, 19.0, 8.0, 14.0, 8.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-58.65625, -56.7978515625, -54.939453125, -53.0810546875, -51.22265625, -49.3642578125, -47.505859375, -45.6474609375, -43.7890625, -41.9306640625, -40.072265625, -38.2138671875, -36.35546875, -34.4970703125, -32.638671875, -30.7802734375, -28.921875, -27.0634765625, -25.205078125, -23.3466796875, -21.48828125, -19.6298828125, -17.771484375, -15.9130859375, -14.0546875, -12.1962890625, -10.337890625, -8.4794921875, -6.62109375, -4.7626953125, -2.904296875, -1.0458984375, 0.8125, 2.6708984375, 4.529296875, 6.3876953125, 8.24609375, 10.1044921875, 11.962890625, 13.8212890625, 15.6796875, 17.5380859375, 19.396484375, 21.2548828125, 23.11328125, 24.9716796875, 26.830078125, 28.6884765625, 30.546875, 32.4052734375, 34.263671875, 36.1220703125, 37.98046875, 39.8388671875, 41.697265625, 43.5556640625, 45.4140625, 47.2724609375, 49.130859375, 50.9892578125, 52.84765625, 54.7060546875, 56.564453125, 58.4228515625, 60.28125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 1.0, 0.0, 8.0, 12.0, 4.0, 12.0, 14.0, 14.0, 20.0, 24.0, 21.0, 18.0, 20.0, 31.0, 36.0, 25.0, 37.0, 34.0, 43.0, 47.0, 40.0, 45.0, 46.0, 46.0, 46.0, 36.0, 32.0, 25.0, 35.0, 32.0, 24.0, 25.0, 29.0, 15.0, 20.0, 8.0, 14.0, 12.0, 13.0, 11.0, 8.0, 3.0, 3.0, 1.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.625, -32.53173828125, -31.4384765625, -30.34521484375, -29.251953125, -28.15869140625, -27.0654296875, -25.97216796875, -24.87890625, -23.78564453125, -22.6923828125, -21.59912109375, -20.505859375, -19.41259765625, -18.3193359375, -17.22607421875, -16.1328125, -15.03955078125, -13.9462890625, -12.85302734375, -11.759765625, -10.66650390625, -9.5732421875, -8.47998046875, -7.38671875, -6.29345703125, -5.2001953125, -4.10693359375, -3.013671875, -1.92041015625, -0.8271484375, 0.26611328125, 1.359375, 2.45263671875, 3.5458984375, 4.63916015625, 5.732421875, 6.82568359375, 7.9189453125, 9.01220703125, 10.10546875, 11.19873046875, 12.2919921875, 13.38525390625, 14.478515625, 15.57177734375, 16.6650390625, 17.75830078125, 18.8515625, 19.94482421875, 21.0380859375, 22.13134765625, 23.224609375, 24.31787109375, 25.4111328125, 26.50439453125, 27.59765625, 28.69091796875, 29.7841796875, 30.87744140625, 31.970703125, 33.06396484375, 34.1572265625, 35.25048828125, 36.34375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 14.0, 20.0, 13.0, 35.0, 53.0, 69.0, 105.0, 141.0, 203.0, 337.0, 442.0, 672.0, 1058.0, 1753.0, 2682.0, 4142.0, 7292.0, 13045.0, 24272.0, 49422.0, 111165.0, 291219.0, 1005586.0, 1829166.0, 523866.0, 177593.0, 72967.0, 34410.0, 17682.0, 9750.0, 5711.0, 3335.0, 2086.0, 1331.0, 886.0, 590.0, 372.0, 269.0, 172.0, 96.0, 77.0, 64.0, 38.0, 31.0, 13.0, 12.0, 9.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-60.40625, -58.40966796875, -56.4130859375, -54.41650390625, -52.419921875, -50.42333984375, -48.4267578125, -46.43017578125, -44.43359375, -42.43701171875, -40.4404296875, -38.44384765625, -36.447265625, -34.45068359375, -32.4541015625, -30.45751953125, -28.4609375, -26.46435546875, -24.4677734375, -22.47119140625, -20.474609375, -18.47802734375, -16.4814453125, -14.48486328125, -12.48828125, -10.49169921875, -8.4951171875, -6.49853515625, -4.501953125, -2.50537109375, -0.5087890625, 1.48779296875, 3.484375, 5.48095703125, 7.4775390625, 9.47412109375, 11.470703125, 13.46728515625, 15.4638671875, 17.46044921875, 19.45703125, 21.45361328125, 23.4501953125, 25.44677734375, 27.443359375, 29.43994140625, 31.4365234375, 33.43310546875, 35.4296875, 37.42626953125, 39.4228515625, 41.41943359375, 43.416015625, 45.41259765625, 47.4091796875, 49.40576171875, 51.40234375, 53.39892578125, 55.3955078125, 57.39208984375, 59.388671875, 61.38525390625, 63.3818359375, 65.37841796875, 67.375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 7.0, 6.0, 3.0, 7.0, 7.0, 10.0, 10.0, 18.0, 15.0, 10.0, 26.0, 33.0, 30.0, 50.0, 54.0, 65.0, 79.0, 108.0, 125.0, 154.0, 196.0, 241.0, 326.0, 361.0, 373.0, 346.0, 274.0, 238.0, 164.0, 142.0, 129.0, 88.0, 72.0, 69.0, 46.0, 37.0, 32.0, 16.0, 19.0, 14.0, 15.0, 7.0, 9.0, 4.0, 14.0, 8.0, 4.0, 9.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-15.3203125, -14.8148193359375, -14.309326171875, -13.8038330078125, -13.29833984375, -12.7928466796875, -12.287353515625, -11.7818603515625, -11.2763671875, -10.7708740234375, -10.265380859375, -9.7598876953125, -9.25439453125, -8.7489013671875, -8.243408203125, -7.7379150390625, -7.232421875, -6.7269287109375, -6.221435546875, -5.7159423828125, -5.21044921875, -4.7049560546875, -4.199462890625, -3.6939697265625, -3.1884765625, -2.6829833984375, -2.177490234375, -1.6719970703125, -1.16650390625, -0.6610107421875, -0.155517578125, 0.3499755859375, 0.85546875, 1.3609619140625, 1.866455078125, 2.3719482421875, 2.87744140625, 3.3829345703125, 3.888427734375, 4.3939208984375, 4.8994140625, 5.4049072265625, 5.910400390625, 6.4158935546875, 6.92138671875, 7.4268798828125, 7.932373046875, 8.4378662109375, 8.943359375, 9.4488525390625, 9.954345703125, 10.4598388671875, 10.96533203125, 11.4708251953125, 11.976318359375, 12.4818115234375, 12.9873046875, 13.4927978515625, 13.998291015625, 14.5037841796875, 15.00927734375, 15.5147705078125, 16.020263671875, 16.5257568359375, 17.03125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 3.0, 3.0, 7.0, 7.0, 12.0, 20.0, 19.0, 33.0, 29.0, 57.0, 59.0, 46.0, 84.0, 95.0, 81.0, 69.0, 74.0, 66.0, 43.0, 44.0, 33.0, 25.0, 17.0, 12.0, 17.0, 10.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.31568908691406, -45.760162353515625, -44.20463562011719, -42.64910888671875, -41.09358596801758, -39.53805923461914, -37.9825325012207, -36.427005767822266, -34.87147903442383, -33.31595230102539, -31.760427474975586, -30.20490074157715, -28.64937400817871, -27.093849182128906, -25.53832244873047, -23.98279571533203, -22.427270889282227, -20.87174415588379, -19.316219329833984, -17.760692596435547, -16.20516586303711, -14.649640083312988, -13.094114303588867, -11.53858757019043, -9.983061790466309, -8.427536010742188, -6.87200927734375, -5.316483497619629, -3.7609572410583496, -2.2054309844970703, -0.6499052047729492, 0.9056215286254883, 2.4611473083496094, 4.016673564910889, 5.572199821472168, 7.127725601196289, 8.683252334594727, 10.238778114318848, 11.794303894042969, 13.349830627441406, 14.905356407165527, 16.46088218688965, 18.016408920288086, 19.57193374633789, 21.127460479736328, 22.682987213134766, 24.238513946533203, 25.79404067993164, 27.349565505981445, 28.905092239379883, 30.460617065429688, 32.016143798828125, 33.57167053222656, 35.127197265625, 36.68272399902344, 38.238250732421875, 39.79377365112305, 41.349300384521484, 42.90482711791992, 44.460350036621094, 46.01587677001953, 47.57140350341797, 49.126930236816406, 50.682456970214844, 52.23798370361328]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 2.0, 6.0, 6.0, 6.0, 13.0, 9.0, 18.0, 22.0, 23.0, 22.0, 35.0, 25.0, 22.0, 31.0, 30.0, 35.0, 39.0, 59.0, 30.0, 48.0, 46.0, 49.0, 43.0, 47.0, 45.0, 36.0, 35.0, 21.0, 24.0, 25.0, 16.0, 23.0, 18.0, 21.0, 16.0, 8.0, 12.0, 7.0, 4.0, 5.0, 7.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.902496337890625, -31.659561157226562, -30.416627883911133, -29.173694610595703, -27.93075942993164, -26.687824249267578, -25.44489097595215, -24.20195770263672, -22.959022521972656, -21.716087341308594, -20.473154067993164, -19.230220794677734, -17.987285614013672, -16.74435043334961, -15.50141716003418, -14.258482933044434, -13.015548706054688, -11.772614479064941, -10.529680252075195, -9.28674602508545, -8.043811798095703, -6.800877571105957, -5.557943344116211, -4.315009117126465, -3.0720748901367188, -1.8291406631469727, -0.5862064361572266, 0.6567277908325195, 1.8996620178222656, 3.1425962448120117, 4.385530471801758, 5.628464698791504, 6.871402740478516, 8.114336967468262, 9.357271194458008, 10.600205421447754, 11.8431396484375, 13.086073875427246, 14.329008102416992, 15.571942329406738, 16.814876556396484, 18.057811737060547, 19.300745010375977, 20.543678283691406, 21.78661346435547, 23.02954864501953, 24.27248191833496, 25.51541519165039, 26.758350372314453, 28.001285552978516, 29.244218826293945, 30.487152099609375, 31.730087280273438, 32.9730224609375, 34.21595764160156, 35.45888900756836, 36.70182418823242, 37.944759368896484, 39.18769073486328, 40.430625915527344, 41.673561096191406, 42.91649627685547, 44.15943145751953, 45.40236282348633, 46.64529800415039]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 6.0, 5.0, 13.0, 16.0, 24.0, 27.0, 42.0, 60.0, 89.0, 130.0, 229.0, 317.0, 518.0, 811.0, 1314.0, 2123.0, 3712.0, 6487.0, 11176.0, 20446.0, 38820.0, 78824.0, 173637.0, 315775.0, 204345.0, 92062.0, 44404.0, 23110.0, 12541.0, 6948.0, 4132.0, 2362.0, 1452.0, 898.0, 595.0, 381.0, 249.0, 139.0, 105.0, 65.0, 42.0, 27.0, 25.0, 13.0, 14.0, 14.0, 6.0, 10.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-18.25, -17.690185546875, -17.13037109375, -16.570556640625, -16.0107421875, -15.450927734375, -14.89111328125, -14.331298828125, -13.771484375, -13.211669921875, -12.65185546875, -12.092041015625, -11.5322265625, -10.972412109375, -10.41259765625, -9.852783203125, -9.29296875, -8.733154296875, -8.17333984375, -7.613525390625, -7.0537109375, -6.493896484375, -5.93408203125, -5.374267578125, -4.814453125, -4.254638671875, -3.69482421875, -3.135009765625, -2.5751953125, -2.015380859375, -1.45556640625, -0.895751953125, -0.3359375, 0.223876953125, 0.78369140625, 1.343505859375, 1.9033203125, 2.463134765625, 3.02294921875, 3.582763671875, 4.142578125, 4.702392578125, 5.26220703125, 5.822021484375, 6.3818359375, 6.941650390625, 7.50146484375, 8.061279296875, 8.62109375, 9.180908203125, 9.74072265625, 10.300537109375, 10.8603515625, 11.420166015625, 11.97998046875, 12.539794921875, 13.099609375, 13.659423828125, 14.21923828125, 14.779052734375, 15.3388671875, 15.898681640625, 16.45849609375, 17.018310546875, 17.578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 5.0, 4.0, 2.0, 6.0, 9.0, 11.0, 20.0, 13.0, 19.0, 18.0, 15.0, 34.0, 20.0, 18.0, 34.0, 28.0, 31.0, 36.0, 42.0, 39.0, 44.0, 38.0, 41.0, 48.0, 40.0, 38.0, 45.0, 32.0, 34.0, 31.0, 19.0, 23.0, 24.0, 24.0, 16.0, 13.0, 17.0, 19.0, 6.0, 8.0, 5.0, 5.0, 5.0, 1.0, 9.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-35.875, -34.69775390625, -33.5205078125, -32.34326171875, -31.166015625, -29.98876953125, -28.8115234375, -27.63427734375, -26.45703125, -25.27978515625, -24.1025390625, -22.92529296875, -21.748046875, -20.57080078125, -19.3935546875, -18.21630859375, -17.0390625, -15.86181640625, -14.6845703125, -13.50732421875, -12.330078125, -11.15283203125, -9.9755859375, -8.79833984375, -7.62109375, -6.44384765625, -5.2666015625, -4.08935546875, -2.912109375, -1.73486328125, -0.5576171875, 0.61962890625, 1.796875, 2.97412109375, 4.1513671875, 5.32861328125, 6.505859375, 7.68310546875, 8.8603515625, 10.03759765625, 11.21484375, 12.39208984375, 13.5693359375, 14.74658203125, 15.923828125, 17.10107421875, 18.2783203125, 19.45556640625, 20.6328125, 21.81005859375, 22.9873046875, 24.16455078125, 25.341796875, 26.51904296875, 27.6962890625, 28.87353515625, 30.05078125, 31.22802734375, 32.4052734375, 33.58251953125, 34.759765625, 35.93701171875, 37.1142578125, 38.29150390625, 39.46875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 7.0, 3.0, 6.0, 7.0, 17.0, 14.0, 21.0, 27.0, 52.0, 74.0, 122.0, 236.0, 431.0, 826.0, 1669.0, 3635.0, 8360.0, 21701.0, 168678.0, 788722.0, 33316.0, 11337.0, 4845.0, 2171.0, 1033.0, 536.0, 279.0, 162.0, 86.0, 53.0, 43.0, 16.0, 16.0, 14.0, 10.0, 5.0, 5.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-44.15625, -42.8642578125, -41.572265625, -40.2802734375, -38.98828125, -37.6962890625, -36.404296875, -35.1123046875, -33.8203125, -32.5283203125, -31.236328125, -29.9443359375, -28.65234375, -27.3603515625, -26.068359375, -24.7763671875, -23.484375, -22.1923828125, -20.900390625, -19.6083984375, -18.31640625, -17.0244140625, -15.732421875, -14.4404296875, -13.1484375, -11.8564453125, -10.564453125, -9.2724609375, -7.98046875, -6.6884765625, -5.396484375, -4.1044921875, -2.8125, -1.5205078125, -0.228515625, 1.0634765625, 2.35546875, 3.6474609375, 4.939453125, 6.2314453125, 7.5234375, 8.8154296875, 10.107421875, 11.3994140625, 12.69140625, 13.9833984375, 15.275390625, 16.5673828125, 17.859375, 19.1513671875, 20.443359375, 21.7353515625, 23.02734375, 24.3193359375, 25.611328125, 26.9033203125, 28.1953125, 29.4873046875, 30.779296875, 32.0712890625, 33.36328125, 34.6552734375, 35.947265625, 37.2392578125, 38.53125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 4.0, 3.0, 9.0, 9.0, 7.0, 14.0, 9.0, 14.0, 11.0, 17.0, 17.0, 19.0, 11.0, 28.0, 23.0, 31.0, 26.0, 41.0, 40.0, 37.0, 36.0, 44.0, 40.0, 42.0, 38.0, 39.0, 35.0, 33.0, 34.0, 37.0, 37.0, 25.0, 23.0, 23.0, 21.0, 20.0, 11.0, 15.0, 9.0, 11.0, 13.0, 4.0, 13.0, 5.0, 6.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.140625, -23.35986328125, -22.5791015625, -21.79833984375, -21.017578125, -20.23681640625, -19.4560546875, -18.67529296875, -17.89453125, -17.11376953125, -16.3330078125, -15.55224609375, -14.771484375, -13.99072265625, -13.2099609375, -12.42919921875, -11.6484375, -10.86767578125, -10.0869140625, -9.30615234375, -8.525390625, -7.74462890625, -6.9638671875, -6.18310546875, -5.40234375, -4.62158203125, -3.8408203125, -3.06005859375, -2.279296875, -1.49853515625, -0.7177734375, 0.06298828125, 0.84375, 1.62451171875, 2.4052734375, 3.18603515625, 3.966796875, 4.74755859375, 5.5283203125, 6.30908203125, 7.08984375, 7.87060546875, 8.6513671875, 9.43212890625, 10.212890625, 10.99365234375, 11.7744140625, 12.55517578125, 13.3359375, 14.11669921875, 14.8974609375, 15.67822265625, 16.458984375, 17.23974609375, 18.0205078125, 18.80126953125, 19.58203125, 20.36279296875, 21.1435546875, 21.92431640625, 22.705078125, 23.48583984375, 24.2666015625, 25.04736328125, 25.828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 10.0, 6.0, 14.0, 23.0, 30.0, 43.0, 67.0, 89.0, 115.0, 204.0, 318.0, 532.0, 928.0, 1708.0, 3678.0, 8761.0, 26070.0, 678643.0, 290017.0, 22149.0, 7871.0, 3288.0, 1620.0, 926.0, 490.0, 312.0, 193.0, 138.0, 89.0, 64.0, 34.0, 25.0, 27.0, 23.0, 14.0, 6.0, 9.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.751953125, -3.626617431640625, -3.50128173828125, -3.375946044921875, -3.2506103515625, -3.125274658203125, -2.99993896484375, -2.874603271484375, -2.749267578125, -2.623931884765625, -2.49859619140625, -2.373260498046875, -2.2479248046875, -2.122589111328125, -1.99725341796875, -1.871917724609375, -1.74658203125, -1.621246337890625, -1.49591064453125, -1.370574951171875, -1.2452392578125, -1.119903564453125, -0.99456787109375, -0.869232177734375, -0.743896484375, -0.618560791015625, -0.49322509765625, -0.367889404296875, -0.2425537109375, -0.117218017578125, 0.00811767578125, 0.133453369140625, 0.2587890625, 0.384124755859375, 0.50946044921875, 0.634796142578125, 0.7601318359375, 0.885467529296875, 1.01080322265625, 1.136138916015625, 1.261474609375, 1.386810302734375, 1.51214599609375, 1.637481689453125, 1.7628173828125, 1.888153076171875, 2.01348876953125, 2.138824462890625, 2.26416015625, 2.389495849609375, 2.51483154296875, 2.640167236328125, 2.7655029296875, 2.890838623046875, 3.01617431640625, 3.141510009765625, 3.266845703125, 3.392181396484375, 3.51751708984375, 3.642852783203125, 3.7681884765625, 3.893524169921875, 4.01885986328125, 4.144195556640625, 4.26953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 11.0, 13.0, 19.0, 24.0, 37.0, 41.0, 54.0, 115.0, 129.0, 139.0, 122.0, 77.0, 53.0, 51.0, 34.0, 33.0, 9.0, 13.0, 7.0, 4.0, 1.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005731582641601562, -0.0005593076348304749, -0.0005454570055007935, -0.0005316063761711121, -0.0005177557468414307, -0.0005039051175117493, -0.0004900544881820679, -0.0004762038588523865, -0.0004623532295227051, -0.0004485026001930237, -0.0004346519708633423, -0.0004208013415336609, -0.0004069507122039795, -0.0003931000828742981, -0.0003792494535446167, -0.0003653988242149353, -0.0003515481948852539, -0.0003376975655555725, -0.0003238469362258911, -0.0003099963068962097, -0.0002961456775665283, -0.0002822950482368469, -0.00026844441890716553, -0.00025459378957748413, -0.00024074316024780273, -0.00022689253091812134, -0.00021304190158843994, -0.00019919127225875854, -0.00018534064292907715, -0.00017149001359939575, -0.00015763938426971436, -0.00014378875494003296, -0.00012993812561035156, -0.00011608749628067017, -0.00010223686695098877, -8.838623762130737e-05, -7.453560829162598e-05, -6.068497896194458e-05, -4.6834349632263184e-05, -3.298372030258179e-05, -1.913309097290039e-05, -5.282461643218994e-06, 8.568167686462402e-06, 2.24187970161438e-05, 3.6269426345825195e-05, 5.012005567550659e-05, 6.397068500518799e-05, 7.782131433486938e-05, 9.167194366455078e-05, 0.00010552257299423218, 0.00011937320232391357, 0.00013322383165359497, 0.00014707446098327637, 0.00016092509031295776, 0.00017477571964263916, 0.00018862634897232056, 0.00020247697830200195, 0.00021632760763168335, 0.00023017823696136475, 0.00024402886629104614, 0.00025787949562072754, 0.00027173012495040894, 0.00028558075428009033, 0.00029943138360977173, 0.0003132820129394531]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 8.0, 12.0, 17.0, 29.0, 33.0, 44.0, 92.0, 99.0, 153.0, 217.0, 327.0, 475.0, 720.0, 1118.0, 1706.0, 2522.0, 3947.0, 6447.0, 10731.0, 18287.0, 33631.0, 67960.0, 158767.0, 338785.0, 215670.0, 88827.0, 41959.0, 22062.0, 12638.0, 7738.0, 4825.0, 2991.0, 1935.0, 1262.0, 810.0, 570.0, 347.0, 246.0, 165.0, 112.0, 80.0, 53.0, 44.0, 24.0, 20.0, 11.0, 12.0, 8.0, 6.0, 8.0, 2.0, 1.0, 2.0, 4.0], "bins": [-3.626953125, -3.51922607421875, -3.4114990234375, -3.30377197265625, -3.196044921875, -3.08831787109375, -2.9805908203125, -2.87286376953125, -2.76513671875, -2.65740966796875, -2.5496826171875, -2.44195556640625, -2.334228515625, -2.22650146484375, -2.1187744140625, -2.01104736328125, -1.9033203125, -1.79559326171875, -1.6878662109375, -1.58013916015625, -1.472412109375, -1.36468505859375, -1.2569580078125, -1.14923095703125, -1.04150390625, -0.93377685546875, -0.8260498046875, -0.71832275390625, -0.610595703125, -0.50286865234375, -0.3951416015625, -0.28741455078125, -0.1796875, -0.07196044921875, 0.0357666015625, 0.14349365234375, 0.251220703125, 0.35894775390625, 0.4666748046875, 0.57440185546875, 0.68212890625, 0.78985595703125, 0.8975830078125, 1.00531005859375, 1.113037109375, 1.22076416015625, 1.3284912109375, 1.43621826171875, 1.5439453125, 1.65167236328125, 1.7593994140625, 1.86712646484375, 1.974853515625, 2.08258056640625, 2.1903076171875, 2.29803466796875, 2.40576171875, 2.51348876953125, 2.6212158203125, 2.72894287109375, 2.836669921875, 2.94439697265625, 3.0521240234375, 3.15985107421875, 3.267578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 11.0, 11.0, 12.0, 17.0, 10.0, 25.0, 35.0, 28.0, 28.0, 43.0, 55.0, 70.0, 59.0, 67.0, 82.0, 57.0, 59.0, 64.0, 42.0, 31.0, 42.0, 28.0, 21.0, 14.0, 13.0, 19.0, 10.0, 6.0, 9.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1142578125, -1.0807647705078125, -1.047271728515625, -1.0137786865234375, -0.98028564453125, -0.9467926025390625, -0.913299560546875, -0.8798065185546875, -0.8463134765625, -0.8128204345703125, -0.779327392578125, -0.7458343505859375, -0.71234130859375, -0.6788482666015625, -0.645355224609375, -0.6118621826171875, -0.578369140625, -0.5448760986328125, -0.511383056640625, -0.4778900146484375, -0.44439697265625, -0.4109039306640625, -0.377410888671875, -0.3439178466796875, -0.3104248046875, -0.2769317626953125, -0.243438720703125, -0.2099456787109375, -0.17645263671875, -0.1429595947265625, -0.109466552734375, -0.0759735107421875, -0.04248046875, -0.0089874267578125, 0.024505615234375, 0.0579986572265625, 0.09149169921875, 0.1249847412109375, 0.158477783203125, 0.1919708251953125, 0.2254638671875, 0.2589569091796875, 0.292449951171875, 0.3259429931640625, 0.35943603515625, 0.3929290771484375, 0.426422119140625, 0.4599151611328125, 0.493408203125, 0.5269012451171875, 0.560394287109375, 0.5938873291015625, 0.62738037109375, 0.6608734130859375, 0.694366455078125, 0.7278594970703125, 0.7613525390625, 0.7948455810546875, 0.828338623046875, 0.8618316650390625, 0.89532470703125, 0.9288177490234375, 0.962310791015625, 0.9958038330078125, 1.029296875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 9.0, 14.0, 22.0, 22.0, 30.0, 45.0, 43.0, 64.0, 57.0, 79.0, 86.0, 78.0, 74.0, 69.0, 61.0, 51.0, 29.0, 36.0, 19.0, 17.0, 25.0, 11.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.452972412109375, -41.96217727661133, -40.47138214111328, -38.9805908203125, -37.48979568481445, -35.999000549316406, -34.508209228515625, -33.01741409301758, -31.52661895751953, -30.035823822021484, -28.54503059387207, -27.054237365722656, -25.56344223022461, -24.072647094726562, -22.58185386657715, -21.091060638427734, -19.600265502929688, -18.10947036743164, -16.618677139282227, -15.127882957458496, -13.637088775634766, -12.146294593811035, -10.655500411987305, -9.164706230163574, -7.673912048339844, -6.183117866516113, -4.692323684692383, -3.2015295028686523, -1.7107353210449219, -0.2199411392211914, 1.270853042602539, 2.7616472244262695, 4.25244140625, 5.7432355880737305, 7.234029769897461, 8.724823951721191, 10.215618133544922, 11.706412315368652, 13.197206497192383, 14.688000679016113, 16.178794860839844, 17.66958999633789, 19.160383224487305, 20.65117645263672, 22.141971588134766, 23.632766723632812, 25.123559951782227, 26.61435317993164, 28.105148315429688, 29.595943450927734, 31.08673667907715, 32.57752990722656, 34.06832504272461, 35.559120178222656, 37.04991149902344, 38.540706634521484, 40.03150177001953, 41.52229690551758, 43.013092041015625, 44.503883361816406, 45.99467849731445, 47.4854736328125, 48.97626495361328, 50.46706008911133, 51.957855224609375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 7.0, 3.0, 1.0, 7.0, 6.0, 2.0, 13.0, 13.0, 16.0, 20.0, 23.0, 23.0, 31.0, 25.0, 28.0, 25.0, 29.0, 38.0, 40.0, 52.0, 39.0, 47.0, 42.0, 45.0, 49.0, 47.0, 45.0, 38.0, 33.0, 24.0, 21.0, 21.0, 23.0, 22.0, 16.0, 21.0, 21.0, 8.0, 9.0, 11.0, 2.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.65187072753906, -31.42336082458496, -30.19485092163086, -28.966341018676758, -27.737831115722656, -26.509321212768555, -25.280811309814453, -24.05230140686035, -22.82379150390625, -21.59528160095215, -20.366771697998047, -19.138261795043945, -17.909751892089844, -16.681241989135742, -15.45273208618164, -14.224222183227539, -12.995712280273438, -11.767202377319336, -10.538692474365234, -9.310182571411133, -8.081672668457031, -6.85316276550293, -5.624652862548828, -4.396142959594727, -3.167633056640625, -1.9391231536865234, -0.7106132507324219, 0.5178966522216797, 1.7464065551757812, 2.974916458129883, 4.203426361083984, 5.431936264038086, 6.660442352294922, 7.888952255249023, 9.117462158203125, 10.345972061157227, 11.574481964111328, 12.80299186706543, 14.031501770019531, 15.260011672973633, 16.488521575927734, 17.717031478881836, 18.945541381835938, 20.17405128479004, 21.40256118774414, 22.631071090698242, 23.859580993652344, 25.088090896606445, 26.316600799560547, 27.54511070251465, 28.77362060546875, 30.00213050842285, 31.230640411376953, 32.45915222167969, 33.687660217285156, 34.916168212890625, 36.14468002319336, 37.373191833496094, 38.60169982910156, 39.83020782470703, 41.058719635009766, 42.2872314453125, 43.51573944091797, 44.74424743652344, 45.97275924682617]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 9.0, 10.0, 7.0, 33.0, 35.0, 64.0, 99.0, 167.0, 277.0, 435.0, 746.0, 1303.0, 2126.0, 4117.0, 7508.0, 14851.0, 30506.0, 66884.0, 154875.0, 322904.0, 243889.0, 105181.0, 46821.0, 22004.0, 10803.0, 5647.0, 3085.0, 1687.0, 1007.0, 575.0, 368.0, 197.0, 119.0, 81.0, 36.0, 26.0, 18.0, 14.0, 10.0, 6.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-75.25, -73.20361328125, -71.1572265625, -69.11083984375, -67.064453125, -65.01806640625, -62.9716796875, -60.92529296875, -58.87890625, -56.83251953125, -54.7861328125, -52.73974609375, -50.693359375, -48.64697265625, -46.6005859375, -44.55419921875, -42.5078125, -40.46142578125, -38.4150390625, -36.36865234375, -34.322265625, -32.27587890625, -30.2294921875, -28.18310546875, -26.13671875, -24.09033203125, -22.0439453125, -19.99755859375, -17.951171875, -15.90478515625, -13.8583984375, -11.81201171875, -9.765625, -7.71923828125, -5.6728515625, -3.62646484375, -1.580078125, 0.46630859375, 2.5126953125, 4.55908203125, 6.60546875, 8.65185546875, 10.6982421875, 12.74462890625, 14.791015625, 16.83740234375, 18.8837890625, 20.93017578125, 22.9765625, 25.02294921875, 27.0693359375, 29.11572265625, 31.162109375, 33.20849609375, 35.2548828125, 37.30126953125, 39.34765625, 41.39404296875, 43.4404296875, 45.48681640625, 47.533203125, 49.57958984375, 51.6259765625, 53.67236328125, 55.71875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 5.0, 6.0, 6.0, 10.0, 15.0, 12.0, 25.0, 22.0, 36.0, 18.0, 26.0, 22.0, 34.0, 44.0, 35.0, 42.0, 47.0, 43.0, 48.0, 51.0, 55.0, 51.0, 55.0, 32.0, 27.0, 26.0, 29.0, 21.0, 21.0, 14.0, 19.0, 20.0, 16.0, 9.0, 15.0, 4.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.8125, -33.560546875, -32.30859375, -31.056640625, -29.8046875, -28.552734375, -27.30078125, -26.048828125, -24.796875, -23.544921875, -22.29296875, -21.041015625, -19.7890625, -18.537109375, -17.28515625, -16.033203125, -14.78125, -13.529296875, -12.27734375, -11.025390625, -9.7734375, -8.521484375, -7.26953125, -6.017578125, -4.765625, -3.513671875, -2.26171875, -1.009765625, 0.2421875, 1.494140625, 2.74609375, 3.998046875, 5.25, 6.501953125, 7.75390625, 9.005859375, 10.2578125, 11.509765625, 12.76171875, 14.013671875, 15.265625, 16.517578125, 17.76953125, 19.021484375, 20.2734375, 21.525390625, 22.77734375, 24.029296875, 25.28125, 26.533203125, 27.78515625, 29.037109375, 30.2890625, 31.541015625, 32.79296875, 34.044921875, 35.296875, 36.548828125, 37.80078125, 39.052734375, 40.3046875, 41.556640625, 42.80859375, 44.060546875, 45.3125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 10.0, 2.0, 13.0, 7.0, 34.0, 30.0, 47.0, 74.0, 98.0, 166.0, 239.0, 387.0, 567.0, 890.0, 1241.0, 1929.0, 3060.0, 4689.0, 7419.0, 11180.0, 17479.0, 28533.0, 46317.0, 76366.0, 125803.0, 189591.0, 192491.0, 130976.0, 79728.0, 48235.0, 29572.0, 18356.0, 11687.0, 7439.0, 4729.0, 3115.0, 2044.0, 1422.0, 878.0, 593.0, 384.0, 266.0, 153.0, 116.0, 59.0, 51.0, 30.0, 17.0, 17.0, 15.0, 10.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-43.40625, -42.0078125, -40.609375, -39.2109375, -37.8125, -36.4140625, -35.015625, -33.6171875, -32.21875, -30.8203125, -29.421875, -28.0234375, -26.625, -25.2265625, -23.828125, -22.4296875, -21.03125, -19.6328125, -18.234375, -16.8359375, -15.4375, -14.0390625, -12.640625, -11.2421875, -9.84375, -8.4453125, -7.046875, -5.6484375, -4.25, -2.8515625, -1.453125, -0.0546875, 1.34375, 2.7421875, 4.140625, 5.5390625, 6.9375, 8.3359375, 9.734375, 11.1328125, 12.53125, 13.9296875, 15.328125, 16.7265625, 18.125, 19.5234375, 20.921875, 22.3203125, 23.71875, 25.1171875, 26.515625, 27.9140625, 29.3125, 30.7109375, 32.109375, 33.5078125, 34.90625, 36.3046875, 37.703125, 39.1015625, 40.5, 41.8984375, 43.296875, 44.6953125, 46.09375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 11.0, 8.0, 12.0, 14.0, 12.0, 19.0, 17.0, 20.0, 10.0, 25.0, 24.0, 28.0, 23.0, 33.0, 45.0, 49.0, 38.0, 32.0, 47.0, 36.0, 32.0, 46.0, 43.0, 49.0, 55.0, 35.0, 46.0, 24.0, 22.0, 27.0, 15.0, 20.0, 13.0, 15.0, 15.0, 10.0, 8.0, 10.0, 7.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -22.07373046875, -21.2412109375, -20.40869140625, -19.576171875, -18.74365234375, -17.9111328125, -17.07861328125, -16.24609375, -15.41357421875, -14.5810546875, -13.74853515625, -12.916015625, -12.08349609375, -11.2509765625, -10.41845703125, -9.5859375, -8.75341796875, -7.9208984375, -7.08837890625, -6.255859375, -5.42333984375, -4.5908203125, -3.75830078125, -2.92578125, -2.09326171875, -1.2607421875, -0.42822265625, 0.404296875, 1.23681640625, 2.0693359375, 2.90185546875, 3.734375, 4.56689453125, 5.3994140625, 6.23193359375, 7.064453125, 7.89697265625, 8.7294921875, 9.56201171875, 10.39453125, 11.22705078125, 12.0595703125, 12.89208984375, 13.724609375, 14.55712890625, 15.3896484375, 16.22216796875, 17.0546875, 17.88720703125, 18.7197265625, 19.55224609375, 20.384765625, 21.21728515625, 22.0498046875, 22.88232421875, 23.71484375, 24.54736328125, 25.3798828125, 26.21240234375, 27.044921875, 27.87744140625, 28.7099609375, 29.54248046875, 30.375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 11.0, 12.0, 37.0, 30.0, 46.0, 78.0, 106.0, 149.0, 185.0, 279.0, 386.0, 575.0, 857.0, 1222.0, 1706.0, 2488.0, 3879.0, 5850.0, 9197.0, 14498.0, 23772.0, 40249.0, 69437.0, 124735.0, 219383.0, 222902.0, 127704.0, 70843.0, 41071.0, 24380.0, 14971.0, 9238.0, 5989.0, 3979.0, 2632.0, 1760.0, 1234.0, 846.0, 564.0, 374.0, 273.0, 186.0, 143.0, 104.0, 75.0, 34.0, 36.0, 17.0, 12.0, 8.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0], "bins": [-17.71875, -17.18212890625, -16.6455078125, -16.10888671875, -15.572265625, -15.03564453125, -14.4990234375, -13.96240234375, -13.42578125, -12.88916015625, -12.3525390625, -11.81591796875, -11.279296875, -10.74267578125, -10.2060546875, -9.66943359375, -9.1328125, -8.59619140625, -8.0595703125, -7.52294921875, -6.986328125, -6.44970703125, -5.9130859375, -5.37646484375, -4.83984375, -4.30322265625, -3.7666015625, -3.22998046875, -2.693359375, -2.15673828125, -1.6201171875, -1.08349609375, -0.546875, -0.01025390625, 0.5263671875, 1.06298828125, 1.599609375, 2.13623046875, 2.6728515625, 3.20947265625, 3.74609375, 4.28271484375, 4.8193359375, 5.35595703125, 5.892578125, 6.42919921875, 6.9658203125, 7.50244140625, 8.0390625, 8.57568359375, 9.1123046875, 9.64892578125, 10.185546875, 10.72216796875, 11.2587890625, 11.79541015625, 12.33203125, 12.86865234375, 13.4052734375, 13.94189453125, 14.478515625, 15.01513671875, 15.5517578125, 16.08837890625, 16.625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 10.0, 13.0, 17.0, 19.0, 13.0, 34.0, 44.0, 60.0, 66.0, 70.0, 87.0, 92.0, 91.0, 77.0, 58.0, 48.0, 29.0, 23.0, 18.0, 26.0, 19.0, 13.0, 8.0, 17.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.001983642578125, -0.0019261986017227173, -0.0018687546253204346, -0.0018113106489181519, -0.0017538666725158691, -0.0016964226961135864, -0.0016389787197113037, -0.001581534743309021, -0.0015240907669067383, -0.0014666467905044556, -0.0014092028141021729, -0.0013517588376998901, -0.0012943148612976074, -0.0012368708848953247, -0.001179426908493042, -0.0011219829320907593, -0.0010645389556884766, -0.0010070949792861938, -0.0009496510028839111, -0.0008922070264816284, -0.0008347630500793457, -0.000777319073677063, -0.0007198750972747803, -0.0006624311208724976, -0.0006049871444702148, -0.0005475431680679321, -0.0004900991916656494, -0.0004326552152633667, -0.000375211238861084, -0.00031776726245880127, -0.00026032328605651855, -0.00020287930965423584, -0.00014543533325195312, -8.799135684967041e-05, -3.0547380447387695e-05, 2.689659595489502e-05, 8.434057235717773e-05, 0.00014178454875946045, 0.00019922852516174316, 0.0002566725015640259, 0.0003141164779663086, 0.0003715604543685913, 0.000429004430770874, 0.00048644840717315674, 0.0005438923835754395, 0.0006013363599777222, 0.0006587803363800049, 0.0007162243127822876, 0.0007736682891845703, 0.000831112265586853, 0.0008885562419891357, 0.0009460002183914185, 0.0010034441947937012, 0.0010608881711959839, 0.0011183321475982666, 0.0011757761240005493, 0.001233220100402832, 0.0012906640768051147, 0.0013481080532073975, 0.0014055520296096802, 0.0014629960060119629, 0.0015204399824142456, 0.0015778839588165283, 0.001635327935218811, 0.0016927719116210938]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 11.0, 9.0, 11.0, 18.0, 33.0, 40.0, 54.0, 83.0, 130.0, 198.0, 257.0, 390.0, 530.0, 745.0, 1139.0, 1624.0, 2386.0, 3608.0, 5544.0, 8858.0, 14470.0, 22705.0, 37390.0, 65170.0, 114721.0, 207505.0, 234563.0, 135806.0, 75393.0, 43949.0, 25900.0, 16053.0, 10165.0, 6343.0, 4095.0, 2758.0, 1825.0, 1352.0, 848.0, 553.0, 426.0, 269.0, 207.0, 121.0, 88.0, 72.0, 39.0, 28.0, 21.0, 18.0, 15.0, 5.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0], "bins": [-16.328125, -15.820068359375, -15.31201171875, -14.803955078125, -14.2958984375, -13.787841796875, -13.27978515625, -12.771728515625, -12.263671875, -11.755615234375, -11.24755859375, -10.739501953125, -10.2314453125, -9.723388671875, -9.21533203125, -8.707275390625, -8.19921875, -7.691162109375, -7.18310546875, -6.675048828125, -6.1669921875, -5.658935546875, -5.15087890625, -4.642822265625, -4.134765625, -3.626708984375, -3.11865234375, -2.610595703125, -2.1025390625, -1.594482421875, -1.08642578125, -0.578369140625, -0.0703125, 0.437744140625, 0.94580078125, 1.453857421875, 1.9619140625, 2.469970703125, 2.97802734375, 3.486083984375, 3.994140625, 4.502197265625, 5.01025390625, 5.518310546875, 6.0263671875, 6.534423828125, 7.04248046875, 7.550537109375, 8.05859375, 8.566650390625, 9.07470703125, 9.582763671875, 10.0908203125, 10.598876953125, 11.10693359375, 11.614990234375, 12.123046875, 12.631103515625, 13.13916015625, 13.647216796875, 14.1552734375, 14.663330078125, 15.17138671875, 15.679443359375, 16.1875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 5.0, 12.0, 13.0, 7.0, 15.0, 15.0, 19.0, 17.0, 30.0, 33.0, 45.0, 30.0, 44.0, 38.0, 61.0, 65.0, 54.0, 63.0, 51.0, 55.0, 56.0, 39.0, 41.0, 37.0, 25.0, 21.0, 18.0, 21.0, 13.0, 12.0, 11.0, 0.0, 5.0, 2.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.70880126953125, -6.5113525390625, -6.31390380859375, -6.116455078125, -5.91900634765625, -5.7215576171875, -5.52410888671875, -5.32666015625, -5.12921142578125, -4.9317626953125, -4.73431396484375, -4.536865234375, -4.33941650390625, -4.1419677734375, -3.94451904296875, -3.7470703125, -3.54962158203125, -3.3521728515625, -3.15472412109375, -2.957275390625, -2.75982666015625, -2.5623779296875, -2.36492919921875, -2.16748046875, -1.97003173828125, -1.7725830078125, -1.57513427734375, -1.377685546875, -1.18023681640625, -0.9827880859375, -0.78533935546875, -0.587890625, -0.39044189453125, -0.1929931640625, 0.00445556640625, 0.201904296875, 0.39935302734375, 0.5968017578125, 0.79425048828125, 0.99169921875, 1.18914794921875, 1.3865966796875, 1.58404541015625, 1.781494140625, 1.97894287109375, 2.1763916015625, 2.37384033203125, 2.5712890625, 2.76873779296875, 2.9661865234375, 3.16363525390625, 3.361083984375, 3.55853271484375, 3.7559814453125, 3.95343017578125, 4.15087890625, 4.34832763671875, 4.5457763671875, 4.74322509765625, 4.940673828125, 5.13812255859375, 5.3355712890625, 5.53302001953125, 5.73046875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 7.0, 12.0, 16.0, 16.0, 11.0, 27.0, 26.0, 41.0, 48.0, 54.0, 58.0, 63.0, 57.0, 72.0, 67.0, 67.0, 52.0, 61.0, 56.0, 28.0, 33.0, 29.0, 13.0, 14.0, 15.0, 10.0, 7.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.03135299682617, -37.67646408081055, -36.32157516479492, -34.9666862487793, -33.61180114746094, -32.25691223144531, -30.902023315429688, -29.547134399414062, -28.192245483398438, -26.837356567382812, -25.482467651367188, -24.127580642700195, -22.77269172668457, -21.417802810668945, -20.062915802001953, -18.708026885986328, -17.353137969970703, -15.998249053955078, -14.64336109161377, -13.288473129272461, -11.933584213256836, -10.578695297241211, -9.223807334899902, -7.868919372558594, -6.514030456542969, -5.159142017364502, -3.804253578186035, -2.4493651390075684, -1.0944766998291016, 0.26041173934936523, 1.615300178527832, 2.9701881408691406, 4.3250732421875, 5.679961681365967, 7.034850120544434, 8.389738082885742, 9.744626998901367, 11.099515914916992, 12.4544038772583, 13.80929183959961, 15.164180755615234, 16.51906967163086, 17.873958587646484, 19.228845596313477, 20.5837345123291, 21.938623428344727, 23.29351043701172, 24.648399353027344, 26.00328826904297, 27.358177185058594, 28.71306610107422, 30.06795310974121, 31.422842025756836, 32.77772903442383, 34.13261795043945, 35.48750686645508, 36.8423957824707, 38.19728469848633, 39.55217361450195, 40.90706253051758, 42.26194763183594, 43.61683654785156, 44.97172546386719, 46.32661437988281, 47.68150329589844]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 11.0, 8.0, 8.0, 11.0, 14.0, 20.0, 23.0, 19.0, 25.0, 24.0, 22.0, 34.0, 43.0, 46.0, 41.0, 33.0, 55.0, 44.0, 49.0, 40.0, 43.0, 41.0, 43.0, 39.0, 41.0, 30.0, 26.0, 26.0, 22.0, 14.0, 14.0, 12.0, 13.0, 14.0, 7.0, 8.0, 10.0, 7.0, 2.0, 7.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.6940803527832, -32.41613006591797, -31.138179779052734, -29.8602294921875, -28.582279205322266, -27.30432891845703, -26.026378631591797, -24.748428344726562, -23.470478057861328, -22.192527770996094, -20.91457748413086, -19.636627197265625, -18.35867691040039, -17.080726623535156, -15.802775382995605, -14.524825096130371, -13.24687385559082, -11.968923568725586, -10.690973281860352, -9.413022994995117, -8.135072708129883, -6.85712194442749, -5.579171180725098, -4.301220893859863, -3.023270606994629, -1.745320200920105, -0.46736979484558105, 0.8105807304382324, 2.088531017303467, 3.366481304168701, 4.644432067871094, 5.922382354736328, 7.2003326416015625, 8.478282928466797, 9.756233215332031, 11.034183502197266, 12.3121337890625, 13.590084075927734, 14.868035316467285, 16.145984649658203, 17.423934936523438, 18.701885223388672, 19.979835510253906, 21.25778579711914, 22.535736083984375, 23.81368637084961, 25.091636657714844, 26.369586944580078, 27.647539138793945, 28.92548942565918, 30.203439712524414, 31.48138999938965, 32.759342193603516, 34.03729248046875, 35.315242767333984, 36.59319305419922, 37.87114334106445, 39.14909362792969, 40.42704391479492, 41.704994201660156, 42.98294448852539, 44.260894775390625, 45.53884506225586, 46.816795349121094, 48.09474563598633]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 15.0, 10.0, 16.0, 30.0, 47.0, 54.0, 94.0, 118.0, 183.0, 271.0, 388.0, 546.0, 910.0, 1372.0, 2258.0, 3877.0, 6655.0, 12272.0, 24811.0, 55763.0, 170156.0, 673337.0, 1882934.0, 983074.0, 237535.0, 72358.0, 30041.0, 15019.0, 7973.0, 4540.0, 2740.0, 1664.0, 1062.0, 702.0, 467.0, 339.0, 212.0, 128.0, 100.0, 64.0, 42.0, 42.0, 20.0, 8.0, 9.0, 9.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-62.28125, -60.4296875, -58.578125, -56.7265625, -54.875, -53.0234375, -51.171875, -49.3203125, -47.46875, -45.6171875, -43.765625, -41.9140625, -40.0625, -38.2109375, -36.359375, -34.5078125, -32.65625, -30.8046875, -28.953125, -27.1015625, -25.25, -23.3984375, -21.546875, -19.6953125, -17.84375, -15.9921875, -14.140625, -12.2890625, -10.4375, -8.5859375, -6.734375, -4.8828125, -3.03125, -1.1796875, 0.671875, 2.5234375, 4.375, 6.2265625, 8.078125, 9.9296875, 11.78125, 13.6328125, 15.484375, 17.3359375, 19.1875, 21.0390625, 22.890625, 24.7421875, 26.59375, 28.4453125, 30.296875, 32.1484375, 34.0, 35.8515625, 37.703125, 39.5546875, 41.40625, 43.2578125, 45.109375, 46.9609375, 48.8125, 50.6640625, 52.515625, 54.3671875, 56.21875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 9.0, 12.0, 6.0, 12.0, 23.0, 27.0, 29.0, 24.0, 23.0, 32.0, 35.0, 40.0, 43.0, 56.0, 46.0, 57.0, 60.0, 56.0, 43.0, 39.0, 44.0, 46.0, 41.0, 35.0, 19.0, 28.0, 18.0, 17.0, 7.0, 12.0, 11.0, 11.0, 6.0, 11.0, 7.0, 0.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.359375, -30.170166015625, -28.98095703125, -27.791748046875, -26.6025390625, -25.413330078125, -24.22412109375, -23.034912109375, -21.845703125, -20.656494140625, -19.46728515625, -18.278076171875, -17.0888671875, -15.899658203125, -14.71044921875, -13.521240234375, -12.33203125, -11.142822265625, -9.95361328125, -8.764404296875, -7.5751953125, -6.385986328125, -5.19677734375, -4.007568359375, -2.818359375, -1.629150390625, -0.43994140625, 0.749267578125, 1.9384765625, 3.127685546875, 4.31689453125, 5.506103515625, 6.6953125, 7.884521484375, 9.07373046875, 10.262939453125, 11.4521484375, 12.641357421875, 13.83056640625, 15.019775390625, 16.208984375, 17.398193359375, 18.58740234375, 19.776611328125, 20.9658203125, 22.155029296875, 23.34423828125, 24.533447265625, 25.72265625, 26.911865234375, 28.10107421875, 29.290283203125, 30.4794921875, 31.668701171875, 32.85791015625, 34.047119140625, 35.236328125, 36.425537109375, 37.61474609375, 38.803955078125, 39.9931640625, 41.182373046875, 42.37158203125, 43.560791015625, 44.75]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 9.0, 12.0, 19.0, 21.0, 23.0, 46.0, 55.0, 67.0, 118.0, 155.0, 237.0, 341.0, 470.0, 807.0, 1080.0, 1692.0, 2515.0, 4055.0, 6663.0, 11179.0, 19277.0, 34181.0, 64264.0, 127191.0, 277685.0, 705874.0, 1558648.0, 780701.0, 303262.0, 137564.0, 68539.0, 36184.0, 20321.0, 11727.0, 6958.0, 4247.0, 2750.0, 1773.0, 1128.0, 760.0, 502.0, 349.0, 252.0, 165.0, 136.0, 76.0, 53.0, 54.0, 29.0, 24.0, 15.0, 15.0, 9.0, 3.0, 2.0, 2.0, 5.0], "bins": [-50.0625, -48.5703125, -47.078125, -45.5859375, -44.09375, -42.6015625, -41.109375, -39.6171875, -38.125, -36.6328125, -35.140625, -33.6484375, -32.15625, -30.6640625, -29.171875, -27.6796875, -26.1875, -24.6953125, -23.203125, -21.7109375, -20.21875, -18.7265625, -17.234375, -15.7421875, -14.25, -12.7578125, -11.265625, -9.7734375, -8.28125, -6.7890625, -5.296875, -3.8046875, -2.3125, -0.8203125, 0.671875, 2.1640625, 3.65625, 5.1484375, 6.640625, 8.1328125, 9.625, 11.1171875, 12.609375, 14.1015625, 15.59375, 17.0859375, 18.578125, 20.0703125, 21.5625, 23.0546875, 24.546875, 26.0390625, 27.53125, 29.0234375, 30.515625, 32.0078125, 33.5, 34.9921875, 36.484375, 37.9765625, 39.46875, 40.9609375, 42.453125, 43.9453125, 45.4375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 8.0, 15.0, 16.0, 15.0, 22.0, 27.0, 35.0, 47.0, 43.0, 50.0, 58.0, 79.0, 99.0, 105.0, 150.0, 181.0, 216.0, 288.0, 351.0, 358.0, 338.0, 271.0, 236.0, 195.0, 155.0, 119.0, 107.0, 83.0, 79.0, 68.0, 45.0, 46.0, 31.0, 16.0, 30.0, 20.0, 15.0, 7.0, 10.0, 3.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.5703125, -15.1063232421875, -14.642333984375, -14.1783447265625, -13.71435546875, -13.2503662109375, -12.786376953125, -12.3223876953125, -11.8583984375, -11.3944091796875, -10.930419921875, -10.4664306640625, -10.00244140625, -9.5384521484375, -9.074462890625, -8.6104736328125, -8.146484375, -7.6824951171875, -7.218505859375, -6.7545166015625, -6.29052734375, -5.8265380859375, -5.362548828125, -4.8985595703125, -4.4345703125, -3.9705810546875, -3.506591796875, -3.0426025390625, -2.57861328125, -2.1146240234375, -1.650634765625, -1.1866455078125, -0.72265625, -0.2586669921875, 0.205322265625, 0.6693115234375, 1.13330078125, 1.5972900390625, 2.061279296875, 2.5252685546875, 2.9892578125, 3.4532470703125, 3.917236328125, 4.3812255859375, 4.84521484375, 5.3092041015625, 5.773193359375, 6.2371826171875, 6.701171875, 7.1651611328125, 7.629150390625, 8.0931396484375, 8.55712890625, 9.0211181640625, 9.485107421875, 9.9490966796875, 10.4130859375, 10.8770751953125, 11.341064453125, 11.8050537109375, 12.26904296875, 12.7330322265625, 13.197021484375, 13.6610107421875, 14.125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 8.0, 10.0, 5.0, 15.0, 16.0, 28.0, 25.0, 30.0, 36.0, 54.0, 49.0, 52.0, 54.0, 58.0, 68.0, 67.0, 57.0, 47.0, 48.0, 35.0, 40.0, 25.0, 21.0, 31.0, 19.0, 12.0, 16.0, 9.0, 6.0, 8.0, 7.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.71540832519531, -33.58159255981445, -32.447776794433594, -31.313961029052734, -30.180145263671875, -29.046329498291016, -27.912513732910156, -26.778697967529297, -25.644882202148438, -24.511066436767578, -23.37725067138672, -22.24343490600586, -21.109619140625, -19.97580337524414, -18.84198760986328, -17.708171844482422, -16.574356079101562, -15.440540313720703, -14.306724548339844, -13.172908782958984, -12.039093017578125, -10.905277252197266, -9.771461486816406, -8.637645721435547, -7.5038299560546875, -6.370014190673828, -5.236198425292969, -4.102382659912109, -2.96856689453125, -1.8347511291503906, -0.7009353637695312, 0.4328804016113281, 1.5666961669921875, 2.700511932373047, 3.8343276977539062, 4.968143463134766, 6.101959228515625, 7.235774993896484, 8.369590759277344, 9.503406524658203, 10.637222290039062, 11.771038055419922, 12.904853820800781, 14.03866958618164, 15.1724853515625, 16.30630111694336, 17.44011688232422, 18.573932647705078, 19.707748413085938, 20.841564178466797, 21.975379943847656, 23.109195709228516, 24.243011474609375, 25.376827239990234, 26.510643005371094, 27.644458770751953, 28.778274536132812, 29.912090301513672, 31.04590606689453, 32.17972183227539, 33.31353759765625, 34.44735336303711, 35.58116912841797, 36.71498489379883, 37.84880065917969]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 8.0, 14.0, 4.0, 14.0, 18.0, 13.0, 21.0, 19.0, 26.0, 27.0, 38.0, 31.0, 29.0, 39.0, 41.0, 39.0, 36.0, 48.0, 46.0, 43.0, 33.0, 41.0, 43.0, 31.0, 37.0, 28.0, 33.0, 24.0, 26.0, 20.0, 22.0, 12.0, 13.0, 14.0, 12.0, 6.0, 7.0, 3.0, 4.0, 9.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.75595474243164, -31.653465270996094, -30.550975799560547, -29.448486328125, -28.345996856689453, -27.243507385253906, -26.141016006469727, -25.03852653503418, -23.936037063598633, -22.833547592163086, -21.73105812072754, -20.628568649291992, -19.526077270507812, -18.423587799072266, -17.32109832763672, -16.218608856201172, -15.116119384765625, -14.013629913330078, -12.911140441894531, -11.808650016784668, -10.706160545349121, -9.603671073913574, -8.501180648803711, -7.398691177368164, -6.296201705932617, -5.19371223449707, -4.091222286224365, -2.9887325763702393, -1.8862428665161133, -0.7837533950805664, 0.31873655319213867, 1.4212265014648438, 2.5237159729003906, 3.6262056827545166, 4.728695392608643, 5.831185340881348, 6.9336748123168945, 8.036164283752441, 9.138654708862305, 10.241144180297852, 11.343633651733398, 12.446123123168945, 13.548612594604492, 14.651103019714355, 15.753592491149902, 16.856082916259766, 17.958572387695312, 19.06106185913086, 20.163551330566406, 21.266040802001953, 22.3685302734375, 23.471019744873047, 24.573509216308594, 25.67599868774414, 26.77849006652832, 27.880979537963867, 28.983469009399414, 30.08595848083496, 31.188447952270508, 32.29093933105469, 33.393428802490234, 34.49591827392578, 35.59840774536133, 36.700897216796875, 37.80338668823242]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 6.0, 6.0, 10.0, 8.0, 28.0, 27.0, 52.0, 63.0, 82.0, 139.0, 171.0, 251.0, 351.0, 451.0, 713.0, 1007.0, 1336.0, 1984.0, 2834.0, 4151.0, 5975.0, 8587.0, 13076.0, 19378.0, 29539.0, 46727.0, 75129.0, 126231.0, 211514.0, 192758.0, 113088.0, 67511.0, 42345.0, 27286.0, 17657.0, 11840.0, 8156.0, 5422.0, 3792.0, 2609.0, 1825.0, 1329.0, 889.0, 635.0, 475.0, 335.0, 242.0, 156.0, 124.0, 79.0, 42.0, 44.0, 41.0, 18.0, 19.0, 10.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-9.828125, -9.510009765625, -9.19189453125, -8.873779296875, -8.5556640625, -8.237548828125, -7.91943359375, -7.601318359375, -7.283203125, -6.965087890625, -6.64697265625, -6.328857421875, -6.0107421875, -5.692626953125, -5.37451171875, -5.056396484375, -4.73828125, -4.420166015625, -4.10205078125, -3.783935546875, -3.4658203125, -3.147705078125, -2.82958984375, -2.511474609375, -2.193359375, -1.875244140625, -1.55712890625, -1.239013671875, -0.9208984375, -0.602783203125, -0.28466796875, 0.033447265625, 0.3515625, 0.669677734375, 0.98779296875, 1.305908203125, 1.6240234375, 1.942138671875, 2.26025390625, 2.578369140625, 2.896484375, 3.214599609375, 3.53271484375, 3.850830078125, 4.1689453125, 4.487060546875, 4.80517578125, 5.123291015625, 5.44140625, 5.759521484375, 6.07763671875, 6.395751953125, 6.7138671875, 7.031982421875, 7.35009765625, 7.668212890625, 7.986328125, 8.304443359375, 8.62255859375, 8.940673828125, 9.2587890625, 9.576904296875, 9.89501953125, 10.213134765625, 10.53125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 7.0, 11.0, 8.0, 21.0, 10.0, 11.0, 19.0, 20.0, 27.0, 29.0, 31.0, 37.0, 28.0, 41.0, 29.0, 36.0, 47.0, 43.0, 47.0, 42.0, 35.0, 47.0, 27.0, 41.0, 39.0, 28.0, 40.0, 30.0, 19.0, 23.0, 15.0, 20.0, 15.0, 7.0, 12.0, 4.0, 8.0, 7.0, 6.0, 6.0, 6.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.625, -34.5029296875, -33.380859375, -32.2587890625, -31.13671875, -30.0146484375, -28.892578125, -27.7705078125, -26.6484375, -25.5263671875, -24.404296875, -23.2822265625, -22.16015625, -21.0380859375, -19.916015625, -18.7939453125, -17.671875, -16.5498046875, -15.427734375, -14.3056640625, -13.18359375, -12.0615234375, -10.939453125, -9.8173828125, -8.6953125, -7.5732421875, -6.451171875, -5.3291015625, -4.20703125, -3.0849609375, -1.962890625, -0.8408203125, 0.28125, 1.4033203125, 2.525390625, 3.6474609375, 4.76953125, 5.8916015625, 7.013671875, 8.1357421875, 9.2578125, 10.3798828125, 11.501953125, 12.6240234375, 13.74609375, 14.8681640625, 15.990234375, 17.1123046875, 18.234375, 19.3564453125, 20.478515625, 21.6005859375, 22.72265625, 23.8447265625, 24.966796875, 26.0888671875, 27.2109375, 28.3330078125, 29.455078125, 30.5771484375, 31.69921875, 32.8212890625, 33.943359375, 35.0654296875, 36.1875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 8.0, 5.0, 6.0, 20.0, 21.0, 36.0, 40.0, 74.0, 100.0, 148.0, 193.0, 306.0, 454.0, 731.0, 1182.0, 2040.0, 3597.0, 6853.0, 13393.0, 32143.0, 527019.0, 401775.0, 30298.0, 12946.0, 6453.0, 3488.0, 1980.0, 1105.0, 699.0, 452.0, 292.0, 191.0, 135.0, 94.0, 80.0, 43.0, 29.0, 24.0, 28.0, 11.0, 9.0, 14.0, 7.0, 6.0, 2.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-26.296875, -25.474365234375, -24.65185546875, -23.829345703125, -23.0068359375, -22.184326171875, -21.36181640625, -20.539306640625, -19.716796875, -18.894287109375, -18.07177734375, -17.249267578125, -16.4267578125, -15.604248046875, -14.78173828125, -13.959228515625, -13.13671875, -12.314208984375, -11.49169921875, -10.669189453125, -9.8466796875, -9.024169921875, -8.20166015625, -7.379150390625, -6.556640625, -5.734130859375, -4.91162109375, -4.089111328125, -3.2666015625, -2.444091796875, -1.62158203125, -0.799072265625, 0.0234375, 0.845947265625, 1.66845703125, 2.490966796875, 3.3134765625, 4.135986328125, 4.95849609375, 5.781005859375, 6.603515625, 7.426025390625, 8.24853515625, 9.071044921875, 9.8935546875, 10.716064453125, 11.53857421875, 12.361083984375, 13.18359375, 14.006103515625, 14.82861328125, 15.651123046875, 16.4736328125, 17.296142578125, 18.11865234375, 18.941162109375, 19.763671875, 20.586181640625, 21.40869140625, 22.231201171875, 23.0537109375, 23.876220703125, 24.69873046875, 25.521240234375, 26.34375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 5.0, 9.0, 4.0, 9.0, 10.0, 18.0, 14.0, 5.0, 27.0, 24.0, 20.0, 30.0, 22.0, 43.0, 48.0, 28.0, 45.0, 34.0, 40.0, 38.0, 39.0, 29.0, 29.0, 40.0, 35.0, 44.0, 25.0, 32.0, 28.0, 34.0, 22.0, 28.0, 19.0, 17.0, 13.0, 16.0, 18.0, 10.0, 12.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-24.203125, -23.479248046875, -22.75537109375, -22.031494140625, -21.3076171875, -20.583740234375, -19.85986328125, -19.135986328125, -18.412109375, -17.688232421875, -16.96435546875, -16.240478515625, -15.5166015625, -14.792724609375, -14.06884765625, -13.344970703125, -12.62109375, -11.897216796875, -11.17333984375, -10.449462890625, -9.7255859375, -9.001708984375, -8.27783203125, -7.553955078125, -6.830078125, -6.106201171875, -5.38232421875, -4.658447265625, -3.9345703125, -3.210693359375, -2.48681640625, -1.762939453125, -1.0390625, -0.315185546875, 0.40869140625, 1.132568359375, 1.8564453125, 2.580322265625, 3.30419921875, 4.028076171875, 4.751953125, 5.475830078125, 6.19970703125, 6.923583984375, 7.6474609375, 8.371337890625, 9.09521484375, 9.819091796875, 10.54296875, 11.266845703125, 11.99072265625, 12.714599609375, 13.4384765625, 14.162353515625, 14.88623046875, 15.610107421875, 16.333984375, 17.057861328125, 17.78173828125, 18.505615234375, 19.2294921875, 19.953369140625, 20.67724609375, 21.401123046875, 22.125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 6.0, 19.0, 22.0, 30.0, 44.0, 71.0, 62.0, 121.0, 146.0, 221.0, 365.0, 615.0, 1188.0, 2424.0, 5755.0, 15321.0, 67207.0, 892786.0, 40788.0, 12002.0, 4548.0, 2073.0, 1048.0, 624.0, 352.0, 248.0, 136.0, 87.0, 50.0, 43.0, 27.0, 26.0, 20.0, 15.0, 11.0, 13.0, 4.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.709228515625, -2.61376953125, -2.518310546875, -2.4228515625, -2.327392578125, -2.23193359375, -2.136474609375, -2.041015625, -1.945556640625, -1.85009765625, -1.754638671875, -1.6591796875, -1.563720703125, -1.46826171875, -1.372802734375, -1.27734375, -1.181884765625, -1.08642578125, -0.990966796875, -0.8955078125, -0.800048828125, -0.70458984375, -0.609130859375, -0.513671875, -0.418212890625, -0.32275390625, -0.227294921875, -0.1318359375, -0.036376953125, 0.05908203125, 0.154541015625, 0.25, 0.345458984375, 0.44091796875, 0.536376953125, 0.6318359375, 0.727294921875, 0.82275390625, 0.918212890625, 1.013671875, 1.109130859375, 1.20458984375, 1.300048828125, 1.3955078125, 1.490966796875, 1.58642578125, 1.681884765625, 1.77734375, 1.872802734375, 1.96826171875, 2.063720703125, 2.1591796875, 2.254638671875, 2.35009765625, 2.445556640625, 2.541015625, 2.636474609375, 2.73193359375, 2.827392578125, 2.9228515625, 3.018310546875, 3.11376953125, 3.209228515625, 3.3046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 6.0, 2.0, 14.0, 9.0, 13.0, 13.0, 26.0, 26.0, 33.0, 41.0, 41.0, 62.0, 63.0, 83.0, 65.0, 68.0, 67.0, 66.0, 56.0, 44.0, 23.0, 32.0, 20.0, 17.0, 19.0, 13.0, 16.0, 13.0, 11.0, 8.0, 3.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016009807586669922, -0.00015516020357608795, -0.00015022233128547668, -0.00014528445899486542, -0.00014034658670425415, -0.00013540871441364288, -0.00013047084212303162, -0.00012553296983242035, -0.00012059509754180908, -0.00011565722525119781, -0.00011071935296058655, -0.00010578148066997528, -0.00010084360837936401, -9.590573608875275e-05, -9.096786379814148e-05, -8.602999150753021e-05, -8.109211921691895e-05, -7.615424692630768e-05, -7.121637463569641e-05, -6.627850234508514e-05, -6.134063005447388e-05, -5.640275776386261e-05, -5.146488547325134e-05, -4.6527013182640076e-05, -4.158914089202881e-05, -3.665126860141754e-05, -3.1713396310806274e-05, -2.6775524020195007e-05, -2.183765172958374e-05, -1.6899779438972473e-05, -1.1961907148361206e-05, -7.024034857749939e-06, -2.086162567138672e-06, 2.8517097234725952e-06, 7.789582014083862e-06, 1.272745430469513e-05, 1.7665326595306396e-05, 2.2603198885917664e-05, 2.754107117652893e-05, 3.24789434671402e-05, 3.7416815757751465e-05, 4.235468804836273e-05, 4.7292560338974e-05, 5.2230432629585266e-05, 5.716830492019653e-05, 6.21061772108078e-05, 6.704404950141907e-05, 7.198192179203033e-05, 7.69197940826416e-05, 8.185766637325287e-05, 8.679553866386414e-05, 9.17334109544754e-05, 9.667128324508667e-05, 0.00010160915553569794, 0.0001065470278263092, 0.00011148490011692047, 0.00011642277240753174, 0.000121360644698143, 0.00012629851698875427, 0.00013123638927936554, 0.0001361742615699768, 0.00014111213386058807, 0.00014605000615119934, 0.0001509878784418106, 0.00015592575073242188]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 16.0, 32.0, 28.0, 36.0, 78.0, 101.0, 154.0, 204.0, 312.0, 414.0, 611.0, 919.0, 1348.0, 1906.0, 2783.0, 4188.0, 6459.0, 10162.0, 16405.0, 27944.0, 51127.0, 104035.0, 237867.0, 295683.0, 134853.0, 63588.0, 33994.0, 19064.0, 11764.0, 7418.0, 4847.0, 3389.0, 2160.0, 1511.0, 988.0, 624.0, 456.0, 329.0, 234.0, 163.0, 118.0, 59.0, 50.0, 49.0, 31.0, 11.0, 12.0, 2.0, 4.0, 5.0, 6.0, 0.0, 3.0], "bins": [-2.93359375, -2.84771728515625, -2.7618408203125, -2.67596435546875, -2.590087890625, -2.50421142578125, -2.4183349609375, -2.33245849609375, -2.24658203125, -2.16070556640625, -2.0748291015625, -1.98895263671875, -1.903076171875, -1.81719970703125, -1.7313232421875, -1.64544677734375, -1.5595703125, -1.47369384765625, -1.3878173828125, -1.30194091796875, -1.216064453125, -1.13018798828125, -1.0443115234375, -0.95843505859375, -0.87255859375, -0.78668212890625, -0.7008056640625, -0.61492919921875, -0.529052734375, -0.44317626953125, -0.3572998046875, -0.27142333984375, -0.185546875, -0.09967041015625, -0.0137939453125, 0.07208251953125, 0.157958984375, 0.24383544921875, 0.3297119140625, 0.41558837890625, 0.50146484375, 0.58734130859375, 0.6732177734375, 0.75909423828125, 0.844970703125, 0.93084716796875, 1.0167236328125, 1.10260009765625, 1.1884765625, 1.27435302734375, 1.3602294921875, 1.44610595703125, 1.531982421875, 1.61785888671875, 1.7037353515625, 1.78961181640625, 1.87548828125, 1.96136474609375, 2.0472412109375, 2.13311767578125, 2.218994140625, 2.30487060546875, 2.3907470703125, 2.47662353515625, 2.5625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 4.0, 8.0, 3.0, 4.0, 7.0, 7.0, 12.0, 12.0, 18.0, 25.0, 23.0, 37.0, 44.0, 63.0, 83.0, 111.0, 87.0, 96.0, 72.0, 47.0, 58.0, 41.0, 22.0, 27.0, 12.0, 12.0, 6.0, 9.0, 7.0, 4.0, 8.0, 6.0, 5.0, 1.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0361328125, -1.0007476806640625, -0.965362548828125, -0.9299774169921875, -0.89459228515625, -0.8592071533203125, -0.823822021484375, -0.7884368896484375, -0.7530517578125, -0.7176666259765625, -0.682281494140625, -0.6468963623046875, -0.61151123046875, -0.5761260986328125, -0.540740966796875, -0.5053558349609375, -0.469970703125, -0.4345855712890625, -0.399200439453125, -0.3638153076171875, -0.32843017578125, -0.2930450439453125, -0.257659912109375, -0.2222747802734375, -0.1868896484375, -0.1515045166015625, -0.116119384765625, -0.0807342529296875, -0.04534912109375, -0.0099639892578125, 0.025421142578125, 0.0608062744140625, 0.09619140625, 0.1315765380859375, 0.166961669921875, 0.2023468017578125, 0.23773193359375, 0.2731170654296875, 0.308502197265625, 0.3438873291015625, 0.3792724609375, 0.4146575927734375, 0.450042724609375, 0.4854278564453125, 0.52081298828125, 0.5561981201171875, 0.591583251953125, 0.6269683837890625, 0.662353515625, 0.6977386474609375, 0.733123779296875, 0.7685089111328125, 0.80389404296875, 0.8392791748046875, 0.874664306640625, 0.9100494384765625, 0.9454345703125, 0.9808197021484375, 1.016204833984375, 1.0515899658203125, 1.08697509765625, 1.1223602294921875, 1.157745361328125, 1.1931304931640625, 1.228515625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 8.0, 8.0, 8.0, 7.0, 11.0, 17.0, 30.0, 27.0, 30.0, 38.0, 47.0, 61.0, 60.0, 62.0, 63.0, 55.0, 72.0, 68.0, 54.0, 43.0, 39.0, 29.0, 22.0, 24.0, 23.0, 17.0, 15.0, 6.0, 10.0, 12.0, 5.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.98853302001953, -34.8026237487793, -33.61671447753906, -32.43080520629883, -31.244897842407227, -30.058988571166992, -28.87308120727539, -27.687171936035156, -26.501262664794922, -25.315353393554688, -24.129444122314453, -22.94353675842285, -21.757627487182617, -20.571718215942383, -19.38581085205078, -18.199901580810547, -17.013992309570312, -15.828083038330078, -14.64217472076416, -13.456266403198242, -12.270357131958008, -11.084447860717773, -9.898539543151855, -8.712631225585938, -7.526721954345703, -6.340813159942627, -5.154904365539551, -3.9689955711364746, -2.7830867767333984, -1.5971779823303223, -0.4112691879272461, 0.7746391296386719, 1.9605522155761719, 3.146461009979248, 4.332369804382324, 5.5182785987854, 6.704187393188477, 7.890096187591553, 9.076004981994629, 10.261913299560547, 11.447822570800781, 12.633731842041016, 13.819640159606934, 15.005548477172852, 16.191457748413086, 17.37736701965332, 18.563274383544922, 19.749183654785156, 20.93509292602539, 22.121002197265625, 23.30691146850586, 24.49281883239746, 25.678728103637695, 26.86463737487793, 28.05054473876953, 29.236454010009766, 30.42236328125, 31.608272552490234, 32.79418182373047, 33.9800910949707, 35.16600036621094, 36.351905822753906, 37.53781509399414, 38.723724365234375, 39.90963363647461]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 6.0, 4.0, 3.0, 5.0, 8.0, 12.0, 3.0, 14.0, 17.0, 18.0, 20.0, 20.0, 28.0, 26.0, 37.0, 30.0, 29.0, 37.0, 45.0, 37.0, 37.0, 45.0, 46.0, 38.0, 40.0, 41.0, 39.0, 34.0, 32.0, 30.0, 33.0, 22.0, 28.0, 21.0, 22.0, 13.0, 14.0, 13.0, 9.0, 9.0, 6.0, 4.0, 3.0, 9.0, 7.0, 4.0, 6.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.0479621887207, -30.97037124633789, -29.892780303955078, -28.815189361572266, -27.737598419189453, -26.66000747680664, -25.582416534423828, -24.504825592041016, -23.427234649658203, -22.34964370727539, -21.272052764892578, -20.194461822509766, -19.116870880126953, -18.03927993774414, -16.961688995361328, -15.884098052978516, -14.806507110595703, -13.72891616821289, -12.651325225830078, -11.573734283447266, -10.496143341064453, -9.41855239868164, -8.340961456298828, -7.263370513916016, -6.185779571533203, -5.108188629150391, -4.030597686767578, -2.9530067443847656, -1.8754158020019531, -0.7978248596191406, 0.2797660827636719, 1.3573570251464844, 2.4349517822265625, 3.512542724609375, 4.5901336669921875, 5.667724609375, 6.7453155517578125, 7.822906494140625, 8.900497436523438, 9.97808837890625, 11.055679321289062, 12.133270263671875, 13.210861206054688, 14.2884521484375, 15.366043090820312, 16.443634033203125, 17.521224975585938, 18.59881591796875, 19.676406860351562, 20.753997802734375, 21.831588745117188, 22.9091796875, 23.986770629882812, 25.064361572265625, 26.141952514648438, 27.21954345703125, 28.297134399414062, 29.374725341796875, 30.452316284179688, 31.5299072265625, 32.60749816894531, 33.685089111328125, 34.76268005371094, 35.84027099609375, 36.91786193847656]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 14.0, 24.0, 25.0, 55.0, 78.0, 108.0, 181.0, 320.0, 542.0, 806.0, 1169.0, 1992.0, 2976.0, 4706.0, 7568.0, 12784.0, 21044.0, 36227.0, 63725.0, 112983.0, 195324.0, 231253.0, 151071.0, 85556.0, 47987.0, 27550.0, 16320.0, 9937.0, 5910.0, 3628.0, 2413.0, 1496.0, 1006.0, 643.0, 437.0, 240.0, 153.0, 97.0, 85.0, 42.0, 25.0, 21.0, 14.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-49.625, -48.21728515625, -46.8095703125, -45.40185546875, -43.994140625, -42.58642578125, -41.1787109375, -39.77099609375, -38.36328125, -36.95556640625, -35.5478515625, -34.14013671875, -32.732421875, -31.32470703125, -29.9169921875, -28.50927734375, -27.1015625, -25.69384765625, -24.2861328125, -22.87841796875, -21.470703125, -20.06298828125, -18.6552734375, -17.24755859375, -15.83984375, -14.43212890625, -13.0244140625, -11.61669921875, -10.208984375, -8.80126953125, -7.3935546875, -5.98583984375, -4.578125, -3.17041015625, -1.7626953125, -0.35498046875, 1.052734375, 2.46044921875, 3.8681640625, 5.27587890625, 6.68359375, 8.09130859375, 9.4990234375, 10.90673828125, 12.314453125, 13.72216796875, 15.1298828125, 16.53759765625, 17.9453125, 19.35302734375, 20.7607421875, 22.16845703125, 23.576171875, 24.98388671875, 26.3916015625, 27.79931640625, 29.20703125, 30.61474609375, 32.0224609375, 33.43017578125, 34.837890625, 36.24560546875, 37.6533203125, 39.06103515625, 40.46875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 6.0, 6.0, 4.0, 5.0, 9.0, 14.0, 12.0, 17.0, 14.0, 19.0, 25.0, 33.0, 31.0, 26.0, 26.0, 40.0, 33.0, 51.0, 47.0, 54.0, 38.0, 42.0, 47.0, 28.0, 51.0, 38.0, 33.0, 30.0, 30.0, 29.0, 24.0, 19.0, 23.0, 16.0, 10.0, 11.0, 10.0, 9.0, 3.0, 10.0, 2.0, 3.0, 7.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.296875, -29.207763671875, -28.11865234375, -27.029541015625, -25.9404296875, -24.851318359375, -23.76220703125, -22.673095703125, -21.583984375, -20.494873046875, -19.40576171875, -18.316650390625, -17.2275390625, -16.138427734375, -15.04931640625, -13.960205078125, -12.87109375, -11.781982421875, -10.69287109375, -9.603759765625, -8.5146484375, -7.425537109375, -6.33642578125, -5.247314453125, -4.158203125, -3.069091796875, -1.97998046875, -0.890869140625, 0.1982421875, 1.287353515625, 2.37646484375, 3.465576171875, 4.5546875, 5.643798828125, 6.73291015625, 7.822021484375, 8.9111328125, 10.000244140625, 11.08935546875, 12.178466796875, 13.267578125, 14.356689453125, 15.44580078125, 16.534912109375, 17.6240234375, 18.713134765625, 19.80224609375, 20.891357421875, 21.98046875, 23.069580078125, 24.15869140625, 25.247802734375, 26.3369140625, 27.426025390625, 28.51513671875, 29.604248046875, 30.693359375, 31.782470703125, 32.87158203125, 33.960693359375, 35.0498046875, 36.138916015625, 37.22802734375, 38.317138671875, 39.40625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 8.0, 4.0, 5.0, 10.0, 11.0, 25.0, 27.0, 41.0, 68.0, 85.0, 142.0, 162.0, 252.0, 392.0, 595.0, 894.0, 1332.0, 2003.0, 3028.0, 4697.0, 7156.0, 11090.0, 17479.0, 28178.0, 46157.0, 76520.0, 124968.0, 185068.0, 190530.0, 133524.0, 81537.0, 49319.0, 30399.0, 18855.0, 11763.0, 7711.0, 4899.0, 3253.0, 2141.0, 1379.0, 940.0, 635.0, 402.0, 255.0, 177.0, 143.0, 92.0, 62.0, 54.0, 39.0, 16.0, 12.0, 9.0, 5.0, 4.0, 5.0, 2.0, 4.0, 5.0], "bins": [-40.59375, -39.3662109375, -38.138671875, -36.9111328125, -35.68359375, -34.4560546875, -33.228515625, -32.0009765625, -30.7734375, -29.5458984375, -28.318359375, -27.0908203125, -25.86328125, -24.6357421875, -23.408203125, -22.1806640625, -20.953125, -19.7255859375, -18.498046875, -17.2705078125, -16.04296875, -14.8154296875, -13.587890625, -12.3603515625, -11.1328125, -9.9052734375, -8.677734375, -7.4501953125, -6.22265625, -4.9951171875, -3.767578125, -2.5400390625, -1.3125, -0.0849609375, 1.142578125, 2.3701171875, 3.59765625, 4.8251953125, 6.052734375, 7.2802734375, 8.5078125, 9.7353515625, 10.962890625, 12.1904296875, 13.41796875, 14.6455078125, 15.873046875, 17.1005859375, 18.328125, 19.5556640625, 20.783203125, 22.0107421875, 23.23828125, 24.4658203125, 25.693359375, 26.9208984375, 28.1484375, 29.3759765625, 30.603515625, 31.8310546875, 33.05859375, 34.2861328125, 35.513671875, 36.7412109375, 37.96875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 6.0, 10.0, 9.0, 11.0, 15.0, 11.0, 17.0, 21.0, 26.0, 14.0, 25.0, 32.0, 28.0, 33.0, 33.0, 33.0, 33.0, 50.0, 48.0, 35.0, 43.0, 43.0, 36.0, 37.0, 33.0, 45.0, 30.0, 31.0, 43.0, 17.0, 16.0, 13.0, 18.0, 23.0, 12.0, 9.0, 6.0, 11.0, 7.0, 9.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-20.5, -19.858642578125, -19.21728515625, -18.575927734375, -17.9345703125, -17.293212890625, -16.65185546875, -16.010498046875, -15.369140625, -14.727783203125, -14.08642578125, -13.445068359375, -12.8037109375, -12.162353515625, -11.52099609375, -10.879638671875, -10.23828125, -9.596923828125, -8.95556640625, -8.314208984375, -7.6728515625, -7.031494140625, -6.39013671875, -5.748779296875, -5.107421875, -4.466064453125, -3.82470703125, -3.183349609375, -2.5419921875, -1.900634765625, -1.25927734375, -0.617919921875, 0.0234375, 0.664794921875, 1.30615234375, 1.947509765625, 2.5888671875, 3.230224609375, 3.87158203125, 4.512939453125, 5.154296875, 5.795654296875, 6.43701171875, 7.078369140625, 7.7197265625, 8.361083984375, 9.00244140625, 9.643798828125, 10.28515625, 10.926513671875, 11.56787109375, 12.209228515625, 12.8505859375, 13.491943359375, 14.13330078125, 14.774658203125, 15.416015625, 16.057373046875, 16.69873046875, 17.340087890625, 17.9814453125, 18.622802734375, 19.26416015625, 19.905517578125, 20.546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 13.0, 21.0, 29.0, 40.0, 73.0, 88.0, 120.0, 150.0, 246.0, 308.0, 486.0, 674.0, 955.0, 1317.0, 1961.0, 2640.0, 4087.0, 6266.0, 9471.0, 14908.0, 24482.0, 42440.0, 77394.0, 146513.0, 253581.0, 204876.0, 108618.0, 58063.0, 33170.0, 19460.0, 12057.0, 7731.0, 5004.0, 3416.0, 2349.0, 1635.0, 1165.0, 814.0, 550.0, 419.0, 266.0, 199.0, 139.0, 100.0, 69.0, 57.0, 48.0, 24.0, 18.0, 13.0, 9.0, 3.0, 6.0, 4.0, 1.0, 3.0, 1.0], "bins": [-14.0234375, -13.58203125, -13.140625, -12.69921875, -12.2578125, -11.81640625, -11.375, -10.93359375, -10.4921875, -10.05078125, -9.609375, -9.16796875, -8.7265625, -8.28515625, -7.84375, -7.40234375, -6.9609375, -6.51953125, -6.078125, -5.63671875, -5.1953125, -4.75390625, -4.3125, -3.87109375, -3.4296875, -2.98828125, -2.546875, -2.10546875, -1.6640625, -1.22265625, -0.78125, -0.33984375, 0.1015625, 0.54296875, 0.984375, 1.42578125, 1.8671875, 2.30859375, 2.75, 3.19140625, 3.6328125, 4.07421875, 4.515625, 4.95703125, 5.3984375, 5.83984375, 6.28125, 6.72265625, 7.1640625, 7.60546875, 8.046875, 8.48828125, 8.9296875, 9.37109375, 9.8125, 10.25390625, 10.6953125, 11.13671875, 11.578125, 12.01953125, 12.4609375, 12.90234375, 13.34375, 13.78515625, 14.2265625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 11.0, 14.0, 13.0, 26.0, 28.0, 45.0, 43.0, 70.0, 84.0, 108.0, 139.0, 105.0, 79.0, 55.0, 51.0, 32.0, 18.0, 16.0, 13.0, 9.0, 7.0, 4.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.002300262451171875, -0.002229154109954834, -0.002158045768737793, -0.002086937427520752, -0.002015829086303711, -0.00194472074508667, -0.001873612403869629, -0.0018025040626525879, -0.0017313957214355469, -0.0016602873802185059, -0.0015891790390014648, -0.0015180706977844238, -0.0014469623565673828, -0.0013758540153503418, -0.0013047456741333008, -0.0012336373329162598, -0.0011625289916992188, -0.0010914206504821777, -0.0010203123092651367, -0.0009492039680480957, -0.0008780956268310547, -0.0008069872856140137, -0.0007358789443969727, -0.0006647706031799316, -0.0005936622619628906, -0.0005225539207458496, -0.0004514455795288086, -0.0003803372383117676, -0.00030922889709472656, -0.00023812055587768555, -0.00016701221466064453, -9.590387344360352e-05, -2.47955322265625e-05, 4.6312808990478516e-05, 0.00011742115020751953, 0.00018852949142456055, 0.00025963783264160156, 0.0003307461738586426, 0.0004018545150756836, 0.0004729628562927246, 0.0005440711975097656, 0.0006151795387268066, 0.0006862878799438477, 0.0007573962211608887, 0.0008285045623779297, 0.0008996129035949707, 0.0009707212448120117, 0.0010418295860290527, 0.0011129379272460938, 0.0011840462684631348, 0.0012551546096801758, 0.0013262629508972168, 0.0013973712921142578, 0.0014684796333312988, 0.0015395879745483398, 0.0016106963157653809, 0.0016818046569824219, 0.0017529129981994629, 0.001824021339416504, 0.001895129680633545, 0.001966238021850586, 0.002037346363067627, 0.002108454704284668, 0.002179563045501709, 0.00225067138671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 0.0, 8.0, 10.0, 7.0, 9.0, 22.0, 32.0, 41.0, 63.0, 99.0, 124.0, 185.0, 285.0, 393.0, 609.0, 860.0, 1255.0, 1855.0, 2970.0, 4642.0, 7141.0, 11557.0, 18840.0, 32022.0, 57034.0, 106907.0, 207248.0, 261874.0, 148407.0, 77263.0, 42258.0, 24262.0, 14575.0, 9013.0, 5682.0, 3669.0, 2422.0, 1612.0, 1083.0, 670.0, 490.0, 344.0, 222.0, 148.0, 111.0, 83.0, 52.0, 28.0, 24.0, 16.0, 14.0, 6.0, 5.0, 5.0, 8.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.5703125, -14.10400390625, -13.6376953125, -13.17138671875, -12.705078125, -12.23876953125, -11.7724609375, -11.30615234375, -10.83984375, -10.37353515625, -9.9072265625, -9.44091796875, -8.974609375, -8.50830078125, -8.0419921875, -7.57568359375, -7.109375, -6.64306640625, -6.1767578125, -5.71044921875, -5.244140625, -4.77783203125, -4.3115234375, -3.84521484375, -3.37890625, -2.91259765625, -2.4462890625, -1.97998046875, -1.513671875, -1.04736328125, -0.5810546875, -0.11474609375, 0.3515625, 0.81787109375, 1.2841796875, 1.75048828125, 2.216796875, 2.68310546875, 3.1494140625, 3.61572265625, 4.08203125, 4.54833984375, 5.0146484375, 5.48095703125, 5.947265625, 6.41357421875, 6.8798828125, 7.34619140625, 7.8125, 8.27880859375, 8.7451171875, 9.21142578125, 9.677734375, 10.14404296875, 10.6103515625, 11.07666015625, 11.54296875, 12.00927734375, 12.4755859375, 12.94189453125, 13.408203125, 13.87451171875, 14.3408203125, 14.80712890625, 15.2734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 6.0, 9.0, 8.0, 7.0, 11.0, 11.0, 16.0, 25.0, 16.0, 22.0, 31.0, 35.0, 72.0, 53.0, 80.0, 89.0, 79.0, 73.0, 55.0, 56.0, 55.0, 32.0, 18.0, 25.0, 24.0, 19.0, 17.0, 10.0, 5.0, 6.0, 10.0, 7.0, 5.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.26171875, -6.05865478515625, -5.8555908203125, -5.65252685546875, -5.449462890625, -5.24639892578125, -5.0433349609375, -4.84027099609375, -4.63720703125, -4.43414306640625, -4.2310791015625, -4.02801513671875, -3.824951171875, -3.62188720703125, -3.4188232421875, -3.21575927734375, -3.0126953125, -2.80963134765625, -2.6065673828125, -2.40350341796875, -2.200439453125, -1.99737548828125, -1.7943115234375, -1.59124755859375, -1.38818359375, -1.18511962890625, -0.9820556640625, -0.77899169921875, -0.575927734375, -0.37286376953125, -0.1697998046875, 0.03326416015625, 0.236328125, 0.43939208984375, 0.6424560546875, 0.84552001953125, 1.048583984375, 1.25164794921875, 1.4547119140625, 1.65777587890625, 1.86083984375, 2.06390380859375, 2.2669677734375, 2.47003173828125, 2.673095703125, 2.87615966796875, 3.0792236328125, 3.28228759765625, 3.4853515625, 3.68841552734375, 3.8914794921875, 4.09454345703125, 4.297607421875, 4.50067138671875, 4.7037353515625, 4.90679931640625, 5.10986328125, 5.31292724609375, 5.5159912109375, 5.71905517578125, 5.922119140625, 6.12518310546875, 6.3282470703125, 6.53131103515625, 6.734375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 12.0, 12.0, 13.0, 24.0, 23.0, 33.0, 50.0, 48.0, 69.0, 70.0, 67.0, 75.0, 96.0, 72.0, 58.0, 60.0, 49.0, 30.0, 23.0, 23.0, 22.0, 13.0, 17.0, 7.0, 7.0, 4.0, 2.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.99857711791992, -38.51227951049805, -37.02598571777344, -35.53968811035156, -34.05339431762695, -32.56709671020508, -31.080801010131836, -29.594505310058594, -28.10820770263672, -26.621912002563477, -25.135616302490234, -23.64931869506836, -22.163022994995117, -20.676727294921875, -19.190431594848633, -17.70413589477539, -16.21784019470215, -14.731544494628906, -13.245247840881348, -11.758952140808105, -10.272655487060547, -8.786359786987305, -7.3000640869140625, -5.813767433166504, -4.327471733093262, -2.8411755561828613, -1.35487961769104, 0.13141632080078125, 1.6177124977111816, 3.104008674621582, 4.590304374694824, 6.076601028442383, 7.562896728515625, 9.049192428588867, 10.535489082336426, 12.021784782409668, 13.508081436157227, 14.994377136230469, 16.48067283630371, 17.966968536376953, 19.453266143798828, 20.93956184387207, 22.425857543945312, 23.912155151367188, 25.39845085144043, 26.884746551513672, 28.371042251586914, 29.857337951660156, 31.3436336517334, 32.82992935180664, 34.316226959228516, 35.802520751953125, 37.288818359375, 38.775115966796875, 40.261409759521484, 41.74770736694336, 43.23400115966797, 44.720298767089844, 46.20659255981445, 47.69289016723633, 49.17918395996094, 50.66548156738281, 52.15177917480469, 53.6380729675293, 55.12437057495117]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 5.0, 8.0, 9.0, 12.0, 13.0, 12.0, 12.0, 17.0, 23.0, 20.0, 30.0, 24.0, 36.0, 34.0, 36.0, 29.0, 33.0, 43.0, 39.0, 47.0, 34.0, 41.0, 52.0, 46.0, 32.0, 30.0, 32.0, 32.0, 27.0, 20.0, 23.0, 21.0, 14.0, 15.0, 26.0, 12.0, 11.0, 4.0, 6.0, 6.0, 6.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.39145851135254, -28.269893646240234, -27.14832878112793, -26.026763916015625, -24.905197143554688, -23.783632278442383, -22.662067413330078, -21.540502548217773, -20.41893768310547, -19.297372817993164, -18.17580795288086, -17.054241180419922, -15.932676315307617, -14.811111450195312, -13.689546585083008, -12.567981719970703, -11.446414947509766, -10.324850082397461, -9.20328426361084, -8.081719398498535, -6.960154056549072, -5.838588714599609, -4.717023849487305, -3.595458507537842, -2.473893165588379, -1.3523279428482056, -0.23076272010803223, 0.8908023834228516, 2.0123677253723145, 3.1339330673217773, 4.255497932434082, 5.377063274383545, 6.498630523681641, 7.6201958656311035, 8.741761207580566, 9.863326072692871, 10.984891891479492, 12.106456756591797, 13.228021621704102, 14.349586486816406, 15.471152305603027, 16.59271812438965, 17.714282989501953, 18.835847854614258, 19.957412719726562, 21.0789794921875, 22.200542449951172, 23.32210922241211, 24.443674087524414, 25.56523895263672, 26.686803817749023, 27.808368682861328, 28.929935455322266, 30.05150032043457, 31.173065185546875, 32.29463195800781, 33.416194915771484, 34.53776168823242, 35.659324645996094, 36.78089141845703, 37.9024543762207, 39.02402114868164, 40.14558410644531, 41.26715087890625, 42.38871765136719]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 9.0, 3.0, 10.0, 14.0, 17.0, 28.0, 54.0, 59.0, 111.0, 131.0, 240.0, 398.0, 649.0, 1057.0, 1780.0, 3201.0, 5966.0, 11605.0, 23979.0, 57151.0, 172535.0, 697435.0, 1882726.0, 964660.0, 232681.0, 73740.0, 30838.0, 15012.0, 7865.0, 4300.0, 2431.0, 1439.0, 829.0, 498.0, 299.0, 194.0, 107.0, 79.0, 58.0, 31.0, 23.0, 10.0, 9.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0], "bins": [-62.90625, -61.08935546875, -59.2724609375, -57.45556640625, -55.638671875, -53.82177734375, -52.0048828125, -50.18798828125, -48.37109375, -46.55419921875, -44.7373046875, -42.92041015625, -41.103515625, -39.28662109375, -37.4697265625, -35.65283203125, -33.8359375, -32.01904296875, -30.2021484375, -28.38525390625, -26.568359375, -24.75146484375, -22.9345703125, -21.11767578125, -19.30078125, -17.48388671875, -15.6669921875, -13.85009765625, -12.033203125, -10.21630859375, -8.3994140625, -6.58251953125, -4.765625, -2.94873046875, -1.1318359375, 0.68505859375, 2.501953125, 4.31884765625, 6.1357421875, 7.95263671875, 9.76953125, 11.58642578125, 13.4033203125, 15.22021484375, 17.037109375, 18.85400390625, 20.6708984375, 22.48779296875, 24.3046875, 26.12158203125, 27.9384765625, 29.75537109375, 31.572265625, 33.38916015625, 35.2060546875, 37.02294921875, 38.83984375, 40.65673828125, 42.4736328125, 44.29052734375, 46.107421875, 47.92431640625, 49.7412109375, 51.55810546875, 53.375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 9.0, 6.0, 13.0, 9.0, 14.0, 11.0, 18.0, 15.0, 26.0, 22.0, 19.0, 30.0, 42.0, 38.0, 33.0, 35.0, 35.0, 47.0, 57.0, 47.0, 36.0, 45.0, 51.0, 36.0, 41.0, 29.0, 24.0, 33.0, 14.0, 23.0, 21.0, 18.0, 19.0, 12.0, 10.0, 15.0, 6.0, 10.0, 4.0, 3.0, 9.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.609375, -25.604736328125, -24.60009765625, -23.595458984375, -22.5908203125, -21.586181640625, -20.58154296875, -19.576904296875, -18.572265625, -17.567626953125, -16.56298828125, -15.558349609375, -14.5537109375, -13.549072265625, -12.54443359375, -11.539794921875, -10.53515625, -9.530517578125, -8.52587890625, -7.521240234375, -6.5166015625, -5.511962890625, -4.50732421875, -3.502685546875, -2.498046875, -1.493408203125, -0.48876953125, 0.515869140625, 1.5205078125, 2.525146484375, 3.52978515625, 4.534423828125, 5.5390625, 6.543701171875, 7.54833984375, 8.552978515625, 9.5576171875, 10.562255859375, 11.56689453125, 12.571533203125, 13.576171875, 14.580810546875, 15.58544921875, 16.590087890625, 17.5947265625, 18.599365234375, 19.60400390625, 20.608642578125, 21.61328125, 22.617919921875, 23.62255859375, 24.627197265625, 25.6318359375, 26.636474609375, 27.64111328125, 28.645751953125, 29.650390625, 30.655029296875, 31.65966796875, 32.664306640625, 33.6689453125, 34.673583984375, 35.67822265625, 36.682861328125, 37.6875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 9.0, 11.0, 18.0, 36.0, 37.0, 50.0, 110.0, 157.0, 239.0, 350.0, 545.0, 836.0, 1234.0, 2072.0, 3244.0, 5231.0, 8815.0, 15605.0, 27678.0, 52944.0, 108112.0, 238694.0, 588532.0, 1465872.0, 978704.0, 371943.0, 159102.0, 75622.0, 38080.0, 20755.0, 11826.0, 6758.0, 4001.0, 2492.0, 1606.0, 964.0, 678.0, 436.0, 282.0, 214.0, 132.0, 91.0, 59.0, 35.0, 33.0, 19.0, 9.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0], "bins": [-51.875, -50.38232421875, -48.8896484375, -47.39697265625, -45.904296875, -44.41162109375, -42.9189453125, -41.42626953125, -39.93359375, -38.44091796875, -36.9482421875, -35.45556640625, -33.962890625, -32.47021484375, -30.9775390625, -29.48486328125, -27.9921875, -26.49951171875, -25.0068359375, -23.51416015625, -22.021484375, -20.52880859375, -19.0361328125, -17.54345703125, -16.05078125, -14.55810546875, -13.0654296875, -11.57275390625, -10.080078125, -8.58740234375, -7.0947265625, -5.60205078125, -4.109375, -2.61669921875, -1.1240234375, 0.36865234375, 1.861328125, 3.35400390625, 4.8466796875, 6.33935546875, 7.83203125, 9.32470703125, 10.8173828125, 12.31005859375, 13.802734375, 15.29541015625, 16.7880859375, 18.28076171875, 19.7734375, 21.26611328125, 22.7587890625, 24.25146484375, 25.744140625, 27.23681640625, 28.7294921875, 30.22216796875, 31.71484375, 33.20751953125, 34.7001953125, 36.19287109375, 37.685546875, 39.17822265625, 40.6708984375, 42.16357421875, 43.65625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 3.0, 5.0, 5.0, 13.0, 12.0, 28.0, 21.0, 26.0, 37.0, 62.0, 65.0, 97.0, 122.0, 149.0, 213.0, 248.0, 317.0, 373.0, 437.0, 376.0, 326.0, 248.0, 192.0, 147.0, 121.0, 107.0, 62.0, 60.0, 51.0, 47.0, 16.0, 23.0, 15.0, 17.0, 9.0, 5.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-20.03125, -19.4810791015625, -18.930908203125, -18.3807373046875, -17.83056640625, -17.2803955078125, -16.730224609375, -16.1800537109375, -15.6298828125, -15.0797119140625, -14.529541015625, -13.9793701171875, -13.42919921875, -12.8790283203125, -12.328857421875, -11.7786865234375, -11.228515625, -10.6783447265625, -10.128173828125, -9.5780029296875, -9.02783203125, -8.4776611328125, -7.927490234375, -7.3773193359375, -6.8271484375, -6.2769775390625, -5.726806640625, -5.1766357421875, -4.62646484375, -4.0762939453125, -3.526123046875, -2.9759521484375, -2.42578125, -1.8756103515625, -1.325439453125, -0.7752685546875, -0.22509765625, 0.3250732421875, 0.875244140625, 1.4254150390625, 1.9755859375, 2.5257568359375, 3.075927734375, 3.6260986328125, 4.17626953125, 4.7264404296875, 5.276611328125, 5.8267822265625, 6.376953125, 6.9271240234375, 7.477294921875, 8.0274658203125, 8.57763671875, 9.1278076171875, 9.677978515625, 10.2281494140625, 10.7783203125, 11.3284912109375, 11.878662109375, 12.4288330078125, 12.97900390625, 13.5291748046875, 14.079345703125, 14.6295166015625, 15.1796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 1.0, 7.0, 8.0, 11.0, 11.0, 9.0, 26.0, 22.0, 28.0, 30.0, 32.0, 39.0, 52.0, 87.0, 66.0, 60.0, 69.0, 64.0, 63.0, 55.0, 43.0, 34.0, 34.0, 33.0, 21.0, 26.0, 12.0, 14.0, 10.0, 10.0, 7.0, 1.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.72513961791992, -40.499412536621094, -39.27368927001953, -38.0479621887207, -36.822235107421875, -35.59650802612305, -34.37078094482422, -33.145057678222656, -31.919330596923828, -30.693603515625, -29.467878341674805, -28.24215316772461, -27.01642608642578, -25.790699005126953, -24.564973831176758, -23.339248657226562, -22.113521575927734, -20.887794494628906, -19.66206932067871, -18.436344146728516, -17.210617065429688, -15.984890937805176, -14.759164810180664, -13.533438682556152, -12.30771255493164, -11.081986427307129, -9.856260299682617, -8.630534172058105, -7.404808044433594, -6.179081916809082, -4.95335578918457, -3.7276296615600586, -2.5019073486328125, -1.2761812210083008, -0.05045509338378906, 1.1752710342407227, 2.4009971618652344, 3.626723289489746, 4.852449417114258, 6.0781755447387695, 7.303901672363281, 8.529627799987793, 9.755353927612305, 10.981080055236816, 12.206806182861328, 13.43253231048584, 14.658258438110352, 15.883984565734863, 17.109710693359375, 18.335437774658203, 19.5611629486084, 20.786888122558594, 22.012615203857422, 23.23834228515625, 24.464067459106445, 25.68979263305664, 26.91551971435547, 28.141246795654297, 29.366971969604492, 30.592697143554688, 31.818424224853516, 33.044151306152344, 34.269874572753906, 35.495601654052734, 36.72132873535156]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 2.0, 11.0, 10.0, 9.0, 9.0, 15.0, 26.0, 14.0, 19.0, 22.0, 30.0, 24.0, 21.0, 33.0, 32.0, 38.0, 44.0, 41.0, 45.0, 42.0, 51.0, 37.0, 29.0, 37.0, 45.0, 32.0, 34.0, 22.0, 23.0, 34.0, 25.0, 22.0, 21.0, 14.0, 15.0, 11.0, 10.0, 7.0, 8.0, 9.0, 4.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.4442024230957, -32.367523193359375, -31.290842056274414, -30.214160919189453, -29.137481689453125, -28.060800552368164, -26.984119415283203, -25.907440185546875, -24.830759048461914, -23.754077911376953, -22.677398681640625, -21.600717544555664, -20.524036407470703, -19.447357177734375, -18.370676040649414, -17.293994903564453, -16.217315673828125, -15.14063549041748, -14.063955307006836, -12.987274169921875, -11.91059398651123, -10.833913803100586, -9.757232666015625, -8.68055248260498, -7.603872299194336, -6.527192115783691, -5.450511455535889, -4.373830795288086, -3.2971506118774414, -2.220470428466797, -1.1437897682189941, -0.0671091079711914, 1.0095710754394531, 2.0862514972686768, 3.1629319190979004, 4.239612579345703, 5.316292762756348, 6.392972946166992, 7.469653606414795, 8.546334266662598, 9.623014450073242, 10.699694633483887, 11.776374816894531, 12.853055953979492, 13.929736137390137, 15.006416320800781, 16.083097457885742, 17.159778594970703, 18.23645782470703, 19.313138961791992, 20.38981819152832, 21.46649932861328, 22.54317855834961, 23.61985969543457, 24.69654083251953, 25.77322006225586, 26.84990119934082, 27.92658233642578, 29.00326156616211, 30.07994270324707, 31.15662384033203, 32.23330307006836, 33.30998229980469, 34.38666534423828, 35.46334457397461]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 12.0, 28.0, 43.0, 45.0, 61.0, 85.0, 146.0, 187.0, 264.0, 357.0, 563.0, 780.0, 1068.0, 1600.0, 2360.0, 3190.0, 4899.0, 6851.0, 10342.0, 15147.0, 22040.0, 33851.0, 52644.0, 89955.0, 167896.0, 259128.0, 148390.0, 80809.0, 48776.0, 31460.0, 20803.0, 14027.0, 9450.0, 6466.0, 4618.0, 3112.0, 2110.0, 1592.0, 1015.0, 736.0, 508.0, 346.0, 259.0, 166.0, 105.0, 82.0, 61.0, 41.0, 24.0, 17.0, 12.0, 6.0, 1.0, 4.0, 5.0, 4.0, 1.0], "bins": [-10.4921875, -10.16845703125, -9.8447265625, -9.52099609375, -9.197265625, -8.87353515625, -8.5498046875, -8.22607421875, -7.90234375, -7.57861328125, -7.2548828125, -6.93115234375, -6.607421875, -6.28369140625, -5.9599609375, -5.63623046875, -5.3125, -4.98876953125, -4.6650390625, -4.34130859375, -4.017578125, -3.69384765625, -3.3701171875, -3.04638671875, -2.72265625, -2.39892578125, -2.0751953125, -1.75146484375, -1.427734375, -1.10400390625, -0.7802734375, -0.45654296875, -0.1328125, 0.19091796875, 0.5146484375, 0.83837890625, 1.162109375, 1.48583984375, 1.8095703125, 2.13330078125, 2.45703125, 2.78076171875, 3.1044921875, 3.42822265625, 3.751953125, 4.07568359375, 4.3994140625, 4.72314453125, 5.046875, 5.37060546875, 5.6943359375, 6.01806640625, 6.341796875, 6.66552734375, 6.9892578125, 7.31298828125, 7.63671875, 7.96044921875, 8.2841796875, 8.60791015625, 8.931640625, 9.25537109375, 9.5791015625, 9.90283203125, 10.2265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 1.0, 13.0, 7.0, 8.0, 14.0, 15.0, 17.0, 21.0, 25.0, 26.0, 26.0, 28.0, 32.0, 36.0, 37.0, 60.0, 32.0, 44.0, 37.0, 56.0, 48.0, 42.0, 37.0, 47.0, 27.0, 32.0, 25.0, 25.0, 39.0, 27.0, 19.0, 18.0, 7.0, 12.0, 13.0, 7.0, 7.0, 6.0, 10.0, 6.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.125, -35.939453125, -34.75390625, -33.568359375, -32.3828125, -31.197265625, -30.01171875, -28.826171875, -27.640625, -26.455078125, -25.26953125, -24.083984375, -22.8984375, -21.712890625, -20.52734375, -19.341796875, -18.15625, -16.970703125, -15.78515625, -14.599609375, -13.4140625, -12.228515625, -11.04296875, -9.857421875, -8.671875, -7.486328125, -6.30078125, -5.115234375, -3.9296875, -2.744140625, -1.55859375, -0.373046875, 0.8125, 1.998046875, 3.18359375, 4.369140625, 5.5546875, 6.740234375, 7.92578125, 9.111328125, 10.296875, 11.482421875, 12.66796875, 13.853515625, 15.0390625, 16.224609375, 17.41015625, 18.595703125, 19.78125, 20.966796875, 22.15234375, 23.337890625, 24.5234375, 25.708984375, 26.89453125, 28.080078125, 29.265625, 30.451171875, 31.63671875, 32.822265625, 34.0078125, 35.193359375, 36.37890625, 37.564453125, 38.75]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 9.0, 12.0, 27.0, 33.0, 37.0, 59.0, 74.0, 99.0, 151.0, 214.0, 317.0, 436.0, 561.0, 893.0, 1172.0, 1701.0, 2447.0, 3698.0, 5478.0, 8944.0, 16383.0, 43908.0, 325356.0, 535731.0, 53791.0, 18494.0, 9942.0, 5951.0, 3834.0, 2616.0, 1791.0, 1267.0, 909.0, 653.0, 463.0, 296.0, 236.0, 169.0, 112.0, 86.0, 55.0, 51.0, 15.0, 35.0, 17.0, 9.0, 2.0, 4.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0], "bins": [-15.1015625, -14.64501953125, -14.1884765625, -13.73193359375, -13.275390625, -12.81884765625, -12.3623046875, -11.90576171875, -11.44921875, -10.99267578125, -10.5361328125, -10.07958984375, -9.623046875, -9.16650390625, -8.7099609375, -8.25341796875, -7.796875, -7.34033203125, -6.8837890625, -6.42724609375, -5.970703125, -5.51416015625, -5.0576171875, -4.60107421875, -4.14453125, -3.68798828125, -3.2314453125, -2.77490234375, -2.318359375, -1.86181640625, -1.4052734375, -0.94873046875, -0.4921875, -0.03564453125, 0.4208984375, 0.87744140625, 1.333984375, 1.79052734375, 2.2470703125, 2.70361328125, 3.16015625, 3.61669921875, 4.0732421875, 4.52978515625, 4.986328125, 5.44287109375, 5.8994140625, 6.35595703125, 6.8125, 7.26904296875, 7.7255859375, 8.18212890625, 8.638671875, 9.09521484375, 9.5517578125, 10.00830078125, 10.46484375, 10.92138671875, 11.3779296875, 11.83447265625, 12.291015625, 12.74755859375, 13.2041015625, 13.66064453125, 14.1171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 6.0, 3.0, 4.0, 8.0, 9.0, 10.0, 19.0, 14.0, 26.0, 14.0, 26.0, 22.0, 20.0, 25.0, 30.0, 41.0, 40.0, 41.0, 34.0, 33.0, 42.0, 47.0, 51.0, 34.0, 33.0, 41.0, 26.0, 28.0, 39.0, 36.0, 21.0, 25.0, 25.0, 20.0, 16.0, 15.0, 12.0, 14.0, 9.0, 4.0, 5.0, 10.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.953125, -23.225830078125, -22.49853515625, -21.771240234375, -21.0439453125, -20.316650390625, -19.58935546875, -18.862060546875, -18.134765625, -17.407470703125, -16.68017578125, -15.952880859375, -15.2255859375, -14.498291015625, -13.77099609375, -13.043701171875, -12.31640625, -11.589111328125, -10.86181640625, -10.134521484375, -9.4072265625, -8.679931640625, -7.95263671875, -7.225341796875, -6.498046875, -5.770751953125, -5.04345703125, -4.316162109375, -3.5888671875, -2.861572265625, -2.13427734375, -1.406982421875, -0.6796875, 0.047607421875, 0.77490234375, 1.502197265625, 2.2294921875, 2.956787109375, 3.68408203125, 4.411376953125, 5.138671875, 5.865966796875, 6.59326171875, 7.320556640625, 8.0478515625, 8.775146484375, 9.50244140625, 10.229736328125, 10.95703125, 11.684326171875, 12.41162109375, 13.138916015625, 13.8662109375, 14.593505859375, 15.32080078125, 16.048095703125, 16.775390625, 17.502685546875, 18.22998046875, 18.957275390625, 19.6845703125, 20.411865234375, 21.13916015625, 21.866455078125, 22.59375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 8.0, 10.0, 15.0, 20.0, 33.0, 53.0, 91.0, 112.0, 194.0, 330.0, 668.0, 1188.0, 2726.0, 6881.0, 21547.0, 314818.0, 661284.0, 24870.0, 7757.0, 3002.0, 1327.0, 645.0, 394.0, 201.0, 129.0, 72.0, 51.0, 30.0, 29.0, 18.0, 18.0, 9.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.451171875, -2.363800048828125, -2.27642822265625, -2.189056396484375, -2.1016845703125, -2.014312744140625, -1.92694091796875, -1.839569091796875, -1.752197265625, -1.664825439453125, -1.57745361328125, -1.490081787109375, -1.4027099609375, -1.315338134765625, -1.22796630859375, -1.140594482421875, -1.05322265625, -0.965850830078125, -0.87847900390625, -0.791107177734375, -0.7037353515625, -0.616363525390625, -0.52899169921875, -0.441619873046875, -0.354248046875, -0.266876220703125, -0.17950439453125, -0.092132568359375, -0.0047607421875, 0.082611083984375, 0.16998291015625, 0.257354736328125, 0.3447265625, 0.432098388671875, 0.51947021484375, 0.606842041015625, 0.6942138671875, 0.781585693359375, 0.86895751953125, 0.956329345703125, 1.043701171875, 1.131072998046875, 1.21844482421875, 1.305816650390625, 1.3931884765625, 1.480560302734375, 1.56793212890625, 1.655303955078125, 1.74267578125, 1.830047607421875, 1.91741943359375, 2.004791259765625, 2.0921630859375, 2.179534912109375, 2.26690673828125, 2.354278564453125, 2.441650390625, 2.529022216796875, 2.61639404296875, 2.703765869140625, 2.7911376953125, 2.878509521484375, 2.96588134765625, 3.053253173828125, 3.140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 4.0, 4.0, 7.0, 15.0, 27.0, 25.0, 23.0, 31.0, 48.0, 51.0, 68.0, 85.0, 81.0, 88.0, 92.0, 68.0, 60.0, 46.0, 35.0, 24.0, 20.0, 20.0, 14.0, 11.0, 8.0, 13.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00017261505126953125, -0.00016794726252555847, -0.0001632794737815857, -0.00015861168503761292, -0.00015394389629364014, -0.00014927610754966736, -0.00014460831880569458, -0.0001399405300617218, -0.00013527274131774902, -0.00013060495257377625, -0.00012593716382980347, -0.00012126937508583069, -0.00011660158634185791, -0.00011193379759788513, -0.00010726600885391235, -0.00010259822010993958, -9.79304313659668e-05, -9.326264262199402e-05, -8.859485387802124e-05, -8.392706513404846e-05, -7.925927639007568e-05, -7.45914876461029e-05, -6.992369890213013e-05, -6.525591015815735e-05, -6.058812141418457e-05, -5.592033267021179e-05, -5.1252543926239014e-05, -4.6584755182266235e-05, -4.191696643829346e-05, -3.724917769432068e-05, -3.25813889503479e-05, -2.7913600206375122e-05, -2.3245811462402344e-05, -1.8578022718429565e-05, -1.3910233974456787e-05, -9.242445230484009e-06, -4.5746564865112305e-06, 9.313225746154785e-08, 4.760921001434326e-06, 9.428709745407104e-06, 1.4096498489379883e-05, 1.876428723335266e-05, 2.343207597732544e-05, 2.8099864721298218e-05, 3.2767653465270996e-05, 3.7435442209243774e-05, 4.210323095321655e-05, 4.677101969718933e-05, 5.143880844116211e-05, 5.610659718513489e-05, 6.0774385929107666e-05, 6.544217467308044e-05, 7.010996341705322e-05, 7.4777752161026e-05, 7.944554090499878e-05, 8.411332964897156e-05, 8.878111839294434e-05, 9.344890713691711e-05, 9.811669588088989e-05, 0.00010278448462486267, 0.00010745227336883545, 0.00011212006211280823, 0.000116787850856781, 0.00012145563960075378, 0.00012612342834472656]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 8.0, 21.0, 26.0, 25.0, 45.0, 75.0, 101.0, 152.0, 205.0, 312.0, 547.0, 944.0, 1485.0, 2440.0, 4211.0, 7593.0, 13712.0, 26913.0, 55674.0, 121926.0, 261450.0, 286208.0, 137120.0, 62686.0, 29945.0, 15111.0, 8252.0, 4533.0, 2641.0, 1567.0, 907.0, 578.0, 386.0, 234.0, 189.0, 114.0, 66.0, 54.0, 29.0, 24.0, 12.0, 10.0, 3.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.93359375, -1.871368408203125, -1.80914306640625, -1.746917724609375, -1.6846923828125, -1.622467041015625, -1.56024169921875, -1.498016357421875, -1.435791015625, -1.373565673828125, -1.31134033203125, -1.249114990234375, -1.1868896484375, -1.124664306640625, -1.06243896484375, -1.000213623046875, -0.93798828125, -0.875762939453125, -0.81353759765625, -0.751312255859375, -0.6890869140625, -0.626861572265625, -0.56463623046875, -0.502410888671875, -0.440185546875, -0.377960205078125, -0.31573486328125, -0.253509521484375, -0.1912841796875, -0.129058837890625, -0.06683349609375, -0.004608154296875, 0.0576171875, 0.119842529296875, 0.18206787109375, 0.244293212890625, 0.3065185546875, 0.368743896484375, 0.43096923828125, 0.493194580078125, 0.555419921875, 0.617645263671875, 0.67987060546875, 0.742095947265625, 0.8043212890625, 0.866546630859375, 0.92877197265625, 0.990997314453125, 1.05322265625, 1.115447998046875, 1.17767333984375, 1.239898681640625, 1.3021240234375, 1.364349365234375, 1.42657470703125, 1.488800048828125, 1.551025390625, 1.613250732421875, 1.67547607421875, 1.737701416015625, 1.7999267578125, 1.862152099609375, 1.92437744140625, 1.986602783203125, 2.048828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 7.0, 8.0, 6.0, 10.0, 13.0, 12.0, 13.0, 28.0, 28.0, 41.0, 43.0, 49.0, 53.0, 57.0, 60.0, 68.0, 51.0, 56.0, 61.0, 45.0, 52.0, 49.0, 41.0, 29.0, 36.0, 20.0, 16.0, 11.0, 10.0, 10.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44873046875, -0.431121826171875, -0.41351318359375, -0.395904541015625, -0.3782958984375, -0.360687255859375, -0.34307861328125, -0.325469970703125, -0.307861328125, -0.290252685546875, -0.27264404296875, -0.255035400390625, -0.2374267578125, -0.219818115234375, -0.20220947265625, -0.184600830078125, -0.1669921875, -0.149383544921875, -0.13177490234375, -0.114166259765625, -0.0965576171875, -0.078948974609375, -0.06134033203125, -0.043731689453125, -0.026123046875, -0.008514404296875, 0.00909423828125, 0.026702880859375, 0.0443115234375, 0.061920166015625, 0.07952880859375, 0.097137451171875, 0.11474609375, 0.132354736328125, 0.14996337890625, 0.167572021484375, 0.1851806640625, 0.202789306640625, 0.22039794921875, 0.238006591796875, 0.255615234375, 0.273223876953125, 0.29083251953125, 0.308441162109375, 0.3260498046875, 0.343658447265625, 0.36126708984375, 0.378875732421875, 0.396484375, 0.414093017578125, 0.43170166015625, 0.449310302734375, 0.4669189453125, 0.484527587890625, 0.50213623046875, 0.519744873046875, 0.537353515625, 0.554962158203125, 0.57257080078125, 0.590179443359375, 0.6077880859375, 0.625396728515625, 0.64300537109375, 0.660614013671875, 0.67822265625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 5.0, 3.0, 6.0, 13.0, 10.0, 15.0, 15.0, 19.0, 34.0, 29.0, 27.0, 45.0, 44.0, 73.0, 74.0, 54.0, 73.0, 61.0, 61.0, 57.0, 53.0, 38.0, 36.0, 27.0, 24.0, 25.0, 22.0, 11.0, 11.0, 8.0, 5.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-41.68342590332031, -40.505332946777344, -39.327239990234375, -38.149147033691406, -36.97105407714844, -35.79296112060547, -34.6148681640625, -33.436771392822266, -32.2586784362793, -31.080585479736328, -29.90249252319336, -28.72439956665039, -27.54630470275879, -26.36821174621582, -25.19011878967285, -24.01202392578125, -22.833932876586914, -21.655839920043945, -20.477746963500977, -19.299652099609375, -18.121559143066406, -16.943466186523438, -15.765373229980469, -14.587279319763184, -13.409186363220215, -12.231093406677246, -11.052999496459961, -9.874906539916992, -8.696813583374023, -7.518719673156738, -6.3406267166137695, -5.162532806396484, -3.9844398498535156, -2.8063464164733887, -1.6282532215118408, -0.45016002655029297, 0.727933406829834, 1.906026840209961, 3.0841197967529297, 4.262213706970215, 5.440306663513184, 6.6184000968933105, 7.7964935302734375, 8.974586486816406, 10.152679443359375, 11.33077335357666, 12.508866310119629, 13.686960220336914, 14.865053176879883, 16.04314613342285, 17.22123908996582, 18.399333953857422, 19.57742691040039, 20.75551986694336, 21.933612823486328, 23.111705780029297, 24.289798736572266, 25.467891693115234, 26.645984649658203, 27.824077606201172, 29.002172470092773, 30.180265426635742, 31.35835838317871, 32.53645324707031, 33.71454620361328]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 8.0, 3.0, 10.0, 7.0, 13.0, 8.0, 18.0, 23.0, 15.0, 20.0, 21.0, 30.0, 22.0, 24.0, 29.0, 36.0, 38.0, 45.0, 42.0, 44.0, 43.0, 51.0, 34.0, 31.0, 40.0, 41.0, 36.0, 33.0, 19.0, 27.0, 30.0, 25.0, 22.0, 21.0, 12.0, 16.0, 12.0, 9.0, 8.0, 6.0, 10.0, 3.0, 6.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.25746536254883, -32.19170379638672, -31.125944137573242, -30.060182571411133, -28.994422912597656, -27.928661346435547, -26.862899780273438, -25.797138214111328, -24.73137855529785, -23.665616989135742, -22.599857330322266, -21.534095764160156, -20.468334197998047, -19.40257453918457, -18.33681297302246, -17.271053314208984, -16.205291748046875, -15.139531135559082, -14.073770523071289, -13.00800895690918, -11.942248344421387, -10.876487731933594, -9.810726165771484, -8.744965553283691, -7.679204940795898, -6.6134443283081055, -5.547683238983154, -4.481922149658203, -3.41616153717041, -2.350400924682617, -1.284639835357666, -0.21887874603271484, 0.8468818664550781, 1.9126427173614502, 2.9784035682678223, 4.044164657592773, 5.109925270080566, 6.175685882568359, 7.2414469718933105, 8.307208061218262, 9.372968673706055, 10.438729286193848, 11.50448989868164, 12.57025146484375, 13.636012077331543, 14.701772689819336, 15.767534255981445, 16.833293914794922, 17.89905548095703, 18.96481704711914, 20.030576705932617, 21.096338272094727, 22.162097930908203, 23.227859497070312, 24.293621063232422, 25.35938262939453, 26.425142288208008, 27.490903854370117, 28.556663513183594, 29.622425079345703, 30.688186645507812, 31.75394630432129, 32.819705963134766, 33.885467529296875, 34.951229095458984]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 11.0, 10.0, 23.0, 32.0, 38.0, 53.0, 67.0, 110.0, 156.0, 259.0, 379.0, 543.0, 809.0, 1284.0, 2078.0, 2982.0, 4781.0, 7460.0, 11775.0, 18716.0, 29679.0, 48776.0, 80301.0, 131647.0, 195806.0, 189278.0, 123607.0, 75086.0, 45860.0, 28325.0, 17684.0, 11063.0, 7063.0, 4359.0, 2944.0, 1880.0, 1214.0, 788.0, 561.0, 357.0, 238.0, 151.0, 105.0, 64.0, 50.0, 31.0, 31.0, 13.0, 11.0, 8.0, 5.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.78125, -36.56005859375, -35.3388671875, -34.11767578125, -32.896484375, -31.67529296875, -30.4541015625, -29.23291015625, -28.01171875, -26.79052734375, -25.5693359375, -24.34814453125, -23.126953125, -21.90576171875, -20.6845703125, -19.46337890625, -18.2421875, -17.02099609375, -15.7998046875, -14.57861328125, -13.357421875, -12.13623046875, -10.9150390625, -9.69384765625, -8.47265625, -7.25146484375, -6.0302734375, -4.80908203125, -3.587890625, -2.36669921875, -1.1455078125, 0.07568359375, 1.296875, 2.51806640625, 3.7392578125, 4.96044921875, 6.181640625, 7.40283203125, 8.6240234375, 9.84521484375, 11.06640625, 12.28759765625, 13.5087890625, 14.72998046875, 15.951171875, 17.17236328125, 18.3935546875, 19.61474609375, 20.8359375, 22.05712890625, 23.2783203125, 24.49951171875, 25.720703125, 26.94189453125, 28.1630859375, 29.38427734375, 30.60546875, 31.82666015625, 33.0478515625, 34.26904296875, 35.490234375, 36.71142578125, 37.9326171875, 39.15380859375, 40.375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 6.0, 3.0, 5.0, 9.0, 14.0, 17.0, 18.0, 18.0, 18.0, 20.0, 32.0, 23.0, 29.0, 31.0, 33.0, 35.0, 43.0, 41.0, 47.0, 38.0, 48.0, 42.0, 49.0, 38.0, 48.0, 43.0, 35.0, 29.0, 26.0, 24.0, 20.0, 24.0, 17.0, 14.0, 8.0, 11.0, 7.0, 8.0, 7.0, 4.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.53125, -34.4287109375, -33.326171875, -32.2236328125, -31.12109375, -30.0185546875, -28.916015625, -27.8134765625, -26.7109375, -25.6083984375, -24.505859375, -23.4033203125, -22.30078125, -21.1982421875, -20.095703125, -18.9931640625, -17.890625, -16.7880859375, -15.685546875, -14.5830078125, -13.48046875, -12.3779296875, -11.275390625, -10.1728515625, -9.0703125, -7.9677734375, -6.865234375, -5.7626953125, -4.66015625, -3.5576171875, -2.455078125, -1.3525390625, -0.25, 0.8525390625, 1.955078125, 3.0576171875, 4.16015625, 5.2626953125, 6.365234375, 7.4677734375, 8.5703125, 9.6728515625, 10.775390625, 11.8779296875, 12.98046875, 14.0830078125, 15.185546875, 16.2880859375, 17.390625, 18.4931640625, 19.595703125, 20.6982421875, 21.80078125, 22.9033203125, 24.005859375, 25.1083984375, 26.2109375, 27.3134765625, 28.416015625, 29.5185546875, 30.62109375, 31.7236328125, 32.826171875, 33.9287109375, 35.03125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 20.0, 15.0, 29.0, 48.0, 79.0, 125.0, 215.0, 361.0, 549.0, 1014.0, 1725.0, 2846.0, 4721.0, 8072.0, 13563.0, 23207.0, 39727.0, 66573.0, 110994.0, 176970.0, 210911.0, 154943.0, 94981.0, 55834.0, 33490.0, 19159.0, 11608.0, 6909.0, 3992.0, 2421.0, 1373.0, 851.0, 469.0, 316.0, 165.0, 112.0, 58.0, 37.0, 22.0, 15.0, 11.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.65625, -38.2568359375, -36.857421875, -35.4580078125, -34.05859375, -32.6591796875, -31.259765625, -29.8603515625, -28.4609375, -27.0615234375, -25.662109375, -24.2626953125, -22.86328125, -21.4638671875, -20.064453125, -18.6650390625, -17.265625, -15.8662109375, -14.466796875, -13.0673828125, -11.66796875, -10.2685546875, -8.869140625, -7.4697265625, -6.0703125, -4.6708984375, -3.271484375, -1.8720703125, -0.47265625, 0.9267578125, 2.326171875, 3.7255859375, 5.125, 6.5244140625, 7.923828125, 9.3232421875, 10.72265625, 12.1220703125, 13.521484375, 14.9208984375, 16.3203125, 17.7197265625, 19.119140625, 20.5185546875, 21.91796875, 23.3173828125, 24.716796875, 26.1162109375, 27.515625, 28.9150390625, 30.314453125, 31.7138671875, 33.11328125, 34.5126953125, 35.912109375, 37.3115234375, 38.7109375, 40.1103515625, 41.509765625, 42.9091796875, 44.30859375, 45.7080078125, 47.107421875, 48.5068359375, 49.90625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 6.0, 9.0, 6.0, 7.0, 10.0, 14.0, 18.0, 12.0, 26.0, 17.0, 17.0, 22.0, 20.0, 29.0, 23.0, 29.0, 33.0, 34.0, 37.0, 28.0, 30.0, 21.0, 24.0, 32.0, 28.0, 34.0, 41.0, 36.0, 39.0, 39.0, 38.0, 29.0, 27.0, 22.0, 23.0, 20.0, 19.0, 17.0, 14.0, 11.0, 8.0, 6.0, 7.0, 8.0, 3.0, 9.0, 7.0, 4.0, 0.0, 4.0, 1.0, 3.0, 2.0], "bins": [-19.796875, -19.20751953125, -18.6181640625, -18.02880859375, -17.439453125, -16.85009765625, -16.2607421875, -15.67138671875, -15.08203125, -14.49267578125, -13.9033203125, -13.31396484375, -12.724609375, -12.13525390625, -11.5458984375, -10.95654296875, -10.3671875, -9.77783203125, -9.1884765625, -8.59912109375, -8.009765625, -7.42041015625, -6.8310546875, -6.24169921875, -5.65234375, -5.06298828125, -4.4736328125, -3.88427734375, -3.294921875, -2.70556640625, -2.1162109375, -1.52685546875, -0.9375, -0.34814453125, 0.2412109375, 0.83056640625, 1.419921875, 2.00927734375, 2.5986328125, 3.18798828125, 3.77734375, 4.36669921875, 4.9560546875, 5.54541015625, 6.134765625, 6.72412109375, 7.3134765625, 7.90283203125, 8.4921875, 9.08154296875, 9.6708984375, 10.26025390625, 10.849609375, 11.43896484375, 12.0283203125, 12.61767578125, 13.20703125, 13.79638671875, 14.3857421875, 14.97509765625, 15.564453125, 16.15380859375, 16.7431640625, 17.33251953125, 17.921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 7.0, 18.0, 14.0, 16.0, 43.0, 48.0, 63.0, 124.0, 201.0, 276.0, 449.0, 648.0, 1215.0, 1803.0, 2890.0, 4934.0, 8529.0, 15266.0, 28317.0, 54122.0, 109481.0, 212633.0, 269052.0, 164224.0, 81927.0, 41280.0, 21710.0, 11869.0, 6807.0, 4105.0, 2418.0, 1516.0, 913.0, 551.0, 373.0, 261.0, 170.0, 88.0, 69.0, 30.0, 22.0, 26.0, 13.0, 8.0, 11.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-16.296875, -15.792236328125, -15.28759765625, -14.782958984375, -14.2783203125, -13.773681640625, -13.26904296875, -12.764404296875, -12.259765625, -11.755126953125, -11.25048828125, -10.745849609375, -10.2412109375, -9.736572265625, -9.23193359375, -8.727294921875, -8.22265625, -7.718017578125, -7.21337890625, -6.708740234375, -6.2041015625, -5.699462890625, -5.19482421875, -4.690185546875, -4.185546875, -3.680908203125, -3.17626953125, -2.671630859375, -2.1669921875, -1.662353515625, -1.15771484375, -0.653076171875, -0.1484375, 0.356201171875, 0.86083984375, 1.365478515625, 1.8701171875, 2.374755859375, 2.87939453125, 3.384033203125, 3.888671875, 4.393310546875, 4.89794921875, 5.402587890625, 5.9072265625, 6.411865234375, 6.91650390625, 7.421142578125, 7.92578125, 8.430419921875, 8.93505859375, 9.439697265625, 9.9443359375, 10.448974609375, 10.95361328125, 11.458251953125, 11.962890625, 12.467529296875, 12.97216796875, 13.476806640625, 13.9814453125, 14.486083984375, 14.99072265625, 15.495361328125, 16.0]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 16.0, 20.0, 25.0, 34.0, 55.0, 71.0, 106.0, 137.0, 134.0, 123.0, 89.0, 62.0, 40.0, 28.0, 23.0, 8.0, 4.0, 1.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028667449951171875, -0.0027831196784973145, -0.0026994943618774414, -0.0026158690452575684, -0.0025322437286376953, -0.0024486184120178223, -0.0023649930953979492, -0.002281367778778076, -0.002197742462158203, -0.00211411714553833, -0.002030491828918457, -0.001946866512298584, -0.001863241195678711, -0.0017796158790588379, -0.0016959905624389648, -0.0016123652458190918, -0.0015287399291992188, -0.0014451146125793457, -0.0013614892959594727, -0.0012778639793395996, -0.0011942386627197266, -0.0011106133460998535, -0.0010269880294799805, -0.0009433627128601074, -0.0008597373962402344, -0.0007761120796203613, -0.0006924867630004883, -0.0006088614463806152, -0.0005252361297607422, -0.00044161081314086914, -0.0003579854965209961, -0.00027436017990112305, -0.00019073486328125, -0.00010710954666137695, -2.3484230041503906e-05, 6.014108657836914e-05, 0.0001437664031982422, 0.00022739171981811523, 0.0003110170364379883, 0.00039464235305786133, 0.0004782676696777344, 0.0005618929862976074, 0.0006455183029174805, 0.0007291436195373535, 0.0008127689361572266, 0.0008963942527770996, 0.0009800195693969727, 0.0010636448860168457, 0.0011472702026367188, 0.0012308955192565918, 0.0013145208358764648, 0.0013981461524963379, 0.001481771469116211, 0.001565396785736084, 0.001649022102355957, 0.00173264741897583, 0.0018162727355957031, 0.0018998980522155762, 0.0019835233688354492, 0.0020671486854553223, 0.0021507740020751953, 0.0022343993186950684, 0.0023180246353149414, 0.0024016499519348145, 0.0024852752685546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 11.0, 14.0, 14.0, 18.0, 34.0, 49.0, 94.0, 136.0, 176.0, 299.0, 476.0, 889.0, 1398.0, 2365.0, 4209.0, 7195.0, 13135.0, 24536.0, 47046.0, 92638.0, 184090.0, 279658.0, 189629.0, 95699.0, 48234.0, 25263.0, 13455.0, 7481.0, 4198.0, 2382.0, 1452.0, 873.0, 528.0, 325.0, 214.0, 115.0, 81.0, 50.0, 38.0, 18.0, 14.0, 7.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.59375, -18.0390625, -17.484375, -16.9296875, -16.375, -15.8203125, -15.265625, -14.7109375, -14.15625, -13.6015625, -13.046875, -12.4921875, -11.9375, -11.3828125, -10.828125, -10.2734375, -9.71875, -9.1640625, -8.609375, -8.0546875, -7.5, -6.9453125, -6.390625, -5.8359375, -5.28125, -4.7265625, -4.171875, -3.6171875, -3.0625, -2.5078125, -1.953125, -1.3984375, -0.84375, -0.2890625, 0.265625, 0.8203125, 1.375, 1.9296875, 2.484375, 3.0390625, 3.59375, 4.1484375, 4.703125, 5.2578125, 5.8125, 6.3671875, 6.921875, 7.4765625, 8.03125, 8.5859375, 9.140625, 9.6953125, 10.25, 10.8046875, 11.359375, 11.9140625, 12.46875, 13.0234375, 13.578125, 14.1328125, 14.6875, 15.2421875, 15.796875, 16.3515625, 16.90625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 10.0, 5.0, 12.0, 13.0, 16.0, 25.0, 24.0, 18.0, 35.0, 42.0, 37.0, 54.0, 60.0, 54.0, 65.0, 62.0, 52.0, 70.0, 41.0, 39.0, 37.0, 27.0, 28.0, 29.0, 24.0, 27.0, 13.0, 13.0, 7.0, 7.0, 6.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.734375, -4.58251953125, -4.4306640625, -4.27880859375, -4.126953125, -3.97509765625, -3.8232421875, -3.67138671875, -3.51953125, -3.36767578125, -3.2158203125, -3.06396484375, -2.912109375, -2.76025390625, -2.6083984375, -2.45654296875, -2.3046875, -2.15283203125, -2.0009765625, -1.84912109375, -1.697265625, -1.54541015625, -1.3935546875, -1.24169921875, -1.08984375, -0.93798828125, -0.7861328125, -0.63427734375, -0.482421875, -0.33056640625, -0.1787109375, -0.02685546875, 0.125, 0.27685546875, 0.4287109375, 0.58056640625, 0.732421875, 0.88427734375, 1.0361328125, 1.18798828125, 1.33984375, 1.49169921875, 1.6435546875, 1.79541015625, 1.947265625, 2.09912109375, 2.2509765625, 2.40283203125, 2.5546875, 2.70654296875, 2.8583984375, 3.01025390625, 3.162109375, 3.31396484375, 3.4658203125, 3.61767578125, 3.76953125, 3.92138671875, 4.0732421875, 4.22509765625, 4.376953125, 4.52880859375, 4.6806640625, 4.83251953125, 4.984375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 0.0, 4.0, 3.0, 3.0, 9.0, 5.0, 3.0, 9.0, 14.0, 12.0, 8.0, 13.0, 26.0, 20.0, 33.0, 37.0, 35.0, 45.0, 68.0, 56.0, 50.0, 69.0, 69.0, 46.0, 47.0, 54.0, 40.0, 38.0, 29.0, 23.0, 25.0, 18.0, 21.0, 17.0, 14.0, 4.0, 8.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.427425384521484, -34.3779411315918, -33.32845687866211, -32.278968811035156, -31.2294864654541, -30.18000030517578, -29.130516052246094, -28.081031799316406, -27.03154754638672, -25.98206329345703, -24.93257713317871, -23.883092880249023, -22.833608627319336, -21.784122467041016, -20.734638214111328, -19.68515396118164, -18.63566780090332, -17.586183547973633, -16.536697387695312, -15.487213134765625, -14.437728881835938, -13.388243675231934, -12.33875846862793, -11.289274215698242, -10.239789009094238, -9.190303802490234, -8.140819549560547, -7.091334342956543, -6.041849613189697, -4.992364883422852, -3.9428796768188477, -2.893394947052002, -1.843912124633789, -0.7944272756576538, 0.25505757331848145, 1.3045425415039062, 2.354027271270752, 3.4035120010375977, 4.452997207641602, 5.502481937408447, 6.551966667175293, 7.601451396942139, 8.650936126708984, 9.700421333312988, 10.749906539916992, 11.79939079284668, 12.848875999450684, 13.898361206054688, 14.947845458984375, 15.997330665588379, 17.046815872192383, 18.09630012512207, 19.145784378051758, 20.195270538330078, 21.244754791259766, 22.294239044189453, 23.34372329711914, 24.393207550048828, 25.44269371032715, 26.492177963256836, 27.541662216186523, 28.591148376464844, 29.64063262939453, 30.69011688232422, 31.73960304260254]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 10.0, 4.0, 5.0, 7.0, 8.0, 12.0, 13.0, 13.0, 24.0, 19.0, 26.0, 26.0, 30.0, 29.0, 24.0, 39.0, 36.0, 43.0, 46.0, 26.0, 44.0, 54.0, 36.0, 49.0, 44.0, 27.0, 45.0, 28.0, 29.0, 29.0, 26.0, 23.0, 27.0, 17.0, 11.0, 12.0, 13.0, 10.0, 8.0, 5.0, 8.0, 1.0, 8.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.69272232055664, -34.54065704345703, -33.38859176635742, -32.23652648925781, -31.084461212158203, -29.932395935058594, -28.780332565307617, -27.628267288208008, -26.4762020111084, -25.32413673400879, -24.17207145690918, -23.02000617980957, -21.867942810058594, -20.715877532958984, -19.563812255859375, -18.411746978759766, -17.259681701660156, -16.107616424560547, -14.955551147460938, -13.803486824035645, -12.651421546936035, -11.499356269836426, -10.347291946411133, -9.195226669311523, -8.043161392211914, -6.891096115112305, -5.7390313148498535, -4.586966514587402, -3.434901237487793, -2.2828359603881836, -1.1307711601257324, 0.02129364013671875, 1.1733627319335938, 2.325427770614624, 3.4774928092956543, 4.6295576095581055, 5.781622886657715, 6.933688163757324, 8.085752487182617, 9.237817764282227, 10.389883041381836, 11.541948318481445, 12.694013595581055, 13.846077919006348, 14.998143196105957, 16.15020751953125, 17.30227279663086, 18.45433807373047, 19.606403350830078, 20.758468627929688, 21.910533905029297, 23.062599182128906, 24.214664459228516, 25.366729736328125, 26.5187931060791, 27.67085838317871, 28.82292366027832, 29.97498893737793, 31.12705421447754, 32.279117584228516, 33.431182861328125, 34.583248138427734, 35.735313415527344, 36.88737869262695, 38.03944396972656]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [6.0, 4.0, 1.0, 6.0, 10.0, 9.0, 9.0, 19.0, 19.0, 33.0, 49.0, 69.0, 92.0, 174.0, 243.0, 373.0, 595.0, 895.0, 1286.0, 2006.0, 3065.0, 4840.0, 8058.0, 14009.0, 24995.0, 50342.0, 118007.0, 335318.0, 944276.0, 1478702.0, 754540.0, 258088.0, 95391.0, 42832.0, 22583.0, 12591.0, 7594.0, 4630.0, 2943.0, 1893.0, 1278.0, 833.0, 525.0, 352.0, 221.0, 165.0, 108.0, 68.0, 54.0, 23.0, 19.0, 15.0, 14.0, 8.0, 10.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.375, -38.03515625, -36.6953125, -35.35546875, -34.015625, -32.67578125, -31.3359375, -29.99609375, -28.65625, -27.31640625, -25.9765625, -24.63671875, -23.296875, -21.95703125, -20.6171875, -19.27734375, -17.9375, -16.59765625, -15.2578125, -13.91796875, -12.578125, -11.23828125, -9.8984375, -8.55859375, -7.21875, -5.87890625, -4.5390625, -3.19921875, -1.859375, -0.51953125, 0.8203125, 2.16015625, 3.5, 4.83984375, 6.1796875, 7.51953125, 8.859375, 10.19921875, 11.5390625, 12.87890625, 14.21875, 15.55859375, 16.8984375, 18.23828125, 19.578125, 20.91796875, 22.2578125, 23.59765625, 24.9375, 26.27734375, 27.6171875, 28.95703125, 30.296875, 31.63671875, 32.9765625, 34.31640625, 35.65625, 36.99609375, 38.3359375, 39.67578125, 41.015625, 42.35546875, 43.6953125, 45.03515625, 46.375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 7.0, 3.0, 7.0, 6.0, 10.0, 8.0, 5.0, 14.0, 19.0, 13.0, 26.0, 26.0, 26.0, 25.0, 26.0, 27.0, 31.0, 37.0, 41.0, 47.0, 47.0, 44.0, 46.0, 45.0, 42.0, 46.0, 50.0, 36.0, 24.0, 29.0, 31.0, 24.0, 22.0, 18.0, 18.0, 11.0, 16.0, 13.0, 7.0, 7.0, 5.0, 4.0, 3.0, 3.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-33.5, -32.45068359375, -31.4013671875, -30.35205078125, -29.302734375, -28.25341796875, -27.2041015625, -26.15478515625, -25.10546875, -24.05615234375, -23.0068359375, -21.95751953125, -20.908203125, -19.85888671875, -18.8095703125, -17.76025390625, -16.7109375, -15.66162109375, -14.6123046875, -13.56298828125, -12.513671875, -11.46435546875, -10.4150390625, -9.36572265625, -8.31640625, -7.26708984375, -6.2177734375, -5.16845703125, -4.119140625, -3.06982421875, -2.0205078125, -0.97119140625, 0.078125, 1.12744140625, 2.1767578125, 3.22607421875, 4.275390625, 5.32470703125, 6.3740234375, 7.42333984375, 8.47265625, 9.52197265625, 10.5712890625, 11.62060546875, 12.669921875, 13.71923828125, 14.7685546875, 15.81787109375, 16.8671875, 17.91650390625, 18.9658203125, 20.01513671875, 21.064453125, 22.11376953125, 23.1630859375, 24.21240234375, 25.26171875, 26.31103515625, 27.3603515625, 28.40966796875, 29.458984375, 30.50830078125, 31.5576171875, 32.60693359375, 33.65625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 6.0, 23.0, 17.0, 35.0, 46.0, 90.0, 123.0, 179.0, 268.0, 415.0, 691.0, 1131.0, 1746.0, 2961.0, 5265.0, 8998.0, 16391.0, 31611.0, 63654.0, 134770.0, 316016.0, 841564.0, 1580156.0, 688738.0, 265503.0, 116633.0, 55129.0, 27653.0, 14738.0, 8049.0, 4574.0, 2725.0, 1616.0, 1015.0, 606.0, 391.0, 242.0, 166.0, 111.0, 84.0, 56.0, 27.0, 17.0, 12.0, 13.0, 11.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-54.125, -52.5517578125, -50.978515625, -49.4052734375, -47.83203125, -46.2587890625, -44.685546875, -43.1123046875, -41.5390625, -39.9658203125, -38.392578125, -36.8193359375, -35.24609375, -33.6728515625, -32.099609375, -30.5263671875, -28.953125, -27.3798828125, -25.806640625, -24.2333984375, -22.66015625, -21.0869140625, -19.513671875, -17.9404296875, -16.3671875, -14.7939453125, -13.220703125, -11.6474609375, -10.07421875, -8.5009765625, -6.927734375, -5.3544921875, -3.78125, -2.2080078125, -0.634765625, 0.9384765625, 2.51171875, 4.0849609375, 5.658203125, 7.2314453125, 8.8046875, 10.3779296875, 11.951171875, 13.5244140625, 15.09765625, 16.6708984375, 18.244140625, 19.8173828125, 21.390625, 22.9638671875, 24.537109375, 26.1103515625, 27.68359375, 29.2568359375, 30.830078125, 32.4033203125, 33.9765625, 35.5498046875, 37.123046875, 38.6962890625, 40.26953125, 41.8427734375, 43.416015625, 44.9892578125, 46.5625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 7.0, 6.0, 9.0, 15.0, 12.0, 10.0, 20.0, 21.0, 29.0, 44.0, 52.0, 61.0, 86.0, 98.0, 113.0, 167.0, 182.0, 215.0, 281.0, 314.0, 351.0, 354.0, 309.0, 234.0, 233.0, 161.0, 138.0, 119.0, 100.0, 67.0, 59.0, 49.0, 34.0, 30.0, 23.0, 17.0, 19.0, 12.0, 11.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0], "bins": [-18.09375, -17.6011962890625, -17.108642578125, -16.6160888671875, -16.12353515625, -15.6309814453125, -15.138427734375, -14.6458740234375, -14.1533203125, -13.6607666015625, -13.168212890625, -12.6756591796875, -12.18310546875, -11.6905517578125, -11.197998046875, -10.7054443359375, -10.212890625, -9.7203369140625, -9.227783203125, -8.7352294921875, -8.24267578125, -7.7501220703125, -7.257568359375, -6.7650146484375, -6.2724609375, -5.7799072265625, -5.287353515625, -4.7947998046875, -4.30224609375, -3.8096923828125, -3.317138671875, -2.8245849609375, -2.33203125, -1.8394775390625, -1.346923828125, -0.8543701171875, -0.36181640625, 0.1307373046875, 0.623291015625, 1.1158447265625, 1.6083984375, 2.1009521484375, 2.593505859375, 3.0860595703125, 3.57861328125, 4.0711669921875, 4.563720703125, 5.0562744140625, 5.548828125, 6.0413818359375, 6.533935546875, 7.0264892578125, 7.51904296875, 8.0115966796875, 8.504150390625, 8.9967041015625, 9.4892578125, 9.9818115234375, 10.474365234375, 10.9669189453125, 11.45947265625, 11.9520263671875, 12.444580078125, 12.9371337890625, 13.4296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 9.0, 6.0, 10.0, 7.0, 9.0, 14.0, 12.0, 14.0, 19.0, 29.0, 42.0, 43.0, 44.0, 64.0, 72.0, 74.0, 73.0, 64.0, 60.0, 50.0, 48.0, 41.0, 29.0, 25.0, 38.0, 19.0, 18.0, 18.0, 9.0, 5.0, 8.0, 9.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.86423110961914, -39.64664840698242, -38.42906188964844, -37.21147918701172, -35.993896484375, -34.77631378173828, -33.5587272644043, -32.34114456176758, -31.123559951782227, -29.905975341796875, -28.688392639160156, -27.470808029174805, -26.253223419189453, -25.035640716552734, -23.818056106567383, -22.60047149658203, -21.382888793945312, -20.16530418395996, -18.947721481323242, -17.73013687133789, -16.512554168701172, -15.29496955871582, -14.077384948730469, -12.859801292419434, -11.642217636108398, -10.424633979797363, -9.207050323486328, -7.989465713500977, -6.771882057189941, -5.554298400878906, -4.336714267730713, -3.1191301345825195, -1.9015426635742188, -0.6839587688446045, 0.5336251258850098, 1.751209020614624, 2.9687929153442383, 4.186376571655273, 5.403960704803467, 6.62154483795166, 7.839128494262695, 9.05671215057373, 10.274295806884766, 11.491880416870117, 12.709464073181152, 13.927047729492188, 15.144632339477539, 16.36221694946289, 17.57979965209961, 18.79738426208496, 20.01496696472168, 21.23255157470703, 22.45013427734375, 23.6677188873291, 24.885303497314453, 26.102886199951172, 27.320470809936523, 28.538055419921875, 29.755638122558594, 30.973222732543945, 32.1908073425293, 33.408390045166016, 34.625972747802734, 35.84355926513672, 37.06114196777344]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 8.0, 9.0, 8.0, 10.0, 18.0, 19.0, 32.0, 19.0, 27.0, 33.0, 29.0, 26.0, 37.0, 30.0, 40.0, 46.0, 41.0, 43.0, 41.0, 37.0, 51.0, 37.0, 44.0, 40.0, 27.0, 31.0, 43.0, 21.0, 30.0, 17.0, 16.0, 19.0, 15.0, 7.0, 14.0, 10.0, 4.0, 3.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.64574432373047, -41.444091796875, -40.24243927001953, -39.04078674316406, -37.839134216308594, -36.63748550415039, -35.43583297729492, -34.23418045043945, -33.032527923583984, -31.830875396728516, -30.629222869873047, -29.42757225036621, -28.225919723510742, -27.024267196655273, -25.822616577148438, -24.62096405029297, -23.4193115234375, -22.21765899658203, -21.016006469726562, -19.814355850219727, -18.612703323364258, -17.41105079650879, -16.209400177001953, -15.007747650146484, -13.806095123291016, -12.604442596435547, -11.402791023254395, -10.201139450073242, -8.999486923217773, -7.797834873199463, -6.596182823181152, -5.39453125, -4.192882537841797, -2.9912304878234863, -1.7895784378051758, -0.5879263877868652, 0.6137256622314453, 1.8153777122497559, 3.0170297622680664, 4.218681335449219, 5.4203338623046875, 6.621985912322998, 7.823637962341309, 9.025289535522461, 10.22694206237793, 11.428594589233398, 12.63024616241455, 13.831897735595703, 15.033550262451172, 16.23520278930664, 17.43685531616211, 18.638505935668945, 19.840158462524414, 21.041810989379883, 22.24346160888672, 23.445114135742188, 24.646766662597656, 25.848419189453125, 27.050071716308594, 28.25172233581543, 29.4533748626709, 30.655027389526367, 31.856678009033203, 33.05833053588867, 34.25998306274414]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 11.0, 16.0, 22.0, 27.0, 28.0, 48.0, 89.0, 122.0, 177.0, 284.0, 360.0, 544.0, 813.0, 1276.0, 1832.0, 2682.0, 4327.0, 6478.0, 9975.0, 15518.0, 24432.0, 39346.0, 67176.0, 128860.0, 295937.0, 210478.0, 95300.0, 53253.0, 31746.0, 20216.0, 12879.0, 8318.0, 5354.0, 3552.0, 2350.0, 1562.0, 1010.0, 692.0, 474.0, 342.0, 217.0, 152.0, 95.0, 63.0, 44.0, 35.0, 15.0, 13.0, 11.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.25, -11.8387451171875, -11.427490234375, -11.0162353515625, -10.60498046875, -10.1937255859375, -9.782470703125, -9.3712158203125, -8.9599609375, -8.5487060546875, -8.137451171875, -7.7261962890625, -7.31494140625, -6.9036865234375, -6.492431640625, -6.0811767578125, -5.669921875, -5.2586669921875, -4.847412109375, -4.4361572265625, -4.02490234375, -3.6136474609375, -3.202392578125, -2.7911376953125, -2.3798828125, -1.9686279296875, -1.557373046875, -1.1461181640625, -0.73486328125, -0.3236083984375, 0.087646484375, 0.4989013671875, 0.91015625, 1.3214111328125, 1.732666015625, 2.1439208984375, 2.55517578125, 2.9664306640625, 3.377685546875, 3.7889404296875, 4.2001953125, 4.6114501953125, 5.022705078125, 5.4339599609375, 5.84521484375, 6.2564697265625, 6.667724609375, 7.0789794921875, 7.490234375, 7.9014892578125, 8.312744140625, 8.7239990234375, 9.13525390625, 9.5465087890625, 9.957763671875, 10.3690185546875, 10.7802734375, 11.1915283203125, 11.602783203125, 12.0140380859375, 12.42529296875, 12.8365478515625, 13.247802734375, 13.6590576171875, 14.0703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 8.0, 4.0, 5.0, 7.0, 7.0, 13.0, 23.0, 18.0, 26.0, 21.0, 34.0, 27.0, 30.0, 32.0, 33.0, 37.0, 52.0, 47.0, 42.0, 47.0, 47.0, 47.0, 47.0, 30.0, 44.0, 29.0, 31.0, 34.0, 33.0, 20.0, 26.0, 20.0, 15.0, 10.0, 6.0, 13.0, 12.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-44.8125, -43.5634765625, -42.314453125, -41.0654296875, -39.81640625, -38.5673828125, -37.318359375, -36.0693359375, -34.8203125, -33.5712890625, -32.322265625, -31.0732421875, -29.82421875, -28.5751953125, -27.326171875, -26.0771484375, -24.828125, -23.5791015625, -22.330078125, -21.0810546875, -19.83203125, -18.5830078125, -17.333984375, -16.0849609375, -14.8359375, -13.5869140625, -12.337890625, -11.0888671875, -9.83984375, -8.5908203125, -7.341796875, -6.0927734375, -4.84375, -3.5947265625, -2.345703125, -1.0966796875, 0.15234375, 1.4013671875, 2.650390625, 3.8994140625, 5.1484375, 6.3974609375, 7.646484375, 8.8955078125, 10.14453125, 11.3935546875, 12.642578125, 13.8916015625, 15.140625, 16.3896484375, 17.638671875, 18.8876953125, 20.13671875, 21.3857421875, 22.634765625, 23.8837890625, 25.1328125, 26.3818359375, 27.630859375, 28.8798828125, 30.12890625, 31.3779296875, 32.626953125, 33.8759765625, 35.125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 12.0, 11.0, 12.0, 32.0, 50.0, 59.0, 96.0, 129.0, 199.0, 288.0, 414.0, 613.0, 798.0, 1133.0, 1679.0, 2429.0, 3723.0, 5706.0, 9704.0, 18688.0, 59409.0, 621852.0, 246602.0, 36917.0, 14574.0, 8017.0, 5032.0, 3252.0, 2215.0, 1476.0, 1023.0, 740.0, 529.0, 357.0, 258.0, 181.0, 115.0, 79.0, 54.0, 30.0, 19.0, 18.0, 13.0, 9.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1875, -14.678466796875, -14.16943359375, -13.660400390625, -13.1513671875, -12.642333984375, -12.13330078125, -11.624267578125, -11.115234375, -10.606201171875, -10.09716796875, -9.588134765625, -9.0791015625, -8.570068359375, -8.06103515625, -7.552001953125, -7.04296875, -6.533935546875, -6.02490234375, -5.515869140625, -5.0068359375, -4.497802734375, -3.98876953125, -3.479736328125, -2.970703125, -2.461669921875, -1.95263671875, -1.443603515625, -0.9345703125, -0.425537109375, 0.08349609375, 0.592529296875, 1.1015625, 1.610595703125, 2.11962890625, 2.628662109375, 3.1376953125, 3.646728515625, 4.15576171875, 4.664794921875, 5.173828125, 5.682861328125, 6.19189453125, 6.700927734375, 7.2099609375, 7.718994140625, 8.22802734375, 8.737060546875, 9.24609375, 9.755126953125, 10.26416015625, 10.773193359375, 11.2822265625, 11.791259765625, 12.30029296875, 12.809326171875, 13.318359375, 13.827392578125, 14.33642578125, 14.845458984375, 15.3544921875, 15.863525390625, 16.37255859375, 16.881591796875, 17.390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 9.0, 11.0, 3.0, 14.0, 11.0, 14.0, 12.0, 16.0, 20.0, 28.0, 28.0, 26.0, 25.0, 35.0, 32.0, 32.0, 39.0, 40.0, 43.0, 42.0, 49.0, 44.0, 29.0, 37.0, 40.0, 33.0, 39.0, 29.0, 26.0, 39.0, 15.0, 28.0, 10.0, 19.0, 19.0, 14.0, 12.0, 11.0, 9.0, 9.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.625, -23.810546875, -22.99609375, -22.181640625, -21.3671875, -20.552734375, -19.73828125, -18.923828125, -18.109375, -17.294921875, -16.48046875, -15.666015625, -14.8515625, -14.037109375, -13.22265625, -12.408203125, -11.59375, -10.779296875, -9.96484375, -9.150390625, -8.3359375, -7.521484375, -6.70703125, -5.892578125, -5.078125, -4.263671875, -3.44921875, -2.634765625, -1.8203125, -1.005859375, -0.19140625, 0.623046875, 1.4375, 2.251953125, 3.06640625, 3.880859375, 4.6953125, 5.509765625, 6.32421875, 7.138671875, 7.953125, 8.767578125, 9.58203125, 10.396484375, 11.2109375, 12.025390625, 12.83984375, 13.654296875, 14.46875, 15.283203125, 16.09765625, 16.912109375, 17.7265625, 18.541015625, 19.35546875, 20.169921875, 20.984375, 21.798828125, 22.61328125, 23.427734375, 24.2421875, 25.056640625, 25.87109375, 26.685546875, 27.5]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 19.0, 21.0, 38.0, 62.0, 66.0, 105.0, 166.0, 266.0, 403.0, 643.0, 1162.0, 2042.0, 3844.0, 8198.0, 19319.0, 78904.0, 850255.0, 52076.0, 16106.0, 7026.0, 3387.0, 1750.0, 1024.0, 561.0, 408.0, 213.0, 159.0, 102.0, 53.0, 48.0, 40.0, 20.0, 21.0, 12.0, 3.0, 4.0, 3.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.3671875, -2.300323486328125, -2.23345947265625, -2.166595458984375, -2.0997314453125, -2.032867431640625, -1.96600341796875, -1.899139404296875, -1.832275390625, -1.765411376953125, -1.69854736328125, -1.631683349609375, -1.5648193359375, -1.497955322265625, -1.43109130859375, -1.364227294921875, -1.29736328125, -1.230499267578125, -1.16363525390625, -1.096771240234375, -1.0299072265625, -0.963043212890625, -0.89617919921875, -0.829315185546875, -0.762451171875, -0.695587158203125, -0.62872314453125, -0.561859130859375, -0.4949951171875, -0.428131103515625, -0.36126708984375, -0.294403076171875, -0.2275390625, -0.160675048828125, -0.09381103515625, -0.026947021484375, 0.0399169921875, 0.106781005859375, 0.17364501953125, 0.240509033203125, 0.307373046875, 0.374237060546875, 0.44110107421875, 0.507965087890625, 0.5748291015625, 0.641693115234375, 0.70855712890625, 0.775421142578125, 0.84228515625, 0.909149169921875, 0.97601318359375, 1.042877197265625, 1.1097412109375, 1.176605224609375, 1.24346923828125, 1.310333251953125, 1.377197265625, 1.444061279296875, 1.51092529296875, 1.577789306640625, 1.6446533203125, 1.711517333984375, 1.77838134765625, 1.845245361328125, 1.912109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 8.0, 6.0, 6.0, 10.0, 15.0, 16.0, 24.0, 30.0, 39.0, 44.0, 45.0, 55.0, 55.0, 57.0, 57.0, 68.0, 61.0, 67.0, 46.0, 56.0, 30.0, 33.0, 31.0, 27.0, 17.0, 13.0, 17.0, 15.0, 7.0, 2.0, 6.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00010657310485839844, -0.00010285340249538422, -9.913370013237e-05, -9.541399776935577e-05, -9.169429540634155e-05, -8.797459304332733e-05, -8.425489068031311e-05, -8.053518831729889e-05, -7.681548595428467e-05, -7.309578359127045e-05, -6.937608122825623e-05, -6.5656378865242e-05, -6.193667650222778e-05, -5.821697413921356e-05, -5.449727177619934e-05, -5.077756941318512e-05, -4.70578670501709e-05, -4.333816468715668e-05, -3.9618462324142456e-05, -3.5898759961128235e-05, -3.2179057598114014e-05, -2.8459355235099792e-05, -2.473965287208557e-05, -2.101995050907135e-05, -1.730024814605713e-05, -1.3580545783042908e-05, -9.860843420028687e-06, -6.141141057014465e-06, -2.421438694000244e-06, 1.298263669013977e-06, 5.017966032028198e-06, 8.73766839504242e-06, 1.245737075805664e-05, 1.6177073121070862e-05, 1.9896775484085083e-05, 2.3616477847099304e-05, 2.7336180210113525e-05, 3.1055882573127747e-05, 3.477558493614197e-05, 3.849528729915619e-05, 4.221498966217041e-05, 4.593469202518463e-05, 4.965439438819885e-05, 5.3374096751213074e-05, 5.7093799114227295e-05, 6.0813501477241516e-05, 6.453320384025574e-05, 6.825290620326996e-05, 7.197260856628418e-05, 7.56923109292984e-05, 7.941201329231262e-05, 8.313171565532684e-05, 8.685141801834106e-05, 9.057112038135529e-05, 9.429082274436951e-05, 9.801052510738373e-05, 0.00010173022747039795, 0.00010544992983341217, 0.00010916963219642639, 0.00011288933455944061, 0.00011660903692245483, 0.00012032873928546906, 0.00012404844164848328, 0.0001277681440114975, 0.00013148784637451172]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 10.0, 7.0, 14.0, 21.0, 33.0, 57.0, 69.0, 101.0, 175.0, 284.0, 389.0, 588.0, 910.0, 1406.0, 2179.0, 3305.0, 5198.0, 8086.0, 12698.0, 20802.0, 35033.0, 62811.0, 115887.0, 212500.0, 240877.0, 141461.0, 76049.0, 42261.0, 24416.0, 15040.0, 9361.0, 5685.0, 3701.0, 2439.0, 1545.0, 1097.0, 713.0, 492.0, 295.0, 191.0, 130.0, 87.0, 48.0, 33.0, 28.0, 21.0, 9.0, 6.0, 6.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.197265625, -1.1600341796875, -1.122802734375, -1.0855712890625, -1.04833984375, -1.0111083984375, -0.973876953125, -0.9366455078125, -0.8994140625, -0.8621826171875, -0.824951171875, -0.7877197265625, -0.75048828125, -0.7132568359375, -0.676025390625, -0.6387939453125, -0.6015625, -0.5643310546875, -0.527099609375, -0.4898681640625, -0.45263671875, -0.4154052734375, -0.378173828125, -0.3409423828125, -0.3037109375, -0.2664794921875, -0.229248046875, -0.1920166015625, -0.15478515625, -0.1175537109375, -0.080322265625, -0.0430908203125, -0.005859375, 0.0313720703125, 0.068603515625, 0.1058349609375, 0.14306640625, 0.1802978515625, 0.217529296875, 0.2547607421875, 0.2919921875, 0.3292236328125, 0.366455078125, 0.4036865234375, 0.44091796875, 0.4781494140625, 0.515380859375, 0.5526123046875, 0.58984375, 0.6270751953125, 0.664306640625, 0.7015380859375, 0.73876953125, 0.7760009765625, 0.813232421875, 0.8504638671875, 0.8876953125, 0.9249267578125, 0.962158203125, 0.9993896484375, 1.03662109375, 1.0738525390625, 1.111083984375, 1.1483154296875, 1.185546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 6.0, 10.0, 5.0, 10.0, 10.0, 12.0, 16.0, 11.0, 19.0, 28.0, 21.0, 40.0, 26.0, 39.0, 45.0, 61.0, 60.0, 55.0, 66.0, 47.0, 64.0, 40.0, 43.0, 35.0, 39.0, 24.0, 30.0, 18.0, 14.0, 18.0, 15.0, 15.0, 8.0, 11.0, 12.0, 4.0, 8.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43115234375, -0.416015625, -0.40087890625, -0.3857421875, -0.37060546875, -0.35546875, -0.34033203125, -0.3251953125, -0.31005859375, -0.294921875, -0.27978515625, -0.2646484375, -0.24951171875, -0.234375, -0.21923828125, -0.2041015625, -0.18896484375, -0.173828125, -0.15869140625, -0.1435546875, -0.12841796875, -0.11328125, -0.09814453125, -0.0830078125, -0.06787109375, -0.052734375, -0.03759765625, -0.0224609375, -0.00732421875, 0.0078125, 0.02294921875, 0.0380859375, 0.05322265625, 0.068359375, 0.08349609375, 0.0986328125, 0.11376953125, 0.12890625, 0.14404296875, 0.1591796875, 0.17431640625, 0.189453125, 0.20458984375, 0.2197265625, 0.23486328125, 0.25, 0.26513671875, 0.2802734375, 0.29541015625, 0.310546875, 0.32568359375, 0.3408203125, 0.35595703125, 0.37109375, 0.38623046875, 0.4013671875, 0.41650390625, 0.431640625, 0.44677734375, 0.4619140625, 0.47705078125, 0.4921875, 0.50732421875, 0.5224609375, 0.53759765625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 11.0, 6.0, 7.0, 11.0, 15.0, 18.0, 19.0, 28.0, 25.0, 48.0, 60.0, 59.0, 75.0, 73.0, 72.0, 56.0, 67.0, 62.0, 45.0, 32.0, 40.0, 32.0, 32.0, 18.0, 20.0, 15.0, 12.0, 6.0, 6.0, 9.0, 8.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.30769729614258, -44.071327209472656, -42.834957122802734, -41.59859085083008, -40.362220764160156, -39.125850677490234, -37.88948059082031, -36.65311050415039, -35.41674041748047, -34.18037033081055, -32.944000244140625, -31.707632064819336, -30.471263885498047, -29.234893798828125, -27.998523712158203, -26.76215362548828, -25.525787353515625, -24.289417266845703, -23.053049087524414, -21.816679000854492, -20.580310821533203, -19.34394073486328, -18.10757064819336, -16.871200561523438, -15.634832382202148, -14.398463249206543, -13.162094116210938, -11.925724029541016, -10.68935489654541, -9.452985763549805, -8.216615676879883, -6.980246543884277, -5.743877410888672, -4.507508277893066, -3.2711386680603027, -2.034769296646118, -0.7983999252319336, 0.4379692077636719, 1.6743388175964355, 2.910708427429199, 4.147077560424805, 5.38344669342041, 6.619816303253174, 7.8561859130859375, 9.092555046081543, 10.328924179077148, 11.56529426574707, 12.801663398742676, 14.038032531738281, 15.274401664733887, 16.510770797729492, 17.747140884399414, 18.983509063720703, 20.219879150390625, 21.456249237060547, 22.69261932373047, 23.928987503051758, 25.16535758972168, 26.40172576904297, 27.63809585571289, 28.874465942382812, 30.1108341217041, 31.347204208374023, 32.58357238769531, 33.819942474365234]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 6.0, 11.0, 8.0, 9.0, 16.0, 22.0, 31.0, 21.0, 25.0, 35.0, 27.0, 27.0, 37.0, 27.0, 39.0, 49.0, 42.0, 40.0, 45.0, 35.0, 48.0, 41.0, 42.0, 43.0, 25.0, 32.0, 42.0, 23.0, 25.0, 23.0, 15.0, 17.0, 15.0, 11.0, 11.0, 10.0, 5.0, 3.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-41.921695709228516, -40.73655319213867, -39.55141067504883, -38.36627197265625, -37.181129455566406, -35.99598693847656, -34.81084442138672, -33.625701904296875, -32.44055938720703, -31.255416870117188, -30.070276260375977, -28.885133743286133, -27.699993133544922, -26.514850616455078, -25.329708099365234, -24.14456558227539, -22.959426879882812, -21.77428436279297, -20.589143753051758, -19.404001235961914, -18.218860626220703, -17.03371810913086, -15.848575592041016, -14.663434028625488, -13.478292465209961, -12.293150901794434, -11.108009338378906, -9.922866821289062, -8.737725257873535, -7.552583694458008, -6.367441654205322, -5.182299613952637, -3.9971580505371094, -2.812016248703003, -1.6268744468688965, -0.44173264503479004, 0.7434091567993164, 1.9285507202148438, 3.1136927604675293, 4.298834800720215, 5.483976364135742, 6.6691179275512695, 7.854259967803955, 9.03940200805664, 10.224543571472168, 11.409685134887695, 12.594827651977539, 13.779969215393066, 14.965110778808594, 16.150253295898438, 17.33539390563965, 18.520536422729492, 19.705677032470703, 20.890819549560547, 22.07596206665039, 23.261104583740234, 24.446245193481445, 25.63138771057129, 26.8165283203125, 28.001670837402344, 29.186813354492188, 30.3719539642334, 31.557096481323242, 32.74223709106445, 33.9273796081543]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 7.0, 11.0, 28.0, 30.0, 46.0, 86.0, 103.0, 153.0, 284.0, 450.0, 749.0, 1223.0, 1894.0, 3098.0, 5300.0, 9160.0, 15612.0, 27023.0, 47604.0, 84836.0, 149208.0, 225623.0, 198985.0, 119578.0, 67377.0, 37616.0, 21401.0, 12438.0, 7308.0, 4448.0, 2627.0, 1613.0, 945.0, 606.0, 393.0, 245.0, 159.0, 107.0, 64.0, 31.0, 43.0, 15.0, 10.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-52.5625, -51.09423828125, -49.6259765625, -48.15771484375, -46.689453125, -45.22119140625, -43.7529296875, -42.28466796875, -40.81640625, -39.34814453125, -37.8798828125, -36.41162109375, -34.943359375, -33.47509765625, -32.0068359375, -30.53857421875, -29.0703125, -27.60205078125, -26.1337890625, -24.66552734375, -23.197265625, -21.72900390625, -20.2607421875, -18.79248046875, -17.32421875, -15.85595703125, -14.3876953125, -12.91943359375, -11.451171875, -9.98291015625, -8.5146484375, -7.04638671875, -5.578125, -4.10986328125, -2.6416015625, -1.17333984375, 0.294921875, 1.76318359375, 3.2314453125, 4.69970703125, 6.16796875, 7.63623046875, 9.1044921875, 10.57275390625, 12.041015625, 13.50927734375, 14.9775390625, 16.44580078125, 17.9140625, 19.38232421875, 20.8505859375, 22.31884765625, 23.787109375, 25.25537109375, 26.7236328125, 28.19189453125, 29.66015625, 31.12841796875, 32.5966796875, 34.06494140625, 35.533203125, 37.00146484375, 38.4697265625, 39.93798828125, 41.40625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 14.0, 19.0, 21.0, 29.0, 21.0, 31.0, 27.0, 34.0, 42.0, 31.0, 41.0, 53.0, 43.0, 50.0, 42.0, 33.0, 52.0, 46.0, 45.0, 47.0, 27.0, 33.0, 28.0, 33.0, 27.0, 20.0, 15.0, 13.0, 10.0, 16.0, 10.0, 5.0, 3.0, 0.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-44.40625, -43.1826171875, -41.958984375, -40.7353515625, -39.51171875, -38.2880859375, -37.064453125, -35.8408203125, -34.6171875, -33.3935546875, -32.169921875, -30.9462890625, -29.72265625, -28.4990234375, -27.275390625, -26.0517578125, -24.828125, -23.6044921875, -22.380859375, -21.1572265625, -19.93359375, -18.7099609375, -17.486328125, -16.2626953125, -15.0390625, -13.8154296875, -12.591796875, -11.3681640625, -10.14453125, -8.9208984375, -7.697265625, -6.4736328125, -5.25, -4.0263671875, -2.802734375, -1.5791015625, -0.35546875, 0.8681640625, 2.091796875, 3.3154296875, 4.5390625, 5.7626953125, 6.986328125, 8.2099609375, 9.43359375, 10.6572265625, 11.880859375, 13.1044921875, 14.328125, 15.5517578125, 16.775390625, 17.9990234375, 19.22265625, 20.4462890625, 21.669921875, 22.8935546875, 24.1171875, 25.3408203125, 26.564453125, 27.7880859375, 29.01171875, 30.2353515625, 31.458984375, 32.6826171875, 33.90625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 10.0, 10.0, 16.0, 22.0, 31.0, 54.0, 70.0, 123.0, 175.0, 286.0, 418.0, 762.0, 1185.0, 2068.0, 3155.0, 5330.0, 8860.0, 14698.0, 25547.0, 43898.0, 75236.0, 128402.0, 202312.0, 208056.0, 135677.0, 79535.0, 46112.0, 26705.0, 15945.0, 9351.0, 5766.0, 3419.0, 2060.0, 1287.0, 748.0, 488.0, 272.0, 166.0, 118.0, 71.0, 42.0, 34.0, 18.0, 10.0, 11.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.21875, -46.71435546875, -45.2099609375, -43.70556640625, -42.201171875, -40.69677734375, -39.1923828125, -37.68798828125, -36.18359375, -34.67919921875, -33.1748046875, -31.67041015625, -30.166015625, -28.66162109375, -27.1572265625, -25.65283203125, -24.1484375, -22.64404296875, -21.1396484375, -19.63525390625, -18.130859375, -16.62646484375, -15.1220703125, -13.61767578125, -12.11328125, -10.60888671875, -9.1044921875, -7.60009765625, -6.095703125, -4.59130859375, -3.0869140625, -1.58251953125, -0.078125, 1.42626953125, 2.9306640625, 4.43505859375, 5.939453125, 7.44384765625, 8.9482421875, 10.45263671875, 11.95703125, 13.46142578125, 14.9658203125, 16.47021484375, 17.974609375, 19.47900390625, 20.9833984375, 22.48779296875, 23.9921875, 25.49658203125, 27.0009765625, 28.50537109375, 30.009765625, 31.51416015625, 33.0185546875, 34.52294921875, 36.02734375, 37.53173828125, 39.0361328125, 40.54052734375, 42.044921875, 43.54931640625, 45.0537109375, 46.55810546875, 48.0625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 4.0, 5.0, 13.0, 11.0, 12.0, 20.0, 19.0, 23.0, 22.0, 31.0, 29.0, 39.0, 36.0, 36.0, 46.0, 35.0, 48.0, 41.0, 51.0, 43.0, 40.0, 47.0, 43.0, 39.0, 43.0, 30.0, 31.0, 26.0, 22.0, 18.0, 19.0, 13.0, 9.0, 8.0, 8.0, 5.0, 11.0, 5.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.046875, -24.247314453125, -23.44775390625, -22.648193359375, -21.8486328125, -21.049072265625, -20.24951171875, -19.449951171875, -18.650390625, -17.850830078125, -17.05126953125, -16.251708984375, -15.4521484375, -14.652587890625, -13.85302734375, -13.053466796875, -12.25390625, -11.454345703125, -10.65478515625, -9.855224609375, -9.0556640625, -8.256103515625, -7.45654296875, -6.656982421875, -5.857421875, -5.057861328125, -4.25830078125, -3.458740234375, -2.6591796875, -1.859619140625, -1.06005859375, -0.260498046875, 0.5390625, 1.338623046875, 2.13818359375, 2.937744140625, 3.7373046875, 4.536865234375, 5.33642578125, 6.135986328125, 6.935546875, 7.735107421875, 8.53466796875, 9.334228515625, 10.1337890625, 10.933349609375, 11.73291015625, 12.532470703125, 13.33203125, 14.131591796875, 14.93115234375, 15.730712890625, 16.5302734375, 17.329833984375, 18.12939453125, 18.928955078125, 19.728515625, 20.528076171875, 21.32763671875, 22.127197265625, 22.9267578125, 23.726318359375, 24.52587890625, 25.325439453125, 26.125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 5.0, 7.0, 15.0, 14.0, 12.0, 34.0, 41.0, 82.0, 117.0, 134.0, 233.0, 335.0, 496.0, 784.0, 1164.0, 1878.0, 2988.0, 4936.0, 8175.0, 13709.0, 24187.0, 42858.0, 78231.0, 145393.0, 243020.0, 212395.0, 117993.0, 64116.0, 35448.0, 19949.0, 11413.0, 7003.0, 4056.0, 2606.0, 1584.0, 1101.0, 682.0, 443.0, 288.0, 195.0, 136.0, 102.0, 59.0, 34.0, 38.0, 22.0, 21.0, 14.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-16.28125, -15.800048828125, -15.31884765625, -14.837646484375, -14.3564453125, -13.875244140625, -13.39404296875, -12.912841796875, -12.431640625, -11.950439453125, -11.46923828125, -10.988037109375, -10.5068359375, -10.025634765625, -9.54443359375, -9.063232421875, -8.58203125, -8.100830078125, -7.61962890625, -7.138427734375, -6.6572265625, -6.176025390625, -5.69482421875, -5.213623046875, -4.732421875, -4.251220703125, -3.77001953125, -3.288818359375, -2.8076171875, -2.326416015625, -1.84521484375, -1.364013671875, -0.8828125, -0.401611328125, 0.07958984375, 0.560791015625, 1.0419921875, 1.523193359375, 2.00439453125, 2.485595703125, 2.966796875, 3.447998046875, 3.92919921875, 4.410400390625, 4.8916015625, 5.372802734375, 5.85400390625, 6.335205078125, 6.81640625, 7.297607421875, 7.77880859375, 8.260009765625, 8.7412109375, 9.222412109375, 9.70361328125, 10.184814453125, 10.666015625, 11.147216796875, 11.62841796875, 12.109619140625, 12.5908203125, 13.072021484375, 13.55322265625, 14.034423828125, 14.515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 10.0, 10.0, 9.0, 28.0, 37.0, 24.0, 54.0, 61.0, 83.0, 101.0, 131.0, 123.0, 74.0, 62.0, 39.0, 45.0, 24.0, 26.0, 13.0, 10.0, 6.0, 8.0, 9.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00222015380859375, -0.0021537840366363525, -0.002087414264678955, -0.0020210444927215576, -0.00195467472076416, -0.0018883049488067627, -0.0018219351768493652, -0.0017555654048919678, -0.0016891956329345703, -0.0016228258609771729, -0.0015564560890197754, -0.001490086317062378, -0.0014237165451049805, -0.001357346773147583, -0.0012909770011901855, -0.001224607229232788, -0.0011582374572753906, -0.0010918676853179932, -0.0010254979133605957, -0.0009591281414031982, -0.0008927583694458008, -0.0008263885974884033, -0.0007600188255310059, -0.0006936490535736084, -0.0006272792816162109, -0.0005609095096588135, -0.000494539737701416, -0.00042816996574401855, -0.0003618001937866211, -0.00029543042182922363, -0.00022906064987182617, -0.0001626908779144287, -9.632110595703125e-05, -2.995133399963379e-05, 3.641843795776367e-05, 0.00010278820991516113, 0.0001691579818725586, 0.00023552775382995605, 0.0003018975257873535, 0.000368267297744751, 0.00043463706970214844, 0.0005010068416595459, 0.0005673766136169434, 0.0006337463855743408, 0.0007001161575317383, 0.0007664859294891357, 0.0008328557014465332, 0.0008992254734039307, 0.0009655952453613281, 0.0010319650173187256, 0.001098334789276123, 0.0011647045612335205, 0.001231074333190918, 0.0012974441051483154, 0.0013638138771057129, 0.0014301836490631104, 0.0014965534210205078, 0.0015629231929779053, 0.0016292929649353027, 0.0016956627368927002, 0.0017620325088500977, 0.0018284022808074951, 0.0018947720527648926, 0.00196114182472229, 0.0020275115966796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 10.0, 8.0, 11.0, 15.0, 19.0, 32.0, 56.0, 92.0, 123.0, 134.0, 208.0, 345.0, 441.0, 683.0, 972.0, 1431.0, 2027.0, 3102.0, 4467.0, 6479.0, 9991.0, 14856.0, 23054.0, 36585.0, 58885.0, 96033.0, 151804.0, 195102.0, 161571.0, 104013.0, 63434.0, 39148.0, 25054.0, 15894.0, 10520.0, 7157.0, 4816.0, 3151.0, 2089.0, 1517.0, 1065.0, 693.0, 467.0, 314.0, 203.0, 158.0, 114.0, 79.0, 42.0, 28.0, 20.0, 17.0, 15.0, 9.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.2578125, -11.8433837890625, -11.428955078125, -11.0145263671875, -10.60009765625, -10.1856689453125, -9.771240234375, -9.3568115234375, -8.9423828125, -8.5279541015625, -8.113525390625, -7.6990966796875, -7.28466796875, -6.8702392578125, -6.455810546875, -6.0413818359375, -5.626953125, -5.2125244140625, -4.798095703125, -4.3836669921875, -3.96923828125, -3.5548095703125, -3.140380859375, -2.7259521484375, -2.3115234375, -1.8970947265625, -1.482666015625, -1.0682373046875, -0.65380859375, -0.2393798828125, 0.175048828125, 0.5894775390625, 1.00390625, 1.4183349609375, 1.832763671875, 2.2471923828125, 2.66162109375, 3.0760498046875, 3.490478515625, 3.9049072265625, 4.3193359375, 4.7337646484375, 5.148193359375, 5.5626220703125, 5.97705078125, 6.3914794921875, 6.805908203125, 7.2203369140625, 7.634765625, 8.0491943359375, 8.463623046875, 8.8780517578125, 9.29248046875, 9.7069091796875, 10.121337890625, 10.5357666015625, 10.9501953125, 11.3646240234375, 11.779052734375, 12.1934814453125, 12.60791015625, 13.0223388671875, 13.436767578125, 13.8511962890625, 14.265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 3.0, 5.0, 8.0, 18.0, 10.0, 20.0, 22.0, 25.0, 23.0, 27.0, 31.0, 44.0, 53.0, 48.0, 48.0, 36.0, 55.0, 40.0, 62.0, 54.0, 44.0, 34.0, 52.0, 33.0, 31.0, 29.0, 20.0, 25.0, 14.0, 15.0, 9.0, 6.0, 8.0, 10.0, 5.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.27734375, -5.10687255859375, -4.9364013671875, -4.76593017578125, -4.595458984375, -4.42498779296875, -4.2545166015625, -4.08404541015625, -3.91357421875, -3.74310302734375, -3.5726318359375, -3.40216064453125, -3.231689453125, -3.06121826171875, -2.8907470703125, -2.72027587890625, -2.5498046875, -2.37933349609375, -2.2088623046875, -2.03839111328125, -1.867919921875, -1.69744873046875, -1.5269775390625, -1.35650634765625, -1.18603515625, -1.01556396484375, -0.8450927734375, -0.67462158203125, -0.504150390625, -0.33367919921875, -0.1632080078125, 0.00726318359375, 0.177734375, 0.34820556640625, 0.5186767578125, 0.68914794921875, 0.859619140625, 1.03009033203125, 1.2005615234375, 1.37103271484375, 1.54150390625, 1.71197509765625, 1.8824462890625, 2.05291748046875, 2.223388671875, 2.39385986328125, 2.5643310546875, 2.73480224609375, 2.9052734375, 3.07574462890625, 3.2462158203125, 3.41668701171875, 3.587158203125, 3.75762939453125, 3.9281005859375, 4.09857177734375, 4.26904296875, 4.43951416015625, 4.6099853515625, 4.78045654296875, 4.950927734375, 5.12139892578125, 5.2918701171875, 5.46234130859375, 5.6328125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 2.0, 4.0, 8.0, 6.0, 8.0, 6.0, 12.0, 15.0, 18.0, 27.0, 43.0, 39.0, 39.0, 42.0, 61.0, 61.0, 53.0, 72.0, 70.0, 50.0, 50.0, 48.0, 45.0, 31.0, 40.0, 32.0, 20.0, 17.0, 13.0, 12.0, 9.0, 9.0, 10.0, 4.0, 4.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-41.44779968261719, -40.31585693359375, -39.18391418457031, -38.051971435546875, -36.9200325012207, -35.788089752197266, -34.65614700317383, -33.52420425415039, -32.39226150512695, -31.260318756103516, -30.12837791442871, -28.996435165405273, -27.864492416381836, -26.73255157470703, -25.600608825683594, -24.468666076660156, -23.33672523498535, -22.204782485961914, -21.07284164428711, -19.940898895263672, -18.808956146240234, -17.677013397216797, -16.545072555541992, -15.413129806518555, -14.281188011169434, -13.149246215820312, -12.017303466796875, -10.885361671447754, -9.753419876098633, -8.621477127075195, -7.489535331726074, -6.357593059539795, -5.225648880004883, -4.0937066078186035, -2.9617645740509033, -1.8298225402832031, -0.6978802680969238, 0.43406200408935547, 1.5660037994384766, 2.697946071624756, 3.829888343811035, 4.9618306159973145, 6.093772888183594, 7.225714683532715, 8.357656478881836, 9.489599227905273, 10.621541023254395, 11.753482818603516, 12.885425567626953, 14.017367362976074, 15.149310111999512, 16.281251907348633, 17.41319465637207, 18.545135498046875, 19.677078247070312, 20.80902099609375, 21.940963745117188, 23.072906494140625, 24.20484733581543, 25.336790084838867, 26.468732833862305, 27.60067367553711, 28.732616424560547, 29.864559173583984, 30.99650001525879]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 0.0, 6.0, 8.0, 7.0, 14.0, 10.0, 14.0, 14.0, 22.0, 21.0, 20.0, 27.0, 26.0, 43.0, 40.0, 33.0, 36.0, 47.0, 36.0, 42.0, 37.0, 49.0, 26.0, 43.0, 39.0, 40.0, 44.0, 30.0, 27.0, 31.0, 21.0, 22.0, 20.0, 20.0, 15.0, 7.0, 11.0, 14.0, 11.0, 9.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0], "bins": [-44.825984954833984, -43.59872055053711, -42.3714599609375, -41.144195556640625, -39.91693115234375, -38.689666748046875, -37.46240234375, -36.23514175415039, -35.007877349853516, -33.78061294555664, -32.55335235595703, -31.326087951660156, -30.09882354736328, -28.871559143066406, -27.644296646118164, -26.417034149169922, -25.189769744873047, -23.962505340576172, -22.73524284362793, -21.507980346679688, -20.280715942382812, -19.053451538085938, -17.826189041137695, -16.598926544189453, -15.371662139892578, -14.14439868927002, -12.917135238647461, -11.689871788024902, -10.462608337402344, -9.235344886779785, -8.008081436157227, -6.780817985534668, -5.553554534912109, -4.326291084289551, -3.099027633666992, -1.8717641830444336, -0.644500732421875, 0.5827627182006836, 1.8100261688232422, 3.037289619445801, 4.264553070068359, 5.491816520690918, 6.719079971313477, 7.946343421936035, 9.173606872558594, 10.400870323181152, 11.628133773803711, 12.85539722442627, 14.082660675048828, 15.309924125671387, 16.537187576293945, 17.764450073242188, 18.991714477539062, 20.218978881835938, 21.44624137878418, 22.673503875732422, 23.900768280029297, 25.128032684326172, 26.355295181274414, 27.582557678222656, 28.80982208251953, 30.037086486816406, 31.26434898376465, 32.49161148071289, 33.718875885009766]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 2.0, 7.0, 10.0, 14.0, 14.0, 26.0, 29.0, 60.0, 80.0, 148.0, 197.0, 313.0, 540.0, 907.0, 1627.0, 2678.0, 4898.0, 9039.0, 17128.0, 33968.0, 74075.0, 198409.0, 624795.0, 1512840.0, 1116349.0, 370514.0, 122305.0, 51243.0, 24210.0, 12264.0, 6486.0, 3693.0, 2086.0, 1214.0, 748.0, 483.0, 299.0, 206.0, 116.0, 97.0, 49.0, 30.0, 30.0, 14.0, 14.0, 10.0, 12.0, 5.0, 1.0, 2.0, 0.0, 3.0], "bins": [-55.84375, -54.28271484375, -52.7216796875, -51.16064453125, -49.599609375, -48.03857421875, -46.4775390625, -44.91650390625, -43.35546875, -41.79443359375, -40.2333984375, -38.67236328125, -37.111328125, -35.55029296875, -33.9892578125, -32.42822265625, -30.8671875, -29.30615234375, -27.7451171875, -26.18408203125, -24.623046875, -23.06201171875, -21.5009765625, -19.93994140625, -18.37890625, -16.81787109375, -15.2568359375, -13.69580078125, -12.134765625, -10.57373046875, -9.0126953125, -7.45166015625, -5.890625, -4.32958984375, -2.7685546875, -1.20751953125, 0.353515625, 1.91455078125, 3.4755859375, 5.03662109375, 6.59765625, 8.15869140625, 9.7197265625, 11.28076171875, 12.841796875, 14.40283203125, 15.9638671875, 17.52490234375, 19.0859375, 20.64697265625, 22.2080078125, 23.76904296875, 25.330078125, 26.89111328125, 28.4521484375, 30.01318359375, 31.57421875, 33.13525390625, 34.6962890625, 36.25732421875, 37.818359375, 39.37939453125, 40.9404296875, 42.50146484375, 44.0625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 6.0, 6.0, 6.0, 11.0, 8.0, 14.0, 11.0, 19.0, 15.0, 19.0, 23.0, 27.0, 35.0, 36.0, 42.0, 26.0, 43.0, 44.0, 55.0, 36.0, 37.0, 40.0, 50.0, 44.0, 46.0, 36.0, 40.0, 29.0, 25.0, 18.0, 30.0, 22.0, 19.0, 8.0, 15.0, 13.0, 10.0, 9.0, 6.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0], "bins": [-41.90625, -40.759765625, -39.61328125, -38.466796875, -37.3203125, -36.173828125, -35.02734375, -33.880859375, -32.734375, -31.587890625, -30.44140625, -29.294921875, -28.1484375, -27.001953125, -25.85546875, -24.708984375, -23.5625, -22.416015625, -21.26953125, -20.123046875, -18.9765625, -17.830078125, -16.68359375, -15.537109375, -14.390625, -13.244140625, -12.09765625, -10.951171875, -9.8046875, -8.658203125, -7.51171875, -6.365234375, -5.21875, -4.072265625, -2.92578125, -1.779296875, -0.6328125, 0.513671875, 1.66015625, 2.806640625, 3.953125, 5.099609375, 6.24609375, 7.392578125, 8.5390625, 9.685546875, 10.83203125, 11.978515625, 13.125, 14.271484375, 15.41796875, 16.564453125, 17.7109375, 18.857421875, 20.00390625, 21.150390625, 22.296875, 23.443359375, 24.58984375, 25.736328125, 26.8828125, 28.029296875, 29.17578125, 30.322265625, 31.46875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 5.0, 5.0, 6.0, 11.0, 13.0, 20.0, 31.0, 41.0, 56.0, 85.0, 123.0, 149.0, 234.0, 361.0, 461.0, 691.0, 1043.0, 1515.0, 2126.0, 3273.0, 4918.0, 7572.0, 11573.0, 18861.0, 30677.0, 51646.0, 88587.0, 160155.0, 302681.0, 604025.0, 1131380.0, 847756.0, 419416.0, 216546.0, 117259.0, 66427.0, 39167.0, 23342.0, 14690.0, 9328.0, 5910.0, 3900.0, 2585.0, 1753.0, 1168.0, 831.0, 583.0, 382.0, 279.0, 211.0, 138.0, 88.0, 68.0, 38.0, 35.0, 25.0, 19.0, 15.0, 6.0, 9.0, 1.0, 2.0, 2.0], "bins": [-37.90625, -36.7119140625, -35.517578125, -34.3232421875, -33.12890625, -31.9345703125, -30.740234375, -29.5458984375, -28.3515625, -27.1572265625, -25.962890625, -24.7685546875, -23.57421875, -22.3798828125, -21.185546875, -19.9912109375, -18.796875, -17.6025390625, -16.408203125, -15.2138671875, -14.01953125, -12.8251953125, -11.630859375, -10.4365234375, -9.2421875, -8.0478515625, -6.853515625, -5.6591796875, -4.46484375, -3.2705078125, -2.076171875, -0.8818359375, 0.3125, 1.5068359375, 2.701171875, 3.8955078125, 5.08984375, 6.2841796875, 7.478515625, 8.6728515625, 9.8671875, 11.0615234375, 12.255859375, 13.4501953125, 14.64453125, 15.8388671875, 17.033203125, 18.2275390625, 19.421875, 20.6162109375, 21.810546875, 23.0048828125, 24.19921875, 25.3935546875, 26.587890625, 27.7822265625, 28.9765625, 30.1708984375, 31.365234375, 32.5595703125, 33.75390625, 34.9482421875, 36.142578125, 37.3369140625, 38.53125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 9.0, 6.0, 13.0, 17.0, 23.0, 39.0, 50.0, 66.0, 58.0, 86.0, 97.0, 106.0, 174.0, 184.0, 230.0, 269.0, 302.0, 339.0, 335.0, 296.0, 258.0, 220.0, 185.0, 149.0, 115.0, 79.0, 75.0, 52.0, 50.0, 38.0, 31.0, 29.0, 13.0, 19.0, 16.0, 6.0, 7.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.40625, -15.877197265625, -15.34814453125, -14.819091796875, -14.2900390625, -13.760986328125, -13.23193359375, -12.702880859375, -12.173828125, -11.644775390625, -11.11572265625, -10.586669921875, -10.0576171875, -9.528564453125, -8.99951171875, -8.470458984375, -7.94140625, -7.412353515625, -6.88330078125, -6.354248046875, -5.8251953125, -5.296142578125, -4.76708984375, -4.238037109375, -3.708984375, -3.179931640625, -2.65087890625, -2.121826171875, -1.5927734375, -1.063720703125, -0.53466796875, -0.005615234375, 0.5234375, 1.052490234375, 1.58154296875, 2.110595703125, 2.6396484375, 3.168701171875, 3.69775390625, 4.226806640625, 4.755859375, 5.284912109375, 5.81396484375, 6.343017578125, 6.8720703125, 7.401123046875, 7.93017578125, 8.459228515625, 8.98828125, 9.517333984375, 10.04638671875, 10.575439453125, 11.1044921875, 11.633544921875, 12.16259765625, 12.691650390625, 13.220703125, 13.749755859375, 14.27880859375, 14.807861328125, 15.3369140625, 15.865966796875, 16.39501953125, 16.924072265625, 17.453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 2.0, 6.0, 5.0, 8.0, 7.0, 19.0, 20.0, 24.0, 24.0, 54.0, 43.0, 54.0, 73.0, 78.0, 74.0, 69.0, 72.0, 69.0, 56.0, 43.0, 43.0, 42.0, 25.0, 21.0, 19.0, 14.0, 8.0, 7.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.03807830810547, -48.57343292236328, -47.108787536621094, -45.64413833618164, -44.17949295043945, -42.714847564697266, -41.25020217895508, -39.785552978515625, -38.32090759277344, -36.85626220703125, -35.39161682128906, -33.92696762084961, -32.46232223510742, -30.997676849365234, -29.533031463623047, -28.068384170532227, -26.60373878479004, -25.13909339904785, -23.67444610595703, -22.209800720214844, -20.745153427124023, -19.280508041381836, -17.815860748291016, -16.351215362548828, -14.886569023132324, -13.42192268371582, -11.957276344299316, -10.492630004882812, -9.027984619140625, -7.563337802886963, -6.098691940307617, -4.634045600891113, -3.1693992614746094, -1.704753041267395, -0.24010682106018066, 1.2245392799377441, 2.689185619354248, 4.153831958770752, 5.618477821350098, 7.083124160766602, 8.547770500183105, 10.01241683959961, 11.477063179016113, 12.941709518432617, 14.406354904174805, 15.871002197265625, 17.335647583007812, 18.80029296875, 20.26494026184082, 21.729585647583008, 23.194232940673828, 24.658878326416016, 26.123525619506836, 27.588171005249023, 29.052818298339844, 30.51746368408203, 31.98210906982422, 33.446754455566406, 34.911399841308594, 36.37604904174805, 37.840694427490234, 39.30533981323242, 40.76998519897461, 42.23463439941406, 43.69927978515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 4.0, 5.0, 7.0, 11.0, 12.0, 20.0, 27.0, 17.0, 24.0, 23.0, 36.0, 30.0, 34.0, 51.0, 40.0, 49.0, 47.0, 35.0, 44.0, 53.0, 31.0, 44.0, 41.0, 32.0, 37.0, 39.0, 25.0, 31.0, 21.0, 16.0, 25.0, 12.0, 13.0, 13.0, 6.0, 8.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.723575592041016, -45.40193176269531, -44.080284118652344, -42.75864028930664, -41.43699645996094, -40.11534881591797, -38.793704986572266, -37.47206115722656, -36.150413513183594, -34.82876968383789, -33.50712203979492, -32.18547821044922, -30.863832473754883, -29.542186737060547, -28.220542907714844, -26.898897171020508, -25.577251434326172, -24.255605697631836, -22.9339599609375, -21.612316131591797, -20.29067039489746, -18.969024658203125, -17.647380828857422, -16.325735092163086, -15.00408935546875, -13.682443618774414, -12.360798835754395, -11.039154052734375, -9.717508316040039, -8.395862579345703, -7.074217796325684, -5.752573013305664, -4.430927276611328, -3.1092820167541504, -1.7876367568969727, -0.4659914970397949, 0.8556537628173828, 2.1772990226745605, 3.4989442825317383, 4.820589065551758, 6.142234802246094, 7.4638800621032715, 8.78552532196045, 10.107170104980469, 11.428815841674805, 12.75046157836914, 14.07210636138916, 15.39375114440918, 16.715396881103516, 18.03704261779785, 19.358688354492188, 20.68033218383789, 22.001977920532227, 23.323623657226562, 24.645267486572266, 25.9669132232666, 27.288558959960938, 28.610204696655273, 29.93185043334961, 31.253494262695312, 32.57514190673828, 33.896785736083984, 35.21842956542969, 36.540077209472656, 37.86172103881836]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 25.0, 42.0, 46.0, 84.0, 113.0, 184.0, 274.0, 356.0, 562.0, 839.0, 1156.0, 1726.0, 2677.0, 3825.0, 6068.0, 9015.0, 13955.0, 21518.0, 34111.0, 56055.0, 97308.0, 200437.0, 281695.0, 128603.0, 70444.0, 41743.0, 26286.0, 16918.0, 11019.0, 7100.0, 4709.0, 3232.0, 2114.0, 1396.0, 955.0, 640.0, 407.0, 280.0, 204.0, 153.0, 83.0, 48.0, 47.0, 32.0, 21.0, 10.0, 10.0, 12.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-13.8984375, -13.467041015625, -13.03564453125, -12.604248046875, -12.1728515625, -11.741455078125, -11.31005859375, -10.878662109375, -10.447265625, -10.015869140625, -9.58447265625, -9.153076171875, -8.7216796875, -8.290283203125, -7.85888671875, -7.427490234375, -6.99609375, -6.564697265625, -6.13330078125, -5.701904296875, -5.2705078125, -4.839111328125, -4.40771484375, -3.976318359375, -3.544921875, -3.113525390625, -2.68212890625, -2.250732421875, -1.8193359375, -1.387939453125, -0.95654296875, -0.525146484375, -0.09375, 0.337646484375, 0.76904296875, 1.200439453125, 1.6318359375, 2.063232421875, 2.49462890625, 2.926025390625, 3.357421875, 3.788818359375, 4.22021484375, 4.651611328125, 5.0830078125, 5.514404296875, 5.94580078125, 6.377197265625, 6.80859375, 7.239990234375, 7.67138671875, 8.102783203125, 8.5341796875, 8.965576171875, 9.39697265625, 9.828369140625, 10.259765625, 10.691162109375, 11.12255859375, 11.553955078125, 11.9853515625, 12.416748046875, 12.84814453125, 13.279541015625, 13.7109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 2.0, 11.0, 8.0, 12.0, 9.0, 22.0, 14.0, 21.0, 30.0, 31.0, 26.0, 33.0, 48.0, 50.0, 39.0, 37.0, 47.0, 44.0, 53.0, 43.0, 37.0, 44.0, 39.0, 33.0, 33.0, 32.0, 30.0, 23.0, 27.0, 15.0, 13.0, 30.0, 8.0, 9.0, 14.0, 4.0, 5.0, 3.0, 5.0, 4.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.5, -43.150390625, -41.80078125, -40.451171875, -39.1015625, -37.751953125, -36.40234375, -35.052734375, -33.703125, -32.353515625, -31.00390625, -29.654296875, -28.3046875, -26.955078125, -25.60546875, -24.255859375, -22.90625, -21.556640625, -20.20703125, -18.857421875, -17.5078125, -16.158203125, -14.80859375, -13.458984375, -12.109375, -10.759765625, -9.41015625, -8.060546875, -6.7109375, -5.361328125, -4.01171875, -2.662109375, -1.3125, 0.037109375, 1.38671875, 2.736328125, 4.0859375, 5.435546875, 6.78515625, 8.134765625, 9.484375, 10.833984375, 12.18359375, 13.533203125, 14.8828125, 16.232421875, 17.58203125, 18.931640625, 20.28125, 21.630859375, 22.98046875, 24.330078125, 25.6796875, 27.029296875, 28.37890625, 29.728515625, 31.078125, 32.427734375, 33.77734375, 35.126953125, 36.4765625, 37.826171875, 39.17578125, 40.525390625, 41.875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 8.0, 9.0, 13.0, 24.0, 31.0, 35.0, 58.0, 78.0, 125.0, 186.0, 245.0, 367.0, 525.0, 733.0, 1113.0, 1473.0, 2089.0, 3191.0, 4721.0, 7489.0, 13357.0, 31792.0, 191990.0, 675553.0, 65966.0, 19531.0, 9653.0, 5928.0, 3753.0, 2610.0, 1790.0, 1235.0, 832.0, 596.0, 464.0, 281.0, 228.0, 160.0, 106.0, 58.0, 41.0, 39.0, 21.0, 13.0, 13.0, 8.0, 3.0, 7.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.1875, -17.62353515625, -17.0595703125, -16.49560546875, -15.931640625, -15.36767578125, -14.8037109375, -14.23974609375, -13.67578125, -13.11181640625, -12.5478515625, -11.98388671875, -11.419921875, -10.85595703125, -10.2919921875, -9.72802734375, -9.1640625, -8.60009765625, -8.0361328125, -7.47216796875, -6.908203125, -6.34423828125, -5.7802734375, -5.21630859375, -4.65234375, -4.08837890625, -3.5244140625, -2.96044921875, -2.396484375, -1.83251953125, -1.2685546875, -0.70458984375, -0.140625, 0.42333984375, 0.9873046875, 1.55126953125, 2.115234375, 2.67919921875, 3.2431640625, 3.80712890625, 4.37109375, 4.93505859375, 5.4990234375, 6.06298828125, 6.626953125, 7.19091796875, 7.7548828125, 8.31884765625, 8.8828125, 9.44677734375, 10.0107421875, 10.57470703125, 11.138671875, 11.70263671875, 12.2666015625, 12.83056640625, 13.39453125, 13.95849609375, 14.5224609375, 15.08642578125, 15.650390625, 16.21435546875, 16.7783203125, 17.34228515625, 17.90625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 5.0, 8.0, 9.0, 13.0, 15.0, 19.0, 17.0, 29.0, 24.0, 19.0, 39.0, 25.0, 38.0, 29.0, 26.0, 40.0, 42.0, 51.0, 54.0, 45.0, 48.0, 38.0, 46.0, 46.0, 45.0, 29.0, 40.0, 15.0, 33.0, 23.0, 16.0, 13.0, 15.0, 15.0, 8.0, 7.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.6875, -33.719482421875, -32.75146484375, -31.783447265625, -30.8154296875, -29.847412109375, -28.87939453125, -27.911376953125, -26.943359375, -25.975341796875, -25.00732421875, -24.039306640625, -23.0712890625, -22.103271484375, -21.13525390625, -20.167236328125, -19.19921875, -18.231201171875, -17.26318359375, -16.295166015625, -15.3271484375, -14.359130859375, -13.39111328125, -12.423095703125, -11.455078125, -10.487060546875, -9.51904296875, -8.551025390625, -7.5830078125, -6.614990234375, -5.64697265625, -4.678955078125, -3.7109375, -2.742919921875, -1.77490234375, -0.806884765625, 0.1611328125, 1.129150390625, 2.09716796875, 3.065185546875, 4.033203125, 5.001220703125, 5.96923828125, 6.937255859375, 7.9052734375, 8.873291015625, 9.84130859375, 10.809326171875, 11.77734375, 12.745361328125, 13.71337890625, 14.681396484375, 15.6494140625, 16.617431640625, 17.58544921875, 18.553466796875, 19.521484375, 20.489501953125, 21.45751953125, 22.425537109375, 23.3935546875, 24.361572265625, 25.32958984375, 26.297607421875, 27.265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 3.0, 9.0, 14.0, 23.0, 21.0, 38.0, 64.0, 99.0, 126.0, 163.0, 251.0, 413.0, 721.0, 1159.0, 1961.0, 3722.0, 7814.0, 20096.0, 126214.0, 824091.0, 38130.0, 11957.0, 5081.0, 2701.0, 1416.0, 806.0, 518.0, 311.0, 193.0, 119.0, 111.0, 61.0, 27.0, 34.0, 14.0, 14.0, 10.0, 9.0, 10.0, 3.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.517578125, -3.408477783203125, -3.29937744140625, -3.190277099609375, -3.0811767578125, -2.972076416015625, -2.86297607421875, -2.753875732421875, -2.644775390625, -2.535675048828125, -2.42657470703125, -2.317474365234375, -2.2083740234375, -2.099273681640625, -1.99017333984375, -1.881072998046875, -1.77197265625, -1.662872314453125, -1.55377197265625, -1.444671630859375, -1.3355712890625, -1.226470947265625, -1.11737060546875, -1.008270263671875, -0.899169921875, -0.790069580078125, -0.68096923828125, -0.571868896484375, -0.4627685546875, -0.353668212890625, -0.24456787109375, -0.135467529296875, -0.0263671875, 0.082733154296875, 0.19183349609375, 0.300933837890625, 0.4100341796875, 0.519134521484375, 0.62823486328125, 0.737335205078125, 0.846435546875, 0.955535888671875, 1.06463623046875, 1.173736572265625, 1.2828369140625, 1.391937255859375, 1.50103759765625, 1.610137939453125, 1.71923828125, 1.828338623046875, 1.93743896484375, 2.046539306640625, 2.1556396484375, 2.264739990234375, 2.37384033203125, 2.482940673828125, 2.592041015625, 2.701141357421875, 2.81024169921875, 2.919342041015625, 3.0284423828125, 3.137542724609375, 3.24664306640625, 3.355743408203125, 3.46484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 10.0, 9.0, 4.0, 9.0, 22.0, 20.0, 38.0, 43.0, 36.0, 54.0, 79.0, 85.0, 90.0, 87.0, 81.0, 77.0, 58.0, 41.0, 39.0, 27.0, 17.0, 18.0, 5.0, 14.0, 6.0, 5.0, 2.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019788742065429688, -0.0001916550099849701, -0.0001854225993156433, -0.00017919018864631653, -0.00017295777797698975, -0.00016672536730766296, -0.00016049295663833618, -0.0001542605459690094, -0.00014802813529968262, -0.00014179572463035583, -0.00013556331396102905, -0.00012933090329170227, -0.0001230984926223755, -0.0001168660819530487, -0.00011063367128372192, -0.00010440126061439514, -9.816884994506836e-05, -9.193643927574158e-05, -8.57040286064148e-05, -7.947161793708801e-05, -7.323920726776123e-05, -6.700679659843445e-05, -6.0774385929107666e-05, -5.4541975259780884e-05, -4.83095645904541e-05, -4.207715392112732e-05, -3.584474325180054e-05, -2.9612332582473755e-05, -2.3379921913146973e-05, -1.714751124382019e-05, -1.0915100574493408e-05, -4.682689905166626e-06, 1.5497207641601562e-06, 7.782131433486938e-06, 1.401454210281372e-05, 2.0246952772140503e-05, 2.6479363441467285e-05, 3.271177411079407e-05, 3.894418478012085e-05, 4.517659544944763e-05, 5.1409006118774414e-05, 5.7641416788101196e-05, 6.387382745742798e-05, 7.010623812675476e-05, 7.633864879608154e-05, 8.257105946540833e-05, 8.880347013473511e-05, 9.503588080406189e-05, 0.00010126829147338867, 0.00010750070214271545, 0.00011373311281204224, 0.00011996552348136902, 0.0001261979341506958, 0.00013243034482002258, 0.00013866275548934937, 0.00014489516615867615, 0.00015112757682800293, 0.0001573599874973297, 0.0001635923981666565, 0.00016982480883598328, 0.00017605721950531006, 0.00018228963017463684, 0.00018852204084396362, 0.0001947544515132904, 0.0002009868621826172]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 6.0, 8.0, 15.0, 23.0, 34.0, 44.0, 71.0, 90.0, 136.0, 197.0, 283.0, 440.0, 566.0, 844.0, 1170.0, 1743.0, 2607.0, 4139.0, 6503.0, 10932.0, 18743.0, 34814.0, 69799.0, 155098.0, 305974.0, 224936.0, 99869.0, 47487.0, 24759.0, 13782.0, 8351.0, 5129.0, 3224.0, 2162.0, 1373.0, 995.0, 649.0, 500.0, 313.0, 240.0, 150.0, 109.0, 83.0, 58.0, 45.0, 18.0, 12.0, 12.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7236328125, -1.6693115234375, -1.614990234375, -1.5606689453125, -1.50634765625, -1.4520263671875, -1.397705078125, -1.3433837890625, -1.2890625, -1.2347412109375, -1.180419921875, -1.1260986328125, -1.07177734375, -1.0174560546875, -0.963134765625, -0.9088134765625, -0.8544921875, -0.8001708984375, -0.745849609375, -0.6915283203125, -0.63720703125, -0.5828857421875, -0.528564453125, -0.4742431640625, -0.419921875, -0.3656005859375, -0.311279296875, -0.2569580078125, -0.20263671875, -0.1483154296875, -0.093994140625, -0.0396728515625, 0.0146484375, 0.0689697265625, 0.123291015625, 0.1776123046875, 0.23193359375, 0.2862548828125, 0.340576171875, 0.3948974609375, 0.44921875, 0.5035400390625, 0.557861328125, 0.6121826171875, 0.66650390625, 0.7208251953125, 0.775146484375, 0.8294677734375, 0.8837890625, 0.9381103515625, 0.992431640625, 1.0467529296875, 1.10107421875, 1.1553955078125, 1.209716796875, 1.2640380859375, 1.318359375, 1.3726806640625, 1.427001953125, 1.4813232421875, 1.53564453125, 1.5899658203125, 1.644287109375, 1.6986083984375, 1.7529296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 6.0, 4.0, 6.0, 4.0, 9.0, 14.0, 10.0, 14.0, 25.0, 29.0, 28.0, 38.0, 45.0, 62.0, 98.0, 87.0, 86.0, 73.0, 61.0, 54.0, 46.0, 37.0, 29.0, 25.0, 14.0, 15.0, 7.0, 5.0, 8.0, 9.0, 3.0, 2.0, 0.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5869140625, -0.5678863525390625, -0.548858642578125, -0.5298309326171875, -0.51080322265625, -0.4917755126953125, -0.472747802734375, -0.4537200927734375, -0.4346923828125, -0.4156646728515625, -0.396636962890625, -0.3776092529296875, -0.35858154296875, -0.3395538330078125, -0.320526123046875, -0.3014984130859375, -0.282470703125, -0.2634429931640625, -0.244415283203125, -0.2253875732421875, -0.20635986328125, -0.1873321533203125, -0.168304443359375, -0.1492767333984375, -0.1302490234375, -0.1112213134765625, -0.092193603515625, -0.0731658935546875, -0.05413818359375, -0.0351104736328125, -0.016082763671875, 0.0029449462890625, 0.02197265625, 0.0410003662109375, 0.060028076171875, 0.0790557861328125, 0.09808349609375, 0.1171112060546875, 0.136138916015625, 0.1551666259765625, 0.1741943359375, 0.1932220458984375, 0.212249755859375, 0.2312774658203125, 0.25030517578125, 0.2693328857421875, 0.288360595703125, 0.3073883056640625, 0.326416015625, 0.3454437255859375, 0.364471435546875, 0.3834991455078125, 0.40252685546875, 0.4215545654296875, 0.440582275390625, 0.4596099853515625, 0.4786376953125, 0.4976654052734375, 0.516693115234375, 0.5357208251953125, 0.55474853515625, 0.5737762451171875, 0.592803955078125, 0.6118316650390625, 0.630859375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 6.0, 8.0, 13.0, 10.0, 24.0, 20.0, 29.0, 41.0, 52.0, 57.0, 67.0, 65.0, 89.0, 75.0, 74.0, 73.0, 38.0, 56.0, 49.0, 47.0, 18.0, 16.0, 15.0, 16.0, 10.0, 5.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.29299545288086, -48.8133430480957, -47.33369064331055, -45.85403823852539, -44.3743896484375, -42.894737243652344, -41.41508483886719, -39.93543243408203, -38.455780029296875, -36.97612762451172, -35.49647521972656, -34.016822814941406, -32.53717041015625, -31.057519912719727, -29.577869415283203, -28.098217010498047, -26.61856460571289, -25.138912200927734, -23.659259796142578, -22.179609298706055, -20.6999568939209, -19.220304489135742, -17.74065399169922, -16.261001586914062, -14.781349182128906, -13.30169677734375, -11.82204532623291, -10.34239387512207, -8.862741470336914, -7.383089542388916, -5.903437614440918, -4.423786163330078, -2.9441299438476562, -1.4644780158996582, 0.015173912048339844, 1.494825839996338, 2.974477767944336, 4.454129695892334, 5.933781623840332, 7.413433074951172, 8.893085479736328, 10.372737884521484, 11.852389335632324, 13.332040786743164, 14.81169319152832, 16.291345596313477, 17.77099609375, 19.250648498535156, 20.730300903320312, 22.20995330810547, 23.689605712890625, 25.16925621032715, 26.648908615112305, 28.12856101989746, 29.608211517333984, 31.08786392211914, 32.5675163269043, 34.04716873168945, 35.52682113647461, 37.006473541259766, 38.486122131347656, 39.96577453613281, 41.44542694091797, 42.925079345703125, 44.40473175048828]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 3.0, 7.0, 6.0, 12.0, 16.0, 15.0, 32.0, 14.0, 22.0, 27.0, 36.0, 33.0, 30.0, 50.0, 42.0, 50.0, 47.0, 35.0, 45.0, 48.0, 35.0, 42.0, 42.0, 27.0, 42.0, 39.0, 26.0, 28.0, 20.0, 15.0, 24.0, 13.0, 13.0, 13.0, 5.0, 8.0, 6.0, 8.0, 4.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.716773986816406, -44.41510009765625, -43.11343002319336, -41.8117561340332, -40.51008605957031, -39.208412170410156, -37.906742095947266, -36.60506820678711, -35.30339813232422, -34.00172424316406, -32.70005416870117, -31.39838218688965, -30.096710205078125, -28.79503631591797, -27.493364334106445, -26.191692352294922, -24.890018463134766, -23.588346481323242, -22.28667449951172, -20.985002517700195, -19.683330535888672, -18.381656646728516, -17.079984664916992, -15.778312683105469, -14.476640701293945, -13.174968719482422, -11.873296737670898, -10.571623802185059, -9.269951820373535, -7.968279838562012, -6.66660737991333, -5.364934921264648, -4.063266754150391, -2.761594533920288, -1.4599223136901855, -0.158250093460083, 1.1434221267700195, 2.445094108581543, 3.7467665672302246, 5.048439025878906, 6.35011100769043, 7.651782989501953, 8.953454971313477, 10.255127906799316, 11.55679988861084, 12.858471870422363, 14.160144805908203, 15.461816787719727, 16.76348876953125, 18.065160751342773, 19.366832733154297, 20.66850471496582, 21.970176696777344, 23.2718505859375, 24.573522567749023, 25.875194549560547, 27.17686653137207, 28.478538513183594, 29.780210494995117, 31.08188247680664, 32.3835563659668, 33.68522644042969, 34.986900329589844, 36.28857421875, 37.59024429321289]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 12.0, 13.0, 17.0, 27.0, 62.0, 74.0, 109.0, 168.0, 216.0, 371.0, 515.0, 757.0, 1153.0, 1754.0, 2619.0, 3931.0, 6070.0, 9270.0, 14060.0, 21993.0, 33861.0, 52554.0, 81888.0, 124907.0, 173497.0, 171500.0, 122420.0, 79538.0, 50797.0, 32959.0, 21097.0, 13755.0, 9133.0, 5828.0, 3899.0, 2632.0, 1640.0, 1176.0, 765.0, 504.0, 341.0, 217.0, 142.0, 111.0, 68.0, 49.0, 28.0, 21.0, 12.0, 6.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.03125, -35.83544921875, -34.6396484375, -33.44384765625, -32.248046875, -31.05224609375, -29.8564453125, -28.66064453125, -27.46484375, -26.26904296875, -25.0732421875, -23.87744140625, -22.681640625, -21.48583984375, -20.2900390625, -19.09423828125, -17.8984375, -16.70263671875, -15.5068359375, -14.31103515625, -13.115234375, -11.91943359375, -10.7236328125, -9.52783203125, -8.33203125, -7.13623046875, -5.9404296875, -4.74462890625, -3.548828125, -2.35302734375, -1.1572265625, 0.03857421875, 1.234375, 2.43017578125, 3.6259765625, 4.82177734375, 6.017578125, 7.21337890625, 8.4091796875, 9.60498046875, 10.80078125, 11.99658203125, 13.1923828125, 14.38818359375, 15.583984375, 16.77978515625, 17.9755859375, 19.17138671875, 20.3671875, 21.56298828125, 22.7587890625, 23.95458984375, 25.150390625, 26.34619140625, 27.5419921875, 28.73779296875, 29.93359375, 31.12939453125, 32.3251953125, 33.52099609375, 34.716796875, 35.91259765625, 37.1083984375, 38.30419921875, 39.5]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 2.0, 7.0, 3.0, 12.0, 11.0, 11.0, 14.0, 14.0, 14.0, 27.0, 18.0, 31.0, 35.0, 34.0, 40.0, 39.0, 31.0, 49.0, 43.0, 43.0, 49.0, 51.0, 38.0, 37.0, 38.0, 25.0, 33.0, 38.0, 37.0, 23.0, 24.0, 19.0, 12.0, 24.0, 16.0, 10.0, 9.0, 7.0, 8.0, 2.0, 6.0, 1.0, 5.0, 5.0, 1.0, 1.0, 2.0], "bins": [-43.65625, -42.4814453125, -41.306640625, -40.1318359375, -38.95703125, -37.7822265625, -36.607421875, -35.4326171875, -34.2578125, -33.0830078125, -31.908203125, -30.7333984375, -29.55859375, -28.3837890625, -27.208984375, -26.0341796875, -24.859375, -23.6845703125, -22.509765625, -21.3349609375, -20.16015625, -18.9853515625, -17.810546875, -16.6357421875, -15.4609375, -14.2861328125, -13.111328125, -11.9365234375, -10.76171875, -9.5869140625, -8.412109375, -7.2373046875, -6.0625, -4.8876953125, -3.712890625, -2.5380859375, -1.36328125, -0.1884765625, 0.986328125, 2.1611328125, 3.3359375, 4.5107421875, 5.685546875, 6.8603515625, 8.03515625, 9.2099609375, 10.384765625, 11.5595703125, 12.734375, 13.9091796875, 15.083984375, 16.2587890625, 17.43359375, 18.6083984375, 19.783203125, 20.9580078125, 22.1328125, 23.3076171875, 24.482421875, 25.6572265625, 26.83203125, 28.0068359375, 29.181640625, 30.3564453125, 31.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 12.0, 17.0, 26.0, 32.0, 59.0, 94.0, 150.0, 227.0, 280.0, 501.0, 617.0, 1071.0, 1510.0, 2258.0, 3380.0, 4949.0, 7716.0, 11658.0, 17576.0, 27036.0, 41552.0, 64477.0, 98818.0, 144514.0, 175056.0, 148534.0, 103082.0, 67525.0, 43488.0, 28000.0, 18402.0, 11843.0, 7944.0, 5378.0, 3574.0, 2429.0, 1545.0, 1038.0, 731.0, 514.0, 325.0, 201.0, 136.0, 94.0, 74.0, 38.0, 18.0, 24.0, 17.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0], "bins": [-44.65625, -43.3251953125, -41.994140625, -40.6630859375, -39.33203125, -38.0009765625, -36.669921875, -35.3388671875, -34.0078125, -32.6767578125, -31.345703125, -30.0146484375, -28.68359375, -27.3525390625, -26.021484375, -24.6904296875, -23.359375, -22.0283203125, -20.697265625, -19.3662109375, -18.03515625, -16.7041015625, -15.373046875, -14.0419921875, -12.7109375, -11.3798828125, -10.048828125, -8.7177734375, -7.38671875, -6.0556640625, -4.724609375, -3.3935546875, -2.0625, -0.7314453125, 0.599609375, 1.9306640625, 3.26171875, 4.5927734375, 5.923828125, 7.2548828125, 8.5859375, 9.9169921875, 11.248046875, 12.5791015625, 13.91015625, 15.2412109375, 16.572265625, 17.9033203125, 19.234375, 20.5654296875, 21.896484375, 23.2275390625, 24.55859375, 25.8896484375, 27.220703125, 28.5517578125, 29.8828125, 31.2138671875, 32.544921875, 33.8759765625, 35.20703125, 36.5380859375, 37.869140625, 39.2001953125, 40.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 8.0, 1.0, 7.0, 7.0, 12.0, 18.0, 12.0, 19.0, 16.0, 19.0, 21.0, 32.0, 24.0, 32.0, 43.0, 41.0, 34.0, 47.0, 38.0, 45.0, 49.0, 45.0, 35.0, 39.0, 30.0, 28.0, 47.0, 32.0, 29.0, 29.0, 17.0, 17.0, 24.0, 17.0, 14.0, 16.0, 13.0, 13.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-25.25, -24.47705078125, -23.7041015625, -22.93115234375, -22.158203125, -21.38525390625, -20.6123046875, -19.83935546875, -19.06640625, -18.29345703125, -17.5205078125, -16.74755859375, -15.974609375, -15.20166015625, -14.4287109375, -13.65576171875, -12.8828125, -12.10986328125, -11.3369140625, -10.56396484375, -9.791015625, -9.01806640625, -8.2451171875, -7.47216796875, -6.69921875, -5.92626953125, -5.1533203125, -4.38037109375, -3.607421875, -2.83447265625, -2.0615234375, -1.28857421875, -0.515625, 0.25732421875, 1.0302734375, 1.80322265625, 2.576171875, 3.34912109375, 4.1220703125, 4.89501953125, 5.66796875, 6.44091796875, 7.2138671875, 7.98681640625, 8.759765625, 9.53271484375, 10.3056640625, 11.07861328125, 11.8515625, 12.62451171875, 13.3974609375, 14.17041015625, 14.943359375, 15.71630859375, 16.4892578125, 17.26220703125, 18.03515625, 18.80810546875, 19.5810546875, 20.35400390625, 21.126953125, 21.89990234375, 22.6728515625, 23.44580078125, 24.21875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 10.0, 9.0, 18.0, 16.0, 38.0, 55.0, 71.0, 99.0, 109.0, 199.0, 303.0, 424.0, 726.0, 954.0, 1564.0, 2464.0, 3856.0, 6246.0, 10394.0, 17899.0, 32796.0, 62548.0, 125794.0, 244406.0, 254918.0, 133708.0, 66270.0, 34733.0, 19134.0, 10890.0, 6554.0, 3963.0, 2515.0, 1599.0, 1099.0, 701.0, 470.0, 332.0, 198.0, 149.0, 90.0, 80.0, 42.0, 36.0, 29.0, 20.0, 11.0, 7.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-25.703125, -24.92529296875, -24.1474609375, -23.36962890625, -22.591796875, -21.81396484375, -21.0361328125, -20.25830078125, -19.48046875, -18.70263671875, -17.9248046875, -17.14697265625, -16.369140625, -15.59130859375, -14.8134765625, -14.03564453125, -13.2578125, -12.47998046875, -11.7021484375, -10.92431640625, -10.146484375, -9.36865234375, -8.5908203125, -7.81298828125, -7.03515625, -6.25732421875, -5.4794921875, -4.70166015625, -3.923828125, -3.14599609375, -2.3681640625, -1.59033203125, -0.8125, -0.03466796875, 0.7431640625, 1.52099609375, 2.298828125, 3.07666015625, 3.8544921875, 4.63232421875, 5.41015625, 6.18798828125, 6.9658203125, 7.74365234375, 8.521484375, 9.29931640625, 10.0771484375, 10.85498046875, 11.6328125, 12.41064453125, 13.1884765625, 13.96630859375, 14.744140625, 15.52197265625, 16.2998046875, 17.07763671875, 17.85546875, 18.63330078125, 19.4111328125, 20.18896484375, 20.966796875, 21.74462890625, 22.5224609375, 23.30029296875, 24.078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 11.0, 14.0, 20.0, 15.0, 28.0, 46.0, 52.0, 81.0, 118.0, 131.0, 151.0, 97.0, 81.0, 42.0, 29.0, 18.0, 14.0, 10.0, 6.0, 4.0, 2.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004322052001953125, -0.004204541444778442, -0.00408703088760376, -0.003969520330429077, -0.0038520097732543945, -0.003734499216079712, -0.0036169886589050293, -0.0034994781017303467, -0.003381967544555664, -0.0032644569873809814, -0.003146946430206299, -0.003029435873031616, -0.0029119253158569336, -0.002794414758682251, -0.0026769042015075684, -0.0025593936443328857, -0.002441883087158203, -0.0023243725299835205, -0.002206861972808838, -0.0020893514156341553, -0.0019718408584594727, -0.00185433030128479, -0.0017368197441101074, -0.0016193091869354248, -0.0015017986297607422, -0.0013842880725860596, -0.001266777515411377, -0.0011492669582366943, -0.0010317564010620117, -0.0009142458438873291, -0.0007967352867126465, -0.0006792247295379639, -0.0005617141723632812, -0.00044420361518859863, -0.000326693058013916, -0.0002091825008392334, -9.167194366455078e-05, 2.5838613510131836e-05, 0.00014334917068481445, 0.00026085972785949707, 0.0003783702850341797, 0.0004958808422088623, 0.0006133913993835449, 0.0007309019565582275, 0.0008484125137329102, 0.0009659230709075928, 0.0010834336280822754, 0.001200944185256958, 0.0013184547424316406, 0.0014359652996063232, 0.0015534758567810059, 0.0016709864139556885, 0.001788496971130371, 0.0019060075283050537, 0.0020235180854797363, 0.002141028642654419, 0.0022585391998291016, 0.002376049757003784, 0.002493560314178467, 0.0026110708713531494, 0.002728581428527832, 0.0028460919857025146, 0.0029636025428771973, 0.00308111310005188, 0.0031986236572265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 6.0, 15.0, 11.0, 25.0, 41.0, 48.0, 64.0, 107.0, 146.0, 226.0, 316.0, 502.0, 756.0, 1224.0, 1670.0, 2751.0, 4186.0, 6598.0, 10827.0, 18028.0, 31444.0, 57096.0, 107765.0, 206597.0, 262466.0, 151374.0, 79394.0, 42589.0, 24149.0, 14105.0, 8718.0, 5441.0, 3466.0, 2206.0, 1403.0, 959.0, 599.0, 392.0, 281.0, 180.0, 136.0, 79.0, 53.0, 38.0, 29.0, 17.0, 12.0, 4.0, 8.0, 4.0, 3.0, 1.0, 0.0, 3.0], "bins": [-25.203125, -24.467529296875, -23.73193359375, -22.996337890625, -22.2607421875, -21.525146484375, -20.78955078125, -20.053955078125, -19.318359375, -18.582763671875, -17.84716796875, -17.111572265625, -16.3759765625, -15.640380859375, -14.90478515625, -14.169189453125, -13.43359375, -12.697998046875, -11.96240234375, -11.226806640625, -10.4912109375, -9.755615234375, -9.02001953125, -8.284423828125, -7.548828125, -6.813232421875, -6.07763671875, -5.342041015625, -4.6064453125, -3.870849609375, -3.13525390625, -2.399658203125, -1.6640625, -0.928466796875, -0.19287109375, 0.542724609375, 1.2783203125, 2.013916015625, 2.74951171875, 3.485107421875, 4.220703125, 4.956298828125, 5.69189453125, 6.427490234375, 7.1630859375, 7.898681640625, 8.63427734375, 9.369873046875, 10.10546875, 10.841064453125, 11.57666015625, 12.312255859375, 13.0478515625, 13.783447265625, 14.51904296875, 15.254638671875, 15.990234375, 16.725830078125, 17.46142578125, 18.197021484375, 18.9326171875, 19.668212890625, 20.40380859375, 21.139404296875, 21.875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 4.0, 11.0, 19.0, 13.0, 16.0, 27.0, 32.0, 25.0, 36.0, 56.0, 63.0, 70.0, 75.0, 63.0, 66.0, 81.0, 60.0, 58.0, 51.0, 37.0, 28.0, 16.0, 15.0, 10.0, 18.0, 12.0, 6.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.5443115234375, -9.213623046875, -8.8829345703125, -8.55224609375, -8.2215576171875, -7.890869140625, -7.5601806640625, -7.2294921875, -6.8988037109375, -6.568115234375, -6.2374267578125, -5.90673828125, -5.5760498046875, -5.245361328125, -4.9146728515625, -4.583984375, -4.2532958984375, -3.922607421875, -3.5919189453125, -3.26123046875, -2.9305419921875, -2.599853515625, -2.2691650390625, -1.9384765625, -1.6077880859375, -1.277099609375, -0.9464111328125, -0.61572265625, -0.2850341796875, 0.045654296875, 0.3763427734375, 0.70703125, 1.0377197265625, 1.368408203125, 1.6990966796875, 2.02978515625, 2.3604736328125, 2.691162109375, 3.0218505859375, 3.3525390625, 3.6832275390625, 4.013916015625, 4.3446044921875, 4.67529296875, 5.0059814453125, 5.336669921875, 5.6673583984375, 5.998046875, 6.3287353515625, 6.659423828125, 6.9901123046875, 7.32080078125, 7.6514892578125, 7.982177734375, 8.3128662109375, 8.6435546875, 8.9742431640625, 9.304931640625, 9.6356201171875, 9.96630859375, 10.2969970703125, 10.627685546875, 10.9583740234375, 11.2890625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 17.0, 16.0, 12.0, 23.0, 24.0, 34.0, 28.0, 31.0, 40.0, 50.0, 57.0, 61.0, 55.0, 78.0, 70.0, 60.0, 53.0, 42.0, 44.0, 36.0, 26.0, 25.0, 23.0, 16.0, 9.0, 10.0, 11.0, 6.0, 4.0, 6.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.91347885131836, -45.59896469116211, -44.284454345703125, -42.969940185546875, -41.655426025390625, -40.34091567993164, -39.02640151977539, -37.711891174316406, -36.397377014160156, -35.082862854003906, -33.76835250854492, -32.45383834838867, -31.139326095581055, -29.824813842773438, -28.510299682617188, -27.19578742980957, -25.881275177001953, -24.566762924194336, -23.25225067138672, -21.93773651123047, -20.62322425842285, -19.308712005615234, -17.994197845458984, -16.679685592651367, -15.36517333984375, -14.050661087036133, -12.7361478805542, -11.421634674072266, -10.107122421264648, -8.792610168457031, -7.478096961975098, -6.163583755493164, -4.849067687988281, -3.534554958343506, -2.2200422286987305, -0.9055294990539551, 0.4089832305908203, 1.7234959602355957, 3.038008689880371, 4.352521896362305, 5.667034149169922, 6.981546878814697, 8.296059608459473, 9.610572814941406, 10.925085067749023, 12.23959732055664, 13.554110527038574, 14.868623733520508, 16.183135986328125, 17.497648239135742, 18.81216049194336, 20.12667465209961, 21.441186904907227, 22.755699157714844, 24.070213317871094, 25.38472557067871, 26.699237823486328, 28.013750076293945, 29.328262329101562, 30.642776489257812, 31.95728874206543, 33.27180099487305, 34.5863151550293, 35.90082550048828, 37.21533966064453]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 7.0, 11.0, 4.0, 10.0, 9.0, 17.0, 15.0, 19.0, 22.0, 21.0, 21.0, 39.0, 35.0, 38.0, 38.0, 32.0, 43.0, 48.0, 32.0, 45.0, 45.0, 49.0, 45.0, 33.0, 41.0, 34.0, 22.0, 36.0, 32.0, 17.0, 30.0, 16.0, 16.0, 14.0, 12.0, 10.0, 8.0, 3.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-45.423152923583984, -44.04756546020508, -42.67197799682617, -41.296390533447266, -39.92080307006836, -38.54521560668945, -37.16962814331055, -35.79404067993164, -34.418453216552734, -33.04286575317383, -31.667278289794922, -30.291690826416016, -28.91610336303711, -27.540515899658203, -26.164928436279297, -24.78934097290039, -23.413755416870117, -22.03816795349121, -20.662580490112305, -19.2869930267334, -17.911405563354492, -16.535818099975586, -15.160231590270996, -13.78464412689209, -12.409056663513184, -11.033469200134277, -9.657881736755371, -8.282295227050781, -6.906707286834717, -5.5311198234558105, -4.1555328369140625, -2.7799453735351562, -1.40435791015625, -0.0287705659866333, 1.3468167781829834, 2.7224040031433105, 4.097991466522217, 5.473578929901123, 6.849165916442871, 8.224753379821777, 9.600340843200684, 10.97592830657959, 12.351515769958496, 13.727102279663086, 15.102689743041992, 16.4782772064209, 17.853864669799805, 19.22945213317871, 20.605039596557617, 21.980627059936523, 23.35621452331543, 24.731801986694336, 26.107389450073242, 27.48297691345215, 28.858562469482422, 30.234149932861328, 31.609737396240234, 32.98532485961914, 34.36091232299805, 35.73649978637695, 37.11208724975586, 38.487674713134766, 39.86326217651367, 41.23884963989258, 42.614437103271484]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 9.0, 8.0, 16.0, 17.0, 16.0, 28.0, 26.0, 25.0, 41.0, 53.0, 63.0, 85.0, 100.0, 134.0, 166.0, 202.0, 286.0, 359.0, 450.0, 589.0, 697.0, 1043945.0, 730.0, 582.0, 455.0, 347.0, 225.0, 197.0, 147.0, 109.0, 96.0, 78.0, 61.0, 58.0, 50.0, 25.0, 28.0, 26.0, 26.0, 7.0, 4.0, 7.0, 6.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-714.0451049804688, -691.9876708984375, -669.9302368164062, -647.872802734375, -625.8153686523438, -603.7579345703125, -581.7005004882812, -559.64306640625, -537.5856323242188, -515.5281982421875, -493.47076416015625, -471.413330078125, -449.35589599609375, -427.2984619140625, -405.24102783203125, -383.18359375, -361.12615966796875, -339.0687255859375, -317.01129150390625, -294.953857421875, -272.89642333984375, -250.8389892578125, -228.78155517578125, -206.72412109375, -184.66668701171875, -162.6092529296875, -140.55181884765625, -118.494384765625, -96.43695068359375, -74.3795166015625, -52.32208251953125, -30.2646484375, -8.207275390625, 13.85015869140625, 35.9075927734375, 57.96502685546875, 80.0224609375, 102.07989501953125, 124.1373291015625, 146.19476318359375, 168.252197265625, 190.30963134765625, 212.3670654296875, 234.42449951171875, 256.48193359375, 278.53936767578125, 300.5968017578125, 322.65423583984375, 344.711669921875, 366.76910400390625, 388.8265380859375, 410.88397216796875, 432.94140625, 454.99884033203125, 477.0562744140625, 499.11370849609375, 521.171142578125, 543.2285766601562, 565.2860107421875, 587.3434448242188, 609.40087890625, 631.4583129882812, 653.5157470703125, 675.5731811523438, 697.630615234375]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 1.0, 7.0, 7.0, 14.0, 18.0, 13.0, 17.0, 35.0, 27.0, 48.0, 57.0, 54.0, 78.0, 85.0, 121.0, 143.0, 154.0, 176.0, 230.0, 241.0, 380.0, 625.0, 1301.0, 51318996.0, 144589.0, 1306.0, 646.0, 394.0, 290.0, 221.0, 193.0, 155.0, 106.0, 118.0, 75.0, 81.0, 53.0, 48.0, 45.0, 41.0, 24.0, 26.0, 21.0, 13.0, 14.0, 4.0, 6.0, 7.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1786.1605224609375, -1730.3333740234375, -1674.5062255859375, -1618.6790771484375, -1562.8519287109375, -1507.0247802734375, -1451.1976318359375, -1395.3704833984375, -1339.5433349609375, -1283.7161865234375, -1227.8890380859375, -1172.0618896484375, -1116.2347412109375, -1060.4075927734375, -1004.5804443359375, -948.7532958984375, -892.9261474609375, -837.0989990234375, -781.2718505859375, -725.4447021484375, -669.6175537109375, -613.7904052734375, -557.9632568359375, -502.1361083984375, -446.3089599609375, -390.4818115234375, -334.6546630859375, -278.8275146484375, -223.0003662109375, -167.1732177734375, -111.3460693359375, -55.5189208984375, 0.308349609375, 56.135498046875, 111.962646484375, 167.789794921875, 223.616943359375, 279.444091796875, 335.271240234375, 391.098388671875, 446.925537109375, 502.752685546875, 558.579833984375, 614.406982421875, 670.234130859375, 726.061279296875, 781.888427734375, 837.715576171875, 893.542724609375, 949.369873046875, 1005.197021484375, 1061.024169921875, 1116.851318359375, 1172.678466796875, 1228.505615234375, 1284.332763671875, 1340.159912109375, 1395.987060546875, 1451.814208984375, 1507.641357421875, 1563.468505859375, 1619.295654296875, 1675.122802734375, 1730.949951171875, 1786.777099609375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 6.0, 6.0, 11.0, 10.0, 20.0, 22.0, 21.0, 28.0, 35.0, 51.0, 73.0, 127.0, 123.0, 100.0, 78.0, 62.0, 47.0, 31.0, 33.0, 18.0, 14.0, 12.0, 12.0, 7.0, 8.0, 8.0, 6.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1279.698486328125, -1233.0745849609375, -1186.4508056640625, -1139.826904296875, -1093.203125, -1046.5792236328125, -999.955322265625, -953.3314819335938, -906.7076416015625, -860.0838012695312, -813.4599609375, -766.8360595703125, -720.2122192382812, -673.58837890625, -626.9644775390625, -580.3406372070312, -533.716796875, -487.09295654296875, -440.4690856933594, -393.84521484375, -347.22137451171875, -300.5975341796875, -253.97366333007812, -207.34979248046875, -160.7259521484375, -114.10209655761719, -67.47824096679688, -20.854385375976562, 25.76947021484375, 72.39332580566406, 119.01718139648438, 165.64105224609375, 212.2647705078125, 258.88861083984375, 305.5124816894531, 352.1363525390625, 398.76019287109375, 445.384033203125, 492.0079040527344, 538.6317749023438, 585.255615234375, 631.8794555664062, 678.5032958984375, 725.127197265625, 771.7510375976562, 818.3748779296875, 864.998779296875, 911.6226196289062, 958.2464599609375, 1004.8703002929688, 1051.494140625, 1098.1180419921875, 1144.741943359375, 1191.36572265625, 1237.9896240234375, 1284.613525390625, 1331.2373046875, 1377.8612060546875, 1424.4849853515625, 1471.10888671875, 1517.732666015625, 1564.3565673828125, 1610.98046875, 1657.604248046875, 1704.2281494140625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 14.0, 15.0, 16.0, 20.0, 26.0, 23.0, 39.0, 27.0, 30.0, 38.0, 46.0, 55.0, 75.0, 64.0, 62.0, 55.0, 65.0, 38.0, 30.0, 31.0, 23.0, 24.0, 20.0, 24.0, 16.0, 15.0, 21.0, 7.0, 11.0, 7.0, 8.0, 9.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1612.0467529296875, -1564.2908935546875, -1516.534912109375, -1468.779052734375, -1421.023193359375, -1373.267333984375, -1325.511474609375, -1277.7554931640625, -1229.9996337890625, -1182.2437744140625, -1134.48779296875, -1086.73193359375, -1038.97607421875, -991.22021484375, -943.4642944335938, -895.7083740234375, -847.9525146484375, -800.1966552734375, -752.4407348632812, -704.684814453125, -656.928955078125, -609.173095703125, -561.4171752929688, -513.6612548828125, -465.9053955078125, -418.1495056152344, -370.39361572265625, -322.6377258300781, -274.8818359375, -227.12594604492188, -179.37005615234375, -131.61416625976562, -83.858154296875, -36.102264404296875, 11.65362548828125, 59.409515380859375, 107.1654052734375, 154.92129516601562, 202.67718505859375, 250.43307495117188, 298.18896484375, 345.9448547363281, 393.70074462890625, 441.4566345214844, 489.2125244140625, 536.9683837890625, 584.7243041992188, 632.480224609375, 680.236083984375, 727.991943359375, 775.7478637695312, 823.5037841796875, 871.2596435546875, 919.0155029296875, 966.7714233398438, 1014.52734375, 1062.283203125, 1110.0390625, 1157.794921875, 1205.5509033203125, 1253.3067626953125, 1301.0626220703125, 1348.818603515625, 1396.574462890625, 1444.330322265625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 9.0, 10.0, 12.0, 26.0, 34.0, 66.0, 92.0, 108.0, 177.0, 281.0, 415.0, 580.0, 932.0, 1343.0, 2071.0, 3285.0, 4980.0, 8122.0, 13395.0, 23531.0, 43091.0, 85659.0, 197450.0, 777587.0, 2531208.0, 270571.0, 105972.0, 51615.0, 28025.0, 15711.0, 9598.0, 6047.0, 3863.0, 2543.0, 1789.0, 1216.0, 827.0, 569.0, 410.0, 316.0, 211.0, 144.0, 116.0, 88.0, 52.0, 45.0, 30.0, 18.0, 20.0, 11.0, 10.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.578125, -25.634521484375, -24.69091796875, -23.747314453125, -22.8037109375, -21.860107421875, -20.91650390625, -19.972900390625, -19.029296875, -18.085693359375, -17.14208984375, -16.198486328125, -15.2548828125, -14.311279296875, -13.36767578125, -12.424072265625, -11.48046875, -10.536865234375, -9.59326171875, -8.649658203125, -7.7060546875, -6.762451171875, -5.81884765625, -4.875244140625, -3.931640625, -2.988037109375, -2.04443359375, -1.100830078125, -0.1572265625, 0.786376953125, 1.72998046875, 2.673583984375, 3.6171875, 4.560791015625, 5.50439453125, 6.447998046875, 7.3916015625, 8.335205078125, 9.27880859375, 10.222412109375, 11.166015625, 12.109619140625, 13.05322265625, 13.996826171875, 14.9404296875, 15.884033203125, 16.82763671875, 17.771240234375, 18.71484375, 19.658447265625, 20.60205078125, 21.545654296875, 22.4892578125, 23.432861328125, 24.37646484375, 25.320068359375, 26.263671875, 27.207275390625, 28.15087890625, 29.094482421875, 30.0380859375, 30.981689453125, 31.92529296875, 32.868896484375, 33.8125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 7.0, 2.0, 5.0, 4.0, 7.0, 9.0, 8.0, 12.0, 12.0, 18.0, 25.0, 25.0, 32.0, 39.0, 53.0, 60.0, 48.0, 65.0, 74.0, 73.0, 72.0, 55.0, 45.0, 56.0, 40.0, 36.0, 29.0, 16.0, 13.0, 15.0, 10.0, 10.0, 7.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.617706298828125, -2.52056884765625, -2.423431396484375, -2.3262939453125, -2.229156494140625, -2.13201904296875, -2.034881591796875, -1.937744140625, -1.840606689453125, -1.74346923828125, -1.646331787109375, -1.5491943359375, -1.452056884765625, -1.35491943359375, -1.257781982421875, -1.16064453125, -1.063507080078125, -0.96636962890625, -0.869232177734375, -0.7720947265625, -0.674957275390625, -0.57781982421875, -0.480682373046875, -0.383544921875, -0.286407470703125, -0.18927001953125, -0.092132568359375, 0.0050048828125, 0.102142333984375, 0.19927978515625, 0.296417236328125, 0.3935546875, 0.490692138671875, 0.58782958984375, 0.684967041015625, 0.7821044921875, 0.879241943359375, 0.97637939453125, 1.073516845703125, 1.170654296875, 1.267791748046875, 1.36492919921875, 1.462066650390625, 1.5592041015625, 1.656341552734375, 1.75347900390625, 1.850616455078125, 1.94775390625, 2.044891357421875, 2.14202880859375, 2.239166259765625, 2.3363037109375, 2.433441162109375, 2.53057861328125, 2.627716064453125, 2.724853515625, 2.821990966796875, 2.91912841796875, 3.016265869140625, 3.1134033203125, 3.210540771484375, 3.30767822265625, 3.404815673828125, 3.501953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 11.0, 21.0, 19.0, 20.0, 49.0, 66.0, 102.0, 256.0, 387.0, 670.0, 1250.0, 2367.0, 4601.0, 9543.0, 20680.0, 48211.0, 121742.0, 389460.0, 2598060.0, 699974.0, 177450.0, 66995.0, 27795.0, 12508.0, 5726.0, 2896.0, 1482.0, 843.0, 433.0, 257.0, 152.0, 103.0, 49.0, 35.0, 23.0, 19.0, 7.0, 14.0, 3.0, 1.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -22.18310546875, -21.4599609375, -20.73681640625, -20.013671875, -19.29052734375, -18.5673828125, -17.84423828125, -17.12109375, -16.39794921875, -15.6748046875, -14.95166015625, -14.228515625, -13.50537109375, -12.7822265625, -12.05908203125, -11.3359375, -10.61279296875, -9.8896484375, -9.16650390625, -8.443359375, -7.72021484375, -6.9970703125, -6.27392578125, -5.55078125, -4.82763671875, -4.1044921875, -3.38134765625, -2.658203125, -1.93505859375, -1.2119140625, -0.48876953125, 0.234375, 0.95751953125, 1.6806640625, 2.40380859375, 3.126953125, 3.85009765625, 4.5732421875, 5.29638671875, 6.01953125, 6.74267578125, 7.4658203125, 8.18896484375, 8.912109375, 9.63525390625, 10.3583984375, 11.08154296875, 11.8046875, 12.52783203125, 13.2509765625, 13.97412109375, 14.697265625, 15.42041015625, 16.1435546875, 16.86669921875, 17.58984375, 18.31298828125, 19.0361328125, 19.75927734375, 20.482421875, 21.20556640625, 21.9287109375, 22.65185546875, 23.375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 9.0, 13.0, 13.0, 19.0, 29.0, 26.0, 31.0, 43.0, 50.0, 62.0, 80.0, 85.0, 100.0, 144.0, 182.0, 270.0, 489.0, 902.0, 387.0, 241.0, 174.0, 144.0, 93.0, 92.0, 74.0, 68.0, 54.0, 43.0, 52.0, 28.0, 17.0, 11.0, 15.0, 14.0, 4.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5703125, -6.353515625, -6.13671875, -5.919921875, -5.703125, -5.486328125, -5.26953125, -5.052734375, -4.8359375, -4.619140625, -4.40234375, -4.185546875, -3.96875, -3.751953125, -3.53515625, -3.318359375, -3.1015625, -2.884765625, -2.66796875, -2.451171875, -2.234375, -2.017578125, -1.80078125, -1.583984375, -1.3671875, -1.150390625, -0.93359375, -0.716796875, -0.5, -0.283203125, -0.06640625, 0.150390625, 0.3671875, 0.583984375, 0.80078125, 1.017578125, 1.234375, 1.451171875, 1.66796875, 1.884765625, 2.1015625, 2.318359375, 2.53515625, 2.751953125, 2.96875, 3.185546875, 3.40234375, 3.619140625, 3.8359375, 4.052734375, 4.26953125, 4.486328125, 4.703125, 4.919921875, 5.13671875, 5.353515625, 5.5703125, 5.787109375, 6.00390625, 6.220703125, 6.4375, 6.654296875, 6.87109375, 7.087890625, 7.3046875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 1.0, 3.0, 8.0, 11.0, 20.0, 36.0, 56.0, 100.0, 157.0, 213.0, 152.0, 111.0, 51.0, 42.0, 18.0, 9.0, 9.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.82499694824219, -104.59039306640625, -101.35578155517578, -98.12117767333984, -94.88656616210938, -91.65196228027344, -88.4173583984375, -85.18275451660156, -81.9481430053711, -78.71353912353516, -75.47892761230469, -72.24432373046875, -69.00971984863281, -65.77510833740234, -62.540504455566406, -59.3058967590332, -56.0712890625, -52.8366813659668, -49.602073669433594, -46.367469787597656, -43.13286209106445, -39.89825439453125, -36.66365051269531, -33.42904281616211, -30.194435119628906, -26.959827423095703, -23.725221633911133, -20.490615844726562, -17.25600814819336, -14.021400451660156, -10.786794662475586, -7.552188873291016, -4.3175811767578125, -1.0829744338989258, 2.151632308959961, 5.386239051818848, 8.620845794677734, 11.855453491210938, 15.090059280395508, 18.324665069580078, 21.55927276611328, 24.793880462646484, 28.028486251831055, 31.263092041015625, 34.49769973754883, 37.73230743408203, 40.96691131591797, 44.20151901245117, 47.436126708984375, 50.67073440551758, 53.90534210205078, 57.13994598388672, 60.37455368041992, 63.609161376953125, 66.84376525878906, 70.078369140625, 73.31298065185547, 76.5475845336914, 79.78219604492188, 83.01679992675781, 86.25140380859375, 89.48601531982422, 92.72061920166016, 95.95523071289062, 99.18983459472656]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 7.0, 13.0, 8.0, 15.0, 18.0, 11.0, 25.0, 29.0, 26.0, 36.0, 41.0, 45.0, 40.0, 50.0, 44.0, 58.0, 54.0, 60.0, 54.0, 46.0, 63.0, 50.0, 33.0, 33.0, 29.0, 25.0, 11.0, 15.0, 17.0, 12.0, 6.0, 8.0, 9.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.41141128540039, -38.95561218261719, -37.499813079833984, -36.04401397705078, -34.58821487426758, -33.132415771484375, -31.676616668701172, -30.22081756591797, -28.765018463134766, -27.309219360351562, -25.85342025756836, -24.397621154785156, -22.941822052001953, -21.48602294921875, -20.030223846435547, -18.574424743652344, -17.11862564086914, -15.662826538085938, -14.207027435302734, -12.751228332519531, -11.295429229736328, -9.839630126953125, -8.383831024169922, -6.928031921386719, -5.472232818603516, -4.0164337158203125, -2.5606346130371094, -1.1048355102539062, 0.3509635925292969, 1.8067626953125, 3.262561798095703, 4.718360900878906, 6.174163818359375, 7.629962921142578, 9.085762023925781, 10.541561126708984, 11.997360229492188, 13.45315933227539, 14.908958435058594, 16.364757537841797, 17.820556640625, 19.276355743408203, 20.732154846191406, 22.18795394897461, 23.643753051757812, 25.099552154541016, 26.55535125732422, 28.011150360107422, 29.466949462890625, 30.922748565673828, 32.37854766845703, 33.834346771240234, 35.29014587402344, 36.74594497680664, 38.201744079589844, 39.65754318237305, 41.11334228515625, 42.56914138793945, 44.024940490722656, 45.48073959350586, 46.93653869628906, 48.392337799072266, 49.84813690185547, 51.30393600463867, 52.759735107421875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 8.0, 9.0, 17.0, 19.0, 20.0, 37.0, 47.0, 68.0, 88.0, 109.0, 172.0, 238.0, 340.0, 538.0, 817.0, 1243.0, 2010.0, 3153.0, 5321.0, 9482.0, 17515.0, 34945.0, 74938.0, 206868.0, 435783.0, 137241.0, 56600.0, 27080.0, 14057.0, 7682.0, 4527.0, 2677.0, 1634.0, 1068.0, 682.0, 465.0, 312.0, 208.0, 146.0, 117.0, 65.0, 56.0, 51.0, 26.0, 22.0, 14.0, 14.0, 6.0, 4.0, 12.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.71875, -12.29931640625, -11.8798828125, -11.46044921875, -11.041015625, -10.62158203125, -10.2021484375, -9.78271484375, -9.36328125, -8.94384765625, -8.5244140625, -8.10498046875, -7.685546875, -7.26611328125, -6.8466796875, -6.42724609375, -6.0078125, -5.58837890625, -5.1689453125, -4.74951171875, -4.330078125, -3.91064453125, -3.4912109375, -3.07177734375, -2.65234375, -2.23291015625, -1.8134765625, -1.39404296875, -0.974609375, -0.55517578125, -0.1357421875, 0.28369140625, 0.703125, 1.12255859375, 1.5419921875, 1.96142578125, 2.380859375, 2.80029296875, 3.2197265625, 3.63916015625, 4.05859375, 4.47802734375, 4.8974609375, 5.31689453125, 5.736328125, 6.15576171875, 6.5751953125, 6.99462890625, 7.4140625, 7.83349609375, 8.2529296875, 8.67236328125, 9.091796875, 9.51123046875, 9.9306640625, 10.35009765625, 10.76953125, 11.18896484375, 11.6083984375, 12.02783203125, 12.447265625, 12.86669921875, 13.2861328125, 13.70556640625, 14.125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 11.0, 10.0, 13.0, 11.0, 30.0, 22.0, 33.0, 49.0, 32.0, 39.0, 68.0, 53.0, 63.0, 65.0, 74.0, 74.0, 59.0, 40.0, 54.0, 37.0, 29.0, 22.0, 23.0, 26.0, 7.0, 6.0, 8.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16015625, -3.053375244140625, -2.94659423828125, -2.839813232421875, -2.7330322265625, -2.626251220703125, -2.51947021484375, -2.412689208984375, -2.305908203125, -2.199127197265625, -2.09234619140625, -1.985565185546875, -1.8787841796875, -1.772003173828125, -1.66522216796875, -1.558441162109375, -1.45166015625, -1.344879150390625, -1.23809814453125, -1.131317138671875, -1.0245361328125, -0.917755126953125, -0.81097412109375, -0.704193115234375, -0.597412109375, -0.490631103515625, -0.38385009765625, -0.277069091796875, -0.1702880859375, -0.063507080078125, 0.04327392578125, 0.150054931640625, 0.2568359375, 0.363616943359375, 0.47039794921875, 0.577178955078125, 0.6839599609375, 0.790740966796875, 0.89752197265625, 1.004302978515625, 1.111083984375, 1.217864990234375, 1.32464599609375, 1.431427001953125, 1.5382080078125, 1.644989013671875, 1.75177001953125, 1.858551025390625, 1.96533203125, 2.072113037109375, 2.17889404296875, 2.285675048828125, 2.3924560546875, 2.499237060546875, 2.60601806640625, 2.712799072265625, 2.819580078125, 2.926361083984375, 3.03314208984375, 3.139923095703125, 3.2467041015625, 3.353485107421875, 3.46026611328125, 3.567047119140625, 3.673828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 11.0, 13.0, 21.0, 20.0, 23.0, 36.0, 64.0, 83.0, 156.0, 297.0, 728.0, 1693.0, 5409.0, 22065.0, 161376.0, 763423.0, 74016.0, 13141.0, 3522.0, 1315.0, 499.0, 243.0, 126.0, 85.0, 49.0, 41.0, 18.0, 18.0, 11.0, 11.0, 8.0, 3.0, 6.0, 1.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-31.34375, -30.374267578125, -29.40478515625, -28.435302734375, -27.4658203125, -26.496337890625, -25.52685546875, -24.557373046875, -23.587890625, -22.618408203125, -21.64892578125, -20.679443359375, -19.7099609375, -18.740478515625, -17.77099609375, -16.801513671875, -15.83203125, -14.862548828125, -13.89306640625, -12.923583984375, -11.9541015625, -10.984619140625, -10.01513671875, -9.045654296875, -8.076171875, -7.106689453125, -6.13720703125, -5.167724609375, -4.1982421875, -3.228759765625, -2.25927734375, -1.289794921875, -0.3203125, 0.649169921875, 1.61865234375, 2.588134765625, 3.5576171875, 4.527099609375, 5.49658203125, 6.466064453125, 7.435546875, 8.405029296875, 9.37451171875, 10.343994140625, 11.3134765625, 12.282958984375, 13.25244140625, 14.221923828125, 15.19140625, 16.160888671875, 17.13037109375, 18.099853515625, 19.0693359375, 20.038818359375, 21.00830078125, 21.977783203125, 22.947265625, 23.916748046875, 24.88623046875, 25.855712890625, 26.8251953125, 27.794677734375, 28.76416015625, 29.733642578125, 30.703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 2.0, 2.0, 6.0, 3.0, 10.0, 13.0, 6.0, 9.0, 16.0, 13.0, 12.0, 17.0, 25.0, 20.0, 19.0, 37.0, 24.0, 31.0, 46.0, 45.0, 46.0, 35.0, 44.0, 43.0, 36.0, 46.0, 40.0, 44.0, 40.0, 30.0, 34.0, 22.0, 24.0, 21.0, 22.0, 26.0, 21.0, 12.0, 13.0, 10.0, 8.0, 3.0, 5.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.3203125, -10.96435546875, -10.6083984375, -10.25244140625, -9.896484375, -9.54052734375, -9.1845703125, -8.82861328125, -8.47265625, -8.11669921875, -7.7607421875, -7.40478515625, -7.048828125, -6.69287109375, -6.3369140625, -5.98095703125, -5.625, -5.26904296875, -4.9130859375, -4.55712890625, -4.201171875, -3.84521484375, -3.4892578125, -3.13330078125, -2.77734375, -2.42138671875, -2.0654296875, -1.70947265625, -1.353515625, -0.99755859375, -0.6416015625, -0.28564453125, 0.0703125, 0.42626953125, 0.7822265625, 1.13818359375, 1.494140625, 1.85009765625, 2.2060546875, 2.56201171875, 2.91796875, 3.27392578125, 3.6298828125, 3.98583984375, 4.341796875, 4.69775390625, 5.0537109375, 5.40966796875, 5.765625, 6.12158203125, 6.4775390625, 6.83349609375, 7.189453125, 7.54541015625, 7.9013671875, 8.25732421875, 8.61328125, 8.96923828125, 9.3251953125, 9.68115234375, 10.037109375, 10.39306640625, 10.7490234375, 11.10498046875, 11.4609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 10.0, 9.0, 22.0, 30.0, 38.0, 91.0, 132.0, 326.0, 786.0, 2562.0, 15816.0, 771468.0, 244392.0, 9695.0, 1934.0, 625.0, 276.0, 124.0, 78.0, 43.0, 28.0, 19.0, 11.0, 15.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.8125, -41.27734375, -39.7421875, -38.20703125, -36.671875, -35.13671875, -33.6015625, -32.06640625, -30.53125, -28.99609375, -27.4609375, -25.92578125, -24.390625, -22.85546875, -21.3203125, -19.78515625, -18.25, -16.71484375, -15.1796875, -13.64453125, -12.109375, -10.57421875, -9.0390625, -7.50390625, -5.96875, -4.43359375, -2.8984375, -1.36328125, 0.171875, 1.70703125, 3.2421875, 4.77734375, 6.3125, 7.84765625, 9.3828125, 10.91796875, 12.453125, 13.98828125, 15.5234375, 17.05859375, 18.59375, 20.12890625, 21.6640625, 23.19921875, 24.734375, 26.26953125, 27.8046875, 29.33984375, 30.875, 32.41015625, 33.9453125, 35.48046875, 37.015625, 38.55078125, 40.0859375, 41.62109375, 43.15625, 44.69140625, 46.2265625, 47.76171875, 49.296875, 50.83203125, 52.3671875, 53.90234375, 55.4375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 6.0, 5.0, 4.0, 3.0, 5.0, 15.0, 9.0, 5.0, 17.0, 18.0, 28.0, 42.0, 30.0, 54.0, 70.0, 64.0, 88.0, 84.0, 81.0, 73.0, 50.0, 69.0, 32.0, 30.0, 23.0, 23.0, 11.0, 8.0, 10.0, 3.0, 6.0, 10.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008544921875, -0.0008272528648376465, -0.000800013542175293, -0.0007727742195129395, -0.0007455348968505859, -0.0007182955741882324, -0.0006910562515258789, -0.0006638169288635254, -0.0006365776062011719, -0.0006093382835388184, -0.0005820989608764648, -0.0005548596382141113, -0.0005276203155517578, -0.0005003809928894043, -0.0004731416702270508, -0.00044590234756469727, -0.00041866302490234375, -0.00039142370223999023, -0.0003641843795776367, -0.0003369450569152832, -0.0003097057342529297, -0.00028246641159057617, -0.00025522708892822266, -0.00022798776626586914, -0.00020074844360351562, -0.0001735091209411621, -0.0001462697982788086, -0.00011903047561645508, -9.179115295410156e-05, -6.455183029174805e-05, -3.731250762939453e-05, -1.0073184967041016e-05, 1.71661376953125e-05, 4.4405460357666016e-05, 7.164478302001953e-05, 9.888410568237305e-05, 0.00012612342834472656, 0.00015336275100708008, 0.0001806020736694336, 0.0002078413963317871, 0.00023508071899414062, 0.00026232004165649414, 0.00028955936431884766, 0.00031679868698120117, 0.0003440380096435547, 0.0003712773323059082, 0.0003985166549682617, 0.00042575597763061523, 0.00045299530029296875, 0.00048023462295532227, 0.0005074739456176758, 0.0005347132682800293, 0.0005619525909423828, 0.0005891919136047363, 0.0006164312362670898, 0.0006436705589294434, 0.0006709098815917969, 0.0006981492042541504, 0.0007253885269165039, 0.0007526278495788574, 0.0007798671722412109, 0.0008071064949035645, 0.000834345817565918, 0.0008615851402282715, 0.000888824462890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 8.0, 13.0, 17.0, 25.0, 22.0, 41.0, 52.0, 78.0, 130.0, 198.0, 310.0, 487.0, 807.0, 1364.0, 2474.0, 4792.0, 10393.0, 26000.0, 87835.0, 505057.0, 310596.0, 60742.0, 19642.0, 8292.0, 3913.0, 2083.0, 1214.0, 738.0, 421.0, 264.0, 166.0, 121.0, 72.0, 61.0, 39.0, 27.0, 15.0, 13.0, 7.0, 10.0, 2.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.234375, -15.7550048828125, -15.275634765625, -14.7962646484375, -14.31689453125, -13.8375244140625, -13.358154296875, -12.8787841796875, -12.3994140625, -11.9200439453125, -11.440673828125, -10.9613037109375, -10.48193359375, -10.0025634765625, -9.523193359375, -9.0438232421875, -8.564453125, -8.0850830078125, -7.605712890625, -7.1263427734375, -6.64697265625, -6.1676025390625, -5.688232421875, -5.2088623046875, -4.7294921875, -4.2501220703125, -3.770751953125, -3.2913818359375, -2.81201171875, -2.3326416015625, -1.853271484375, -1.3739013671875, -0.89453125, -0.4151611328125, 0.064208984375, 0.5435791015625, 1.02294921875, 1.5023193359375, 1.981689453125, 2.4610595703125, 2.9404296875, 3.4197998046875, 3.899169921875, 4.3785400390625, 4.85791015625, 5.3372802734375, 5.816650390625, 6.2960205078125, 6.775390625, 7.2547607421875, 7.734130859375, 8.2135009765625, 8.69287109375, 9.1722412109375, 9.651611328125, 10.1309814453125, 10.6103515625, 11.0897216796875, 11.569091796875, 12.0484619140625, 12.52783203125, 13.0072021484375, 13.486572265625, 13.9659423828125, 14.4453125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 5.0, 2.0, 7.0, 10.0, 12.0, 10.0, 13.0, 20.0, 21.0, 27.0, 38.0, 36.0, 42.0, 50.0, 43.0, 60.0, 68.0, 64.0, 64.0, 63.0, 52.0, 55.0, 47.0, 28.0, 30.0, 21.0, 11.0, 18.0, 8.0, 9.0, 12.0, 9.0, 8.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.76953125, -7.52935791015625, -7.2891845703125, -7.04901123046875, -6.808837890625, -6.56866455078125, -6.3284912109375, -6.08831787109375, -5.84814453125, -5.60797119140625, -5.3677978515625, -5.12762451171875, -4.887451171875, -4.64727783203125, -4.4071044921875, -4.16693115234375, -3.9267578125, -3.68658447265625, -3.4464111328125, -3.20623779296875, -2.966064453125, -2.72589111328125, -2.4857177734375, -2.24554443359375, -2.00537109375, -1.76519775390625, -1.5250244140625, -1.28485107421875, -1.044677734375, -0.80450439453125, -0.5643310546875, -0.32415771484375, -0.083984375, 0.15618896484375, 0.3963623046875, 0.63653564453125, 0.876708984375, 1.11688232421875, 1.3570556640625, 1.59722900390625, 1.83740234375, 2.07757568359375, 2.3177490234375, 2.55792236328125, 2.798095703125, 3.03826904296875, 3.2784423828125, 3.51861572265625, 3.7587890625, 3.99896240234375, 4.2391357421875, 4.47930908203125, 4.719482421875, 4.95965576171875, 5.1998291015625, 5.44000244140625, 5.68017578125, 5.92034912109375, 6.1605224609375, 6.40069580078125, 6.640869140625, 6.88104248046875, 7.1212158203125, 7.36138916015625, 7.6015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 9.0, 8.0, 9.0, 18.0, 35.0, 57.0, 137.0, 234.0, 227.0, 136.0, 61.0, 26.0, 17.0, 14.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-256.1457824707031, -249.74057006835938, -243.33535766601562, -236.93014526367188, -230.52491760253906, -224.1197052001953, -217.71449279785156, -211.3092803955078, -204.904052734375, -198.49884033203125, -192.0936279296875, -185.68841552734375, -179.28318786621094, -172.8779754638672, -166.47276306152344, -160.0675506591797, -153.66233825683594, -147.2571258544922, -140.85191345214844, -134.44668579101562, -128.04147338867188, -121.63626098632812, -115.23104858398438, -108.82583618164062, -102.42061614990234, -96.0154037475586, -89.61018371582031, -83.20497131347656, -76.79975891113281, -70.39453887939453, -63.98932647705078, -57.584110260009766, -51.17890930175781, -44.7736930847168, -38.36847686767578, -31.96326446533203, -25.558048248291016, -19.15283203125, -12.74761962890625, -6.342403411865234, 0.06281280517578125, 6.4680280685424805, 12.87324333190918, 19.278457641601562, 25.683673858642578, 32.088890075683594, 38.494102478027344, 44.89931869506836, 51.304534912109375, 57.70975112915039, 64.1149673461914, 70.52017974853516, 76.92539978027344, 83.33061218261719, 89.73582458496094, 96.14103698730469, 102.54625701904297, 108.95146942138672, 115.356689453125, 121.76190185546875, 128.1671142578125, 134.57232666015625, 140.9775390625, 147.3827667236328, 153.78797912597656]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 1.0, 9.0, 4.0, 9.0, 10.0, 12.0, 32.0, 42.0, 74.0, 88.0, 110.0, 137.0, 127.0, 99.0, 73.0, 48.0, 38.0, 16.0, 15.0, 5.0, 6.0, 5.0, 7.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-273.7947692871094, -266.71441650390625, -259.6340637207031, -252.55369567871094, -245.47332763671875, -238.39297485351562, -231.31260681152344, -224.2322540283203, -217.15188598632812, -210.071533203125, -202.9911651611328, -195.9108123779297, -188.8304443359375, -181.75009155273438, -174.6697235107422, -167.58937072753906, -160.50900268554688, -153.42864990234375, -146.34828186035156, -139.26792907714844, -132.18756103515625, -125.10720825195312, -118.02684020996094, -110.94648742675781, -103.86613464355469, -96.78577423095703, -89.70541381835938, -82.62505340576172, -75.54469299316406, -68.46434020996094, -61.383975982666016, -54.30361557006836, -47.22325134277344, -40.14289093017578, -33.062530517578125, -25.9821720123291, -18.901811599731445, -11.821453094482422, -4.741092681884766, 2.3392677307128906, 9.419628143310547, 16.499988555908203, 23.58034896850586, 30.660707473754883, 37.741065979003906, 44.82142639160156, 51.90178680419922, 58.982147216796875, 66.06250762939453, 73.14286804199219, 80.22322845458984, 87.3035888671875, 94.38394927978516, 101.46430969238281, 108.54466247558594, 115.62503051757812, 122.70538330078125, 129.78573608398438, 136.86610412597656, 143.9464569091797, 151.02682495117188, 158.107177734375, 165.1875457763672, 172.2678985595703, 179.3482666015625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 7.0, 6.0, 18.0, 12.0, 16.0, 38.0, 46.0, 58.0, 95.0, 153.0, 252.0, 461.0, 793.0, 1527.0, 3276.0, 7821.0, 22855.0, 97458.0, 3759496.0, 241640.0, 36912.0, 11739.0, 4654.0, 2159.0, 1094.0, 641.0, 351.0, 210.0, 164.0, 105.0, 70.0, 43.0, 27.0, 18.0, 16.0, 18.0, 9.0, 7.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-72.0625, -69.71484375, -67.3671875, -65.01953125, -62.671875, -60.32421875, -57.9765625, -55.62890625, -53.28125, -50.93359375, -48.5859375, -46.23828125, -43.890625, -41.54296875, -39.1953125, -36.84765625, -34.5, -32.15234375, -29.8046875, -27.45703125, -25.109375, -22.76171875, -20.4140625, -18.06640625, -15.71875, -13.37109375, -11.0234375, -8.67578125, -6.328125, -3.98046875, -1.6328125, 0.71484375, 3.0625, 5.41015625, 7.7578125, 10.10546875, 12.453125, 14.80078125, 17.1484375, 19.49609375, 21.84375, 24.19140625, 26.5390625, 28.88671875, 31.234375, 33.58203125, 35.9296875, 38.27734375, 40.625, 42.97265625, 45.3203125, 47.66796875, 50.015625, 52.36328125, 54.7109375, 57.05859375, 59.40625, 61.75390625, 64.1015625, 66.44921875, 68.796875, 71.14453125, 73.4921875, 75.83984375, 78.1875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 9.0, 10.0, 8.0, 5.0, 10.0, 16.0, 14.0, 20.0, 33.0, 42.0, 29.0, 38.0, 50.0, 48.0, 56.0, 64.0, 52.0, 68.0, 67.0, 61.0, 37.0, 48.0, 30.0, 32.0, 31.0, 25.0, 18.0, 11.0, 17.0, 7.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.01953125, -2.920623779296875, -2.82171630859375, -2.722808837890625, -2.6239013671875, -2.524993896484375, -2.42608642578125, -2.327178955078125, -2.228271484375, -2.129364013671875, -2.03045654296875, -1.931549072265625, -1.8326416015625, -1.733734130859375, -1.63482666015625, -1.535919189453125, -1.43701171875, -1.338104248046875, -1.23919677734375, -1.140289306640625, -1.0413818359375, -0.942474365234375, -0.84356689453125, -0.744659423828125, -0.645751953125, -0.546844482421875, -0.44793701171875, -0.349029541015625, -0.2501220703125, -0.151214599609375, -0.05230712890625, 0.046600341796875, 0.1455078125, 0.244415283203125, 0.34332275390625, 0.442230224609375, 0.5411376953125, 0.640045166015625, 0.73895263671875, 0.837860107421875, 0.936767578125, 1.035675048828125, 1.13458251953125, 1.233489990234375, 1.3323974609375, 1.431304931640625, 1.53021240234375, 1.629119873046875, 1.72802734375, 1.826934814453125, 1.92584228515625, 2.024749755859375, 2.1236572265625, 2.222564697265625, 2.32147216796875, 2.420379638671875, 2.519287109375, 2.618194580078125, 2.71710205078125, 2.816009521484375, 2.9149169921875, 3.013824462890625, 3.11273193359375, 3.211639404296875, 3.310546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 5.0, 9.0, 12.0, 7.0, 27.0, 42.0, 55.0, 81.0, 139.0, 205.0, 344.0, 502.0, 829.0, 1393.0, 2390.0, 4198.0, 7750.0, 14968.0, 31671.0, 78155.0, 297245.0, 3331789.0, 282929.0, 76400.0, 30783.0, 14610.0, 7694.0, 4100.0, 2391.0, 1363.0, 812.0, 521.0, 327.0, 174.0, 122.0, 77.0, 61.0, 29.0, 25.0, 20.0, 9.0, 6.0, 8.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.03125, -33.84326171875, -32.6552734375, -31.46728515625, -30.279296875, -29.09130859375, -27.9033203125, -26.71533203125, -25.52734375, -24.33935546875, -23.1513671875, -21.96337890625, -20.775390625, -19.58740234375, -18.3994140625, -17.21142578125, -16.0234375, -14.83544921875, -13.6474609375, -12.45947265625, -11.271484375, -10.08349609375, -8.8955078125, -7.70751953125, -6.51953125, -5.33154296875, -4.1435546875, -2.95556640625, -1.767578125, -0.57958984375, 0.6083984375, 1.79638671875, 2.984375, 4.17236328125, 5.3603515625, 6.54833984375, 7.736328125, 8.92431640625, 10.1123046875, 11.30029296875, 12.48828125, 13.67626953125, 14.8642578125, 16.05224609375, 17.240234375, 18.42822265625, 19.6162109375, 20.80419921875, 21.9921875, 23.18017578125, 24.3681640625, 25.55615234375, 26.744140625, 27.93212890625, 29.1201171875, 30.30810546875, 31.49609375, 32.68408203125, 33.8720703125, 35.06005859375, 36.248046875, 37.43603515625, 38.6240234375, 39.81201171875, 41.0]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 2.0, 4.0, 6.0, 3.0, 9.0, 8.0, 10.0, 22.0, 6.0, 11.0, 21.0, 30.0, 28.0, 50.0, 60.0, 77.0, 116.0, 188.0, 334.0, 2009.0, 411.0, 196.0, 111.0, 73.0, 43.0, 51.0, 39.0, 26.0, 20.0, 21.0, 21.0, 8.0, 9.0, 8.0, 11.0, 7.0, 5.0, 10.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.47265625, -5.29412841796875, -5.1156005859375, -4.93707275390625, -4.758544921875, -4.58001708984375, -4.4014892578125, -4.22296142578125, -4.04443359375, -3.86590576171875, -3.6873779296875, -3.50885009765625, -3.330322265625, -3.15179443359375, -2.9732666015625, -2.79473876953125, -2.6162109375, -2.43768310546875, -2.2591552734375, -2.08062744140625, -1.902099609375, -1.72357177734375, -1.5450439453125, -1.36651611328125, -1.18798828125, -1.00946044921875, -0.8309326171875, -0.65240478515625, -0.473876953125, -0.29534912109375, -0.1168212890625, 0.06170654296875, 0.240234375, 0.41876220703125, 0.5972900390625, 0.77581787109375, 0.954345703125, 1.13287353515625, 1.3114013671875, 1.48992919921875, 1.66845703125, 1.84698486328125, 2.0255126953125, 2.20404052734375, 2.382568359375, 2.56109619140625, 2.7396240234375, 2.91815185546875, 3.0966796875, 3.27520751953125, 3.4537353515625, 3.63226318359375, 3.810791015625, 3.98931884765625, 4.1678466796875, 4.34637451171875, 4.52490234375, 4.70343017578125, 4.8819580078125, 5.06048583984375, 5.239013671875, 5.41754150390625, 5.5960693359375, 5.77459716796875, 5.953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 3.0, 12.0, 25.0, 50.0, 85.0, 130.0, 201.0, 201.0, 140.0, 70.0, 34.0, 22.0, 8.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.876670837402344, -35.98329162597656, -34.08991241455078, -32.196533203125, -30.303150177001953, -28.409770965576172, -26.51639175415039, -24.62301254272461, -22.729631423950195, -20.836252212524414, -18.94287109375, -17.04949188232422, -15.156111717224121, -13.262731552124023, -11.369352340698242, -9.475972175598145, -7.582592010498047, -5.689211845397949, -3.7958321571350098, -1.9024524688720703, -0.009072303771972656, 1.884307861328125, 3.7776870727539062, 5.671067237854004, 7.564447402954102, 9.4578275680542, 11.351207733154297, 13.244586944580078, 15.137967109680176, 17.031347274780273, 18.924726486206055, 20.81810760498047, 22.71148681640625, 24.60486602783203, 26.498247146606445, 28.391626358032227, 30.28500747680664, 32.17838668823242, 34.0717658996582, 35.965145111083984, 37.85852813720703, 39.75190734863281, 41.645286560058594, 43.538665771484375, 45.43204879760742, 47.3254280090332, 49.218807220458984, 51.112186431884766, 53.00556564331055, 54.89894485473633, 56.79232406616211, 58.685707092285156, 60.57908630371094, 62.47246551513672, 64.3658447265625, 66.25922393798828, 68.15260314941406, 70.04598236083984, 71.93936157226562, 73.8327407836914, 75.72611999511719, 77.6195068359375, 79.51287841796875, 81.40626525878906, 83.29964447021484]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 7.0, 6.0, 7.0, 11.0, 10.0, 11.0, 17.0, 18.0, 21.0, 36.0, 26.0, 30.0, 41.0, 36.0, 37.0, 46.0, 45.0, 55.0, 51.0, 42.0, 50.0, 40.0, 54.0, 40.0, 43.0, 27.0, 31.0, 31.0, 24.0, 20.0, 22.0, 18.0, 8.0, 6.0, 4.0, 3.0, 9.0, 4.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.90411949157715, -18.21017837524414, -17.516237258911133, -16.822296142578125, -16.128353118896484, -15.434412956237793, -14.740470886230469, -14.046529769897461, -13.352588653564453, -12.658647537231445, -11.964706420898438, -11.270764350891113, -10.576823234558105, -9.882882118225098, -9.188940048217773, -8.494998931884766, -7.801057815551758, -7.10711669921875, -6.413175106048584, -5.719233512878418, -5.02529239654541, -4.331351280212402, -3.6374096870422363, -2.9434680938720703, -2.2495269775390625, -1.5555856227874756, -0.8616442680358887, -0.16770291328430176, 0.5262384414672852, 1.220179796218872, 1.914121150970459, 2.608062744140625, 3.302003860473633, 3.9959452152252197, 4.689886569976807, 5.383828163146973, 6.0777692794799805, 6.771710395812988, 7.465651988983154, 8.15959358215332, 8.853534698486328, 9.547475814819336, 10.241416931152344, 10.935359001159668, 11.629300117492676, 12.323241233825684, 13.017183303833008, 13.711124420166016, 14.405065536499023, 15.099006652832031, 15.792947769165039, 16.486888885498047, 17.180831909179688, 17.874773025512695, 18.568714141845703, 19.26265525817871, 19.95659637451172, 20.650537490844727, 21.344478607177734, 22.038419723510742, 22.73236083984375, 23.42630386352539, 24.1202449798584, 24.814186096191406, 25.508127212524414]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 6.0, 6.0, 9.0, 9.0, 9.0, 23.0, 14.0, 31.0, 61.0, 77.0, 98.0, 132.0, 243.0, 372.0, 639.0, 1041.0, 1825.0, 3468.0, 6497.0, 13271.0, 29266.0, 68498.0, 208904.0, 462752.0, 149587.0, 54525.0, 23738.0, 10975.0, 5549.0, 2899.0, 1535.0, 950.0, 546.0, 343.0, 243.0, 140.0, 99.0, 67.0, 34.0, 24.0, 17.0, 10.0, 12.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-29.3125, -28.279296875, -27.24609375, -26.212890625, -25.1796875, -24.146484375, -23.11328125, -22.080078125, -21.046875, -20.013671875, -18.98046875, -17.947265625, -16.9140625, -15.880859375, -14.84765625, -13.814453125, -12.78125, -11.748046875, -10.71484375, -9.681640625, -8.6484375, -7.615234375, -6.58203125, -5.548828125, -4.515625, -3.482421875, -2.44921875, -1.416015625, -0.3828125, 0.650390625, 1.68359375, 2.716796875, 3.75, 4.783203125, 5.81640625, 6.849609375, 7.8828125, 8.916015625, 9.94921875, 10.982421875, 12.015625, 13.048828125, 14.08203125, 15.115234375, 16.1484375, 17.181640625, 18.21484375, 19.248046875, 20.28125, 21.314453125, 22.34765625, 23.380859375, 24.4140625, 25.447265625, 26.48046875, 27.513671875, 28.546875, 29.580078125, 30.61328125, 31.646484375, 32.6796875, 33.712890625, 34.74609375, 35.779296875, 36.8125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 6.0, 9.0, 5.0, 6.0, 6.0, 13.0, 13.0, 21.0, 22.0, 29.0, 28.0, 33.0, 39.0, 42.0, 32.0, 60.0, 59.0, 64.0, 67.0, 57.0, 52.0, 57.0, 47.0, 34.0, 25.0, 31.0, 24.0, 26.0, 20.0, 23.0, 8.0, 7.0, 12.0, 13.0, 3.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.79296875, -2.693695068359375, -2.59442138671875, -2.495147705078125, -2.3958740234375, -2.296600341796875, -2.19732666015625, -2.098052978515625, -1.998779296875, -1.899505615234375, -1.80023193359375, -1.700958251953125, -1.6016845703125, -1.502410888671875, -1.40313720703125, -1.303863525390625, -1.20458984375, -1.105316162109375, -1.00604248046875, -0.906768798828125, -0.8074951171875, -0.708221435546875, -0.60894775390625, -0.509674072265625, -0.410400390625, -0.311126708984375, -0.21185302734375, -0.112579345703125, -0.0133056640625, 0.085968017578125, 0.18524169921875, 0.284515380859375, 0.3837890625, 0.483062744140625, 0.58233642578125, 0.681610107421875, 0.7808837890625, 0.880157470703125, 0.97943115234375, 1.078704833984375, 1.177978515625, 1.277252197265625, 1.37652587890625, 1.475799560546875, 1.5750732421875, 1.674346923828125, 1.77362060546875, 1.872894287109375, 1.97216796875, 2.071441650390625, 2.17071533203125, 2.269989013671875, 2.3692626953125, 2.468536376953125, 2.56781005859375, 2.667083740234375, 2.766357421875, 2.865631103515625, 2.96490478515625, 3.064178466796875, 3.1634521484375, 3.262725830078125, 3.36199951171875, 3.461273193359375, 3.560546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 7.0, 11.0, 11.0, 20.0, 15.0, 36.0, 46.0, 66.0, 102.0, 131.0, 187.0, 299.0, 498.0, 860.0, 1506.0, 2996.0, 6423.0, 14908.0, 39402.0, 123822.0, 493835.0, 253832.0, 66643.0, 23659.0, 9687.0, 4401.0, 2153.0, 1158.0, 677.0, 386.0, 221.0, 164.0, 107.0, 75.0, 57.0, 46.0, 27.0, 29.0, 14.0, 9.0, 3.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-31.375, -30.4453125, -29.515625, -28.5859375, -27.65625, -26.7265625, -25.796875, -24.8671875, -23.9375, -23.0078125, -22.078125, -21.1484375, -20.21875, -19.2890625, -18.359375, -17.4296875, -16.5, -15.5703125, -14.640625, -13.7109375, -12.78125, -11.8515625, -10.921875, -9.9921875, -9.0625, -8.1328125, -7.203125, -6.2734375, -5.34375, -4.4140625, -3.484375, -2.5546875, -1.625, -0.6953125, 0.234375, 1.1640625, 2.09375, 3.0234375, 3.953125, 4.8828125, 5.8125, 6.7421875, 7.671875, 8.6015625, 9.53125, 10.4609375, 11.390625, 12.3203125, 13.25, 14.1796875, 15.109375, 16.0390625, 16.96875, 17.8984375, 18.828125, 19.7578125, 20.6875, 21.6171875, 22.546875, 23.4765625, 24.40625, 25.3359375, 26.265625, 27.1953125, 28.125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 11.0, 7.0, 7.0, 10.0, 29.0, 22.0, 34.0, 48.0, 51.0, 43.0, 48.0, 55.0, 63.0, 59.0, 72.0, 69.0, 71.0, 53.0, 48.0, 41.0, 40.0, 20.0, 24.0, 24.0, 10.0, 9.0, 11.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.796875, -17.200439453125, -16.60400390625, -16.007568359375, -15.4111328125, -14.814697265625, -14.21826171875, -13.621826171875, -13.025390625, -12.428955078125, -11.83251953125, -11.236083984375, -10.6396484375, -10.043212890625, -9.44677734375, -8.850341796875, -8.25390625, -7.657470703125, -7.06103515625, -6.464599609375, -5.8681640625, -5.271728515625, -4.67529296875, -4.078857421875, -3.482421875, -2.885986328125, -2.28955078125, -1.693115234375, -1.0966796875, -0.500244140625, 0.09619140625, 0.692626953125, 1.2890625, 1.885498046875, 2.48193359375, 3.078369140625, 3.6748046875, 4.271240234375, 4.86767578125, 5.464111328125, 6.060546875, 6.656982421875, 7.25341796875, 7.849853515625, 8.4462890625, 9.042724609375, 9.63916015625, 10.235595703125, 10.83203125, 11.428466796875, 12.02490234375, 12.621337890625, 13.2177734375, 13.814208984375, 14.41064453125, 15.007080078125, 15.603515625, 16.199951171875, 16.79638671875, 17.392822265625, 17.9892578125, 18.585693359375, 19.18212890625, 19.778564453125, 20.375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 8.0, 8.0, 15.0, 21.0, 24.0, 44.0, 88.0, 160.0, 335.0, 830.0, 2244.0, 7429.0, 36664.0, 523613.0, 434304.0, 32318.0, 6910.0, 2114.0, 723.0, 353.0, 141.0, 81.0, 49.0, 32.0, 14.0, 13.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-59.40625, -57.919921875, -56.43359375, -54.947265625, -53.4609375, -51.974609375, -50.48828125, -49.001953125, -47.515625, -46.029296875, -44.54296875, -43.056640625, -41.5703125, -40.083984375, -38.59765625, -37.111328125, -35.625, -34.138671875, -32.65234375, -31.166015625, -29.6796875, -28.193359375, -26.70703125, -25.220703125, -23.734375, -22.248046875, -20.76171875, -19.275390625, -17.7890625, -16.302734375, -14.81640625, -13.330078125, -11.84375, -10.357421875, -8.87109375, -7.384765625, -5.8984375, -4.412109375, -2.92578125, -1.439453125, 0.046875, 1.533203125, 3.01953125, 4.505859375, 5.9921875, 7.478515625, 8.96484375, 10.451171875, 11.9375, 13.423828125, 14.91015625, 16.396484375, 17.8828125, 19.369140625, 20.85546875, 22.341796875, 23.828125, 25.314453125, 26.80078125, 28.287109375, 29.7734375, 31.259765625, 32.74609375, 34.232421875, 35.71875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 10.0, 11.0, 11.0, 24.0, 22.0, 42.0, 65.0, 93.0, 134.0, 145.0, 148.0, 90.0, 52.0, 32.0, 23.0, 17.0, 13.0, 12.0, 11.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0031375885009765625, -0.003019005060195923, -0.002900421619415283, -0.0027818381786346436, -0.002663254737854004, -0.0025446712970733643, -0.0024260878562927246, -0.002307504415512085, -0.0021889209747314453, -0.0020703375339508057, -0.001951754093170166, -0.0018331706523895264, -0.0017145872116088867, -0.001596003770828247, -0.0014774203300476074, -0.0013588368892669678, -0.0012402534484863281, -0.0011216700077056885, -0.0010030865669250488, -0.0008845031261444092, -0.0007659196853637695, -0.0006473362445831299, -0.0005287528038024902, -0.0004101693630218506, -0.00029158592224121094, -0.0001730024814605713, -5.441904067993164e-05, 6.416440010070801e-05, 0.00018274784088134766, 0.0003013312816619873, 0.00041991472244262695, 0.0005384981632232666, 0.0006570816040039062, 0.0007756650447845459, 0.0008942484855651855, 0.0010128319263458252, 0.0011314153671264648, 0.0012499988079071045, 0.0013685822486877441, 0.0014871656894683838, 0.0016057491302490234, 0.001724332571029663, 0.0018429160118103027, 0.0019614994525909424, 0.002080082893371582, 0.0021986663341522217, 0.0023172497749328613, 0.002435833215713501, 0.0025544166564941406, 0.0026730000972747803, 0.00279158353805542, 0.0029101669788360596, 0.0030287504196166992, 0.003147333860397339, 0.0032659173011779785, 0.003384500741958618, 0.003503084182739258, 0.0036216676235198975, 0.003740251064300537, 0.0038588345050811768, 0.003977417945861816, 0.004096001386642456, 0.004214584827423096, 0.004333168268203735, 0.004451751708984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 9.0, 4.0, 18.0, 19.0, 32.0, 35.0, 72.0, 84.0, 153.0, 246.0, 443.0, 815.0, 1517.0, 3084.0, 6899.0, 18638.0, 65528.0, 362233.0, 468622.0, 83452.0, 21955.0, 7858.0, 3379.0, 1543.0, 802.0, 470.0, 235.0, 145.0, 95.0, 64.0, 36.0, 25.0, 11.0, 13.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.734375, -25.92626953125, -25.1181640625, -24.31005859375, -23.501953125, -22.69384765625, -21.8857421875, -21.07763671875, -20.26953125, -19.46142578125, -18.6533203125, -17.84521484375, -17.037109375, -16.22900390625, -15.4208984375, -14.61279296875, -13.8046875, -12.99658203125, -12.1884765625, -11.38037109375, -10.572265625, -9.76416015625, -8.9560546875, -8.14794921875, -7.33984375, -6.53173828125, -5.7236328125, -4.91552734375, -4.107421875, -3.29931640625, -2.4912109375, -1.68310546875, -0.875, -0.06689453125, 0.7412109375, 1.54931640625, 2.357421875, 3.16552734375, 3.9736328125, 4.78173828125, 5.58984375, 6.39794921875, 7.2060546875, 8.01416015625, 8.822265625, 9.63037109375, 10.4384765625, 11.24658203125, 12.0546875, 12.86279296875, 13.6708984375, 14.47900390625, 15.287109375, 16.09521484375, 16.9033203125, 17.71142578125, 18.51953125, 19.32763671875, 20.1357421875, 20.94384765625, 21.751953125, 22.56005859375, 23.3681640625, 24.17626953125, 24.984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 7.0, 4.0, 4.0, 5.0, 15.0, 15.0, 17.0, 20.0, 27.0, 30.0, 59.0, 56.0, 64.0, 74.0, 79.0, 73.0, 87.0, 74.0, 63.0, 49.0, 43.0, 27.0, 26.0, 20.0, 9.0, 19.0, 3.0, 6.0, 5.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.6796875, -13.3135986328125, -12.947509765625, -12.5814208984375, -12.21533203125, -11.8492431640625, -11.483154296875, -11.1170654296875, -10.7509765625, -10.3848876953125, -10.018798828125, -9.6527099609375, -9.28662109375, -8.9205322265625, -8.554443359375, -8.1883544921875, -7.822265625, -7.4561767578125, -7.090087890625, -6.7239990234375, -6.35791015625, -5.9918212890625, -5.625732421875, -5.2596435546875, -4.8935546875, -4.5274658203125, -4.161376953125, -3.7952880859375, -3.42919921875, -3.0631103515625, -2.697021484375, -2.3309326171875, -1.96484375, -1.5987548828125, -1.232666015625, -0.8665771484375, -0.50048828125, -0.1343994140625, 0.231689453125, 0.5977783203125, 0.9638671875, 1.3299560546875, 1.696044921875, 2.0621337890625, 2.42822265625, 2.7943115234375, 3.160400390625, 3.5264892578125, 3.892578125, 4.2586669921875, 4.624755859375, 4.9908447265625, 5.35693359375, 5.7230224609375, 6.089111328125, 6.4552001953125, 6.8212890625, 7.1873779296875, 7.553466796875, 7.9195556640625, 8.28564453125, 8.6517333984375, 9.017822265625, 9.3839111328125, 9.75]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 12.0, 16.0, 21.0, 61.0, 130.0, 285.0, 246.0, 101.0, 61.0, 30.0, 14.0, 13.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.111572265625, -253.68032836914062, -244.24908447265625, -234.81784057617188, -225.3865966796875, -215.95535278320312, -206.52410888671875, -197.09286499023438, -187.66162109375, -178.23037719726562, -168.79913330078125, -159.36788940429688, -149.9366455078125, -140.50540161132812, -131.07415771484375, -121.64290618896484, -112.21165466308594, -102.78041076660156, -93.34916687011719, -83.91792297363281, -74.48667907714844, -65.05543518066406, -55.624183654785156, -46.19293975830078, -36.761695861816406, -27.33045196533203, -17.899206161499023, -8.467960357666016, 0.9632835388183594, 10.394527435302734, 19.825775146484375, 29.25701904296875, 38.688262939453125, 48.1195068359375, 57.550750732421875, 66.98199462890625, 76.41323852539062, 85.844482421875, 95.2757339477539, 104.70697784423828, 114.13822174072266, 123.56946563720703, 133.00071716308594, 142.4319610595703, 151.8632049560547, 161.29444885253906, 170.72569274902344, 180.1569366455078, 189.5881805419922, 199.01942443847656, 208.45066833496094, 217.8819122314453, 227.3131561279297, 236.74440002441406, 246.1756591796875, 255.60690307617188, 265.03814697265625, 274.4693908691406, 283.900634765625, 293.3318786621094, 302.76312255859375, 312.1943664550781, 321.6256103515625, 331.0568542480469, 340.48809814453125]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 7.0, 4.0, 11.0, 18.0, 18.0, 23.0, 40.0, 45.0, 44.0, 58.0, 64.0, 55.0, 65.0, 77.0, 69.0, 69.0, 49.0, 50.0, 50.0, 47.0, 32.0, 16.0, 16.0, 12.0, 14.0, 11.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-147.695556640625, -143.18995666503906, -138.68435668945312, -134.1787567138672, -129.67315673828125, -125.16755676269531, -120.66195678710938, -116.15635681152344, -111.6507568359375, -107.14515686035156, -102.63955688476562, -98.13395690917969, -93.62835693359375, -89.12275695800781, -84.61715698242188, -80.11155700683594, -75.60596466064453, -71.1003646850586, -66.59476470947266, -62.08916473388672, -57.58356475830078, -53.077964782714844, -48.57236862182617, -44.066768646240234, -39.5611686706543, -35.05556869506836, -30.549968719482422, -26.044370651245117, -21.53877067565918, -17.033170700073242, -12.527572631835938, -8.02197265625, -3.5163726806640625, 0.9892268180847168, 5.494826316833496, 10.000425338745117, 14.506025314331055, 19.011625289916992, 23.517223358154297, 28.022823333740234, 32.52842330932617, 37.03402328491211, 41.53962326049805, 46.04521942138672, 50.550819396972656, 55.056419372558594, 59.56201934814453, 64.06761932373047, 68.5732192993164, 73.07881927490234, 77.58441925048828, 82.09001922607422, 86.59561920166016, 91.1012191772461, 95.6068115234375, 100.11241149902344, 104.61801147460938, 109.12361145019531, 113.62921142578125, 118.13481140136719, 122.64041137695312, 127.14601135253906, 131.651611328125, 136.15721130371094, 140.66281127929688]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 7.0, 2.0, 7.0, 8.0, 20.0, 24.0, 38.0, 57.0, 91.0, 170.0, 250.0, 417.0, 739.0, 1304.0, 2416.0, 4483.0, 8787.0, 18481.0, 45212.0, 161359.0, 3551847.0, 291888.0, 60603.0, 22537.0, 10469.0, 5368.0, 2867.0, 1713.0, 965.0, 636.0, 433.0, 295.0, 203.0, 144.0, 110.0, 61.0, 63.0, 54.0, 32.0, 26.0, 21.0, 13.0, 27.0, 7.0, 4.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-51.28125, -49.11279296875, -46.9443359375, -44.77587890625, -42.607421875, -40.43896484375, -38.2705078125, -36.10205078125, -33.93359375, -31.76513671875, -29.5966796875, -27.42822265625, -25.259765625, -23.09130859375, -20.9228515625, -18.75439453125, -16.5859375, -14.41748046875, -12.2490234375, -10.08056640625, -7.912109375, -5.74365234375, -3.5751953125, -1.40673828125, 0.76171875, 2.93017578125, 5.0986328125, 7.26708984375, 9.435546875, 11.60400390625, 13.7724609375, 15.94091796875, 18.109375, 20.27783203125, 22.4462890625, 24.61474609375, 26.783203125, 28.95166015625, 31.1201171875, 33.28857421875, 35.45703125, 37.62548828125, 39.7939453125, 41.96240234375, 44.130859375, 46.29931640625, 48.4677734375, 50.63623046875, 52.8046875, 54.97314453125, 57.1416015625, 59.31005859375, 61.478515625, 63.64697265625, 65.8154296875, 67.98388671875, 70.15234375, 72.32080078125, 74.4892578125, 76.65771484375, 78.826171875, 80.99462890625, 83.1630859375, 85.33154296875, 87.5]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 12.0, 14.0, 21.0, 20.0, 32.0, 48.0, 51.0, 56.0, 69.0, 83.0, 94.0, 90.0, 72.0, 81.0, 54.0, 52.0, 52.0, 32.0, 18.0, 18.0, 13.0, 7.0, 4.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.66796875, -3.5091552734375, -3.350341796875, -3.1915283203125, -3.03271484375, -2.8739013671875, -2.715087890625, -2.5562744140625, -2.3974609375, -2.2386474609375, -2.079833984375, -1.9210205078125, -1.76220703125, -1.6033935546875, -1.444580078125, -1.2857666015625, -1.126953125, -0.9681396484375, -0.809326171875, -0.6505126953125, -0.49169921875, -0.3328857421875, -0.174072265625, -0.0152587890625, 0.1435546875, 0.3023681640625, 0.461181640625, 0.6199951171875, 0.77880859375, 0.9376220703125, 1.096435546875, 1.2552490234375, 1.4140625, 1.5728759765625, 1.731689453125, 1.8905029296875, 2.04931640625, 2.2081298828125, 2.366943359375, 2.5257568359375, 2.6845703125, 2.8433837890625, 3.002197265625, 3.1610107421875, 3.31982421875, 3.4786376953125, 3.637451171875, 3.7962646484375, 3.955078125, 4.1138916015625, 4.272705078125, 4.4315185546875, 4.59033203125, 4.7491455078125, 4.907958984375, 5.0667724609375, 5.2255859375, 5.3843994140625, 5.543212890625, 5.7020263671875, 5.86083984375, 6.0196533203125, 6.178466796875, 6.3372802734375, 6.49609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 20.0, 23.0, 31.0, 50.0, 105.0, 189.0, 346.0, 897.0, 2348.0, 7774.0, 34785.0, 348887.0, 3681356.0, 94429.0, 16271.0, 4238.0, 1412.0, 525.0, 247.0, 123.0, 61.0, 42.0, 33.0, 13.0, 7.0, 11.0, 9.0, 7.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.4375, -99.3427734375, -95.248046875, -91.1533203125, -87.05859375, -82.9638671875, -78.869140625, -74.7744140625, -70.6796875, -66.5849609375, -62.490234375, -58.3955078125, -54.30078125, -50.2060546875, -46.111328125, -42.0166015625, -37.921875, -33.8271484375, -29.732421875, -25.6376953125, -21.54296875, -17.4482421875, -13.353515625, -9.2587890625, -5.1640625, -1.0693359375, 3.025390625, 7.1201171875, 11.21484375, 15.3095703125, 19.404296875, 23.4990234375, 27.59375, 31.6884765625, 35.783203125, 39.8779296875, 43.97265625, 48.0673828125, 52.162109375, 56.2568359375, 60.3515625, 64.4462890625, 68.541015625, 72.6357421875, 76.73046875, 80.8251953125, 84.919921875, 89.0146484375, 93.109375, 97.2041015625, 101.298828125, 105.3935546875, 109.48828125, 113.5830078125, 117.677734375, 121.7724609375, 125.8671875, 129.9619140625, 134.056640625, 138.1513671875, 142.24609375, 146.3408203125, 150.435546875, 154.5302734375, 158.625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 8.0, 3.0, 8.0, 18.0, 15.0, 17.0, 22.0, 45.0, 38.0, 49.0, 84.0, 113.0, 185.0, 424.0, 1924.0, 469.0, 204.0, 125.0, 81.0, 54.0, 43.0, 30.0, 22.0, 20.0, 12.0, 14.0, 9.0, 7.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.328125, -12.9730224609375, -12.617919921875, -12.2628173828125, -11.90771484375, -11.5526123046875, -11.197509765625, -10.8424072265625, -10.4873046875, -10.1322021484375, -9.777099609375, -9.4219970703125, -9.06689453125, -8.7117919921875, -8.356689453125, -8.0015869140625, -7.646484375, -7.2913818359375, -6.936279296875, -6.5811767578125, -6.22607421875, -5.8709716796875, -5.515869140625, -5.1607666015625, -4.8056640625, -4.4505615234375, -4.095458984375, -3.7403564453125, -3.38525390625, -3.0301513671875, -2.675048828125, -2.3199462890625, -1.96484375, -1.6097412109375, -1.254638671875, -0.8995361328125, -0.54443359375, -0.1893310546875, 0.165771484375, 0.5208740234375, 0.8759765625, 1.2310791015625, 1.586181640625, 1.9412841796875, 2.29638671875, 2.6514892578125, 3.006591796875, 3.3616943359375, 3.716796875, 4.0718994140625, 4.427001953125, 4.7821044921875, 5.13720703125, 5.4923095703125, 5.847412109375, 6.2025146484375, 6.5576171875, 6.9127197265625, 7.267822265625, 7.6229248046875, 7.97802734375, 8.3331298828125, 8.688232421875, 9.0433349609375, 9.3984375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 11.0, 20.0, 34.0, 67.0, 128.0, 209.0, 225.0, 120.0, 70.0, 36.0, 22.0, 19.0, 15.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.61849594116211, -58.402278900146484, -55.186065673828125, -51.9698486328125, -48.753631591796875, -45.53741455078125, -42.32120132446289, -39.104984283447266, -35.888771057128906, -32.67255401611328, -29.45633888244629, -26.240123748779297, -23.023906707763672, -19.80769157409668, -16.591476440429688, -13.375259399414062, -10.159042358398438, -6.942826271057129, -3.7266106605529785, -0.5103950500488281, 2.7058210372924805, 5.922037124633789, 9.138252258300781, 12.354469299316406, 15.570684432983398, 18.78689956665039, 22.003116607666016, 25.219331741333008, 28.435546875, 31.651763916015625, 34.86798095703125, 38.084197998046875, 41.30040740966797, 44.516624450683594, 47.73283767700195, 50.94905471801758, 54.1652717590332, 57.38148498535156, 60.59770202636719, 63.81391906738281, 67.03013610839844, 70.24635314941406, 73.46257019042969, 76.67878723144531, 79.8949966430664, 83.11121368408203, 86.32743072509766, 89.54364776611328, 92.75985717773438, 95.97607421875, 99.19229125976562, 102.40850830078125, 105.62471771240234, 108.84093475341797, 112.0571517944336, 115.27336883544922, 118.48958587646484, 121.70580291748047, 124.9220199584961, 128.1382293701172, 131.3544464111328, 134.57066345214844, 137.78688049316406, 141.0030975341797, 144.2193145751953]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 9.0, 13.0, 13.0, 16.0, 26.0, 29.0, 40.0, 43.0, 49.0, 39.0, 46.0, 48.0, 45.0, 40.0, 59.0, 62.0, 43.0, 47.0, 48.0, 43.0, 39.0, 29.0, 37.0, 30.0, 20.0, 19.0, 13.0, 14.0, 11.0, 6.0, 2.0, 7.0, 2.0, 2.0], "bins": [-67.78295135498047, -66.23178100585938, -64.68061828613281, -63.12944793701172, -61.578277587890625, -60.02710723876953, -58.4759407043457, -56.924774169921875, -55.37360382080078, -53.82243347167969, -52.27126693725586, -50.72010040283203, -49.16893005371094, -47.617759704589844, -46.066593170166016, -44.51542663574219, -42.964256286621094, -41.4130859375, -39.86191940307617, -38.310752868652344, -36.75958251953125, -35.208412170410156, -33.65724563598633, -32.1060791015625, -30.554908752441406, -29.003740310668945, -27.452571868896484, -25.901403427124023, -24.350234985351562, -22.7990665435791, -21.24789810180664, -19.69672966003418, -18.14556121826172, -16.594392776489258, -15.043224334716797, -13.492055892944336, -11.940887451171875, -10.389719009399414, -8.838550567626953, -7.287382125854492, -5.736213684082031, -4.18504524230957, -2.6338768005371094, -1.0827083587646484, 0.4684600830078125, 2.0196285247802734, 3.5707969665527344, 5.121965408325195, 6.673133850097656, 8.224302291870117, 9.775470733642578, 11.326639175415039, 12.8778076171875, 14.428976058959961, 15.980144500732422, 17.531312942504883, 19.082481384277344, 20.633649826049805, 22.184818267822266, 23.735986709594727, 25.287155151367188, 26.83832359313965, 28.38949203491211, 29.94066047668457, 31.49182891845703]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 6.0, 6.0, 10.0, 12.0, 14.0, 22.0, 31.0, 46.0, 50.0, 79.0, 112.0, 170.0, 278.0, 434.0, 663.0, 1080.0, 1748.0, 2998.0, 4979.0, 8993.0, 17210.0, 33552.0, 69483.0, 157766.0, 333117.0, 225723.0, 95642.0, 44482.0, 22300.0, 11601.0, 6476.0, 3563.0, 2251.0, 1306.0, 822.0, 509.0, 339.0, 205.0, 136.0, 93.0, 69.0, 46.0, 36.0, 28.0, 19.0, 12.0, 14.0, 9.0, 4.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.28125, -30.32470703125, -29.3681640625, -28.41162109375, -27.455078125, -26.49853515625, -25.5419921875, -24.58544921875, -23.62890625, -22.67236328125, -21.7158203125, -20.75927734375, -19.802734375, -18.84619140625, -17.8896484375, -16.93310546875, -15.9765625, -15.02001953125, -14.0634765625, -13.10693359375, -12.150390625, -11.19384765625, -10.2373046875, -9.28076171875, -8.32421875, -7.36767578125, -6.4111328125, -5.45458984375, -4.498046875, -3.54150390625, -2.5849609375, -1.62841796875, -0.671875, 0.28466796875, 1.2412109375, 2.19775390625, 3.154296875, 4.11083984375, 5.0673828125, 6.02392578125, 6.98046875, 7.93701171875, 8.8935546875, 9.85009765625, 10.806640625, 11.76318359375, 12.7197265625, 13.67626953125, 14.6328125, 15.58935546875, 16.5458984375, 17.50244140625, 18.458984375, 19.41552734375, 20.3720703125, 21.32861328125, 22.28515625, 23.24169921875, 24.1982421875, 25.15478515625, 26.111328125, 27.06787109375, 28.0244140625, 28.98095703125, 29.9375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 6.0, 5.0, 19.0, 21.0, 26.0, 23.0, 38.0, 33.0, 39.0, 48.0, 45.0, 58.0, 54.0, 58.0, 45.0, 50.0, 51.0, 60.0, 54.0, 47.0, 36.0, 27.0, 31.0, 23.0, 19.0, 17.0, 13.0, 8.0, 11.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.568359375, -3.450469970703125, -3.33258056640625, -3.214691162109375, -3.0968017578125, -2.978912353515625, -2.86102294921875, -2.743133544921875, -2.625244140625, -2.507354736328125, -2.38946533203125, -2.271575927734375, -2.1536865234375, -2.035797119140625, -1.91790771484375, -1.800018310546875, -1.68212890625, -1.564239501953125, -1.44635009765625, -1.328460693359375, -1.2105712890625, -1.092681884765625, -0.97479248046875, -0.856903076171875, -0.739013671875, -0.621124267578125, -0.50323486328125, -0.385345458984375, -0.2674560546875, -0.149566650390625, -0.03167724609375, 0.086212158203125, 0.2041015625, 0.321990966796875, 0.43988037109375, 0.557769775390625, 0.6756591796875, 0.793548583984375, 0.91143798828125, 1.029327392578125, 1.147216796875, 1.265106201171875, 1.38299560546875, 1.500885009765625, 1.6187744140625, 1.736663818359375, 1.85455322265625, 1.972442626953125, 2.09033203125, 2.208221435546875, 2.32611083984375, 2.444000244140625, 2.5618896484375, 2.679779052734375, 2.79766845703125, 2.915557861328125, 3.033447265625, 3.151336669921875, 3.26922607421875, 3.387115478515625, 3.5050048828125, 3.622894287109375, 3.74078369140625, 3.858673095703125, 3.9765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 6.0, 4.0, 12.0, 14.0, 34.0, 23.0, 35.0, 58.0, 79.0, 130.0, 199.0, 309.0, 569.0, 1181.0, 2152.0, 4854.0, 11649.0, 31397.0, 104597.0, 480432.0, 301607.0, 70087.0, 22683.0, 8738.0, 3729.0, 1815.0, 907.0, 438.0, 283.0, 182.0, 107.0, 75.0, 45.0, 33.0, 24.0, 24.0, 10.0, 10.0, 9.0, 2.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-51.25, -49.58837890625, -47.9267578125, -46.26513671875, -44.603515625, -42.94189453125, -41.2802734375, -39.61865234375, -37.95703125, -36.29541015625, -34.6337890625, -32.97216796875, -31.310546875, -29.64892578125, -27.9873046875, -26.32568359375, -24.6640625, -23.00244140625, -21.3408203125, -19.67919921875, -18.017578125, -16.35595703125, -14.6943359375, -13.03271484375, -11.37109375, -9.70947265625, -8.0478515625, -6.38623046875, -4.724609375, -3.06298828125, -1.4013671875, 0.26025390625, 1.921875, 3.58349609375, 5.2451171875, 6.90673828125, 8.568359375, 10.22998046875, 11.8916015625, 13.55322265625, 15.21484375, 16.87646484375, 18.5380859375, 20.19970703125, 21.861328125, 23.52294921875, 25.1845703125, 26.84619140625, 28.5078125, 30.16943359375, 31.8310546875, 33.49267578125, 35.154296875, 36.81591796875, 38.4775390625, 40.13916015625, 41.80078125, 43.46240234375, 45.1240234375, 46.78564453125, 48.447265625, 50.10888671875, 51.7705078125, 53.43212890625, 55.09375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 4.0, 15.0, 6.0, 11.0, 4.0, 16.0, 15.0, 25.0, 24.0, 23.0, 32.0, 41.0, 42.0, 45.0, 47.0, 49.0, 52.0, 54.0, 56.0, 44.0, 66.0, 41.0, 33.0, 40.0, 50.0, 27.0, 18.0, 22.0, 8.0, 14.0, 23.0, 11.0, 9.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.46875, -21.705322265625, -20.94189453125, -20.178466796875, -19.4150390625, -18.651611328125, -17.88818359375, -17.124755859375, -16.361328125, -15.597900390625, -14.83447265625, -14.071044921875, -13.3076171875, -12.544189453125, -11.78076171875, -11.017333984375, -10.25390625, -9.490478515625, -8.72705078125, -7.963623046875, -7.2001953125, -6.436767578125, -5.67333984375, -4.909912109375, -4.146484375, -3.383056640625, -2.61962890625, -1.856201171875, -1.0927734375, -0.329345703125, 0.43408203125, 1.197509765625, 1.9609375, 2.724365234375, 3.48779296875, 4.251220703125, 5.0146484375, 5.778076171875, 6.54150390625, 7.304931640625, 8.068359375, 8.831787109375, 9.59521484375, 10.358642578125, 11.1220703125, 11.885498046875, 12.64892578125, 13.412353515625, 14.17578125, 14.939208984375, 15.70263671875, 16.466064453125, 17.2294921875, 17.992919921875, 18.75634765625, 19.519775390625, 20.283203125, 21.046630859375, 21.81005859375, 22.573486328125, 23.3369140625, 24.100341796875, 24.86376953125, 25.627197265625, 26.390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 8.0, 8.0, 16.0, 32.0, 35.0, 61.0, 90.0, 151.0, 257.0, 434.0, 879.0, 1670.0, 3308.0, 7394.0, 18929.0, 56520.0, 228179.0, 512420.0, 150862.0, 40918.0, 14502.0, 5977.0, 2804.0, 1420.0, 701.0, 382.0, 208.0, 124.0, 83.0, 53.0, 42.0, 24.0, 17.0, 11.0, 10.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.5625, -26.65478515625, -25.7470703125, -24.83935546875, -23.931640625, -23.02392578125, -22.1162109375, -21.20849609375, -20.30078125, -19.39306640625, -18.4853515625, -17.57763671875, -16.669921875, -15.76220703125, -14.8544921875, -13.94677734375, -13.0390625, -12.13134765625, -11.2236328125, -10.31591796875, -9.408203125, -8.50048828125, -7.5927734375, -6.68505859375, -5.77734375, -4.86962890625, -3.9619140625, -3.05419921875, -2.146484375, -1.23876953125, -0.3310546875, 0.57666015625, 1.484375, 2.39208984375, 3.2998046875, 4.20751953125, 5.115234375, 6.02294921875, 6.9306640625, 7.83837890625, 8.74609375, 9.65380859375, 10.5615234375, 11.46923828125, 12.376953125, 13.28466796875, 14.1923828125, 15.10009765625, 16.0078125, 16.91552734375, 17.8232421875, 18.73095703125, 19.638671875, 20.54638671875, 21.4541015625, 22.36181640625, 23.26953125, 24.17724609375, 25.0849609375, 25.99267578125, 26.900390625, 27.80810546875, 28.7158203125, 29.62353515625, 30.53125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 4.0, 6.0, 3.0, 3.0, 17.0, 8.0, 20.0, 19.0, 31.0, 48.0, 79.0, 102.0, 122.0, 140.0, 113.0, 79.0, 45.0, 53.0, 24.0, 18.0, 14.0, 13.0, 7.0, 7.0, 7.0, 3.0, 7.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00626373291015625, -0.006099998950958252, -0.005936264991760254, -0.005772531032562256, -0.005608797073364258, -0.00544506311416626, -0.005281329154968262, -0.005117595195770264, -0.004953861236572266, -0.004790127277374268, -0.0046263933181762695, -0.0044626593589782715, -0.0042989253997802734, -0.004135191440582275, -0.003971457481384277, -0.0038077235221862793, -0.0036439895629882812, -0.003480255603790283, -0.003316521644592285, -0.003152787685394287, -0.002989053726196289, -0.002825319766998291, -0.002661585807800293, -0.002497851848602295, -0.002334117889404297, -0.002170383930206299, -0.0020066499710083008, -0.0018429160118103027, -0.0016791820526123047, -0.0015154480934143066, -0.0013517141342163086, -0.0011879801750183105, -0.0010242462158203125, -0.0008605122566223145, -0.0006967782974243164, -0.0005330443382263184, -0.0003693103790283203, -0.00020557641983032227, -4.184246063232422e-05, 0.00012189149856567383, 0.0002856254577636719, 0.0004493594169616699, 0.000613093376159668, 0.000776827335357666, 0.0009405612945556641, 0.0011042952537536621, 0.0012680292129516602, 0.0014317631721496582, 0.0015954971313476562, 0.0017592310905456543, 0.0019229650497436523, 0.0020866990089416504, 0.0022504329681396484, 0.0024141669273376465, 0.0025779008865356445, 0.0027416348457336426, 0.0029053688049316406, 0.0030691027641296387, 0.0032328367233276367, 0.0033965706825256348, 0.003560304641723633, 0.003724038600921631, 0.003887772560119629, 0.004051506519317627, 0.004215240478515625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 7.0, 7.0, 8.0, 27.0, 22.0, 51.0, 52.0, 74.0, 88.0, 178.0, 258.0, 487.0, 922.0, 1789.0, 3825.0, 8999.0, 23856.0, 76512.0, 310262.0, 448964.0, 116729.0, 33715.0, 12092.0, 4969.0, 2208.0, 1015.0, 548.0, 337.0, 185.0, 117.0, 68.0, 55.0, 40.0, 20.0, 16.0, 13.0, 10.0, 10.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.03125, -29.152099609375, -28.27294921875, -27.393798828125, -26.5146484375, -25.635498046875, -24.75634765625, -23.877197265625, -22.998046875, -22.118896484375, -21.23974609375, -20.360595703125, -19.4814453125, -18.602294921875, -17.72314453125, -16.843994140625, -15.96484375, -15.085693359375, -14.20654296875, -13.327392578125, -12.4482421875, -11.569091796875, -10.68994140625, -9.810791015625, -8.931640625, -8.052490234375, -7.17333984375, -6.294189453125, -5.4150390625, -4.535888671875, -3.65673828125, -2.777587890625, -1.8984375, -1.019287109375, -0.14013671875, 0.739013671875, 1.6181640625, 2.497314453125, 3.37646484375, 4.255615234375, 5.134765625, 6.013916015625, 6.89306640625, 7.772216796875, 8.6513671875, 9.530517578125, 10.40966796875, 11.288818359375, 12.16796875, 13.047119140625, 13.92626953125, 14.805419921875, 15.6845703125, 16.563720703125, 17.44287109375, 18.322021484375, 19.201171875, 20.080322265625, 20.95947265625, 21.838623046875, 22.7177734375, 23.596923828125, 24.47607421875, 25.355224609375, 26.234375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 10.0, 11.0, 6.0, 7.0, 9.0, 9.0, 11.0, 26.0, 20.0, 20.0, 28.0, 38.0, 43.0, 57.0, 51.0, 52.0, 53.0, 62.0, 53.0, 39.0, 55.0, 49.0, 51.0, 45.0, 46.0, 27.0, 18.0, 18.0, 9.0, 13.0, 19.0, 9.0, 8.0, 4.0, 8.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.75, -11.392578125, -11.03515625, -10.677734375, -10.3203125, -9.962890625, -9.60546875, -9.248046875, -8.890625, -8.533203125, -8.17578125, -7.818359375, -7.4609375, -7.103515625, -6.74609375, -6.388671875, -6.03125, -5.673828125, -5.31640625, -4.958984375, -4.6015625, -4.244140625, -3.88671875, -3.529296875, -3.171875, -2.814453125, -2.45703125, -2.099609375, -1.7421875, -1.384765625, -1.02734375, -0.669921875, -0.3125, 0.044921875, 0.40234375, 0.759765625, 1.1171875, 1.474609375, 1.83203125, 2.189453125, 2.546875, 2.904296875, 3.26171875, 3.619140625, 3.9765625, 4.333984375, 4.69140625, 5.048828125, 5.40625, 5.763671875, 6.12109375, 6.478515625, 6.8359375, 7.193359375, 7.55078125, 7.908203125, 8.265625, 8.623046875, 8.98046875, 9.337890625, 9.6953125, 10.052734375, 10.41015625, 10.767578125, 11.125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 7.0, 11.0, 13.0, 23.0, 26.0, 52.0, 75.0, 110.0, 153.0, 148.0, 133.0, 83.0, 54.0, 37.0, 23.0, 14.0, 7.0, 8.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-220.2195587158203, -211.78562927246094, -203.3516845703125, -194.91775512695312, -186.48382568359375, -178.04989624023438, -169.615966796875, -161.18202209472656, -152.7480926513672, -144.3141632080078, -135.88021850585938, -127.4462890625, -119.01235961914062, -110.57843017578125, -102.14449310302734, -93.71055603027344, -85.27662658691406, -76.84269714355469, -68.40876007080078, -59.97482681274414, -51.5408935546875, -43.10696029663086, -34.67302703857422, -26.239093780517578, -17.805160522460938, -9.371227264404297, -0.9372940063476562, 7.496639251708984, 15.930572509765625, 24.364505767822266, 32.798439025878906, 41.23237228393555, 49.66632080078125, 58.10025405883789, 66.53418731689453, 74.96812438964844, 83.40205383300781, 91.83598327636719, 100.2699203491211, 108.703857421875, 117.13778686523438, 125.57171630859375, 134.00564575195312, 142.43959045410156, 150.87351989746094, 159.3074493408203, 167.74139404296875, 176.17532348632812, 184.6092529296875, 193.04318237304688, 201.47711181640625, 209.9110565185547, 218.34498596191406, 226.77891540527344, 235.21286010742188, 243.64678955078125, 252.08071899414062, 260.5146484375, 268.9485778808594, 277.38250732421875, 285.81646728515625, 294.2503967285156, 302.684326171875, 311.1182556152344, 319.55218505859375]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 8.0, 12.0, 13.0, 16.0, 26.0, 20.0, 21.0, 26.0, 29.0, 33.0, 42.0, 52.0, 48.0, 48.0, 64.0, 46.0, 68.0, 47.0, 46.0, 55.0, 44.0, 38.0, 34.0, 22.0, 28.0, 29.0, 13.0, 10.0, 10.0, 7.0, 9.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-193.78839111328125, -187.7338409423828, -181.6792755126953, -175.62472534179688, -169.57017517089844, -163.515625, -157.4610595703125, -151.40650939941406, -145.35195922851562, -139.2974090576172, -133.2428436279297, -127.18829345703125, -121.13374328613281, -115.07918548583984, -109.02462768554688, -102.97007751464844, -96.91551208496094, -90.86095428466797, -84.80640411376953, -78.75184631347656, -72.69729614257812, -66.64273834228516, -60.58818054199219, -54.533626556396484, -48.47907257080078, -42.42451858520508, -36.369964599609375, -30.315406799316406, -24.260852813720703, -18.206298828125, -12.151741027832031, -6.097187042236328, -0.0426483154296875, 6.011906623840332, 12.066461563110352, 18.121017456054688, 24.17557144165039, 30.230125427246094, 36.28468322753906, 42.339237213134766, 48.39379119873047, 54.44834518432617, 60.502899169921875, 66.55745697021484, 72.61201477050781, 78.66656494140625, 84.72112274169922, 90.77568054199219, 96.83023071289062, 102.8847885131836, 108.93933868408203, 114.993896484375, 121.04844665527344, 127.1030044555664, 133.15756225585938, 139.2121124267578, 145.26666259765625, 151.3212127685547, 157.3757781982422, 163.43032836914062, 169.48487854003906, 175.5394287109375, 181.593994140625, 187.64854431152344, 193.70310974121094]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 7.0, 3.0, 10.0, 12.0, 11.0, 18.0, 27.0, 36.0, 49.0, 67.0, 85.0, 129.0, 182.0, 263.0, 431.0, 747.0, 1235.0, 2362.0, 4338.0, 9233.0, 21611.0, 61188.0, 313240.0, 3540044.0, 164641.0, 42470.0, 16342.0, 7225.0, 3539.0, 1930.0, 1032.0, 618.0, 391.0, 249.0, 166.0, 93.0, 81.0, 46.0, 32.0, 24.0, 15.0, 19.0, 10.0, 6.0, 5.0, 5.0, 2.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-78.3125, -75.9638671875, -73.615234375, -71.2666015625, -68.91796875, -66.5693359375, -64.220703125, -61.8720703125, -59.5234375, -57.1748046875, -54.826171875, -52.4775390625, -50.12890625, -47.7802734375, -45.431640625, -43.0830078125, -40.734375, -38.3857421875, -36.037109375, -33.6884765625, -31.33984375, -28.9912109375, -26.642578125, -24.2939453125, -21.9453125, -19.5966796875, -17.248046875, -14.8994140625, -12.55078125, -10.2021484375, -7.853515625, -5.5048828125, -3.15625, -0.8076171875, 1.541015625, 3.8896484375, 6.23828125, 8.5869140625, 10.935546875, 13.2841796875, 15.6328125, 17.9814453125, 20.330078125, 22.6787109375, 25.02734375, 27.3759765625, 29.724609375, 32.0732421875, 34.421875, 36.7705078125, 39.119140625, 41.4677734375, 43.81640625, 46.1650390625, 48.513671875, 50.8623046875, 53.2109375, 55.5595703125, 57.908203125, 60.2568359375, 62.60546875, 64.9541015625, 67.302734375, 69.6513671875, 72.0]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 6.0, 5.0, 6.0, 19.0, 23.0, 22.0, 26.0, 39.0, 48.0, 60.0, 65.0, 54.0, 70.0, 71.0, 68.0, 53.0, 61.0, 56.0, 44.0, 50.0, 33.0, 30.0, 22.0, 17.0, 15.0, 4.0, 7.0, 4.0, 6.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.67578125, -5.4912109375, -5.306640625, -5.1220703125, -4.9375, -4.7529296875, -4.568359375, -4.3837890625, -4.19921875, -4.0146484375, -3.830078125, -3.6455078125, -3.4609375, -3.2763671875, -3.091796875, -2.9072265625, -2.72265625, -2.5380859375, -2.353515625, -2.1689453125, -1.984375, -1.7998046875, -1.615234375, -1.4306640625, -1.24609375, -1.0615234375, -0.876953125, -0.6923828125, -0.5078125, -0.3232421875, -0.138671875, 0.0458984375, 0.23046875, 0.4150390625, 0.599609375, 0.7841796875, 0.96875, 1.1533203125, 1.337890625, 1.5224609375, 1.70703125, 1.8916015625, 2.076171875, 2.2607421875, 2.4453125, 2.6298828125, 2.814453125, 2.9990234375, 3.18359375, 3.3681640625, 3.552734375, 3.7373046875, 3.921875, 4.1064453125, 4.291015625, 4.4755859375, 4.66015625, 4.8447265625, 5.029296875, 5.2138671875, 5.3984375, 5.5830078125, 5.767578125, 5.9521484375, 6.13671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 8.0, 10.0, 14.0, 9.0, 19.0, 28.0, 34.0, 46.0, 80.0, 130.0, 264.0, 710.0, 2404.0, 12377.0, 135029.0, 3906469.0, 121727.0, 11303.0, 2300.0, 735.0, 259.0, 125.0, 66.0, 36.0, 24.0, 25.0, 16.0, 6.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 0.0, 0.0, 2.0, 1.0], "bins": [-229.625, -223.658203125, -217.69140625, -211.724609375, -205.7578125, -199.791015625, -193.82421875, -187.857421875, -181.890625, -175.923828125, -169.95703125, -163.990234375, -158.0234375, -152.056640625, -146.08984375, -140.123046875, -134.15625, -128.189453125, -122.22265625, -116.255859375, -110.2890625, -104.322265625, -98.35546875, -92.388671875, -86.421875, -80.455078125, -74.48828125, -68.521484375, -62.5546875, -56.587890625, -50.62109375, -44.654296875, -38.6875, -32.720703125, -26.75390625, -20.787109375, -14.8203125, -8.853515625, -2.88671875, 3.080078125, 9.046875, 15.013671875, 20.98046875, 26.947265625, 32.9140625, 38.880859375, 44.84765625, 50.814453125, 56.78125, 62.748046875, 68.71484375, 74.681640625, 80.6484375, 86.615234375, 92.58203125, 98.548828125, 104.515625, 110.482421875, 116.44921875, 122.416015625, 128.3828125, 134.349609375, 140.31640625, 146.283203125, 152.25]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 14.0, 20.0, 32.0, 45.0, 76.0, 127.0, 245.0, 989.0, 1902.0, 270.0, 137.0, 86.0, 52.0, 24.0, 14.0, 16.0, 9.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5625, -34.674560546875, -33.78662109375, -32.898681640625, -32.0107421875, -31.122802734375, -30.23486328125, -29.346923828125, -28.458984375, -27.571044921875, -26.68310546875, -25.795166015625, -24.9072265625, -24.019287109375, -23.13134765625, -22.243408203125, -21.35546875, -20.467529296875, -19.57958984375, -18.691650390625, -17.8037109375, -16.915771484375, -16.02783203125, -15.139892578125, -14.251953125, -13.364013671875, -12.47607421875, -11.588134765625, -10.7001953125, -9.812255859375, -8.92431640625, -8.036376953125, -7.1484375, -6.260498046875, -5.37255859375, -4.484619140625, -3.5966796875, -2.708740234375, -1.82080078125, -0.932861328125, -0.044921875, 0.843017578125, 1.73095703125, 2.618896484375, 3.5068359375, 4.394775390625, 5.28271484375, 6.170654296875, 7.05859375, 7.946533203125, 8.83447265625, 9.722412109375, 10.6103515625, 11.498291015625, 12.38623046875, 13.274169921875, 14.162109375, 15.050048828125, 15.93798828125, 16.825927734375, 17.7138671875, 18.601806640625, 19.48974609375, 20.377685546875, 21.265625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 8.0, 10.0, 15.0, 14.0, 26.0, 46.0, 88.0, 117.0, 192.0, 187.0, 143.0, 64.0, 34.0, 24.0, 15.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.19717407226562, -184.57598876953125, -179.95480346679688, -175.33363342285156, -170.7124481201172, -166.0912628173828, -161.47007751464844, -156.84890747070312, -152.22772216796875, -147.60653686523438, -142.9853515625, -138.3641815185547, -133.7429962158203, -129.12181091308594, -124.50062561035156, -119.87944793701172, -115.25826263427734, -110.63707733154297, -106.01589965820312, -101.39471435546875, -96.7735366821289, -92.15235137939453, -87.53117370605469, -82.90998840332031, -78.28880310058594, -73.66761779785156, -69.04644012451172, -64.42525482177734, -59.8040771484375, -55.182891845703125, -50.561710357666016, -45.940528869628906, -41.31934356689453, -36.69816207885742, -32.07698059082031, -27.45579719543457, -22.83461570739746, -18.21343421936035, -13.59225082397461, -8.9710693359375, -4.349887847900391, 0.27129411697387695, 4.8924760818481445, 9.51365852355957, 14.13484001159668, 18.75602149963379, 23.37720489501953, 27.99838638305664, 32.61956787109375, 37.24074935913086, 41.86193084716797, 46.483116149902344, 51.10429382324219, 55.72547912597656, 60.34666061401367, 64.96784210205078, 69.58901977539062, 74.210205078125, 78.83138275146484, 83.45256805419922, 88.07374572753906, 92.69493103027344, 97.31611633300781, 101.93729400634766, 106.55847930908203]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 12.0, 12.0, 19.0, 13.0, 24.0, 24.0, 31.0, 27.0, 44.0, 45.0, 48.0, 52.0, 62.0, 67.0, 61.0, 53.0, 53.0, 48.0, 41.0, 45.0, 40.0, 24.0, 27.0, 19.0, 24.0, 17.0, 18.0, 10.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.23884582519531, -61.92860412597656, -59.61836624145508, -57.30812454223633, -54.997886657714844, -52.687644958496094, -50.377403259277344, -48.06716537475586, -45.756927490234375, -43.446685791015625, -41.13644790649414, -38.82620620727539, -36.515968322753906, -34.205726623535156, -31.89548683166504, -29.585247039794922, -27.275005340576172, -24.964765548706055, -22.654525756835938, -20.344284057617188, -18.034046173095703, -15.72380542755127, -13.413564682006836, -11.103324890136719, -8.793085098266602, -6.482845306396484, -4.172605037689209, -1.8623647689819336, 0.4478750228881836, 2.758114814758301, 5.068355560302734, 7.378595352172852, 9.688835144042969, 11.999074935913086, 14.309314727783203, 16.619556427001953, 18.929794311523438, 21.240036010742188, 23.550275802612305, 25.860515594482422, 28.17075538635254, 30.480995178222656, 32.791236877441406, 35.10147476196289, 37.41171646118164, 39.721954345703125, 42.032196044921875, 44.342437744140625, 46.65267562866211, 48.96291732788086, 51.273155212402344, 53.583396911621094, 55.89363479614258, 58.20387649536133, 60.51411437988281, 62.82435607910156, 65.13459777832031, 67.44483947753906, 69.75508117675781, 72.06531524658203, 74.37555694580078, 76.68579864501953, 78.99604034423828, 81.3062744140625, 83.61651611328125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 7.0, 9.0, 18.0, 22.0, 22.0, 48.0, 53.0, 61.0, 91.0, 164.0, 248.0, 378.0, 607.0, 1041.0, 1806.0, 3371.0, 6296.0, 13200.0, 30055.0, 78474.0, 231757.0, 413005.0, 164919.0, 57597.0, 23030.0, 10364.0, 5231.0, 2783.0, 1497.0, 871.0, 521.0, 346.0, 193.0, 141.0, 91.0, 61.0, 42.0, 36.0, 28.0, 16.0, 12.0, 10.0, 11.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.71875, -41.35595703125, -39.9931640625, -38.63037109375, -37.267578125, -35.90478515625, -34.5419921875, -33.17919921875, -31.81640625, -30.45361328125, -29.0908203125, -27.72802734375, -26.365234375, -25.00244140625, -23.6396484375, -22.27685546875, -20.9140625, -19.55126953125, -18.1884765625, -16.82568359375, -15.462890625, -14.10009765625, -12.7373046875, -11.37451171875, -10.01171875, -8.64892578125, -7.2861328125, -5.92333984375, -4.560546875, -3.19775390625, -1.8349609375, -0.47216796875, 0.890625, 2.25341796875, 3.6162109375, 4.97900390625, 6.341796875, 7.70458984375, 9.0673828125, 10.43017578125, 11.79296875, 13.15576171875, 14.5185546875, 15.88134765625, 17.244140625, 18.60693359375, 19.9697265625, 21.33251953125, 22.6953125, 24.05810546875, 25.4208984375, 26.78369140625, 28.146484375, 29.50927734375, 30.8720703125, 32.23486328125, 33.59765625, 34.96044921875, 36.3232421875, 37.68603515625, 39.048828125, 40.41162109375, 41.7744140625, 43.13720703125, 44.5]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 12.0, 16.0, 16.0, 17.0, 23.0, 32.0, 45.0, 54.0, 43.0, 55.0, 57.0, 85.0, 79.0, 59.0, 62.0, 62.0, 53.0, 52.0, 38.0, 24.0, 22.0, 23.0, 14.0, 8.0, 8.0, 10.0, 6.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.85394287109375, -6.6414794921875, -6.42901611328125, -6.216552734375, -6.00408935546875, -5.7916259765625, -5.57916259765625, -5.36669921875, -5.15423583984375, -4.9417724609375, -4.72930908203125, -4.516845703125, -4.30438232421875, -4.0919189453125, -3.87945556640625, -3.6669921875, -3.45452880859375, -3.2420654296875, -3.02960205078125, -2.817138671875, -2.60467529296875, -2.3922119140625, -2.17974853515625, -1.96728515625, -1.75482177734375, -1.5423583984375, -1.32989501953125, -1.117431640625, -0.90496826171875, -0.6925048828125, -0.48004150390625, -0.267578125, -0.05511474609375, 0.1573486328125, 0.36981201171875, 0.582275390625, 0.79473876953125, 1.0072021484375, 1.21966552734375, 1.43212890625, 1.64459228515625, 1.8570556640625, 2.06951904296875, 2.281982421875, 2.49444580078125, 2.7069091796875, 2.91937255859375, 3.1318359375, 3.34429931640625, 3.5567626953125, 3.76922607421875, 3.981689453125, 4.19415283203125, 4.4066162109375, 4.61907958984375, 4.83154296875, 5.04400634765625, 5.2564697265625, 5.46893310546875, 5.681396484375, 5.89385986328125, 6.1063232421875, 6.31878662109375, 6.53125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 12.0, 10.0, 18.0, 9.0, 13.0, 19.0, 36.0, 43.0, 61.0, 116.0, 119.0, 210.0, 334.0, 543.0, 971.0, 1737.0, 3297.0, 6617.0, 14642.0, 36731.0, 110571.0, 393290.0, 330548.0, 92059.0, 31317.0, 12744.0, 5808.0, 2957.0, 1529.0, 842.0, 508.0, 282.0, 175.0, 106.0, 73.0, 54.0, 38.0, 28.0, 28.0, 18.0, 14.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.53125, -52.875, -51.21875, -49.5625, -47.90625, -46.25, -44.59375, -42.9375, -41.28125, -39.625, -37.96875, -36.3125, -34.65625, -33.0, -31.34375, -29.6875, -28.03125, -26.375, -24.71875, -23.0625, -21.40625, -19.75, -18.09375, -16.4375, -14.78125, -13.125, -11.46875, -9.8125, -8.15625, -6.5, -4.84375, -3.1875, -1.53125, 0.125, 1.78125, 3.4375, 5.09375, 6.75, 8.40625, 10.0625, 11.71875, 13.375, 15.03125, 16.6875, 18.34375, 20.0, 21.65625, 23.3125, 24.96875, 26.625, 28.28125, 29.9375, 31.59375, 33.25, 34.90625, 36.5625, 38.21875, 39.875, 41.53125, 43.1875, 44.84375, 46.5, 48.15625, 49.8125, 51.46875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 6.0, 6.0, 8.0, 9.0, 13.0, 17.0, 12.0, 12.0, 23.0, 20.0, 31.0, 34.0, 33.0, 43.0, 34.0, 47.0, 44.0, 39.0, 33.0, 43.0, 41.0, 53.0, 52.0, 38.0, 38.0, 31.0, 39.0, 35.0, 31.0, 18.0, 23.0, 9.0, 10.0, 16.0, 7.0, 11.0, 9.0, 2.0, 9.0, 2.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.40625, -30.4423828125, -29.478515625, -28.5146484375, -27.55078125, -26.5869140625, -25.623046875, -24.6591796875, -23.6953125, -22.7314453125, -21.767578125, -20.8037109375, -19.83984375, -18.8759765625, -17.912109375, -16.9482421875, -15.984375, -15.0205078125, -14.056640625, -13.0927734375, -12.12890625, -11.1650390625, -10.201171875, -9.2373046875, -8.2734375, -7.3095703125, -6.345703125, -5.3818359375, -4.41796875, -3.4541015625, -2.490234375, -1.5263671875, -0.5625, 0.4013671875, 1.365234375, 2.3291015625, 3.29296875, 4.2568359375, 5.220703125, 6.1845703125, 7.1484375, 8.1123046875, 9.076171875, 10.0400390625, 11.00390625, 11.9677734375, 12.931640625, 13.8955078125, 14.859375, 15.8232421875, 16.787109375, 17.7509765625, 18.71484375, 19.6787109375, 20.642578125, 21.6064453125, 22.5703125, 23.5341796875, 24.498046875, 25.4619140625, 26.42578125, 27.3896484375, 28.353515625, 29.3173828125, 30.28125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 11.0, 20.0, 31.0, 49.0, 44.0, 67.0, 106.0, 153.0, 232.0, 324.0, 457.0, 695.0, 1035.0, 1460.0, 2100.0, 3271.0, 5364.0, 9288.0, 20146.0, 60397.0, 291035.0, 487473.0, 104811.0, 29304.0, 12501.0, 6425.0, 3953.0, 2465.0, 1744.0, 1118.0, 762.0, 506.0, 380.0, 260.0, 171.0, 128.0, 96.0, 64.0, 34.0, 33.0, 13.0, 13.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.109375, -24.21875, -23.328125, -22.4375, -21.546875, -20.65625, -19.765625, -18.875, -17.984375, -17.09375, -16.203125, -15.3125, -14.421875, -13.53125, -12.640625, -11.75, -10.859375, -9.96875, -9.078125, -8.1875, -7.296875, -6.40625, -5.515625, -4.625, -3.734375, -2.84375, -1.953125, -1.0625, -0.171875, 0.71875, 1.609375, 2.5, 3.390625, 4.28125, 5.171875, 6.0625, 6.953125, 7.84375, 8.734375, 9.625, 10.515625, 11.40625, 12.296875, 13.1875, 14.078125, 14.96875, 15.859375, 16.75, 17.640625, 18.53125, 19.421875, 20.3125, 21.203125, 22.09375, 22.984375, 23.875, 24.765625, 25.65625, 26.546875, 27.4375, 28.328125, 29.21875, 30.109375, 31.0, 31.890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 11.0, 7.0, 18.0, 20.0, 25.0, 53.0, 113.0, 162.0, 201.0, 156.0, 86.0, 54.0, 26.0, 20.0, 11.0, 11.0, 6.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00714111328125, -0.006860613822937012, -0.0065801143646240234, -0.006299614906311035, -0.006019115447998047, -0.005738615989685059, -0.00545811653137207, -0.005177617073059082, -0.004897117614746094, -0.0046166181564331055, -0.004336118698120117, -0.004055619239807129, -0.0037751197814941406, -0.0034946203231811523, -0.003214120864868164, -0.0029336214065551758, -0.0026531219482421875, -0.0023726224899291992, -0.002092123031616211, -0.0018116235733032227, -0.0015311241149902344, -0.001250624656677246, -0.0009701251983642578, -0.0006896257400512695, -0.00040912628173828125, -0.00012862682342529297, 0.0001518726348876953, 0.0004323720932006836, 0.0007128715515136719, 0.0009933710098266602, 0.0012738704681396484, 0.0015543699264526367, 0.001834869384765625, 0.0021153688430786133, 0.0023958683013916016, 0.00267636775970459, 0.002956867218017578, 0.0032373666763305664, 0.0035178661346435547, 0.003798365592956543, 0.004078865051269531, 0.0043593645095825195, 0.004639863967895508, 0.004920363426208496, 0.005200862884521484, 0.005481362342834473, 0.005761861801147461, 0.006042361259460449, 0.0063228607177734375, 0.006603360176086426, 0.006883859634399414, 0.007164359092712402, 0.007444858551025391, 0.007725358009338379, 0.008005857467651367, 0.008286356925964355, 0.008566856384277344, 0.008847355842590332, 0.00912785530090332, 0.009408354759216309, 0.009688854217529297, 0.009969353675842285, 0.010249853134155273, 0.010530352592468262, 0.01081085205078125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 9.0, 13.0, 13.0, 13.0, 24.0, 42.0, 46.0, 93.0, 120.0, 201.0, 409.0, 640.0, 1258.0, 2463.0, 5335.0, 14037.0, 68065.0, 754202.0, 165265.0, 22428.0, 7191.0, 3109.0, 1591.0, 825.0, 480.0, 251.0, 160.0, 88.0, 50.0, 42.0, 23.0, 24.0, 10.0, 5.0, 4.0, 3.0, 8.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.40625, -58.5576171875, -56.708984375, -54.8603515625, -53.01171875, -51.1630859375, -49.314453125, -47.4658203125, -45.6171875, -43.7685546875, -41.919921875, -40.0712890625, -38.22265625, -36.3740234375, -34.525390625, -32.6767578125, -30.828125, -28.9794921875, -27.130859375, -25.2822265625, -23.43359375, -21.5849609375, -19.736328125, -17.8876953125, -16.0390625, -14.1904296875, -12.341796875, -10.4931640625, -8.64453125, -6.7958984375, -4.947265625, -3.0986328125, -1.25, 0.5986328125, 2.447265625, 4.2958984375, 6.14453125, 7.9931640625, 9.841796875, 11.6904296875, 13.5390625, 15.3876953125, 17.236328125, 19.0849609375, 20.93359375, 22.7822265625, 24.630859375, 26.4794921875, 28.328125, 30.1767578125, 32.025390625, 33.8740234375, 35.72265625, 37.5712890625, 39.419921875, 41.2685546875, 43.1171875, 44.9658203125, 46.814453125, 48.6630859375, 50.51171875, 52.3603515625, 54.208984375, 56.0576171875, 57.90625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 9.0, 2.0, 13.0, 15.0, 27.0, 46.0, 64.0, 92.0, 158.0, 144.0, 139.0, 80.0, 54.0, 30.0, 18.0, 12.0, 13.0, 13.0, 9.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.890625, -28.9658203125, -28.041015625, -27.1162109375, -26.19140625, -25.2666015625, -24.341796875, -23.4169921875, -22.4921875, -21.5673828125, -20.642578125, -19.7177734375, -18.79296875, -17.8681640625, -16.943359375, -16.0185546875, -15.09375, -14.1689453125, -13.244140625, -12.3193359375, -11.39453125, -10.4697265625, -9.544921875, -8.6201171875, -7.6953125, -6.7705078125, -5.845703125, -4.9208984375, -3.99609375, -3.0712890625, -2.146484375, -1.2216796875, -0.296875, 0.6279296875, 1.552734375, 2.4775390625, 3.40234375, 4.3271484375, 5.251953125, 6.1767578125, 7.1015625, 8.0263671875, 8.951171875, 9.8759765625, 10.80078125, 11.7255859375, 12.650390625, 13.5751953125, 14.5, 15.4248046875, 16.349609375, 17.2744140625, 18.19921875, 19.1240234375, 20.048828125, 20.9736328125, 21.8984375, 22.8232421875, 23.748046875, 24.6728515625, 25.59765625, 26.5224609375, 27.447265625, 28.3720703125, 29.296875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 8.0, 8.0, 5.0, 10.0, 14.0, 36.0, 44.0, 92.0, 101.0, 141.0, 186.0, 126.0, 71.0, 55.0, 39.0, 16.0, 14.0, 19.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-296.50390625, -284.24200439453125, -271.9801330566406, -259.7182312011719, -247.4563446044922, -235.1944580078125, -222.93255615234375, -210.67066955566406, -198.40878295898438, -186.1468963623047, -173.88499450683594, -161.62310791015625, -149.36122131347656, -137.09933471679688, -124.83743286132812, -112.57554626464844, -100.31364440917969, -88.05175018310547, -75.78986358642578, -63.52796936035156, -51.26607894897461, -39.004188537597656, -26.742294311523438, -14.48040771484375, -2.2185134887695312, 10.043377876281738, 22.305269241333008, 34.567161560058594, 46.82905197143555, 59.0909423828125, 71.35283660888672, 83.6147232055664, 95.87661743164062, 108.13851165771484, 120.40039825439453, 132.66229248046875, 144.92417907714844, 157.18606567382812, 169.44796752929688, 181.70985412597656, 193.97174072265625, 206.23362731933594, 218.4955291748047, 230.75741577148438, 243.01930236816406, 255.28118896484375, 267.5430908203125, 279.80499267578125, 292.06689453125, 304.32879638671875, 316.5906677246094, 328.8525695800781, 341.1144714355469, 353.3763427734375, 365.63824462890625, 377.900146484375, 390.1620178222656, 402.4239196777344, 414.685791015625, 426.94769287109375, 439.2095947265625, 451.4714660644531, 463.7333679199219, 475.9952392578125, 488.25714111328125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 1.0, 3.0, 7.0, 11.0, 6.0, 11.0, 9.0, 12.0, 14.0, 19.0, 13.0, 28.0, 26.0, 31.0, 26.0, 32.0, 35.0, 28.0, 41.0, 51.0, 46.0, 36.0, 34.0, 41.0, 51.0, 48.0, 41.0, 42.0, 34.0, 29.0, 35.0, 33.0, 14.0, 27.0, 14.0, 9.0, 16.0, 16.0, 8.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-254.588623046875, -247.61636352539062, -240.64410400390625, -233.67184448242188, -226.69956970214844, -219.72731018066406, -212.7550506591797, -205.7827911376953, -198.81051635742188, -191.8382568359375, -184.86599731445312, -177.89373779296875, -170.9214630126953, -163.94920349121094, -156.97694396972656, -150.0046844482422, -143.0324249267578, -136.06016540527344, -129.08790588378906, -122.11563873291016, -115.14337158203125, -108.17111206054688, -101.1988525390625, -94.22659301757812, -87.25432586669922, -80.28206634521484, -73.30979919433594, -66.33753967285156, -59.36527633666992, -52.39301300048828, -45.420753479003906, -38.448490142822266, -31.476242065429688, -24.503978729248047, -17.53171730041504, -10.559455871582031, -3.5871925354003906, 3.38507080078125, 10.357330322265625, 17.329593658447266, 24.301856994628906, 31.274120330810547, 38.24638366699219, 45.21864318847656, 52.1909065246582, 59.163169860839844, 66.13542938232422, 73.10769653320312, 80.0799560546875, 87.05221557617188, 94.02448272705078, 100.99674224853516, 107.96900939941406, 114.94126892089844, 121.91352844238281, 128.8857879638672, 135.85806274414062, 142.830322265625, 149.80258178710938, 156.77484130859375, 163.7471160888672, 170.71937561035156, 177.69163513183594, 184.6638946533203, 191.6361541748047]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 8.0, 5.0, 3.0, 7.0, 6.0, 9.0, 15.0, 22.0, 17.0, 47.0, 61.0, 79.0, 104.0, 180.0, 262.0, 416.0, 730.0, 1196.0, 2180.0, 4479.0, 10078.0, 26491.0, 97076.0, 3627172.0, 341345.0, 50854.0, 16644.0, 6961.0, 3430.0, 1742.0, 993.0, 619.0, 350.0, 229.0, 152.0, 103.0, 70.0, 49.0, 36.0, 19.0, 10.0, 9.0, 2.0, 5.0, 4.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-68.6875, -66.5263671875, -64.365234375, -62.2041015625, -60.04296875, -57.8818359375, -55.720703125, -53.5595703125, -51.3984375, -49.2373046875, -47.076171875, -44.9150390625, -42.75390625, -40.5927734375, -38.431640625, -36.2705078125, -34.109375, -31.9482421875, -29.787109375, -27.6259765625, -25.46484375, -23.3037109375, -21.142578125, -18.9814453125, -16.8203125, -14.6591796875, -12.498046875, -10.3369140625, -8.17578125, -6.0146484375, -3.853515625, -1.6923828125, 0.46875, 2.6298828125, 4.791015625, 6.9521484375, 9.11328125, 11.2744140625, 13.435546875, 15.5966796875, 17.7578125, 19.9189453125, 22.080078125, 24.2412109375, 26.40234375, 28.5634765625, 30.724609375, 32.8857421875, 35.046875, 37.2080078125, 39.369140625, 41.5302734375, 43.69140625, 45.8525390625, 48.013671875, 50.1748046875, 52.3359375, 54.4970703125, 56.658203125, 58.8193359375, 60.98046875, 63.1416015625, 65.302734375, 67.4638671875, 69.625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 8.0, 13.0, 12.0, 23.0, 29.0, 36.0, 36.0, 30.0, 49.0, 50.0, 56.0, 65.0, 57.0, 59.0, 54.0, 61.0, 43.0, 43.0, 35.0, 50.0, 32.0, 33.0, 27.0, 17.0, 13.0, 9.0, 9.0, 10.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.046875, -5.825927734375, -5.60498046875, -5.384033203125, -5.1630859375, -4.942138671875, -4.72119140625, -4.500244140625, -4.279296875, -4.058349609375, -3.83740234375, -3.616455078125, -3.3955078125, -3.174560546875, -2.95361328125, -2.732666015625, -2.51171875, -2.290771484375, -2.06982421875, -1.848876953125, -1.6279296875, -1.406982421875, -1.18603515625, -0.965087890625, -0.744140625, -0.523193359375, -0.30224609375, -0.081298828125, 0.1396484375, 0.360595703125, 0.58154296875, 0.802490234375, 1.0234375, 1.244384765625, 1.46533203125, 1.686279296875, 1.9072265625, 2.128173828125, 2.34912109375, 2.570068359375, 2.791015625, 3.011962890625, 3.23291015625, 3.453857421875, 3.6748046875, 3.895751953125, 4.11669921875, 4.337646484375, 4.55859375, 4.779541015625, 5.00048828125, 5.221435546875, 5.4423828125, 5.663330078125, 5.88427734375, 6.105224609375, 6.326171875, 6.547119140625, 6.76806640625, 6.989013671875, 7.2099609375, 7.430908203125, 7.65185546875, 7.872802734375, 8.09375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 9.0, 8.0, 18.0, 35.0, 23.0, 36.0, 40.0, 75.0, 112.0, 205.0, 343.0, 651.0, 1324.0, 2777.0, 6446.0, 18874.0, 83110.0, 3353880.0, 644200.0, 57770.0, 14358.0, 5254.0, 2252.0, 1094.0, 581.0, 287.0, 179.0, 105.0, 69.0, 52.0, 38.0, 22.0, 22.0, 10.0, 9.0, 5.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.25, -90.4150390625, -87.580078125, -84.7451171875, -81.91015625, -79.0751953125, -76.240234375, -73.4052734375, -70.5703125, -67.7353515625, -64.900390625, -62.0654296875, -59.23046875, -56.3955078125, -53.560546875, -50.7255859375, -47.890625, -45.0556640625, -42.220703125, -39.3857421875, -36.55078125, -33.7158203125, -30.880859375, -28.0458984375, -25.2109375, -22.3759765625, -19.541015625, -16.7060546875, -13.87109375, -11.0361328125, -8.201171875, -5.3662109375, -2.53125, 0.3037109375, 3.138671875, 5.9736328125, 8.80859375, 11.6435546875, 14.478515625, 17.3134765625, 20.1484375, 22.9833984375, 25.818359375, 28.6533203125, 31.48828125, 34.3232421875, 37.158203125, 39.9931640625, 42.828125, 45.6630859375, 48.498046875, 51.3330078125, 54.16796875, 57.0029296875, 59.837890625, 62.6728515625, 65.5078125, 68.3427734375, 71.177734375, 74.0126953125, 76.84765625, 79.6826171875, 82.517578125, 85.3525390625, 88.1875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 12.0, 12.0, 15.0, 19.0, 27.0, 53.0, 79.0, 157.0, 415.0, 2587.0, 327.0, 156.0, 81.0, 40.0, 34.0, 15.0, 12.0, 7.0, 6.0, 2.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.5625, -27.732666015625, -26.90283203125, -26.072998046875, -25.2431640625, -24.413330078125, -23.58349609375, -22.753662109375, -21.923828125, -21.093994140625, -20.26416015625, -19.434326171875, -18.6044921875, -17.774658203125, -16.94482421875, -16.114990234375, -15.28515625, -14.455322265625, -13.62548828125, -12.795654296875, -11.9658203125, -11.135986328125, -10.30615234375, -9.476318359375, -8.646484375, -7.816650390625, -6.98681640625, -6.156982421875, -5.3271484375, -4.497314453125, -3.66748046875, -2.837646484375, -2.0078125, -1.177978515625, -0.34814453125, 0.481689453125, 1.3115234375, 2.141357421875, 2.97119140625, 3.801025390625, 4.630859375, 5.460693359375, 6.29052734375, 7.120361328125, 7.9501953125, 8.780029296875, 9.60986328125, 10.439697265625, 11.26953125, 12.099365234375, 12.92919921875, 13.759033203125, 14.5888671875, 15.418701171875, 16.24853515625, 17.078369140625, 17.908203125, 18.738037109375, 19.56787109375, 20.397705078125, 21.2275390625, 22.057373046875, 22.88720703125, 23.717041015625, 24.546875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 11.0, 22.0, 27.0, 36.0, 61.0, 104.0, 132.0, 155.0, 143.0, 125.0, 70.0, 45.0, 25.0, 19.0, 10.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.69446563720703, -111.07264709472656, -107.45083618164062, -103.82901763916016, -100.20720672607422, -96.58538818359375, -92.96357727050781, -89.34175872802734, -85.7199478149414, -82.09812927246094, -78.476318359375, -74.85449981689453, -71.2326889038086, -67.61087036132812, -63.98905944824219, -60.36724090576172, -56.745426177978516, -53.12361145019531, -49.50179672241211, -45.879981994628906, -42.2581672668457, -38.6363525390625, -35.01453399658203, -31.39272117614746, -27.770906448364258, -24.149091720581055, -20.52727699279785, -16.905460357666016, -13.283646583557129, -9.66183090209961, -6.040016174316406, -2.418201446533203, 1.20361328125, 4.825428009033203, 8.447242736816406, 12.069058418273926, 15.690873146057129, 19.31268882751465, 22.93450355529785, 26.556318283081055, 30.178133010864258, 33.799949645996094, 37.4217643737793, 41.0435791015625, 44.6653938293457, 48.287208557128906, 51.90902328491211, 55.53083801269531, 59.152652740478516, 62.77446746826172, 66.39628601074219, 70.01809692382812, 73.6399154663086, 77.26172637939453, 80.883544921875, 84.50535583496094, 88.1271743774414, 91.74899291992188, 95.37080383300781, 98.99262237548828, 102.61443328857422, 106.23625183105469, 109.85806274414062, 113.4798812866211, 117.10169219970703]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 8.0, 18.0, 16.0, 18.0, 23.0, 28.0, 25.0, 22.0, 21.0, 34.0, 31.0, 38.0, 38.0, 37.0, 39.0, 34.0, 41.0, 27.0, 38.0, 41.0, 51.0, 35.0, 30.0, 38.0, 21.0, 29.0, 27.0, 17.0, 28.0, 26.0, 17.0, 10.0, 16.0, 12.0, 12.0, 6.0, 4.0, 2.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.5582389831543, -44.98756408691406, -43.41688537597656, -41.84620666503906, -40.27553176879883, -38.704856872558594, -37.134178161621094, -35.563499450683594, -33.99282455444336, -32.422149658203125, -30.851470947265625, -29.280794143676758, -27.71011734008789, -26.139440536499023, -24.568763732910156, -22.99808692932129, -21.427410125732422, -19.856733322143555, -18.286056518554688, -16.71537971496582, -15.144702911376953, -13.574026107788086, -12.003349304199219, -10.432672500610352, -8.861995697021484, -7.291318893432617, -5.72064208984375, -4.149965286254883, -2.5792884826660156, -1.0086116790771484, 0.5620651245117188, 2.132741928100586, 3.7034225463867188, 5.274099349975586, 6.844776153564453, 8.41545295715332, 9.986129760742188, 11.556806564331055, 13.127483367919922, 14.698160171508789, 16.268836975097656, 17.839513778686523, 19.41019058227539, 20.980867385864258, 22.551544189453125, 24.122220993041992, 25.69289779663086, 27.263574600219727, 28.834251403808594, 30.40492820739746, 31.975605010986328, 33.54627990722656, 35.11695861816406, 36.68763732910156, 38.2583122253418, 39.82898712158203, 41.39966583251953, 42.97034454345703, 44.541019439697266, 46.1116943359375, 47.682373046875, 49.2530517578125, 50.823726654052734, 52.39440155029297, 53.96508026123047]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 0.0, 7.0, 9.0, 13.0, 22.0, 34.0, 35.0, 55.0, 100.0, 102.0, 233.0, 366.0, 566.0, 926.0, 1650.0, 2944.0, 5763.0, 11578.0, 24762.0, 57560.0, 148383.0, 368619.0, 255669.0, 94931.0, 39032.0, 17239.0, 8284.0, 4204.0, 2244.0, 1198.0, 752.0, 459.0, 278.0, 169.0, 122.0, 74.0, 50.0, 38.0, 24.0, 16.0, 17.0, 14.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.125, -34.91162109375, -33.6982421875, -32.48486328125, -31.271484375, -30.05810546875, -28.8447265625, -27.63134765625, -26.41796875, -25.20458984375, -23.9912109375, -22.77783203125, -21.564453125, -20.35107421875, -19.1376953125, -17.92431640625, -16.7109375, -15.49755859375, -14.2841796875, -13.07080078125, -11.857421875, -10.64404296875, -9.4306640625, -8.21728515625, -7.00390625, -5.79052734375, -4.5771484375, -3.36376953125, -2.150390625, -0.93701171875, 0.2763671875, 1.48974609375, 2.703125, 3.91650390625, 5.1298828125, 6.34326171875, 7.556640625, 8.77001953125, 9.9833984375, 11.19677734375, 12.41015625, 13.62353515625, 14.8369140625, 16.05029296875, 17.263671875, 18.47705078125, 19.6904296875, 20.90380859375, 22.1171875, 23.33056640625, 24.5439453125, 25.75732421875, 26.970703125, 28.18408203125, 29.3974609375, 30.61083984375, 31.82421875, 33.03759765625, 34.2509765625, 35.46435546875, 36.677734375, 37.89111328125, 39.1044921875, 40.31787109375, 41.53125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 8.0, 10.0, 8.0, 13.0, 28.0, 38.0, 40.0, 40.0, 47.0, 70.0, 68.0, 59.0, 66.0, 72.0, 62.0, 54.0, 66.0, 50.0, 36.0, 29.0, 33.0, 23.0, 16.0, 14.0, 8.0, 15.0, 9.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.4537353515625, -8.188720703125, -7.9237060546875, -7.65869140625, -7.3936767578125, -7.128662109375, -6.8636474609375, -6.5986328125, -6.3336181640625, -6.068603515625, -5.8035888671875, -5.53857421875, -5.2735595703125, -5.008544921875, -4.7435302734375, -4.478515625, -4.2135009765625, -3.948486328125, -3.6834716796875, -3.41845703125, -3.1534423828125, -2.888427734375, -2.6234130859375, -2.3583984375, -2.0933837890625, -1.828369140625, -1.5633544921875, -1.29833984375, -1.0333251953125, -0.768310546875, -0.5032958984375, -0.23828125, 0.0267333984375, 0.291748046875, 0.5567626953125, 0.82177734375, 1.0867919921875, 1.351806640625, 1.6168212890625, 1.8818359375, 2.1468505859375, 2.411865234375, 2.6768798828125, 2.94189453125, 3.2069091796875, 3.471923828125, 3.7369384765625, 4.001953125, 4.2669677734375, 4.531982421875, 4.7969970703125, 5.06201171875, 5.3270263671875, 5.592041015625, 5.8570556640625, 6.1220703125, 6.3870849609375, 6.652099609375, 6.9171142578125, 7.18212890625, 7.4471435546875, 7.712158203125, 7.9771728515625, 8.2421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 8.0, 7.0, 8.0, 16.0, 28.0, 34.0, 42.0, 67.0, 117.0, 194.0, 280.0, 458.0, 818.0, 1335.0, 2284.0, 4323.0, 8027.0, 16583.0, 36610.0, 96332.0, 310286.0, 372038.0, 117124.0, 42833.0, 18752.0, 8981.0, 4652.0, 2597.0, 1429.0, 819.0, 512.0, 349.0, 180.0, 133.0, 100.0, 58.0, 39.0, 27.0, 18.0, 17.0, 12.0, 13.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-44.75, -43.3974609375, -42.044921875, -40.6923828125, -39.33984375, -37.9873046875, -36.634765625, -35.2822265625, -33.9296875, -32.5771484375, -31.224609375, -29.8720703125, -28.51953125, -27.1669921875, -25.814453125, -24.4619140625, -23.109375, -21.7568359375, -20.404296875, -19.0517578125, -17.69921875, -16.3466796875, -14.994140625, -13.6416015625, -12.2890625, -10.9365234375, -9.583984375, -8.2314453125, -6.87890625, -5.5263671875, -4.173828125, -2.8212890625, -1.46875, -0.1162109375, 1.236328125, 2.5888671875, 3.94140625, 5.2939453125, 6.646484375, 7.9990234375, 9.3515625, 10.7041015625, 12.056640625, 13.4091796875, 14.76171875, 16.1142578125, 17.466796875, 18.8193359375, 20.171875, 21.5244140625, 22.876953125, 24.2294921875, 25.58203125, 26.9345703125, 28.287109375, 29.6396484375, 30.9921875, 32.3447265625, 33.697265625, 35.0498046875, 36.40234375, 37.7548828125, 39.107421875, 40.4599609375, 41.8125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 12.0, 6.0, 7.0, 9.0, 10.0, 13.0, 19.0, 16.0, 23.0, 39.0, 32.0, 37.0, 46.0, 51.0, 50.0, 52.0, 57.0, 42.0, 53.0, 54.0, 48.0, 38.0, 40.0, 36.0, 29.0, 26.0, 25.0, 22.0, 24.0, 16.0, 10.0, 14.0, 15.0, 10.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.78125, -42.5419921875, -41.302734375, -40.0634765625, -38.82421875, -37.5849609375, -36.345703125, -35.1064453125, -33.8671875, -32.6279296875, -31.388671875, -30.1494140625, -28.91015625, -27.6708984375, -26.431640625, -25.1923828125, -23.953125, -22.7138671875, -21.474609375, -20.2353515625, -18.99609375, -17.7568359375, -16.517578125, -15.2783203125, -14.0390625, -12.7998046875, -11.560546875, -10.3212890625, -9.08203125, -7.8427734375, -6.603515625, -5.3642578125, -4.125, -2.8857421875, -1.646484375, -0.4072265625, 0.83203125, 2.0712890625, 3.310546875, 4.5498046875, 5.7890625, 7.0283203125, 8.267578125, 9.5068359375, 10.74609375, 11.9853515625, 13.224609375, 14.4638671875, 15.703125, 16.9423828125, 18.181640625, 19.4208984375, 20.66015625, 21.8994140625, 23.138671875, 24.3779296875, 25.6171875, 26.8564453125, 28.095703125, 29.3349609375, 30.57421875, 31.8134765625, 33.052734375, 34.2919921875, 35.53125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 14.0, 17.0, 17.0, 22.0, 17.0, 40.0, 70.0, 109.0, 131.0, 145.0, 222.0, 365.0, 493.0, 721.0, 1161.0, 1887.0, 3991.0, 11952.0, 76858.0, 765024.0, 156605.0, 17371.0, 5159.0, 2313.0, 1262.0, 818.0, 557.0, 352.0, 263.0, 182.0, 111.0, 84.0, 52.0, 46.0, 40.0, 32.0, 9.0, 17.0, 4.0, 4.0, 3.0, 6.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.4375, -39.990234375, -38.54296875, -37.095703125, -35.6484375, -34.201171875, -32.75390625, -31.306640625, -29.859375, -28.412109375, -26.96484375, -25.517578125, -24.0703125, -22.623046875, -21.17578125, -19.728515625, -18.28125, -16.833984375, -15.38671875, -13.939453125, -12.4921875, -11.044921875, -9.59765625, -8.150390625, -6.703125, -5.255859375, -3.80859375, -2.361328125, -0.9140625, 0.533203125, 1.98046875, 3.427734375, 4.875, 6.322265625, 7.76953125, 9.216796875, 10.6640625, 12.111328125, 13.55859375, 15.005859375, 16.453125, 17.900390625, 19.34765625, 20.794921875, 22.2421875, 23.689453125, 25.13671875, 26.583984375, 28.03125, 29.478515625, 30.92578125, 32.373046875, 33.8203125, 35.267578125, 36.71484375, 38.162109375, 39.609375, 41.056640625, 42.50390625, 43.951171875, 45.3984375, 46.845703125, 48.29296875, 49.740234375, 51.1875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 21.0, 30.0, 121.0, 446.0, 253.0, 72.0, 24.0, 16.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0269775390625, -0.0263746976852417, -0.0257718563079834, -0.025169014930725098, -0.024566173553466797, -0.023963332176208496, -0.023360490798950195, -0.022757649421691895, -0.022154808044433594, -0.021551966667175293, -0.020949125289916992, -0.02034628391265869, -0.01974344253540039, -0.01914060115814209, -0.01853775978088379, -0.01793491840362549, -0.017332077026367188, -0.016729235649108887, -0.016126394271850586, -0.015523552894592285, -0.014920711517333984, -0.014317870140075684, -0.013715028762817383, -0.013112187385559082, -0.012509346008300781, -0.01190650463104248, -0.01130366325378418, -0.010700821876525879, -0.010097980499267578, -0.009495139122009277, -0.008892297744750977, -0.008289456367492676, -0.007686614990234375, -0.007083773612976074, -0.0064809322357177734, -0.005878090858459473, -0.005275249481201172, -0.004672408103942871, -0.00406956672668457, -0.0034667253494262695, -0.0028638839721679688, -0.002261042594909668, -0.0016582012176513672, -0.0010553598403930664, -0.0004525184631347656, 0.00015032291412353516, 0.0007531642913818359, 0.0013560056686401367, 0.0019588470458984375, 0.0025616884231567383, 0.003164529800415039, 0.00376737117767334, 0.004370212554931641, 0.004973053932189941, 0.005575895309448242, 0.006178736686706543, 0.006781578063964844, 0.0073844194412231445, 0.007987260818481445, 0.008590102195739746, 0.009192943572998047, 0.009795784950256348, 0.010398626327514648, 0.01100146770477295, 0.01160430908203125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 11.0, 10.0, 32.0, 33.0, 35.0, 52.0, 69.0, 103.0, 164.0, 264.0, 379.0, 594.0, 934.0, 1616.0, 3179.0, 8660.0, 45211.0, 661392.0, 289432.0, 24171.0, 5950.0, 2449.0, 1415.0, 854.0, 493.0, 342.0, 209.0, 163.0, 106.0, 65.0, 52.0, 28.0, 24.0, 11.0, 16.0, 7.0, 6.0, 7.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-56.09375, -54.611328125, -53.12890625, -51.646484375, -50.1640625, -48.681640625, -47.19921875, -45.716796875, -44.234375, -42.751953125, -41.26953125, -39.787109375, -38.3046875, -36.822265625, -35.33984375, -33.857421875, -32.375, -30.892578125, -29.41015625, -27.927734375, -26.4453125, -24.962890625, -23.48046875, -21.998046875, -20.515625, -19.033203125, -17.55078125, -16.068359375, -14.5859375, -13.103515625, -11.62109375, -10.138671875, -8.65625, -7.173828125, -5.69140625, -4.208984375, -2.7265625, -1.244140625, 0.23828125, 1.720703125, 3.203125, 4.685546875, 6.16796875, 7.650390625, 9.1328125, 10.615234375, 12.09765625, 13.580078125, 15.0625, 16.544921875, 18.02734375, 19.509765625, 20.9921875, 22.474609375, 23.95703125, 25.439453125, 26.921875, 28.404296875, 29.88671875, 31.369140625, 32.8515625, 34.333984375, 35.81640625, 37.298828125, 38.78125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 8.0, 4.0, 11.0, 19.0, 27.0, 46.0, 66.0, 112.0, 168.0, 176.0, 132.0, 85.0, 54.0, 24.0, 22.0, 17.0, 8.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-38.09375, -37.0986328125, -36.103515625, -35.1083984375, -34.11328125, -33.1181640625, -32.123046875, -31.1279296875, -30.1328125, -29.1376953125, -28.142578125, -27.1474609375, -26.15234375, -25.1572265625, -24.162109375, -23.1669921875, -22.171875, -21.1767578125, -20.181640625, -19.1865234375, -18.19140625, -17.1962890625, -16.201171875, -15.2060546875, -14.2109375, -13.2158203125, -12.220703125, -11.2255859375, -10.23046875, -9.2353515625, -8.240234375, -7.2451171875, -6.25, -5.2548828125, -4.259765625, -3.2646484375, -2.26953125, -1.2744140625, -0.279296875, 0.7158203125, 1.7109375, 2.7060546875, 3.701171875, 4.6962890625, 5.69140625, 6.6865234375, 7.681640625, 8.6767578125, 9.671875, 10.6669921875, 11.662109375, 12.6572265625, 13.65234375, 14.6474609375, 15.642578125, 16.6376953125, 17.6328125, 18.6279296875, 19.623046875, 20.6181640625, 21.61328125, 22.6083984375, 23.603515625, 24.5986328125, 25.59375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 7.0, 8.0, 9.0, 14.0, 18.0, 21.0, 38.0, 35.0, 48.0, 62.0, 87.0, 103.0, 91.0, 93.0, 76.0, 68.0, 56.0, 40.0, 25.0, 25.0, 25.0, 13.0, 9.0, 7.0, 2.0, 6.0, 3.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-176.0668182373047, -168.53146362304688, -160.99612426757812, -153.4607696533203, -145.9254150390625, -138.39007568359375, -130.85472106933594, -123.31936645507812, -115.78401947021484, -108.24867248535156, -100.71331787109375, -93.17797088623047, -85.64262390136719, -78.10726928710938, -70.5719223022461, -63.03657150268555, -55.501220703125, -47.96586990356445, -40.430519104003906, -32.895172119140625, -25.359821319580078, -17.82447052001953, -10.28912353515625, -2.753772735595703, 4.781578063964844, 12.316927909851074, 19.852277755737305, 27.38762664794922, 34.922977447509766, 42.45832824707031, 49.993675231933594, 57.52902603149414, 65.06439208984375, 72.59973907470703, 80.13509368896484, 87.67044067382812, 95.20579528808594, 102.74114227294922, 110.2764892578125, 117.81184387207031, 125.3471908569336, 132.88253784179688, 140.4178924560547, 147.9532470703125, 155.48858642578125, 163.02394104003906, 170.55929565429688, 178.09463500976562, 185.62998962402344, 193.16534423828125, 200.70068359375, 208.2360382080078, 215.77139282226562, 223.30673217773438, 230.8420867919922, 238.37744140625, 245.91278076171875, 253.44813537597656, 260.9834899902344, 268.5188293457031, 276.0541687011719, 283.58953857421875, 291.1248779296875, 298.66021728515625, 306.1955871582031]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 4.0, 5.0, 5.0, 6.0, 8.0, 11.0, 18.0, 12.0, 22.0, 22.0, 21.0, 29.0, 31.0, 38.0, 46.0, 32.0, 36.0, 47.0, 39.0, 58.0, 45.0, 59.0, 31.0, 37.0, 32.0, 51.0, 32.0, 35.0, 30.0, 21.0, 30.0, 19.0, 17.0, 13.0, 13.0, 5.0, 5.0, 12.0, 9.0, 6.0, 1.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-201.77781677246094, -195.5265350341797, -189.27525329589844, -183.0239715576172, -176.77268981933594, -170.52142333984375, -164.2701416015625, -158.01885986328125, -151.767578125, -145.51629638671875, -139.2650146484375, -133.01373291015625, -126.76245880126953, -120.51117706298828, -114.25989532470703, -108.00862121582031, -101.75733184814453, -95.50605010986328, -89.25476837158203, -83.00349426269531, -76.75221252441406, -70.50093078613281, -64.24964904785156, -57.99837112426758, -51.74708938598633, -45.49580764770508, -39.244529724121094, -32.993247985839844, -26.741968154907227, -20.49068832397461, -14.23940658569336, -7.988128662109375, -1.736846923828125, 4.51443338394165, 10.765713691711426, 17.01699447631836, 23.268274307250977, 29.519554138183594, 35.770835876464844, 42.02211380004883, 48.27339553833008, 54.52467727661133, 60.77595520019531, 67.02723693847656, 73.27851867675781, 79.52980041503906, 85.78108215332031, 92.03235626220703, 98.28363800048828, 104.53491973876953, 110.78620147705078, 117.0374755859375, 123.28875732421875, 129.5400390625, 135.79132080078125, 142.0426025390625, 148.29388427734375, 154.545166015625, 160.79644775390625, 167.0477294921875, 173.29901123046875, 179.55029296875, 185.80157470703125, 192.05284118652344, 198.3041229248047]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 8.0, 12.0, 11.0, 20.0, 34.0, 41.0, 77.0, 116.0, 178.0, 297.0, 564.0, 993.0, 2302.0, 5913.0, 20776.0, 162451.0, 3920404.0, 60440.0, 12126.0, 4065.0, 1609.0, 817.0, 401.0, 227.0, 134.0, 87.0, 68.0, 37.0, 23.0, 16.0, 11.0, 10.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-101.5, -98.541015625, -95.58203125, -92.623046875, -89.6640625, -86.705078125, -83.74609375, -80.787109375, -77.828125, -74.869140625, -71.91015625, -68.951171875, -65.9921875, -63.033203125, -60.07421875, -57.115234375, -54.15625, -51.197265625, -48.23828125, -45.279296875, -42.3203125, -39.361328125, -36.40234375, -33.443359375, -30.484375, -27.525390625, -24.56640625, -21.607421875, -18.6484375, -15.689453125, -12.73046875, -9.771484375, -6.8125, -3.853515625, -0.89453125, 2.064453125, 5.0234375, 7.982421875, 10.94140625, 13.900390625, 16.859375, 19.818359375, 22.77734375, 25.736328125, 28.6953125, 31.654296875, 34.61328125, 37.572265625, 40.53125, 43.490234375, 46.44921875, 49.408203125, 52.3671875, 55.326171875, 58.28515625, 61.244140625, 64.203125, 67.162109375, 70.12109375, 73.080078125, 76.0390625, 78.998046875, 81.95703125, 84.916015625, 87.875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 18.0, 22.0, 22.0, 23.0, 20.0, 36.0, 39.0, 44.0, 51.0, 55.0, 63.0, 52.0, 55.0, 67.0, 43.0, 58.0, 51.0, 39.0, 36.0, 42.0, 28.0, 20.0, 18.0, 16.0, 12.0, 18.0, 14.0, 7.0, 5.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.11834716796875, -7.8695068359375, -7.62066650390625, -7.371826171875, -7.12298583984375, -6.8741455078125, -6.62530517578125, -6.37646484375, -6.12762451171875, -5.8787841796875, -5.62994384765625, -5.381103515625, -5.13226318359375, -4.8834228515625, -4.63458251953125, -4.3857421875, -4.13690185546875, -3.8880615234375, -3.63922119140625, -3.390380859375, -3.14154052734375, -2.8927001953125, -2.64385986328125, -2.39501953125, -2.14617919921875, -1.8973388671875, -1.64849853515625, -1.399658203125, -1.15081787109375, -0.9019775390625, -0.65313720703125, -0.404296875, -0.15545654296875, 0.0933837890625, 0.34222412109375, 0.591064453125, 0.83990478515625, 1.0887451171875, 1.33758544921875, 1.58642578125, 1.83526611328125, 2.0841064453125, 2.33294677734375, 2.581787109375, 2.83062744140625, 3.0794677734375, 3.32830810546875, 3.5771484375, 3.82598876953125, 4.0748291015625, 4.32366943359375, 4.572509765625, 4.82135009765625, 5.0701904296875, 5.31903076171875, 5.56787109375, 5.81671142578125, 6.0655517578125, 6.31439208984375, 6.563232421875, 6.81207275390625, 7.0609130859375, 7.30975341796875, 7.55859375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 4.0, 11.0, 12.0, 15.0, 18.0, 32.0, 50.0, 65.0, 104.0, 143.0, 264.0, 345.0, 683.0, 1351.0, 2935.0, 8085.0, 30215.0, 251723.0, 3780167.0, 91730.0, 17007.0, 5146.0, 2133.0, 929.0, 459.0, 270.0, 153.0, 93.0, 45.0, 31.0, 18.0, 18.0, 9.0, 11.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-112.625, -109.60546875, -106.5859375, -103.56640625, -100.546875, -97.52734375, -94.5078125, -91.48828125, -88.46875, -85.44921875, -82.4296875, -79.41015625, -76.390625, -73.37109375, -70.3515625, -67.33203125, -64.3125, -61.29296875, -58.2734375, -55.25390625, -52.234375, -49.21484375, -46.1953125, -43.17578125, -40.15625, -37.13671875, -34.1171875, -31.09765625, -28.078125, -25.05859375, -22.0390625, -19.01953125, -16.0, -12.98046875, -9.9609375, -6.94140625, -3.921875, -0.90234375, 2.1171875, 5.13671875, 8.15625, 11.17578125, 14.1953125, 17.21484375, 20.234375, 23.25390625, 26.2734375, 29.29296875, 32.3125, 35.33203125, 38.3515625, 41.37109375, 44.390625, 47.41015625, 50.4296875, 53.44921875, 56.46875, 59.48828125, 62.5078125, 65.52734375, 68.546875, 71.56640625, 74.5859375, 77.60546875, 80.625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 8.0, 9.0, 3.0, 15.0, 12.0, 24.0, 37.0, 64.0, 91.0, 179.0, 726.0, 2322.0, 237.0, 125.0, 63.0, 54.0, 37.0, 12.0, 13.0, 4.0, 5.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.625, -26.953369140625, -26.28173828125, -25.610107421875, -24.9384765625, -24.266845703125, -23.59521484375, -22.923583984375, -22.251953125, -21.580322265625, -20.90869140625, -20.237060546875, -19.5654296875, -18.893798828125, -18.22216796875, -17.550537109375, -16.87890625, -16.207275390625, -15.53564453125, -14.864013671875, -14.1923828125, -13.520751953125, -12.84912109375, -12.177490234375, -11.505859375, -10.834228515625, -10.16259765625, -9.490966796875, -8.8193359375, -8.147705078125, -7.47607421875, -6.804443359375, -6.1328125, -5.461181640625, -4.78955078125, -4.117919921875, -3.4462890625, -2.774658203125, -2.10302734375, -1.431396484375, -0.759765625, -0.088134765625, 0.58349609375, 1.255126953125, 1.9267578125, 2.598388671875, 3.27001953125, 3.941650390625, 4.61328125, 5.284912109375, 5.95654296875, 6.628173828125, 7.2998046875, 7.971435546875, 8.64306640625, 9.314697265625, 9.986328125, 10.657958984375, 11.32958984375, 12.001220703125, 12.6728515625, 13.344482421875, 14.01611328125, 14.687744140625, 15.359375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 11.0, 16.0, 43.0, 60.0, 77.0, 106.0, 162.0, 174.0, 128.0, 89.0, 52.0, 29.0, 14.0, 16.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.265480041503906, -59.545352935791016, -55.82522201538086, -52.10509490966797, -48.38496398925781, -44.66483688354492, -40.94470977783203, -37.224578857421875, -33.504451751708984, -29.78432273864746, -26.064193725585938, -22.344066619873047, -18.623937606811523, -14.90380859375, -11.18368148803711, -7.463552474975586, -3.7434234619140625, -0.023294925689697266, 3.696833610534668, 7.416961669921875, 11.137090682983398, 14.857219696044922, 18.577346801757812, 22.297475814819336, 26.01760482788086, 29.737733840942383, 33.457862854003906, 37.1779899597168, 40.89811706542969, 44.618247985839844, 48.338375091552734, 52.058502197265625, 55.77862548828125, 59.49875259399414, 63.2188835144043, 66.93901062011719, 70.65914154052734, 74.3792724609375, 78.09939575195312, 81.81952667236328, 85.53965759277344, 89.2597885131836, 92.97991180419922, 96.70004272460938, 100.42017364501953, 104.14030456542969, 107.86042785644531, 111.58055877685547, 115.3006820678711, 119.02081298828125, 122.74093627929688, 126.46106719970703, 130.1811981201172, 133.9013214111328, 137.6214599609375, 141.34158325195312, 145.06170654296875, 148.78182983398438, 152.50196838378906, 156.2220916748047, 159.9422149658203, 163.662353515625, 167.38247680664062, 171.10260009765625, 174.82273864746094]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 12.0, 5.0, 11.0, 13.0, 15.0, 14.0, 19.0, 18.0, 28.0, 28.0, 32.0, 31.0, 28.0, 39.0, 42.0, 38.0, 35.0, 39.0, 41.0, 37.0, 30.0, 43.0, 41.0, 24.0, 44.0, 34.0, 28.0, 33.0, 23.0, 28.0, 26.0, 16.0, 15.0, 9.0, 13.0, 9.0, 14.0, 9.0, 4.0, 6.0, 5.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.437034606933594, -45.999656677246094, -44.562278747558594, -43.124900817871094, -41.687522888183594, -40.250144958496094, -38.812767028808594, -37.375389099121094, -35.938011169433594, -34.500633239746094, -33.063255310058594, -31.625877380371094, -30.188499450683594, -28.751121520996094, -27.313745498657227, -25.876367568969727, -24.43899154663086, -23.00161361694336, -21.56423568725586, -20.12685775756836, -18.68947982788086, -17.25210189819336, -15.814725875854492, -14.377347946166992, -12.939970016479492, -11.502592086791992, -10.065214157104492, -8.627837181091309, -7.190459251403809, -5.753081321716309, -4.315704345703125, -2.878326416015625, -1.440948486328125, -0.0035707950592041016, 1.4338068962097168, 2.8711843490600586, 4.308562278747559, 5.745940208435059, 7.183317184448242, 8.620695114135742, 10.058073043823242, 11.495450973510742, 12.932828903198242, 14.370205879211426, 15.807583808898926, 17.24496078491211, 18.68233871459961, 20.11971664428711, 21.55709457397461, 22.99447250366211, 24.43185043334961, 25.86922836303711, 27.30660629272461, 28.74398422241211, 30.181360244750977, 31.618738174438477, 33.056114196777344, 34.493492126464844, 35.930870056152344, 37.368247985839844, 38.805625915527344, 40.243003845214844, 41.680381774902344, 43.117759704589844, 44.555137634277344]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 15.0, 9.0, 17.0, 20.0, 31.0, 42.0, 60.0, 102.0, 126.0, 185.0, 319.0, 436.0, 694.0, 1026.0, 1598.0, 2609.0, 4432.0, 7734.0, 13947.0, 26872.0, 55572.0, 121814.0, 269241.0, 287012.0, 131082.0, 59679.0, 28649.0, 14827.0, 8101.0, 4649.0, 2795.0, 1693.0, 1090.0, 689.0, 401.0, 327.0, 204.0, 125.0, 104.0, 64.0, 51.0, 29.0, 24.0, 21.0, 12.0, 9.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-33.3125, -32.304443359375, -31.29638671875, -30.288330078125, -29.2802734375, -28.272216796875, -27.26416015625, -26.256103515625, -25.248046875, -24.239990234375, -23.23193359375, -22.223876953125, -21.2158203125, -20.207763671875, -19.19970703125, -18.191650390625, -17.18359375, -16.175537109375, -15.16748046875, -14.159423828125, -13.1513671875, -12.143310546875, -11.13525390625, -10.127197265625, -9.119140625, -8.111083984375, -7.10302734375, -6.094970703125, -5.0869140625, -4.078857421875, -3.07080078125, -2.062744140625, -1.0546875, -0.046630859375, 0.96142578125, 1.969482421875, 2.9775390625, 3.985595703125, 4.99365234375, 6.001708984375, 7.009765625, 8.017822265625, 9.02587890625, 10.033935546875, 11.0419921875, 12.050048828125, 13.05810546875, 14.066162109375, 15.07421875, 16.082275390625, 17.09033203125, 18.098388671875, 19.1064453125, 20.114501953125, 21.12255859375, 22.130615234375, 23.138671875, 24.146728515625, 25.15478515625, 26.162841796875, 27.1708984375, 28.178955078125, 29.18701171875, 30.195068359375, 31.203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 3.0, 6.0, 5.0, 7.0, 4.0, 12.0, 17.0, 14.0, 25.0, 22.0, 21.0, 28.0, 31.0, 39.0, 38.0, 37.0, 47.0, 38.0, 45.0, 43.0, 51.0, 42.0, 47.0, 41.0, 43.0, 33.0, 27.0, 23.0, 41.0, 37.0, 23.0, 27.0, 12.0, 9.0, 16.0, 3.0, 12.0, 10.0, 3.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.828125, -6.62347412109375, -6.4188232421875, -6.21417236328125, -6.009521484375, -5.80487060546875, -5.6002197265625, -5.39556884765625, -5.19091796875, -4.98626708984375, -4.7816162109375, -4.57696533203125, -4.372314453125, -4.16766357421875, -3.9630126953125, -3.75836181640625, -3.5537109375, -3.34906005859375, -3.1444091796875, -2.93975830078125, -2.735107421875, -2.53045654296875, -2.3258056640625, -2.12115478515625, -1.91650390625, -1.71185302734375, -1.5072021484375, -1.30255126953125, -1.097900390625, -0.89324951171875, -0.6885986328125, -0.48394775390625, -0.279296875, -0.07464599609375, 0.1300048828125, 0.33465576171875, 0.539306640625, 0.74395751953125, 0.9486083984375, 1.15325927734375, 1.35791015625, 1.56256103515625, 1.7672119140625, 1.97186279296875, 2.176513671875, 2.38116455078125, 2.5858154296875, 2.79046630859375, 2.9951171875, 3.19976806640625, 3.4044189453125, 3.60906982421875, 3.813720703125, 4.01837158203125, 4.2230224609375, 4.42767333984375, 4.63232421875, 4.83697509765625, 5.0416259765625, 5.24627685546875, 5.450927734375, 5.65557861328125, 5.8602294921875, 6.06488037109375, 6.26953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 12.0, 13.0, 25.0, 19.0, 57.0, 71.0, 121.0, 206.0, 325.0, 723.0, 1420.0, 3420.0, 9279.0, 30119.0, 123839.0, 523893.0, 270807.0, 58135.0, 16382.0, 5491.0, 2176.0, 914.0, 496.0, 260.0, 127.0, 70.0, 58.0, 33.0, 22.0, 11.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.625, -49.94580078125, -48.2666015625, -46.58740234375, -44.908203125, -43.22900390625, -41.5498046875, -39.87060546875, -38.19140625, -36.51220703125, -34.8330078125, -33.15380859375, -31.474609375, -29.79541015625, -28.1162109375, -26.43701171875, -24.7578125, -23.07861328125, -21.3994140625, -19.72021484375, -18.041015625, -16.36181640625, -14.6826171875, -13.00341796875, -11.32421875, -9.64501953125, -7.9658203125, -6.28662109375, -4.607421875, -2.92822265625, -1.2490234375, 0.43017578125, 2.109375, 3.78857421875, 5.4677734375, 7.14697265625, 8.826171875, 10.50537109375, 12.1845703125, 13.86376953125, 15.54296875, 17.22216796875, 18.9013671875, 20.58056640625, 22.259765625, 23.93896484375, 25.6181640625, 27.29736328125, 28.9765625, 30.65576171875, 32.3349609375, 34.01416015625, 35.693359375, 37.37255859375, 39.0517578125, 40.73095703125, 42.41015625, 44.08935546875, 45.7685546875, 47.44775390625, 49.126953125, 50.80615234375, 52.4853515625, 54.16455078125, 55.84375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 7.0, 5.0, 9.0, 12.0, 13.0, 19.0, 36.0, 20.0, 31.0, 43.0, 44.0, 53.0, 47.0, 58.0, 51.0, 72.0, 66.0, 63.0, 59.0, 54.0, 45.0, 45.0, 46.0, 23.0, 15.0, 10.0, 14.0, 12.0, 17.0, 8.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.6875, -41.357421875, -40.02734375, -38.697265625, -37.3671875, -36.037109375, -34.70703125, -33.376953125, -32.046875, -30.716796875, -29.38671875, -28.056640625, -26.7265625, -25.396484375, -24.06640625, -22.736328125, -21.40625, -20.076171875, -18.74609375, -17.416015625, -16.0859375, -14.755859375, -13.42578125, -12.095703125, -10.765625, -9.435546875, -8.10546875, -6.775390625, -5.4453125, -4.115234375, -2.78515625, -1.455078125, -0.125, 1.205078125, 2.53515625, 3.865234375, 5.1953125, 6.525390625, 7.85546875, 9.185546875, 10.515625, 11.845703125, 13.17578125, 14.505859375, 15.8359375, 17.166015625, 18.49609375, 19.826171875, 21.15625, 22.486328125, 23.81640625, 25.146484375, 26.4765625, 27.806640625, 29.13671875, 30.466796875, 31.796875, 33.126953125, 34.45703125, 35.787109375, 37.1171875, 38.447265625, 39.77734375, 41.107421875, 42.4375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 10.0, 16.0, 18.0, 23.0, 35.0, 53.0, 87.0, 119.0, 149.0, 222.0, 337.0, 545.0, 746.0, 1187.0, 1968.0, 3286.0, 5846.0, 12178.0, 29283.0, 95436.0, 437259.0, 338813.0, 73265.0, 24144.0, 10299.0, 5104.0, 2941.0, 1706.0, 1115.0, 711.0, 493.0, 329.0, 235.0, 180.0, 120.0, 63.0, 75.0, 40.0, 29.0, 23.0, 23.0, 18.0, 8.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-21.109375, -20.42626953125, -19.7431640625, -19.06005859375, -18.376953125, -17.69384765625, -17.0107421875, -16.32763671875, -15.64453125, -14.96142578125, -14.2783203125, -13.59521484375, -12.912109375, -12.22900390625, -11.5458984375, -10.86279296875, -10.1796875, -9.49658203125, -8.8134765625, -8.13037109375, -7.447265625, -6.76416015625, -6.0810546875, -5.39794921875, -4.71484375, -4.03173828125, -3.3486328125, -2.66552734375, -1.982421875, -1.29931640625, -0.6162109375, 0.06689453125, 0.75, 1.43310546875, 2.1162109375, 2.79931640625, 3.482421875, 4.16552734375, 4.8486328125, 5.53173828125, 6.21484375, 6.89794921875, 7.5810546875, 8.26416015625, 8.947265625, 9.63037109375, 10.3134765625, 10.99658203125, 11.6796875, 12.36279296875, 13.0458984375, 13.72900390625, 14.412109375, 15.09521484375, 15.7783203125, 16.46142578125, 17.14453125, 17.82763671875, 18.5107421875, 19.19384765625, 19.876953125, 20.56005859375, 21.2431640625, 21.92626953125, 22.609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 8.0, 8.0, 11.0, 30.0, 41.0, 52.0, 98.0, 204.0, 197.0, 132.0, 94.0, 38.0, 25.0, 18.0, 12.0, 11.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0107421875, -0.010418534278869629, -0.010094881057739258, -0.009771227836608887, -0.009447574615478516, -0.009123921394348145, -0.008800268173217773, -0.008476614952087402, -0.008152961730957031, -0.00782930850982666, -0.007505655288696289, -0.007182002067565918, -0.006858348846435547, -0.006534695625305176, -0.006211042404174805, -0.005887389183044434, -0.0055637359619140625, -0.005240082740783691, -0.00491642951965332, -0.004592776298522949, -0.004269123077392578, -0.003945469856262207, -0.003621816635131836, -0.003298163414001465, -0.0029745101928710938, -0.0026508569717407227, -0.0023272037506103516, -0.0020035505294799805, -0.0016798973083496094, -0.0013562440872192383, -0.0010325908660888672, -0.0007089376449584961, -0.000385284423828125, -6.16312026977539e-05, 0.0002620220184326172, 0.0005856752395629883, 0.0009093284606933594, 0.0012329816818237305, 0.0015566349029541016, 0.0018802881240844727, 0.0022039413452148438, 0.002527594566345215, 0.002851247787475586, 0.003174901008605957, 0.003498554229736328, 0.0038222074508666992, 0.00414586067199707, 0.004469513893127441, 0.0047931671142578125, 0.005116820335388184, 0.005440473556518555, 0.005764126777648926, 0.006087779998779297, 0.006411433219909668, 0.006735086441040039, 0.00705873966217041, 0.007382392883300781, 0.007706046104431152, 0.008029699325561523, 0.008353352546691895, 0.008677005767822266, 0.009000658988952637, 0.009324312210083008, 0.009647965431213379, 0.00997161865234375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 5.0, 7.0, 9.0, 11.0, 23.0, 27.0, 36.0, 73.0, 110.0, 139.0, 259.0, 445.0, 693.0, 1299.0, 2448.0, 5251.0, 13152.0, 43899.0, 331098.0, 551898.0, 67068.0, 17310.0, 6610.0, 3000.0, 1525.0, 867.0, 476.0, 301.0, 176.0, 103.0, 91.0, 47.0, 22.0, 26.0, 12.0, 13.0, 5.0, 11.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.0625, -36.007568359375, -34.95263671875, -33.897705078125, -32.8427734375, -31.787841796875, -30.73291015625, -29.677978515625, -28.623046875, -27.568115234375, -26.51318359375, -25.458251953125, -24.4033203125, -23.348388671875, -22.29345703125, -21.238525390625, -20.18359375, -19.128662109375, -18.07373046875, -17.018798828125, -15.9638671875, -14.908935546875, -13.85400390625, -12.799072265625, -11.744140625, -10.689208984375, -9.63427734375, -8.579345703125, -7.5244140625, -6.469482421875, -5.41455078125, -4.359619140625, -3.3046875, -2.249755859375, -1.19482421875, -0.139892578125, 0.9150390625, 1.969970703125, 3.02490234375, 4.079833984375, 5.134765625, 6.189697265625, 7.24462890625, 8.299560546875, 9.3544921875, 10.409423828125, 11.46435546875, 12.519287109375, 13.57421875, 14.629150390625, 15.68408203125, 16.739013671875, 17.7939453125, 18.848876953125, 19.90380859375, 20.958740234375, 22.013671875, 23.068603515625, 24.12353515625, 25.178466796875, 26.2333984375, 27.288330078125, 28.34326171875, 29.398193359375, 30.453125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 6.0, 6.0, 9.0, 16.0, 19.0, 22.0, 39.0, 66.0, 85.0, 111.0, 126.0, 142.0, 109.0, 79.0, 46.0, 31.0, 24.0, 18.0, 12.0, 6.0, 5.0, 5.0, 1.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.96875, -28.182373046875, -27.39599609375, -26.609619140625, -25.8232421875, -25.036865234375, -24.25048828125, -23.464111328125, -22.677734375, -21.891357421875, -21.10498046875, -20.318603515625, -19.5322265625, -18.745849609375, -17.95947265625, -17.173095703125, -16.38671875, -15.600341796875, -14.81396484375, -14.027587890625, -13.2412109375, -12.454833984375, -11.66845703125, -10.882080078125, -10.095703125, -9.309326171875, -8.52294921875, -7.736572265625, -6.9501953125, -6.163818359375, -5.37744140625, -4.591064453125, -3.8046875, -3.018310546875, -2.23193359375, -1.445556640625, -0.6591796875, 0.127197265625, 0.91357421875, 1.699951171875, 2.486328125, 3.272705078125, 4.05908203125, 4.845458984375, 5.6318359375, 6.418212890625, 7.20458984375, 7.990966796875, 8.77734375, 9.563720703125, 10.35009765625, 11.136474609375, 11.9228515625, 12.709228515625, 13.49560546875, 14.281982421875, 15.068359375, 15.854736328125, 16.64111328125, 17.427490234375, 18.2138671875, 19.000244140625, 19.78662109375, 20.572998046875, 21.359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 10.0, 30.0, 55.0, 90.0, 123.0, 173.0, 175.0, 151.0, 92.0, 44.0, 31.0, 12.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-419.60833740234375, -406.0770568847656, -392.5458068847656, -379.0145263671875, -365.4832458496094, -351.95196533203125, -338.42071533203125, -324.8894348144531, -311.358154296875, -297.8268737792969, -284.2956237792969, -270.76434326171875, -257.2330627441406, -243.70179748535156, -230.1705322265625, -216.63925170898438, -203.10800170898438, -189.5767364501953, -176.0454559326172, -162.51419067382812, -148.98291015625, -135.45164489746094, -121.92037963867188, -108.38910675048828, -94.85783386230469, -81.3265609741211, -67.7952880859375, -54.26402282714844, -40.732749938964844, -27.20147705078125, -13.670211791992188, -0.13893890380859375, 13.392333984375, 26.92360496520996, 40.45487594604492, 53.98614501953125, 67.51741790771484, 81.04869079589844, 94.5799560546875, 108.1112289428711, 121.64250183105469, 135.17376708984375, 148.70504760742188, 162.23631286621094, 175.767578125, 189.29885864257812, 202.8301239013672, 216.36138916015625, 229.89266967773438, 243.42393493652344, 256.9552001953125, 270.4864807128906, 284.01776123046875, 297.54901123046875, 311.0802917480469, 324.611572265625, 338.142822265625, 351.6741027832031, 365.2053527832031, 378.73663330078125, 392.2679138183594, 405.7991943359375, 419.3304443359375, 432.8617248535156, 446.39300537109375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 6.0, 7.0, 6.0, 8.0, 9.0, 7.0, 17.0, 17.0, 18.0, 25.0, 28.0, 38.0, 36.0, 32.0, 36.0, 46.0, 38.0, 39.0, 51.0, 29.0, 50.0, 39.0, 48.0, 40.0, 36.0, 36.0, 27.0, 31.0, 27.0, 19.0, 17.0, 27.0, 15.0, 18.0, 10.0, 15.0, 8.0, 8.0, 9.0, 3.0, 4.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-155.17877197265625, -149.85716247558594, -144.5355682373047, -139.21395874023438, -133.89234924316406, -128.57073974609375, -123.2491455078125, -117.92753601074219, -112.6059341430664, -107.28433227539062, -101.96272277832031, -96.64112091064453, -91.31951904296875, -85.99790954589844, -80.67630767822266, -75.35470581054688, -70.03309631347656, -64.71149444580078, -59.38988494873047, -54.06828308105469, -48.74667739868164, -43.425071716308594, -38.10346984863281, -32.781864166259766, -27.46025848388672, -22.138652801513672, -16.817049026489258, -11.495444297790527, -6.173839569091797, -0.85223388671875, 4.469369888305664, 9.790973663330078, 15.112564086914062, 20.43416976928711, 25.755773544311523, 31.077377319335938, 36.398983001708984, 41.72058868408203, 47.04219055175781, 52.36379623413086, 57.685401916503906, 63.00700759887695, 68.32861328125, 73.65021514892578, 78.97181701660156, 84.29342651367188, 89.61502838134766, 94.93663024902344, 100.25823974609375, 105.57984161376953, 110.90145111083984, 116.22305297851562, 121.54466247558594, 126.86626434326172, 132.1878662109375, 137.5094757080078, 142.83108520507812, 148.15269470214844, 153.4742889404297, 158.7958984375, 164.1175079345703, 169.43911743164062, 174.76071166992188, 180.0823211669922, 185.40391540527344]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 9.0, 10.0, 13.0, 11.0, 19.0, 28.0, 43.0, 45.0, 79.0, 109.0, 132.0, 177.0, 315.0, 436.0, 661.0, 1042.0, 1773.0, 2896.0, 5403.0, 11295.0, 26660.0, 84689.0, 2448620.0, 1475847.0, 84464.0, 26111.0, 10902.0, 5448.0, 2827.0, 1657.0, 932.0, 539.0, 364.0, 236.0, 130.0, 117.0, 78.0, 44.0, 29.0, 20.0, 23.0, 10.0, 8.0, 7.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-52.96875, -51.36328125, -49.7578125, -48.15234375, -46.546875, -44.94140625, -43.3359375, -41.73046875, -40.125, -38.51953125, -36.9140625, -35.30859375, -33.703125, -32.09765625, -30.4921875, -28.88671875, -27.28125, -25.67578125, -24.0703125, -22.46484375, -20.859375, -19.25390625, -17.6484375, -16.04296875, -14.4375, -12.83203125, -11.2265625, -9.62109375, -8.015625, -6.41015625, -4.8046875, -3.19921875, -1.59375, 0.01171875, 1.6171875, 3.22265625, 4.828125, 6.43359375, 8.0390625, 9.64453125, 11.25, 12.85546875, 14.4609375, 16.06640625, 17.671875, 19.27734375, 20.8828125, 22.48828125, 24.09375, 25.69921875, 27.3046875, 28.91015625, 30.515625, 32.12109375, 33.7265625, 35.33203125, 36.9375, 38.54296875, 40.1484375, 41.75390625, 43.359375, 44.96484375, 46.5703125, 48.17578125, 49.78125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 10.0, 8.0, 9.0, 18.0, 20.0, 11.0, 15.0, 25.0, 25.0, 30.0, 55.0, 44.0, 40.0, 52.0, 40.0, 57.0, 60.0, 44.0, 59.0, 48.0, 36.0, 43.0, 39.0, 35.0, 29.0, 26.0, 22.0, 18.0, 12.0, 19.0, 9.0, 10.0, 9.0, 7.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.6875, -7.45819091796875, -7.2288818359375, -6.99957275390625, -6.770263671875, -6.54095458984375, -6.3116455078125, -6.08233642578125, -5.85302734375, -5.62371826171875, -5.3944091796875, -5.16510009765625, -4.935791015625, -4.70648193359375, -4.4771728515625, -4.24786376953125, -4.0185546875, -3.78924560546875, -3.5599365234375, -3.33062744140625, -3.101318359375, -2.87200927734375, -2.6427001953125, -2.41339111328125, -2.18408203125, -1.95477294921875, -1.7254638671875, -1.49615478515625, -1.266845703125, -1.03753662109375, -0.8082275390625, -0.57891845703125, -0.349609375, -0.12030029296875, 0.1090087890625, 0.33831787109375, 0.567626953125, 0.79693603515625, 1.0262451171875, 1.25555419921875, 1.48486328125, 1.71417236328125, 1.9434814453125, 2.17279052734375, 2.402099609375, 2.63140869140625, 2.8607177734375, 3.09002685546875, 3.3193359375, 3.54864501953125, 3.7779541015625, 4.00726318359375, 4.236572265625, 4.46588134765625, 4.6951904296875, 4.92449951171875, 5.15380859375, 5.38311767578125, 5.6124267578125, 5.84173583984375, 6.071044921875, 6.30035400390625, 6.5296630859375, 6.75897216796875, 6.98828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 11.0, 13.0, 23.0, 34.0, 72.0, 122.0, 188.0, 373.0, 634.0, 1372.0, 2958.0, 7501.0, 22356.0, 100530.0, 3363580.0, 607953.0, 60733.0, 15602.0, 5560.0, 2393.0, 1086.0, 535.0, 272.0, 146.0, 90.0, 71.0, 31.0, 17.0, 5.0, 11.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-72.125, -69.708984375, -67.29296875, -64.876953125, -62.4609375, -60.044921875, -57.62890625, -55.212890625, -52.796875, -50.380859375, -47.96484375, -45.548828125, -43.1328125, -40.716796875, -38.30078125, -35.884765625, -33.46875, -31.052734375, -28.63671875, -26.220703125, -23.8046875, -21.388671875, -18.97265625, -16.556640625, -14.140625, -11.724609375, -9.30859375, -6.892578125, -4.4765625, -2.060546875, 0.35546875, 2.771484375, 5.1875, 7.603515625, 10.01953125, 12.435546875, 14.8515625, 17.267578125, 19.68359375, 22.099609375, 24.515625, 26.931640625, 29.34765625, 31.763671875, 34.1796875, 36.595703125, 39.01171875, 41.427734375, 43.84375, 46.259765625, 48.67578125, 51.091796875, 53.5078125, 55.923828125, 58.33984375, 60.755859375, 63.171875, 65.587890625, 68.00390625, 70.419921875, 72.8359375, 75.251953125, 77.66796875, 80.083984375, 82.5]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 4.0, 5.0, 12.0, 11.0, 13.0, 14.0, 17.0, 26.0, 52.0, 58.0, 91.0, 122.0, 237.0, 716.0, 1842.0, 324.0, 168.0, 111.0, 66.0, 52.0, 21.0, 25.0, 13.0, 12.0, 14.0, 13.0, 7.0, 6.0, 4.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.671875, -19.9384765625, -19.205078125, -18.4716796875, -17.73828125, -17.0048828125, -16.271484375, -15.5380859375, -14.8046875, -14.0712890625, -13.337890625, -12.6044921875, -11.87109375, -11.1376953125, -10.404296875, -9.6708984375, -8.9375, -8.2041015625, -7.470703125, -6.7373046875, -6.00390625, -5.2705078125, -4.537109375, -3.8037109375, -3.0703125, -2.3369140625, -1.603515625, -0.8701171875, -0.13671875, 0.5966796875, 1.330078125, 2.0634765625, 2.796875, 3.5302734375, 4.263671875, 4.9970703125, 5.73046875, 6.4638671875, 7.197265625, 7.9306640625, 8.6640625, 9.3974609375, 10.130859375, 10.8642578125, 11.59765625, 12.3310546875, 13.064453125, 13.7978515625, 14.53125, 15.2646484375, 15.998046875, 16.7314453125, 17.46484375, 18.1982421875, 18.931640625, 19.6650390625, 20.3984375, 21.1318359375, 21.865234375, 22.5986328125, 23.33203125, 24.0654296875, 24.798828125, 25.5322265625, 26.265625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 7.0, 4.0, 5.0, 15.0, 33.0, 62.0, 107.0, 171.0, 176.0, 144.0, 115.0, 74.0, 41.0, 22.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.1884002685547, -245.286865234375, -238.38534545898438, -231.4838104248047, -224.582275390625, -217.68075561523438, -210.7792205810547, -203.877685546875, -196.9761505126953, -190.07461547851562, -183.173095703125, -176.2715606689453, -169.37002563476562, -162.468505859375, -155.5669708251953, -148.66543579101562, -141.763916015625, -134.8623809814453, -127.96085357666016, -121.059326171875, -114.15779113769531, -107.25626373291016, -100.354736328125, -93.45320129394531, -86.55166625976562, -79.65013885498047, -72.74860382080078, -65.84707641601562, -58.94554138183594, -52.04401397705078, -45.14248275756836, -38.24095153808594, -31.33941650390625, -24.437885284423828, -17.536354064941406, -10.634824752807617, -3.7332935333251953, 3.1682357788085938, 10.069766998291016, 16.971298217773438, 23.87282943725586, 30.77436065673828, 37.6758918762207, 44.577423095703125, 51.47895050048828, 58.3804817199707, 65.28201293945312, 72.18354797363281, 79.08507537841797, 85.98660278320312, 92.88813781738281, 99.78966522216797, 106.69120025634766, 113.59272766113281, 120.4942626953125, 127.39579010009766, 134.2973175048828, 141.1988525390625, 148.10037231445312, 155.0019073486328, 161.9034423828125, 168.80496215820312, 175.7064971923828, 182.6080322265625, 189.5095672607422]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 4.0, 6.0, 10.0, 7.0, 14.0, 20.0, 18.0, 19.0, 34.0, 25.0, 30.0, 30.0, 33.0, 37.0, 41.0, 39.0, 40.0, 38.0, 37.0, 45.0, 51.0, 39.0, 36.0, 32.0, 31.0, 37.0, 33.0, 29.0, 23.0, 23.0, 18.0, 14.0, 22.0, 11.0, 10.0, 15.0, 20.0, 4.0, 3.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-81.61823272705078, -79.24981689453125, -76.88140106201172, -74.51298522949219, -72.14456939697266, -69.77615356445312, -67.4077377319336, -65.03932189941406, -62.670902252197266, -60.302486419677734, -57.9340705871582, -55.56565475463867, -53.197235107421875, -50.828819274902344, -48.46040344238281, -46.09198760986328, -43.72357177734375, -41.35515594482422, -38.98674011230469, -36.618324279785156, -34.249908447265625, -31.88149070739746, -29.513072967529297, -27.144657135009766, -24.776241302490234, -22.407825469970703, -20.039409637451172, -17.670991897583008, -15.302576065063477, -12.934160232543945, -10.565743446350098, -8.19732666015625, -5.828910827636719, -3.4604945182800293, -1.0920782089233398, 1.2763381004333496, 3.644754409790039, 6.01317024230957, 8.381587028503418, 10.750003814697266, 13.118419647216797, 15.486835479736328, 17.85525131225586, 20.223669052124023, 22.592084884643555, 24.960500717163086, 27.32891845703125, 29.69733428955078, 32.06575012207031, 34.434165954589844, 36.802581787109375, 39.170997619628906, 41.53941345214844, 43.90782928466797, 46.276248931884766, 48.6446647644043, 51.01308059692383, 53.38149642944336, 55.74991226196289, 58.11832809448242, 60.48674774169922, 62.85516357421875, 65.22357940673828, 67.59199523925781, 69.96041107177734]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 11.0, 7.0, 7.0, 12.0, 17.0, 23.0, 25.0, 42.0, 59.0, 96.0, 158.0, 247.0, 390.0, 645.0, 1117.0, 2008.0, 3880.0, 7998.0, 18202.0, 47043.0, 135850.0, 436516.0, 259539.0, 80161.0, 30071.0, 12284.0, 5538.0, 2828.0, 1557.0, 821.0, 526.0, 303.0, 192.0, 109.0, 87.0, 67.0, 31.0, 30.0, 19.0, 14.0, 9.0, 7.0, 6.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.59375, -50.93798828125, -49.2822265625, -47.62646484375, -45.970703125, -44.31494140625, -42.6591796875, -41.00341796875, -39.34765625, -37.69189453125, -36.0361328125, -34.38037109375, -32.724609375, -31.06884765625, -29.4130859375, -27.75732421875, -26.1015625, -24.44580078125, -22.7900390625, -21.13427734375, -19.478515625, -17.82275390625, -16.1669921875, -14.51123046875, -12.85546875, -11.19970703125, -9.5439453125, -7.88818359375, -6.232421875, -4.57666015625, -2.9208984375, -1.26513671875, 0.390625, 2.04638671875, 3.7021484375, 5.35791015625, 7.013671875, 8.66943359375, 10.3251953125, 11.98095703125, 13.63671875, 15.29248046875, 16.9482421875, 18.60400390625, 20.259765625, 21.91552734375, 23.5712890625, 25.22705078125, 26.8828125, 28.53857421875, 30.1943359375, 31.85009765625, 33.505859375, 35.16162109375, 36.8173828125, 38.47314453125, 40.12890625, 41.78466796875, 43.4404296875, 45.09619140625, 46.751953125, 48.40771484375, 50.0634765625, 51.71923828125, 53.375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 3.0, 7.0, 8.0, 11.0, 12.0, 25.0, 21.0, 20.0, 28.0, 16.0, 34.0, 36.0, 33.0, 43.0, 55.0, 49.0, 55.0, 51.0, 51.0, 40.0, 57.0, 51.0, 31.0, 40.0, 33.0, 26.0, 25.0, 33.0, 21.0, 20.0, 19.0, 12.0, 5.0, 6.0, 5.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.56640625, -7.34234619140625, -7.1182861328125, -6.89422607421875, -6.670166015625, -6.44610595703125, -6.2220458984375, -5.99798583984375, -5.77392578125, -5.54986572265625, -5.3258056640625, -5.10174560546875, -4.877685546875, -4.65362548828125, -4.4295654296875, -4.20550537109375, -3.9814453125, -3.75738525390625, -3.5333251953125, -3.30926513671875, -3.085205078125, -2.86114501953125, -2.6370849609375, -2.41302490234375, -2.18896484375, -1.96490478515625, -1.7408447265625, -1.51678466796875, -1.292724609375, -1.06866455078125, -0.8446044921875, -0.62054443359375, -0.396484375, -0.17242431640625, 0.0516357421875, 0.27569580078125, 0.499755859375, 0.72381591796875, 0.9478759765625, 1.17193603515625, 1.39599609375, 1.62005615234375, 1.8441162109375, 2.06817626953125, 2.292236328125, 2.51629638671875, 2.7403564453125, 2.96441650390625, 3.1884765625, 3.41253662109375, 3.6365966796875, 3.86065673828125, 4.084716796875, 4.30877685546875, 4.5328369140625, 4.75689697265625, 4.98095703125, 5.20501708984375, 5.4290771484375, 5.65313720703125, 5.877197265625, 6.10125732421875, 6.3253173828125, 6.54937744140625, 6.7734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 7.0, 7.0, 11.0, 20.0, 19.0, 35.0, 44.0, 71.0, 108.0, 139.0, 238.0, 331.0, 560.0, 848.0, 1543.0, 2566.0, 4732.0, 9431.0, 22068.0, 58255.0, 184229.0, 462945.0, 194652.0, 61392.0, 22691.0, 9966.0, 4910.0, 2682.0, 1481.0, 912.0, 563.0, 364.0, 250.0, 157.0, 108.0, 59.0, 51.0, 30.0, 20.0, 15.0, 13.0, 6.0, 7.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.34375, -39.943359375, -38.54296875, -37.142578125, -35.7421875, -34.341796875, -32.94140625, -31.541015625, -30.140625, -28.740234375, -27.33984375, -25.939453125, -24.5390625, -23.138671875, -21.73828125, -20.337890625, -18.9375, -17.537109375, -16.13671875, -14.736328125, -13.3359375, -11.935546875, -10.53515625, -9.134765625, -7.734375, -6.333984375, -4.93359375, -3.533203125, -2.1328125, -0.732421875, 0.66796875, 2.068359375, 3.46875, 4.869140625, 6.26953125, 7.669921875, 9.0703125, 10.470703125, 11.87109375, 13.271484375, 14.671875, 16.072265625, 17.47265625, 18.873046875, 20.2734375, 21.673828125, 23.07421875, 24.474609375, 25.875, 27.275390625, 28.67578125, 30.076171875, 31.4765625, 32.876953125, 34.27734375, 35.677734375, 37.078125, 38.478515625, 39.87890625, 41.279296875, 42.6796875, 44.080078125, 45.48046875, 46.880859375, 48.28125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 12.0, 8.0, 12.0, 8.0, 18.0, 10.0, 20.0, 26.0, 17.0, 25.0, 27.0, 35.0, 39.0, 44.0, 59.0, 44.0, 55.0, 52.0, 49.0, 44.0, 45.0, 45.0, 48.0, 34.0, 36.0, 27.0, 26.0, 28.0, 26.0, 15.0, 15.0, 10.0, 10.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-35.25, -34.06298828125, -32.8759765625, -31.68896484375, -30.501953125, -29.31494140625, -28.1279296875, -26.94091796875, -25.75390625, -24.56689453125, -23.3798828125, -22.19287109375, -21.005859375, -19.81884765625, -18.6318359375, -17.44482421875, -16.2578125, -15.07080078125, -13.8837890625, -12.69677734375, -11.509765625, -10.32275390625, -9.1357421875, -7.94873046875, -6.76171875, -5.57470703125, -4.3876953125, -3.20068359375, -2.013671875, -0.82666015625, 0.3603515625, 1.54736328125, 2.734375, 3.92138671875, 5.1083984375, 6.29541015625, 7.482421875, 8.66943359375, 9.8564453125, 11.04345703125, 12.23046875, 13.41748046875, 14.6044921875, 15.79150390625, 16.978515625, 18.16552734375, 19.3525390625, 20.53955078125, 21.7265625, 22.91357421875, 24.1005859375, 25.28759765625, 26.474609375, 27.66162109375, 28.8486328125, 30.03564453125, 31.22265625, 32.40966796875, 33.5966796875, 34.78369140625, 35.970703125, 37.15771484375, 38.3447265625, 39.53173828125, 40.71875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 9.0, 14.0, 21.0, 48.0, 68.0, 111.0, 210.0, 346.0, 650.0, 1109.0, 2253.0, 4577.0, 10473.0, 31340.0, 263216.0, 651300.0, 55709.0, 14897.0, 6100.0, 2768.0, 1522.0, 786.0, 461.0, 219.0, 133.0, 90.0, 39.0, 41.0, 17.0, 9.0, 6.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.3125, -50.634765625, -48.95703125, -47.279296875, -45.6015625, -43.923828125, -42.24609375, -40.568359375, -38.890625, -37.212890625, -35.53515625, -33.857421875, -32.1796875, -30.501953125, -28.82421875, -27.146484375, -25.46875, -23.791015625, -22.11328125, -20.435546875, -18.7578125, -17.080078125, -15.40234375, -13.724609375, -12.046875, -10.369140625, -8.69140625, -7.013671875, -5.3359375, -3.658203125, -1.98046875, -0.302734375, 1.375, 3.052734375, 4.73046875, 6.408203125, 8.0859375, 9.763671875, 11.44140625, 13.119140625, 14.796875, 16.474609375, 18.15234375, 19.830078125, 21.5078125, 23.185546875, 24.86328125, 26.541015625, 28.21875, 29.896484375, 31.57421875, 33.251953125, 34.9296875, 36.607421875, 38.28515625, 39.962890625, 41.640625, 43.318359375, 44.99609375, 46.673828125, 48.3515625, 50.029296875, 51.70703125, 53.384765625, 55.0625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 2.0, 5.0, 11.0, 11.0, 25.0, 34.0, 80.0, 194.0, 326.0, 142.0, 60.0, 26.0, 21.0, 17.0, 8.0, 4.0, 6.0, 3.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.01534271240234375, -0.014820694923400879, -0.014298677444458008, -0.013776659965515137, -0.013254642486572266, -0.012732625007629395, -0.012210607528686523, -0.011688590049743652, -0.011166572570800781, -0.01064455509185791, -0.010122537612915039, -0.009600520133972168, -0.009078502655029297, -0.008556485176086426, -0.008034467697143555, -0.007512450218200684, -0.0069904327392578125, -0.006468415260314941, -0.00594639778137207, -0.005424380302429199, -0.004902362823486328, -0.004380345344543457, -0.003858327865600586, -0.003336310386657715, -0.0028142929077148438, -0.0022922754287719727, -0.0017702579498291016, -0.0012482404708862305, -0.0007262229919433594, -0.00020420551300048828, 0.0003178119659423828, 0.0008398294448852539, 0.001361846923828125, 0.001883864402770996, 0.002405881881713867, 0.0029278993606567383, 0.0034499168395996094, 0.0039719343185424805, 0.0044939517974853516, 0.005015969276428223, 0.005537986755371094, 0.006060004234313965, 0.006582021713256836, 0.007104039192199707, 0.007626056671142578, 0.00814807415008545, 0.00867009162902832, 0.009192109107971191, 0.009714126586914062, 0.010236144065856934, 0.010758161544799805, 0.011280179023742676, 0.011802196502685547, 0.012324213981628418, 0.012846231460571289, 0.01336824893951416, 0.013890266418457031, 0.014412283897399902, 0.014934301376342773, 0.015456318855285645, 0.015978336334228516, 0.016500353813171387, 0.017022371292114258, 0.01754438877105713, 0.01806640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 5.0, 14.0, 24.0, 21.0, 42.0, 50.0, 80.0, 119.0, 184.0, 301.0, 432.0, 809.0, 1331.0, 2286.0, 4218.0, 8859.0, 21641.0, 76130.0, 531628.0, 316489.0, 51570.0, 16608.0, 7057.0, 3613.0, 2005.0, 1133.0, 674.0, 421.0, 246.0, 175.0, 114.0, 86.0, 52.0, 36.0, 33.0, 14.0, 9.0, 12.0, 9.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-41.90625, -40.73779296875, -39.5693359375, -38.40087890625, -37.232421875, -36.06396484375, -34.8955078125, -33.72705078125, -32.55859375, -31.39013671875, -30.2216796875, -29.05322265625, -27.884765625, -26.71630859375, -25.5478515625, -24.37939453125, -23.2109375, -22.04248046875, -20.8740234375, -19.70556640625, -18.537109375, -17.36865234375, -16.2001953125, -15.03173828125, -13.86328125, -12.69482421875, -11.5263671875, -10.35791015625, -9.189453125, -8.02099609375, -6.8525390625, -5.68408203125, -4.515625, -3.34716796875, -2.1787109375, -1.01025390625, 0.158203125, 1.32666015625, 2.4951171875, 3.66357421875, 4.83203125, 6.00048828125, 7.1689453125, 8.33740234375, 9.505859375, 10.67431640625, 11.8427734375, 13.01123046875, 14.1796875, 15.34814453125, 16.5166015625, 17.68505859375, 18.853515625, 20.02197265625, 21.1904296875, 22.35888671875, 23.52734375, 24.69580078125, 25.8642578125, 27.03271484375, 28.201171875, 29.36962890625, 30.5380859375, 31.70654296875, 32.875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 8.0, 9.0, 19.0, 18.0, 21.0, 38.0, 43.0, 59.0, 84.0, 116.0, 125.0, 116.0, 95.0, 57.0, 39.0, 24.0, 32.0, 10.0, 13.0, 10.0, 13.0, 3.0, 7.0, 2.0, 3.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-32.71875, -31.846435546875, -30.97412109375, -30.101806640625, -29.2294921875, -28.357177734375, -27.48486328125, -26.612548828125, -25.740234375, -24.867919921875, -23.99560546875, -23.123291015625, -22.2509765625, -21.378662109375, -20.50634765625, -19.634033203125, -18.76171875, -17.889404296875, -17.01708984375, -16.144775390625, -15.2724609375, -14.400146484375, -13.52783203125, -12.655517578125, -11.783203125, -10.910888671875, -10.03857421875, -9.166259765625, -8.2939453125, -7.421630859375, -6.54931640625, -5.677001953125, -4.8046875, -3.932373046875, -3.06005859375, -2.187744140625, -1.3154296875, -0.443115234375, 0.42919921875, 1.301513671875, 2.173828125, 3.046142578125, 3.91845703125, 4.790771484375, 5.6630859375, 6.535400390625, 7.40771484375, 8.280029296875, 9.15234375, 10.024658203125, 10.89697265625, 11.769287109375, 12.6416015625, 13.513916015625, 14.38623046875, 15.258544921875, 16.130859375, 17.003173828125, 17.87548828125, 18.747802734375, 19.6201171875, 20.492431640625, 21.36474609375, 22.237060546875, 23.109375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 14.0, 30.0, 78.0, 168.0, 327.0, 228.0, 100.0, 47.0, 14.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1513.858642578125, -1484.44580078125, -1455.032958984375, -1425.6202392578125, -1396.2073974609375, -1366.7945556640625, -1337.3817138671875, -1307.968994140625, -1278.55615234375, -1249.143310546875, -1219.73046875, -1190.3177490234375, -1160.9049072265625, -1131.4920654296875, -1102.0792236328125, -1072.66650390625, -1043.253662109375, -1013.8408203125, -984.4280395507812, -955.0151977539062, -925.6024169921875, -896.1895751953125, -866.7767944335938, -837.3639526367188, -807.9511108398438, -778.5382690429688, -749.12548828125, -719.712646484375, -690.2998657226562, -660.8870239257812, -631.4742431640625, -602.0614013671875, -572.6485595703125, -543.2357177734375, -513.8229370117188, -484.4101257324219, -454.997314453125, -425.58447265625, -396.17169189453125, -366.75885009765625, -337.3460693359375, -307.9332580566406, -278.52044677734375, -249.10763549804688, -219.69482421875, -190.28199768066406, -160.8691864013672, -131.4563751220703, -102.0435791015625, -72.63076782226562, -43.217952728271484, -13.805137634277344, 15.607673645019531, 45.02049255371094, 74.43330383300781, 103.84611511230469, 133.25892639160156, 162.67173767089844, 192.0845489501953, 221.49737548828125, 250.91018676757812, 280.322998046875, 309.7358093261719, 339.14862060546875, 368.5614318847656]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 14.0, 7.0, 12.0, 15.0, 18.0, 29.0, 30.0, 36.0, 26.0, 42.0, 46.0, 38.0, 38.0, 56.0, 50.0, 54.0, 51.0, 46.0, 37.0, 52.0, 44.0, 36.0, 39.0, 29.0, 26.0, 25.0, 21.0, 24.0, 13.0, 12.0, 7.0, 6.0, 5.0, 1.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-302.77764892578125, -294.8313293457031, -286.8850402832031, -278.938720703125, -270.9924011230469, -263.0461120605469, -255.09979248046875, -247.1534881591797, -239.20718383789062, -231.26087951660156, -223.31455993652344, -215.36825561523438, -207.4219512939453, -199.47564697265625, -191.52932739257812, -183.58302307128906, -175.63671875, -167.69041442871094, -159.7440948486328, -151.79779052734375, -143.8514862060547, -135.90518188476562, -127.9588623046875, -120.01255798339844, -112.06623840332031, -104.11992645263672, -96.17362213134766, -88.22731018066406, -80.281005859375, -72.3346939086914, -64.38838195800781, -56.44207763671875, -48.49577331542969, -40.54946517944336, -32.60315704345703, -24.65684700012207, -16.710538864135742, -8.764228820800781, -0.8179206848144531, 7.128387451171875, 15.074695587158203, 23.02100372314453, 30.96731185913086, 38.91361999511719, 46.85993194580078, 54.80624008178711, 62.75254821777344, 70.6988525390625, 78.6451644897461, 86.59147644042969, 94.53778076171875, 102.48409271240234, 110.4303970336914, 118.376708984375, 126.32301330566406, 134.26931762695312, 142.21563720703125, 150.1619415283203, 158.10826110839844, 166.0545654296875, 174.00086975097656, 181.94717407226562, 189.89349365234375, 197.8397979736328, 205.78610229492188]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 21.0, 14.0, 16.0, 20.0, 43.0, 62.0, 85.0, 101.0, 199.0, 295.0, 482.0, 726.0, 1374.0, 2404.0, 5073.0, 12297.0, 41160.0, 669584.0, 3389823.0, 47142.0, 12729.0, 4977.0, 2478.0, 1304.0, 727.0, 409.0, 254.0, 155.0, 102.0, 76.0, 56.0, 26.0, 22.0, 19.0, 5.0, 5.0, 4.0, 9.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.125, -74.5576171875, -71.990234375, -69.4228515625, -66.85546875, -64.2880859375, -61.720703125, -59.1533203125, -56.5859375, -54.0185546875, -51.451171875, -48.8837890625, -46.31640625, -43.7490234375, -41.181640625, -38.6142578125, -36.046875, -33.4794921875, -30.912109375, -28.3447265625, -25.77734375, -23.2099609375, -20.642578125, -18.0751953125, -15.5078125, -12.9404296875, -10.373046875, -7.8056640625, -5.23828125, -2.6708984375, -0.103515625, 2.4638671875, 5.03125, 7.5986328125, 10.166015625, 12.7333984375, 15.30078125, 17.8681640625, 20.435546875, 23.0029296875, 25.5703125, 28.1376953125, 30.705078125, 33.2724609375, 35.83984375, 38.4072265625, 40.974609375, 43.5419921875, 46.109375, 48.6767578125, 51.244140625, 53.8115234375, 56.37890625, 58.9462890625, 61.513671875, 64.0810546875, 66.6484375, 69.2158203125, 71.783203125, 74.3505859375, 76.91796875, 79.4853515625, 82.052734375, 84.6201171875, 87.1875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 9.0, 9.0, 10.0, 10.0, 12.0, 16.0, 14.0, 22.0, 27.0, 22.0, 40.0, 33.0, 29.0, 35.0, 46.0, 45.0, 36.0, 37.0, 41.0, 46.0, 52.0, 48.0, 41.0, 35.0, 39.0, 23.0, 16.0, 20.0, 29.0, 19.0, 27.0, 20.0, 22.0, 10.0, 9.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.59765625, -7.376708984375, -7.15576171875, -6.934814453125, -6.7138671875, -6.492919921875, -6.27197265625, -6.051025390625, -5.830078125, -5.609130859375, -5.38818359375, -5.167236328125, -4.9462890625, -4.725341796875, -4.50439453125, -4.283447265625, -4.0625, -3.841552734375, -3.62060546875, -3.399658203125, -3.1787109375, -2.957763671875, -2.73681640625, -2.515869140625, -2.294921875, -2.073974609375, -1.85302734375, -1.632080078125, -1.4111328125, -1.190185546875, -0.96923828125, -0.748291015625, -0.52734375, -0.306396484375, -0.08544921875, 0.135498046875, 0.3564453125, 0.577392578125, 0.79833984375, 1.019287109375, 1.240234375, 1.461181640625, 1.68212890625, 1.903076171875, 2.1240234375, 2.344970703125, 2.56591796875, 2.786865234375, 3.0078125, 3.228759765625, 3.44970703125, 3.670654296875, 3.8916015625, 4.112548828125, 4.33349609375, 4.554443359375, 4.775390625, 4.996337890625, 5.21728515625, 5.438232421875, 5.6591796875, 5.880126953125, 6.10107421875, 6.322021484375, 6.54296875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 8.0, 2.0, 14.0, 15.0, 19.0, 32.0, 42.0, 54.0, 83.0, 130.0, 172.0, 257.0, 414.0, 664.0, 1109.0, 1867.0, 3218.0, 6208.0, 13354.0, 35289.0, 145323.0, 3687889.0, 222128.0, 43772.0, 15862.0, 7145.0, 3708.0, 2063.0, 1255.0, 785.0, 485.0, 299.0, 173.0, 141.0, 74.0, 69.0, 40.0, 28.0, 16.0, 24.0, 13.0, 6.0, 10.0, 5.0, 4.0, 3.0, 4.0, 0.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-73.125, -70.654296875, -68.18359375, -65.712890625, -63.2421875, -60.771484375, -58.30078125, -55.830078125, -53.359375, -50.888671875, -48.41796875, -45.947265625, -43.4765625, -41.005859375, -38.53515625, -36.064453125, -33.59375, -31.123046875, -28.65234375, -26.181640625, -23.7109375, -21.240234375, -18.76953125, -16.298828125, -13.828125, -11.357421875, -8.88671875, -6.416015625, -3.9453125, -1.474609375, 0.99609375, 3.466796875, 5.9375, 8.408203125, 10.87890625, 13.349609375, 15.8203125, 18.291015625, 20.76171875, 23.232421875, 25.703125, 28.173828125, 30.64453125, 33.115234375, 35.5859375, 38.056640625, 40.52734375, 42.998046875, 45.46875, 47.939453125, 50.41015625, 52.880859375, 55.3515625, 57.822265625, 60.29296875, 62.763671875, 65.234375, 67.705078125, 70.17578125, 72.646484375, 75.1171875, 77.587890625, 80.05859375, 82.529296875, 85.0]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 5.0, 6.0, 12.0, 22.0, 18.0, 50.0, 67.0, 141.0, 446.0, 2714.0, 274.0, 123.0, 51.0, 41.0, 26.0, 19.0, 16.0, 7.0, 4.0, 3.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.296875, -28.092041015625, -26.88720703125, -25.682373046875, -24.4775390625, -23.272705078125, -22.06787109375, -20.863037109375, -19.658203125, -18.453369140625, -17.24853515625, -16.043701171875, -14.8388671875, -13.634033203125, -12.42919921875, -11.224365234375, -10.01953125, -8.814697265625, -7.60986328125, -6.405029296875, -5.2001953125, -3.995361328125, -2.79052734375, -1.585693359375, -0.380859375, 0.823974609375, 2.02880859375, 3.233642578125, 4.4384765625, 5.643310546875, 6.84814453125, 8.052978515625, 9.2578125, 10.462646484375, 11.66748046875, 12.872314453125, 14.0771484375, 15.281982421875, 16.48681640625, 17.691650390625, 18.896484375, 20.101318359375, 21.30615234375, 22.510986328125, 23.7158203125, 24.920654296875, 26.12548828125, 27.330322265625, 28.53515625, 29.739990234375, 30.94482421875, 32.149658203125, 33.3544921875, 34.559326171875, 35.76416015625, 36.968994140625, 38.173828125, 39.378662109375, 40.58349609375, 41.788330078125, 42.9931640625, 44.197998046875, 45.40283203125, 46.607666015625, 47.8125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 8.0, 25.0, 47.0, 102.0, 209.0, 278.0, 186.0, 82.0, 32.0, 23.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.7943572998047, -192.905517578125, -181.0166778564453, -169.12783813476562, -157.23899841308594, -145.35015869140625, -133.46133422851562, -121.5724868774414, -109.68364715576172, -97.79480743408203, -85.90596771240234, -74.01713562011719, -62.128292083740234, -50.23945236206055, -38.350616455078125, -26.461776733398438, -14.57293701171875, -2.684098243713379, 9.204740524291992, 21.093578338623047, 32.982418060302734, 44.87125778198242, 56.760093688964844, 68.64893341064453, 80.53777313232422, 92.4266128540039, 104.3154525756836, 116.20428466796875, 128.09312438964844, 139.98196411132812, 151.8708038330078, 163.7596435546875, 175.64846801757812, 187.5373077392578, 199.4261474609375, 211.3149871826172, 223.20382690429688, 235.09266662597656, 246.98150634765625, 258.8703308105469, 270.7591857910156, 282.64801025390625, 294.536865234375, 306.4256896972656, 318.3145446777344, 330.203369140625, 342.09222412109375, 353.9810485839844, 365.869873046875, 377.7586975097656, 389.6475524902344, 401.536376953125, 413.42523193359375, 425.3140563964844, 437.2029113769531, 449.09173583984375, 460.9805908203125, 472.8694152832031, 484.7582702636719, 496.6470947265625, 508.53594970703125, 520.4248046875, 532.3135986328125, 544.2024536132812, 556.09130859375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 5.0, 3.0, 12.0, 3.0, 6.0, 10.0, 15.0, 20.0, 15.0, 11.0, 25.0, 24.0, 35.0, 34.0, 31.0, 33.0, 37.0, 47.0, 46.0, 43.0, 45.0, 50.0, 42.0, 35.0, 50.0, 35.0, 38.0, 24.0, 31.0, 36.0, 20.0, 33.0, 12.0, 20.0, 13.0, 10.0, 13.0, 6.0, 7.0, 5.0, 6.0, 2.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.41522216796875, -79.52839660644531, -76.64156341552734, -73.7547378540039, -70.86790466308594, -67.9810791015625, -65.09425354003906, -62.207420349121094, -59.32059097290039, -56.43376159667969, -53.546932220458984, -50.66010284423828, -47.773277282714844, -44.886444091796875, -41.99961853027344, -39.112789154052734, -36.22595977783203, -33.33913040161133, -30.452301025390625, -27.565473556518555, -24.67864418029785, -21.79181480407715, -18.904987335205078, -16.018157958984375, -13.131328582763672, -10.244499206542969, -7.357670783996582, -4.470842361450195, -1.5840129852294922, 1.302816390991211, 4.189643859863281, 7.076473236083984, 9.963294982910156, 12.85012435913086, 15.736952781677246, 18.623781204223633, 21.510610580444336, 24.39743995666504, 27.28426742553711, 30.171096801757812, 33.057926177978516, 35.94475555419922, 38.83158493041992, 41.718414306640625, 44.60523986816406, 47.49207305908203, 50.37889862060547, 53.26572799682617, 56.152557373046875, 59.03938674926758, 61.92621612548828, 64.81304168701172, 67.69987487792969, 70.58670043945312, 73.47352600097656, 76.36035919189453, 79.2471923828125, 82.13401794433594, 85.0208511352539, 87.90767669677734, 90.79450988769531, 93.68133544921875, 96.56816101074219, 99.45499420166016, 102.3418197631836]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 6.0, 4.0, 12.0, 27.0, 19.0, 33.0, 60.0, 71.0, 123.0, 155.0, 236.0, 341.0, 536.0, 793.0, 1213.0, 2009.0, 3267.0, 5289.0, 9001.0, 15877.0, 30032.0, 62521.0, 148231.0, 350947.0, 233010.0, 92307.0, 41932.0, 20894.0, 11551.0, 6700.0, 4075.0, 2484.0, 1638.0, 1054.0, 662.0, 447.0, 313.0, 230.0, 139.0, 94.0, 65.0, 29.0, 38.0, 16.0, 23.0, 14.0, 11.0, 8.0, 6.0, 1.0, 1.0, 2.0, 1.0, 5.0], "bins": [-47.96875, -46.546875, -45.125, -43.703125, -42.28125, -40.859375, -39.4375, -38.015625, -36.59375, -35.171875, -33.75, -32.328125, -30.90625, -29.484375, -28.0625, -26.640625, -25.21875, -23.796875, -22.375, -20.953125, -19.53125, -18.109375, -16.6875, -15.265625, -13.84375, -12.421875, -11.0, -9.578125, -8.15625, -6.734375, -5.3125, -3.890625, -2.46875, -1.046875, 0.375, 1.796875, 3.21875, 4.640625, 6.0625, 7.484375, 8.90625, 10.328125, 11.75, 13.171875, 14.59375, 16.015625, 17.4375, 18.859375, 20.28125, 21.703125, 23.125, 24.546875, 25.96875, 27.390625, 28.8125, 30.234375, 31.65625, 33.078125, 34.5, 35.921875, 37.34375, 38.765625, 40.1875, 41.609375, 43.03125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 10.0, 6.0, 5.0, 6.0, 11.0, 14.0, 15.0, 13.0, 10.0, 14.0, 26.0, 17.0, 19.0, 29.0, 37.0, 19.0, 40.0, 41.0, 46.0, 43.0, 40.0, 49.0, 47.0, 36.0, 40.0, 25.0, 56.0, 38.0, 39.0, 28.0, 22.0, 31.0, 24.0, 18.0, 18.0, 17.0, 9.0, 9.0, 11.0, 8.0, 6.0, 2.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.40625, -8.1561279296875, -7.906005859375, -7.6558837890625, -7.40576171875, -7.1556396484375, -6.905517578125, -6.6553955078125, -6.4052734375, -6.1551513671875, -5.905029296875, -5.6549072265625, -5.40478515625, -5.1546630859375, -4.904541015625, -4.6544189453125, -4.404296875, -4.1541748046875, -3.904052734375, -3.6539306640625, -3.40380859375, -3.1536865234375, -2.903564453125, -2.6534423828125, -2.4033203125, -2.1531982421875, -1.903076171875, -1.6529541015625, -1.40283203125, -1.1527099609375, -0.902587890625, -0.6524658203125, -0.40234375, -0.1522216796875, 0.097900390625, 0.3480224609375, 0.59814453125, 0.8482666015625, 1.098388671875, 1.3485107421875, 1.5986328125, 1.8487548828125, 2.098876953125, 2.3489990234375, 2.59912109375, 2.8492431640625, 3.099365234375, 3.3494873046875, 3.599609375, 3.8497314453125, 4.099853515625, 4.3499755859375, 4.60009765625, 4.8502197265625, 5.100341796875, 5.3504638671875, 5.6005859375, 5.8507080078125, 6.100830078125, 6.3509521484375, 6.60107421875, 6.8511962890625, 7.101318359375, 7.3514404296875, 7.6015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 15.0, 17.0, 8.0, 7.0, 12.0, 19.0, 35.0, 53.0, 71.0, 124.0, 210.0, 349.0, 593.0, 1046.0, 1867.0, 3754.0, 7898.0, 18215.0, 47131.0, 152896.0, 489353.0, 219346.0, 62822.0, 23228.0, 9805.0, 4536.0, 2270.0, 1175.0, 649.0, 365.0, 238.0, 125.0, 94.0, 65.0, 39.0, 22.0, 24.0, 10.0, 13.0, 10.0, 16.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-59.59375, -57.873046875, -56.15234375, -54.431640625, -52.7109375, -50.990234375, -49.26953125, -47.548828125, -45.828125, -44.107421875, -42.38671875, -40.666015625, -38.9453125, -37.224609375, -35.50390625, -33.783203125, -32.0625, -30.341796875, -28.62109375, -26.900390625, -25.1796875, -23.458984375, -21.73828125, -20.017578125, -18.296875, -16.576171875, -14.85546875, -13.134765625, -11.4140625, -9.693359375, -7.97265625, -6.251953125, -4.53125, -2.810546875, -1.08984375, 0.630859375, 2.3515625, 4.072265625, 5.79296875, 7.513671875, 9.234375, 10.955078125, 12.67578125, 14.396484375, 16.1171875, 17.837890625, 19.55859375, 21.279296875, 23.0, 24.720703125, 26.44140625, 28.162109375, 29.8828125, 31.603515625, 33.32421875, 35.044921875, 36.765625, 38.486328125, 40.20703125, 41.927734375, 43.6484375, 45.369140625, 47.08984375, 48.810546875, 50.53125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 8.0, 13.0, 8.0, 15.0, 14.0, 12.0, 13.0, 19.0, 34.0, 38.0, 34.0, 33.0, 28.0, 41.0, 44.0, 42.0, 45.0, 50.0, 47.0, 37.0, 48.0, 47.0, 40.0, 42.0, 38.0, 31.0, 25.0, 23.0, 19.0, 15.0, 17.0, 12.0, 10.0, 12.0, 9.0, 7.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 2.0], "bins": [-49.28125, -47.8896484375, -46.498046875, -45.1064453125, -43.71484375, -42.3232421875, -40.931640625, -39.5400390625, -38.1484375, -36.7568359375, -35.365234375, -33.9736328125, -32.58203125, -31.1904296875, -29.798828125, -28.4072265625, -27.015625, -25.6240234375, -24.232421875, -22.8408203125, -21.44921875, -20.0576171875, -18.666015625, -17.2744140625, -15.8828125, -14.4912109375, -13.099609375, -11.7080078125, -10.31640625, -8.9248046875, -7.533203125, -6.1416015625, -4.75, -3.3583984375, -1.966796875, -0.5751953125, 0.81640625, 2.2080078125, 3.599609375, 4.9912109375, 6.3828125, 7.7744140625, 9.166015625, 10.5576171875, 11.94921875, 13.3408203125, 14.732421875, 16.1240234375, 17.515625, 18.9072265625, 20.298828125, 21.6904296875, 23.08203125, 24.4736328125, 25.865234375, 27.2568359375, 28.6484375, 30.0400390625, 31.431640625, 32.8232421875, 34.21484375, 35.6064453125, 36.998046875, 38.3896484375, 39.78125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 5.0, 8.0, 10.0, 16.0, 25.0, 39.0, 47.0, 65.0, 97.0, 135.0, 187.0, 362.0, 587.0, 1115.0, 2112.0, 5004.0, 15196.0, 73578.0, 705039.0, 203583.0, 27125.0, 7722.0, 3077.0, 1431.0, 720.0, 411.0, 273.0, 203.0, 107.0, 73.0, 56.0, 29.0, 39.0, 23.0, 14.0, 10.0, 6.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.5, -58.5302734375, -56.560546875, -54.5908203125, -52.62109375, -50.6513671875, -48.681640625, -46.7119140625, -44.7421875, -42.7724609375, -40.802734375, -38.8330078125, -36.86328125, -34.8935546875, -32.923828125, -30.9541015625, -28.984375, -27.0146484375, -25.044921875, -23.0751953125, -21.10546875, -19.1357421875, -17.166015625, -15.1962890625, -13.2265625, -11.2568359375, -9.287109375, -7.3173828125, -5.34765625, -3.3779296875, -1.408203125, 0.5615234375, 2.53125, 4.5009765625, 6.470703125, 8.4404296875, 10.41015625, 12.3798828125, 14.349609375, 16.3193359375, 18.2890625, 20.2587890625, 22.228515625, 24.1982421875, 26.16796875, 28.1376953125, 30.107421875, 32.0771484375, 34.046875, 36.0166015625, 37.986328125, 39.9560546875, 41.92578125, 43.8955078125, 45.865234375, 47.8349609375, 49.8046875, 51.7744140625, 53.744140625, 55.7138671875, 57.68359375, 59.6533203125, 61.623046875, 63.5927734375, 65.5625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 4.0, 9.0, 15.0, 18.0, 30.0, 42.0, 73.0, 103.0, 220.0, 175.0, 96.0, 65.0, 33.0, 27.0, 21.0, 11.0, 7.0, 6.0, 8.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0171966552734375, -0.016753792762756348, -0.016310930252075195, -0.015868067741394043, -0.01542520523071289, -0.014982342720031738, -0.014539480209350586, -0.014096617698669434, -0.013653755187988281, -0.013210892677307129, -0.012768030166625977, -0.012325167655944824, -0.011882305145263672, -0.01143944263458252, -0.010996580123901367, -0.010553717613220215, -0.010110855102539062, -0.00966799259185791, -0.009225130081176758, -0.008782267570495605, -0.008339405059814453, -0.0078965425491333, -0.0074536800384521484, -0.007010817527770996, -0.006567955017089844, -0.006125092506408691, -0.005682229995727539, -0.005239367485046387, -0.004796504974365234, -0.004353642463684082, -0.00391077995300293, -0.0034679174423217773, -0.003025054931640625, -0.0025821924209594727, -0.0021393299102783203, -0.001696467399597168, -0.0012536048889160156, -0.0008107423782348633, -0.00036787986755371094, 7.49826431274414e-05, 0.0005178451538085938, 0.0009607076644897461, 0.0014035701751708984, 0.0018464326858520508, 0.002289295196533203, 0.0027321577072143555, 0.003175020217895508, 0.00361788272857666, 0.0040607452392578125, 0.004503607749938965, 0.004946470260620117, 0.0053893327713012695, 0.005832195281982422, 0.006275057792663574, 0.0067179203033447266, 0.007160782814025879, 0.007603645324707031, 0.008046507835388184, 0.008489370346069336, 0.008932232856750488, 0.00937509536743164, 0.009817957878112793, 0.010260820388793945, 0.010703682899475098, 0.01114654541015625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 4.0, 7.0, 10.0, 8.0, 17.0, 27.0, 25.0, 45.0, 60.0, 101.0, 126.0, 209.0, 365.0, 695.0, 1272.0, 3044.0, 9331.0, 47280.0, 604757.0, 337984.0, 31165.0, 6946.0, 2413.0, 1144.0, 591.0, 325.0, 194.0, 125.0, 83.0, 51.0, 40.0, 26.0, 17.0, 13.0, 7.0, 11.0, 7.0, 8.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-77.875, -75.705078125, -73.53515625, -71.365234375, -69.1953125, -67.025390625, -64.85546875, -62.685546875, -60.515625, -58.345703125, -56.17578125, -54.005859375, -51.8359375, -49.666015625, -47.49609375, -45.326171875, -43.15625, -40.986328125, -38.81640625, -36.646484375, -34.4765625, -32.306640625, -30.13671875, -27.966796875, -25.796875, -23.626953125, -21.45703125, -19.287109375, -17.1171875, -14.947265625, -12.77734375, -10.607421875, -8.4375, -6.267578125, -4.09765625, -1.927734375, 0.2421875, 2.412109375, 4.58203125, 6.751953125, 8.921875, 11.091796875, 13.26171875, 15.431640625, 17.6015625, 19.771484375, 21.94140625, 24.111328125, 26.28125, 28.451171875, 30.62109375, 32.791015625, 34.9609375, 37.130859375, 39.30078125, 41.470703125, 43.640625, 45.810546875, 47.98046875, 50.150390625, 52.3203125, 54.490234375, 56.66015625, 58.830078125, 61.0]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 9.0, 4.0, 10.0, 12.0, 15.0, 22.0, 39.0, 49.0, 66.0, 96.0, 137.0, 147.0, 116.0, 75.0, 56.0, 52.0, 19.0, 21.0, 15.0, 15.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.46875, -38.11572265625, -36.7626953125, -35.40966796875, -34.056640625, -32.70361328125, -31.3505859375, -29.99755859375, -28.64453125, -27.29150390625, -25.9384765625, -24.58544921875, -23.232421875, -21.87939453125, -20.5263671875, -19.17333984375, -17.8203125, -16.46728515625, -15.1142578125, -13.76123046875, -12.408203125, -11.05517578125, -9.7021484375, -8.34912109375, -6.99609375, -5.64306640625, -4.2900390625, -2.93701171875, -1.583984375, -0.23095703125, 1.1220703125, 2.47509765625, 3.828125, 5.18115234375, 6.5341796875, 7.88720703125, 9.240234375, 10.59326171875, 11.9462890625, 13.29931640625, 14.65234375, 16.00537109375, 17.3583984375, 18.71142578125, 20.064453125, 21.41748046875, 22.7705078125, 24.12353515625, 25.4765625, 26.82958984375, 28.1826171875, 29.53564453125, 30.888671875, 32.24169921875, 33.5947265625, 34.94775390625, 36.30078125, 37.65380859375, 39.0068359375, 40.35986328125, 41.712890625, 43.06591796875, 44.4189453125, 45.77197265625, 47.125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 15.0, 30.0, 42.0, 97.0, 125.0, 186.0, 166.0, 152.0, 83.0, 42.0, 33.0, 17.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-615.23486328125, -594.6429443359375, -574.051025390625, -553.4590454101562, -532.8671264648438, -512.2752075195312, -491.6832580566406, -471.09130859375, -450.4993896484375, -429.907470703125, -409.3155212402344, -388.72357177734375, -368.13165283203125, -347.53973388671875, -326.9477844238281, -306.3558349609375, -285.763916015625, -265.1719970703125, -244.58004760742188, -223.9881134033203, -203.39617919921875, -182.8042449951172, -162.21231079101562, -141.62037658691406, -121.0284423828125, -100.43650817871094, -79.84457397460938, -59.25263977050781, -38.66070556640625, -18.068771362304688, 2.523162841796875, 23.115097045898438, 43.70703125, 64.29896545410156, 84.89089965820312, 105.48283386230469, 126.07476806640625, 146.6667022705078, 167.25863647460938, 187.85057067871094, 208.4425048828125, 229.03443908691406, 249.62637329101562, 270.21832275390625, 290.81024169921875, 311.40216064453125, 331.9941101074219, 352.5860595703125, 373.177978515625, 393.7698974609375, 414.3618469238281, 434.95379638671875, 455.54571533203125, 476.13763427734375, 496.7295837402344, 517.321533203125, 537.9134521484375, 558.50537109375, 579.0972900390625, 599.6892700195312, 620.2811889648438, 640.8731079101562, 661.465087890625, 682.0570068359375, 702.64892578125]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 8.0, 7.0, 7.0, 14.0, 19.0, 14.0, 21.0, 26.0, 39.0, 39.0, 48.0, 42.0, 55.0, 46.0, 58.0, 47.0, 37.0, 53.0, 54.0, 49.0, 53.0, 37.0, 28.0, 36.0, 22.0, 22.0, 24.0, 17.0, 26.0, 19.0, 5.0, 8.0, 6.0, 4.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-262.41778564453125, -253.11940002441406, -243.82102966308594, -234.52264404296875, -225.22427368164062, -215.92588806152344, -206.62750244140625, -197.32913208007812, -188.03076171875, -178.7323760986328, -169.4340057373047, -160.1356201171875, -150.83724975585938, -141.5388641357422, -132.240478515625, -122.94210815429688, -113.64372253417969, -104.34534454345703, -95.04696655273438, -85.74858093261719, -76.45021057128906, -67.15182495117188, -57.85344696044922, -48.55506896972656, -39.256690979003906, -29.95831298828125, -20.65993309020996, -11.361553192138672, -2.0631752014160156, 7.235202789306641, 16.533584594726562, 25.83196258544922, 35.130340576171875, 44.42871856689453, 53.72709655761719, 63.02547836303711, 72.3238525390625, 81.62223815917969, 90.92061614990234, 100.218994140625, 109.51737213134766, 118.81575012207031, 128.1141357421875, 137.41250610351562, 146.7108917236328, 156.00926208496094, 165.30764770507812, 174.60601806640625, 183.90440368652344, 193.20278930664062, 202.50115966796875, 211.79954528808594, 221.09791564941406, 230.39630126953125, 239.69467163085938, 248.99305725097656, 258.29144287109375, 267.5898132324219, 276.8882141113281, 286.18658447265625, 295.4849548339844, 304.7833251953125, 314.08172607421875, 323.3800964355469, 332.678466796875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 6.0, 9.0, 11.0, 8.0, 15.0, 26.0, 25.0, 29.0, 38.0, 76.0, 109.0, 138.0, 208.0, 289.0, 383.0, 662.0, 1040.0, 1643.0, 2888.0, 5753.0, 12699.0, 35250.0, 168500.0, 3749113.0, 155736.0, 34505.0, 12215.0, 5537.0, 3012.0, 1606.0, 968.0, 589.0, 393.0, 243.0, 183.0, 102.0, 80.0, 56.0, 42.0, 29.0, 22.0, 15.0, 7.0, 13.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-84.0, -81.697265625, -79.39453125, -77.091796875, -74.7890625, -72.486328125, -70.18359375, -67.880859375, -65.578125, -63.275390625, -60.97265625, -58.669921875, -56.3671875, -54.064453125, -51.76171875, -49.458984375, -47.15625, -44.853515625, -42.55078125, -40.248046875, -37.9453125, -35.642578125, -33.33984375, -31.037109375, -28.734375, -26.431640625, -24.12890625, -21.826171875, -19.5234375, -17.220703125, -14.91796875, -12.615234375, -10.3125, -8.009765625, -5.70703125, -3.404296875, -1.1015625, 1.201171875, 3.50390625, 5.806640625, 8.109375, 10.412109375, 12.71484375, 15.017578125, 17.3203125, 19.623046875, 21.92578125, 24.228515625, 26.53125, 28.833984375, 31.13671875, 33.439453125, 35.7421875, 38.044921875, 40.34765625, 42.650390625, 44.953125, 47.255859375, 49.55859375, 51.861328125, 54.1640625, 56.466796875, 58.76953125, 61.072265625, 63.375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 11.0, 12.0, 9.0, 17.0, 17.0, 19.0, 27.0, 38.0, 45.0, 52.0, 40.0, 61.0, 67.0, 55.0, 56.0, 49.0, 73.0, 53.0, 49.0, 42.0, 52.0, 38.0, 26.0, 26.0, 22.0, 14.0, 5.0, 12.0, 6.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.3515625, -10.9781494140625, -10.604736328125, -10.2313232421875, -9.85791015625, -9.4844970703125, -9.111083984375, -8.7376708984375, -8.3642578125, -7.9908447265625, -7.617431640625, -7.2440185546875, -6.87060546875, -6.4971923828125, -6.123779296875, -5.7503662109375, -5.376953125, -5.0035400390625, -4.630126953125, -4.2567138671875, -3.88330078125, -3.5098876953125, -3.136474609375, -2.7630615234375, -2.3896484375, -2.0162353515625, -1.642822265625, -1.2694091796875, -0.89599609375, -0.5225830078125, -0.149169921875, 0.2242431640625, 0.59765625, 0.9710693359375, 1.344482421875, 1.7178955078125, 2.09130859375, 2.4647216796875, 2.838134765625, 3.2115478515625, 3.5849609375, 3.9583740234375, 4.331787109375, 4.7052001953125, 5.07861328125, 5.4520263671875, 5.825439453125, 6.1988525390625, 6.572265625, 6.9456787109375, 7.319091796875, 7.6925048828125, 8.06591796875, 8.4393310546875, 8.812744140625, 9.1861572265625, 9.5595703125, 9.9329833984375, 10.306396484375, 10.6798095703125, 11.05322265625, 11.4266357421875, 11.800048828125, 12.1734619140625, 12.546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 7.0, 12.0, 13.0, 21.0, 12.0, 41.0, 47.0, 69.0, 95.0, 151.0, 259.0, 436.0, 778.0, 1341.0, 2937.0, 7484.0, 25647.0, 138519.0, 3726715.0, 237815.0, 34971.0, 9546.0, 3561.0, 1601.0, 862.0, 483.0, 287.0, 173.0, 122.0, 91.0, 55.0, 42.0, 24.0, 20.0, 13.0, 5.0, 8.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.1875, -111.6552734375, -108.123046875, -104.5908203125, -101.05859375, -97.5263671875, -93.994140625, -90.4619140625, -86.9296875, -83.3974609375, -79.865234375, -76.3330078125, -72.80078125, -69.2685546875, -65.736328125, -62.2041015625, -58.671875, -55.1396484375, -51.607421875, -48.0751953125, -44.54296875, -41.0107421875, -37.478515625, -33.9462890625, -30.4140625, -26.8818359375, -23.349609375, -19.8173828125, -16.28515625, -12.7529296875, -9.220703125, -5.6884765625, -2.15625, 1.3759765625, 4.908203125, 8.4404296875, 11.97265625, 15.5048828125, 19.037109375, 22.5693359375, 26.1015625, 29.6337890625, 33.166015625, 36.6982421875, 40.23046875, 43.7626953125, 47.294921875, 50.8271484375, 54.359375, 57.8916015625, 61.423828125, 64.9560546875, 68.48828125, 72.0205078125, 75.552734375, 79.0849609375, 82.6171875, 86.1494140625, 89.681640625, 93.2138671875, 96.74609375, 100.2783203125, 103.810546875, 107.3427734375, 110.875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 6.0, 11.0, 18.0, 28.0, 36.0, 72.0, 137.0, 374.0, 2595.0, 454.0, 139.0, 84.0, 50.0, 24.0, 8.0, 11.0, 7.0, 10.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.46875, -36.59814453125, -34.7275390625, -32.85693359375, -30.986328125, -29.11572265625, -27.2451171875, -25.37451171875, -23.50390625, -21.63330078125, -19.7626953125, -17.89208984375, -16.021484375, -14.15087890625, -12.2802734375, -10.40966796875, -8.5390625, -6.66845703125, -4.7978515625, -2.92724609375, -1.056640625, 0.81396484375, 2.6845703125, 4.55517578125, 6.42578125, 8.29638671875, 10.1669921875, 12.03759765625, 13.908203125, 15.77880859375, 17.6494140625, 19.52001953125, 21.390625, 23.26123046875, 25.1318359375, 27.00244140625, 28.873046875, 30.74365234375, 32.6142578125, 34.48486328125, 36.35546875, 38.22607421875, 40.0966796875, 41.96728515625, 43.837890625, 45.70849609375, 47.5791015625, 49.44970703125, 51.3203125, 53.19091796875, 55.0615234375, 56.93212890625, 58.802734375, 60.67333984375, 62.5439453125, 64.41455078125, 66.28515625, 68.15576171875, 70.0263671875, 71.89697265625, 73.767578125, 75.63818359375, 77.5087890625, 79.37939453125, 81.25]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 27.0, 181.0, 367.0, 298.0, 99.0, 24.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-877.7890625, -853.2758178710938, -828.7625122070312, -804.249267578125, -779.7360229492188, -755.2227172851562, -730.70947265625, -706.1961669921875, -681.6829223632812, -657.169677734375, -632.6563720703125, -608.1431274414062, -583.6298828125, -559.1165771484375, -534.6033325195312, -510.0900573730469, -485.5768127441406, -461.06353759765625, -436.55029296875, -412.0370178222656, -387.52374267578125, -363.010498046875, -338.4972229003906, -313.98394775390625, -289.470703125, -264.9574279785156, -240.4441680908203, -215.930908203125, -191.41763305664062, -166.9043731689453, -142.39111328125, -117.87783813476562, -93.36456298828125, -68.8512954711914, -44.33803176879883, -19.82476806640625, 4.688499450683594, 29.201766967773438, 53.71502685546875, 78.22830200195312, 102.74156188964844, 127.25482940673828, 151.76809692382812, 176.28135681152344, 200.79461669921875, 225.30789184570312, 249.82115173339844, 274.33441162109375, 298.8476867675781, 323.3609619140625, 347.87420654296875, 372.3874816894531, 396.9007568359375, 421.41400146484375, 445.9272766113281, 470.4405517578125, 494.95379638671875, 519.467041015625, 543.9803466796875, 568.4935913085938, 593.0068359375, 617.5201416015625, 642.0333862304688, 666.546630859375, 691.0599365234375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 4.0, 6.0, 7.0, 11.0, 14.0, 10.0, 18.0, 25.0, 19.0, 26.0, 32.0, 38.0, 34.0, 44.0, 61.0, 40.0, 51.0, 37.0, 54.0, 61.0, 56.0, 41.0, 47.0, 32.0, 41.0, 28.0, 23.0, 27.0, 27.0, 22.0, 17.0, 9.0, 10.0, 5.0, 6.0, 12.0, 3.0, 5.0, 2.0, 1.0, 5.0, 1.0], "bins": [-179.501708984375, -175.03573608398438, -170.56976318359375, -166.1038055419922, -161.63783264160156, -157.17185974121094, -152.7058868408203, -148.2399139404297, -143.77395629882812, -139.3079833984375, -134.84201049804688, -130.3760528564453, -125.91007995605469, -121.44410705566406, -116.97813415527344, -112.51216125488281, -108.04618835449219, -103.58021545410156, -99.11425018310547, -94.64827728271484, -90.18231201171875, -85.71633911132812, -81.2503662109375, -76.78439331054688, -72.31842803955078, -67.85245513916016, -63.38648986816406, -58.92051696777344, -54.45454788208008, -49.98857879638672, -45.522605895996094, -41.056636810302734, -36.590660095214844, -32.124691009521484, -27.658720016479492, -23.1927490234375, -18.72677993774414, -14.260810852050781, -9.794839859008789, -5.328868865966797, -0.8628997802734375, 3.6030702590942383, 8.069040298461914, 12.53501033782959, 17.000980377197266, 21.466949462890625, 25.932920455932617, 30.39889144897461, 34.86486053466797, 39.33082962036133, 43.79679870605469, 48.26277160644531, 52.72874069213867, 57.19470977783203, 61.660682678222656, 66.12664794921875, 70.59262084960938, 75.05859375, 79.5245590209961, 83.99053192138672, 88.45649719238281, 92.92247009277344, 97.38844299316406, 101.85441589355469, 106.32038116455078]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 9.0, 5.0, 6.0, 18.0, 24.0, 19.0, 38.0, 43.0, 64.0, 99.0, 121.0, 191.0, 268.0, 429.0, 580.0, 833.0, 1305.0, 1930.0, 3130.0, 5075.0, 8766.0, 16071.0, 32696.0, 73764.0, 210944.0, 438712.0, 139970.0, 55173.0, 25586.0, 13107.0, 7473.0, 4335.0, 2622.0, 1697.0, 1111.0, 750.0, 514.0, 339.0, 210.0, 152.0, 119.0, 79.0, 59.0, 37.0, 26.0, 20.0, 12.0, 18.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-51.8125, -50.30322265625, -48.7939453125, -47.28466796875, -45.775390625, -44.26611328125, -42.7568359375, -41.24755859375, -39.73828125, -38.22900390625, -36.7197265625, -35.21044921875, -33.701171875, -32.19189453125, -30.6826171875, -29.17333984375, -27.6640625, -26.15478515625, -24.6455078125, -23.13623046875, -21.626953125, -20.11767578125, -18.6083984375, -17.09912109375, -15.58984375, -14.08056640625, -12.5712890625, -11.06201171875, -9.552734375, -8.04345703125, -6.5341796875, -5.02490234375, -3.515625, -2.00634765625, -0.4970703125, 1.01220703125, 2.521484375, 4.03076171875, 5.5400390625, 7.04931640625, 8.55859375, 10.06787109375, 11.5771484375, 13.08642578125, 14.595703125, 16.10498046875, 17.6142578125, 19.12353515625, 20.6328125, 22.14208984375, 23.6513671875, 25.16064453125, 26.669921875, 28.17919921875, 29.6884765625, 31.19775390625, 32.70703125, 34.21630859375, 35.7255859375, 37.23486328125, 38.744140625, 40.25341796875, 41.7626953125, 43.27197265625, 44.78125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 5.0, 5.0, 4.0, 8.0, 15.0, 7.0, 13.0, 13.0, 12.0, 19.0, 18.0, 23.0, 32.0, 34.0, 22.0, 24.0, 46.0, 46.0, 35.0, 39.0, 37.0, 51.0, 47.0, 43.0, 38.0, 42.0, 42.0, 37.0, 29.0, 24.0, 37.0, 22.0, 19.0, 18.0, 16.0, 9.0, 9.0, 11.0, 15.0, 5.0, 5.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.859375, -9.57177734375, -9.2841796875, -8.99658203125, -8.708984375, -8.42138671875, -8.1337890625, -7.84619140625, -7.55859375, -7.27099609375, -6.9833984375, -6.69580078125, -6.408203125, -6.12060546875, -5.8330078125, -5.54541015625, -5.2578125, -4.97021484375, -4.6826171875, -4.39501953125, -4.107421875, -3.81982421875, -3.5322265625, -3.24462890625, -2.95703125, -2.66943359375, -2.3818359375, -2.09423828125, -1.806640625, -1.51904296875, -1.2314453125, -0.94384765625, -0.65625, -0.36865234375, -0.0810546875, 0.20654296875, 0.494140625, 0.78173828125, 1.0693359375, 1.35693359375, 1.64453125, 1.93212890625, 2.2197265625, 2.50732421875, 2.794921875, 3.08251953125, 3.3701171875, 3.65771484375, 3.9453125, 4.23291015625, 4.5205078125, 4.80810546875, 5.095703125, 5.38330078125, 5.6708984375, 5.95849609375, 6.24609375, 6.53369140625, 6.8212890625, 7.10888671875, 7.396484375, 7.68408203125, 7.9716796875, 8.25927734375, 8.546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 3.0, 8.0, 6.0, 6.0, 9.0, 16.0, 18.0, 26.0, 27.0, 45.0, 73.0, 107.0, 146.0, 252.0, 330.0, 654.0, 1102.0, 2111.0, 4371.0, 10326.0, 30793.0, 137655.0, 655767.0, 151399.0, 32849.0, 10712.0, 4624.0, 2209.0, 1148.0, 643.0, 374.0, 246.0, 161.0, 97.0, 50.0, 43.0, 38.0, 32.0, 18.0, 21.0, 12.0, 5.0, 4.0, 10.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-76.875, -74.58203125, -72.2890625, -69.99609375, -67.703125, -65.41015625, -63.1171875, -60.82421875, -58.53125, -56.23828125, -53.9453125, -51.65234375, -49.359375, -47.06640625, -44.7734375, -42.48046875, -40.1875, -37.89453125, -35.6015625, -33.30859375, -31.015625, -28.72265625, -26.4296875, -24.13671875, -21.84375, -19.55078125, -17.2578125, -14.96484375, -12.671875, -10.37890625, -8.0859375, -5.79296875, -3.5, -1.20703125, 1.0859375, 3.37890625, 5.671875, 7.96484375, 10.2578125, 12.55078125, 14.84375, 17.13671875, 19.4296875, 21.72265625, 24.015625, 26.30859375, 28.6015625, 30.89453125, 33.1875, 35.48046875, 37.7734375, 40.06640625, 42.359375, 44.65234375, 46.9453125, 49.23828125, 51.53125, 53.82421875, 56.1171875, 58.41015625, 60.703125, 62.99609375, 65.2890625, 67.58203125, 69.875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 10.0, 9.0, 6.0, 9.0, 12.0, 14.0, 26.0, 34.0, 27.0, 35.0, 41.0, 60.0, 45.0, 71.0, 60.0, 71.0, 50.0, 69.0, 58.0, 57.0, 42.0, 45.0, 40.0, 22.0, 18.0, 18.0, 12.0, 6.0, 10.0, 7.0, 2.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-72.4375, -70.33984375, -68.2421875, -66.14453125, -64.046875, -61.94921875, -59.8515625, -57.75390625, -55.65625, -53.55859375, -51.4609375, -49.36328125, -47.265625, -45.16796875, -43.0703125, -40.97265625, -38.875, -36.77734375, -34.6796875, -32.58203125, -30.484375, -28.38671875, -26.2890625, -24.19140625, -22.09375, -19.99609375, -17.8984375, -15.80078125, -13.703125, -11.60546875, -9.5078125, -7.41015625, -5.3125, -3.21484375, -1.1171875, 0.98046875, 3.078125, 5.17578125, 7.2734375, 9.37109375, 11.46875, 13.56640625, 15.6640625, 17.76171875, 19.859375, 21.95703125, 24.0546875, 26.15234375, 28.25, 30.34765625, 32.4453125, 34.54296875, 36.640625, 38.73828125, 40.8359375, 42.93359375, 45.03125, 47.12890625, 49.2265625, 51.32421875, 53.421875, 55.51953125, 57.6171875, 59.71484375, 61.8125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 12.0, 24.0, 27.0, 35.0, 50.0, 63.0, 106.0, 162.0, 251.0, 449.0, 836.0, 1766.0, 4758.0, 17489.0, 175248.0, 797914.0, 36437.0, 7731.0, 2564.0, 1144.0, 572.0, 328.0, 194.0, 111.0, 73.0, 61.0, 46.0, 24.0, 14.0, 14.0, 14.0, 10.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.0625, -79.2529296875, -76.443359375, -73.6337890625, -70.82421875, -68.0146484375, -65.205078125, -62.3955078125, -59.5859375, -56.7763671875, -53.966796875, -51.1572265625, -48.34765625, -45.5380859375, -42.728515625, -39.9189453125, -37.109375, -34.2998046875, -31.490234375, -28.6806640625, -25.87109375, -23.0615234375, -20.251953125, -17.4423828125, -14.6328125, -11.8232421875, -9.013671875, -6.2041015625, -3.39453125, -0.5849609375, 2.224609375, 5.0341796875, 7.84375, 10.6533203125, 13.462890625, 16.2724609375, 19.08203125, 21.8916015625, 24.701171875, 27.5107421875, 30.3203125, 33.1298828125, 35.939453125, 38.7490234375, 41.55859375, 44.3681640625, 47.177734375, 49.9873046875, 52.796875, 55.6064453125, 58.416015625, 61.2255859375, 64.03515625, 66.8447265625, 69.654296875, 72.4638671875, 75.2734375, 78.0830078125, 80.892578125, 83.7021484375, 86.51171875, 89.3212890625, 92.130859375, 94.9404296875, 97.75]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 9.0, 38.0, 42.0, 120.0, 472.0, 175.0, 55.0, 27.0, 20.0, 12.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019866943359375, -0.018901824951171875, -0.01793670654296875, -0.016971588134765625, -0.0160064697265625, -0.015041351318359375, -0.01407623291015625, -0.013111114501953125, -0.01214599609375, -0.011180877685546875, -0.01021575927734375, -0.009250640869140625, -0.0082855224609375, -0.007320404052734375, -0.00635528564453125, -0.005390167236328125, -0.004425048828125, -0.003459930419921875, -0.00249481201171875, -0.001529693603515625, -0.0005645751953125, 0.000400543212890625, 0.00136566162109375, 0.002330780029296875, 0.0032958984375, 0.004261016845703125, 0.00522613525390625, 0.006191253662109375, 0.0071563720703125, 0.008121490478515625, 0.00908660888671875, 0.010051727294921875, 0.011016845703125, 0.011981964111328125, 0.01294708251953125, 0.013912200927734375, 0.0148773193359375, 0.015842437744140625, 0.01680755615234375, 0.017772674560546875, 0.01873779296875, 0.019702911376953125, 0.02066802978515625, 0.021633148193359375, 0.0225982666015625, 0.023563385009765625, 0.02452850341796875, 0.025493621826171875, 0.026458740234375, 0.027423858642578125, 0.02838897705078125, 0.029354095458984375, 0.0303192138671875, 0.031284332275390625, 0.03224945068359375, 0.033214569091796875, 0.0341796875, 0.035144805908203125, 0.03610992431640625, 0.037075042724609375, 0.0380401611328125, 0.039005279541015625, 0.03997039794921875, 0.040935516357421875, 0.041900634765625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 4.0, 2.0, 8.0, 6.0, 9.0, 9.0, 13.0, 13.0, 27.0, 41.0, 67.0, 120.0, 168.0, 331.0, 676.0, 1490.0, 3596.0, 13201.0, 117970.0, 852035.0, 46419.0, 7606.0, 2488.0, 1106.0, 515.0, 232.0, 159.0, 92.0, 62.0, 26.0, 21.0, 14.0, 6.0, 5.0, 4.0, 6.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.0625, -78.2978515625, -75.533203125, -72.7685546875, -70.00390625, -67.2392578125, -64.474609375, -61.7099609375, -58.9453125, -56.1806640625, -53.416015625, -50.6513671875, -47.88671875, -45.1220703125, -42.357421875, -39.5927734375, -36.828125, -34.0634765625, -31.298828125, -28.5341796875, -25.76953125, -23.0048828125, -20.240234375, -17.4755859375, -14.7109375, -11.9462890625, -9.181640625, -6.4169921875, -3.65234375, -0.8876953125, 1.876953125, 4.6416015625, 7.40625, 10.1708984375, 12.935546875, 15.7001953125, 18.46484375, 21.2294921875, 23.994140625, 26.7587890625, 29.5234375, 32.2880859375, 35.052734375, 37.8173828125, 40.58203125, 43.3466796875, 46.111328125, 48.8759765625, 51.640625, 54.4052734375, 57.169921875, 59.9345703125, 62.69921875, 65.4638671875, 68.228515625, 70.9931640625, 73.7578125, 76.5224609375, 79.287109375, 82.0517578125, 84.81640625, 87.5810546875, 90.345703125, 93.1103515625, 95.875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 5.0, 10.0, 16.0, 25.0, 33.0, 52.0, 67.0, 181.0, 288.0, 135.0, 59.0, 36.0, 28.0, 23.0, 11.0, 9.0, 4.0, 4.0, 0.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.96875, -49.99560546875, -48.0224609375, -46.04931640625, -44.076171875, -42.10302734375, -40.1298828125, -38.15673828125, -36.18359375, -34.21044921875, -32.2373046875, -30.26416015625, -28.291015625, -26.31787109375, -24.3447265625, -22.37158203125, -20.3984375, -18.42529296875, -16.4521484375, -14.47900390625, -12.505859375, -10.53271484375, -8.5595703125, -6.58642578125, -4.61328125, -2.64013671875, -0.6669921875, 1.30615234375, 3.279296875, 5.25244140625, 7.2255859375, 9.19873046875, 11.171875, 13.14501953125, 15.1181640625, 17.09130859375, 19.064453125, 21.03759765625, 23.0107421875, 24.98388671875, 26.95703125, 28.93017578125, 30.9033203125, 32.87646484375, 34.849609375, 36.82275390625, 38.7958984375, 40.76904296875, 42.7421875, 44.71533203125, 46.6884765625, 48.66162109375, 50.634765625, 52.60791015625, 54.5810546875, 56.55419921875, 58.52734375, 60.50048828125, 62.4736328125, 64.44677734375, 66.419921875, 68.39306640625, 70.3662109375, 72.33935546875, 74.3125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 12.0, 25.0, 64.0, 100.0, 156.0, 216.0, 180.0, 101.0, 71.0, 33.0, 20.0, 13.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-337.5392150878906, -312.78826904296875, -288.03729248046875, -263.2863464355469, -238.53538513183594, -213.784423828125, -189.03347778320312, -164.2825164794922, -139.53155517578125, -114.78059387207031, -90.0296401977539, -65.2786865234375, -40.52772521972656, -15.776763916015625, 8.97418212890625, 33.72514343261719, 58.476104736328125, 83.22706604003906, 107.97801971435547, 132.72897338867188, 157.4799346923828, 182.23089599609375, 206.98184204101562, 231.73280334472656, 256.4837646484375, 281.2347106933594, 305.9856872558594, 330.73663330078125, 355.48760986328125, 380.2385559082031, 404.989501953125, 429.740478515625, 454.491455078125, 479.2424011230469, 503.9933776855469, 528.7443237304688, 553.4953002929688, 578.2462158203125, 602.9971923828125, 627.7481689453125, 652.4991455078125, 677.2501220703125, 702.0010375976562, 726.7520141601562, 751.5029907226562, 776.25390625, 801.0048828125, 825.755859375, 850.5067749023438, 875.2577514648438, 900.0086669921875, 924.7596435546875, 949.5106201171875, 974.2615966796875, 999.0125122070312, 1023.7634887695312, 1048.514404296875, 1073.265380859375, 1098.016357421875, 1122.767333984375, 1147.5181884765625, 1172.2691650390625, 1197.0201416015625, 1221.7711181640625, 1246.5220947265625]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 5.0, 3.0, 6.0, 3.0, 4.0, 8.0, 20.0, 10.0, 12.0, 19.0, 24.0, 30.0, 21.0, 35.0, 39.0, 39.0, 36.0, 49.0, 41.0, 36.0, 38.0, 31.0, 48.0, 48.0, 41.0, 34.0, 29.0, 41.0, 21.0, 33.0, 26.0, 27.0, 23.0, 13.0, 21.0, 22.0, 13.0, 16.0, 9.0, 4.0, 9.0, 3.0, 7.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-248.39794921875, -240.1319122314453, -231.86585998535156, -223.59982299804688, -215.33377075195312, -207.06773376464844, -198.80169677734375, -190.53564453125, -182.2696075439453, -174.00357055664062, -165.73751831054688, -157.4714813232422, -149.2054443359375, -140.93939208984375, -132.67335510253906, -124.40731048583984, -116.14126586914062, -107.8752212524414, -99.60917663574219, -91.3431396484375, -83.07709503173828, -74.81105041503906, -66.54501342773438, -58.278968811035156, -50.01292419433594, -41.74687957763672, -33.480838775634766, -25.21479606628418, -16.948753356933594, -8.682708740234375, -0.4166679382324219, 7.849372863769531, 16.11541748046875, 24.381460189819336, 32.64750289916992, 40.913543701171875, 49.179588317871094, 57.44563293457031, 65.711669921875, 73.97771453857422, 82.24375915527344, 90.50980377197266, 98.77584838867188, 107.04188537597656, 115.30792999267578, 123.573974609375, 131.8400115966797, 140.10604858398438, 148.37210083007812, 156.6381378173828, 164.90419006347656, 173.17022705078125, 181.436279296875, 189.7023162841797, 197.96835327148438, 206.23440551757812, 214.5004425048828, 222.7664794921875, 231.03253173828125, 239.29856872558594, 247.56460571289062, 255.83065795898438, 264.0967102050781, 272.36273193359375, 280.6287841796875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 11.0, 12.0, 9.0, 25.0, 31.0, 32.0, 46.0, 66.0, 93.0, 145.0, 214.0, 310.0, 427.0, 722.0, 1266.0, 2296.0, 4295.0, 9354.0, 24143.0, 93548.0, 3796123.0, 198910.0, 36788.0, 12879.0, 5696.0, 2759.0, 1511.0, 880.0, 566.0, 363.0, 228.0, 152.0, 96.0, 80.0, 45.0, 40.0, 35.0, 27.0, 11.0, 15.0, 6.0, 8.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.5625, -76.08203125, -73.6015625, -71.12109375, -68.640625, -66.16015625, -63.6796875, -61.19921875, -58.71875, -56.23828125, -53.7578125, -51.27734375, -48.796875, -46.31640625, -43.8359375, -41.35546875, -38.875, -36.39453125, -33.9140625, -31.43359375, -28.953125, -26.47265625, -23.9921875, -21.51171875, -19.03125, -16.55078125, -14.0703125, -11.58984375, -9.109375, -6.62890625, -4.1484375, -1.66796875, 0.8125, 3.29296875, 5.7734375, 8.25390625, 10.734375, 13.21484375, 15.6953125, 18.17578125, 20.65625, 23.13671875, 25.6171875, 28.09765625, 30.578125, 33.05859375, 35.5390625, 38.01953125, 40.5, 42.98046875, 45.4609375, 47.94140625, 50.421875, 52.90234375, 55.3828125, 57.86328125, 60.34375, 62.82421875, 65.3046875, 67.78515625, 70.265625, 72.74609375, 75.2265625, 77.70703125, 80.1875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 8.0, 3.0, 11.0, 6.0, 11.0, 9.0, 19.0, 15.0, 17.0, 28.0, 30.0, 31.0, 41.0, 27.0, 32.0, 35.0, 50.0, 49.0, 53.0, 56.0, 53.0, 49.0, 48.0, 50.0, 38.0, 36.0, 28.0, 30.0, 37.0, 17.0, 21.0, 11.0, 13.0, 11.0, 8.0, 9.0, 6.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.875, -12.4864501953125, -12.097900390625, -11.7093505859375, -11.32080078125, -10.9322509765625, -10.543701171875, -10.1551513671875, -9.7666015625, -9.3780517578125, -8.989501953125, -8.6009521484375, -8.21240234375, -7.8238525390625, -7.435302734375, -7.0467529296875, -6.658203125, -6.2696533203125, -5.881103515625, -5.4925537109375, -5.10400390625, -4.7154541015625, -4.326904296875, -3.9383544921875, -3.5498046875, -3.1612548828125, -2.772705078125, -2.3841552734375, -1.99560546875, -1.6070556640625, -1.218505859375, -0.8299560546875, -0.44140625, -0.0528564453125, 0.335693359375, 0.7242431640625, 1.11279296875, 1.5013427734375, 1.889892578125, 2.2784423828125, 2.6669921875, 3.0555419921875, 3.444091796875, 3.8326416015625, 4.22119140625, 4.6097412109375, 4.998291015625, 5.3868408203125, 5.775390625, 6.1639404296875, 6.552490234375, 6.9410400390625, 7.32958984375, 7.7181396484375, 8.106689453125, 8.4952392578125, 8.8837890625, 9.2723388671875, 9.660888671875, 10.0494384765625, 10.43798828125, 10.8265380859375, 11.215087890625, 11.6036376953125, 11.9921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 8.0, 12.0, 8.0, 11.0, 8.0, 8.0, 16.0, 26.0, 23.0, 32.0, 50.0, 64.0, 98.0, 177.0, 289.0, 524.0, 1182.0, 2705.0, 7353.0, 25661.0, 168876.0, 3843375.0, 112526.0, 20486.0, 6191.0, 2341.0, 1077.0, 416.0, 292.0, 150.0, 94.0, 61.0, 34.0, 34.0, 18.0, 10.0, 8.0, 10.0, 7.0, 7.0, 3.0, 6.0, 4.0, 8.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-135.5, -131.4453125, -127.390625, -123.3359375, -119.28125, -115.2265625, -111.171875, -107.1171875, -103.0625, -99.0078125, -94.953125, -90.8984375, -86.84375, -82.7890625, -78.734375, -74.6796875, -70.625, -66.5703125, -62.515625, -58.4609375, -54.40625, -50.3515625, -46.296875, -42.2421875, -38.1875, -34.1328125, -30.078125, -26.0234375, -21.96875, -17.9140625, -13.859375, -9.8046875, -5.75, -1.6953125, 2.359375, 6.4140625, 10.46875, 14.5234375, 18.578125, 22.6328125, 26.6875, 30.7421875, 34.796875, 38.8515625, 42.90625, 46.9609375, 51.015625, 55.0703125, 59.125, 63.1796875, 67.234375, 71.2890625, 75.34375, 79.3984375, 83.453125, 87.5078125, 91.5625, 95.6171875, 99.671875, 103.7265625, 107.78125, 111.8359375, 115.890625, 119.9453125, 124.0]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 13.0, 10.0, 21.0, 25.0, 44.0, 102.0, 271.0, 2695.0, 558.0, 156.0, 64.0, 40.0, 21.0, 17.0, 12.0, 5.0, 7.0, 0.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-85.0, -83.1015625, -81.203125, -79.3046875, -77.40625, -75.5078125, -73.609375, -71.7109375, -69.8125, -67.9140625, -66.015625, -64.1171875, -62.21875, -60.3203125, -58.421875, -56.5234375, -54.625, -52.7265625, -50.828125, -48.9296875, -47.03125, -45.1328125, -43.234375, -41.3359375, -39.4375, -37.5390625, -35.640625, -33.7421875, -31.84375, -29.9453125, -28.046875, -26.1484375, -24.25, -22.3515625, -20.453125, -18.5546875, -16.65625, -14.7578125, -12.859375, -10.9609375, -9.0625, -7.1640625, -5.265625, -3.3671875, -1.46875, 0.4296875, 2.328125, 4.2265625, 6.125, 8.0234375, 9.921875, 11.8203125, 13.71875, 15.6171875, 17.515625, 19.4140625, 21.3125, 23.2109375, 25.109375, 27.0078125, 28.90625, 30.8046875, 32.703125, 34.6015625, 36.5]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 7.0, 7.0, 14.0, 15.0, 18.0, 39.0, 50.0, 93.0, 113.0, 135.0, 146.0, 125.0, 78.0, 67.0, 40.0, 21.0, 13.0, 10.0, 1.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-305.647216796875, -298.75439453125, -291.8615417480469, -284.9687194824219, -278.07586669921875, -271.18304443359375, -264.29022216796875, -257.3973693847656, -250.50453186035156, -243.6116943359375, -236.71885681152344, -229.82601928710938, -222.93319702148438, -216.0403594970703, -209.14752197265625, -202.2546844482422, -195.36184692382812, -188.46900939941406, -181.576171875, -174.683349609375, -167.79051208496094, -160.89767456054688, -154.0048370361328, -147.11199951171875, -140.21917724609375, -133.3263397216797, -126.43350982666016, -119.5406723022461, -112.64783477783203, -105.7550048828125, -98.86216735839844, -91.96932983398438, -85.07649230957031, -78.18365478515625, -71.29082489013672, -64.39798736572266, -57.505149841308594, -50.6123161315918, -43.719482421875, -36.82664489746094, -29.93381118774414, -23.04097557067871, -16.14813995361328, -9.255306243896484, -2.3624706268310547, 4.530364990234375, 11.423198699951172, 18.316036224365234, 25.20886993408203, 32.10170364379883, 38.99454116821289, 45.88737487792969, 52.78021240234375, 59.67304611206055, 66.56587982177734, 73.4587173461914, 80.35154724121094, 87.244384765625, 94.13721466064453, 101.0300521850586, 107.92288970947266, 114.81571960449219, 121.70855712890625, 128.6013946533203, 135.49423217773438]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 7.0, 5.0, 11.0, 11.0, 8.0, 7.0, 23.0, 27.0, 17.0, 35.0, 24.0, 34.0, 32.0, 42.0, 37.0, 51.0, 39.0, 46.0, 44.0, 43.0, 58.0, 38.0, 47.0, 31.0, 41.0, 34.0, 31.0, 33.0, 26.0, 20.0, 22.0, 19.0, 13.0, 12.0, 7.0, 7.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.66360473632812, -123.73861694335938, -119.81362915039062, -115.88864135742188, -111.96365356445312, -108.03866577148438, -104.11367797851562, -100.18869018554688, -96.26370239257812, -92.33871459960938, -88.41372680664062, -84.48873901367188, -80.56375122070312, -76.63876342773438, -72.71377563476562, -68.78878784179688, -64.86380767822266, -60.938819885253906, -57.013832092285156, -53.088844299316406, -49.163856506347656, -45.238868713378906, -41.31388473510742, -37.38889694213867, -33.46390914916992, -29.538921356201172, -25.613933563232422, -21.688947677612305, -17.763959884643555, -13.838972091674805, -9.913986206054688, -5.9889984130859375, -2.0640106201171875, 1.8609766960144043, 5.785964012145996, 9.71095085144043, 13.63593864440918, 17.56092643737793, 21.485912322998047, 25.410900115966797, 29.335887908935547, 33.2608757019043, 37.18586349487305, 41.11084747314453, 45.03583526611328, 48.96082305908203, 52.88581085205078, 56.81079864501953, 60.73578643798828, 64.66077423095703, 68.58576202392578, 72.51074981689453, 76.43573760986328, 80.36072540283203, 84.28570556640625, 88.210693359375, 92.13568115234375, 96.0606689453125, 99.98565673828125, 103.91064453125, 107.83563232421875, 111.7606201171875, 115.68560791015625, 119.610595703125, 123.53558349609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 5.0, 8.0, 11.0, 14.0, 17.0, 24.0, 40.0, 55.0, 73.0, 92.0, 181.0, 281.0, 466.0, 743.0, 1386.0, 2496.0, 4436.0, 8255.0, 16363.0, 34279.0, 78570.0, 248041.0, 430775.0, 125094.0, 49333.0, 22821.0, 11211.0, 5899.0, 3245.0, 1731.0, 1022.0, 604.0, 348.0, 201.0, 119.0, 83.0, 63.0, 45.0, 36.0, 24.0, 13.0, 16.0, 15.0, 11.0, 3.0, 4.0, 6.0, 0.0, 1.0, 3.0], "bins": [-50.1875, -48.80224609375, -47.4169921875, -46.03173828125, -44.646484375, -43.26123046875, -41.8759765625, -40.49072265625, -39.10546875, -37.72021484375, -36.3349609375, -34.94970703125, -33.564453125, -32.17919921875, -30.7939453125, -29.40869140625, -28.0234375, -26.63818359375, -25.2529296875, -23.86767578125, -22.482421875, -21.09716796875, -19.7119140625, -18.32666015625, -16.94140625, -15.55615234375, -14.1708984375, -12.78564453125, -11.400390625, -10.01513671875, -8.6298828125, -7.24462890625, -5.859375, -4.47412109375, -3.0888671875, -1.70361328125, -0.318359375, 1.06689453125, 2.4521484375, 3.83740234375, 5.22265625, 6.60791015625, 7.9931640625, 9.37841796875, 10.763671875, 12.14892578125, 13.5341796875, 14.91943359375, 16.3046875, 17.68994140625, 19.0751953125, 20.46044921875, 21.845703125, 23.23095703125, 24.6162109375, 26.00146484375, 27.38671875, 28.77197265625, 30.1572265625, 31.54248046875, 32.927734375, 34.31298828125, 35.6982421875, 37.08349609375, 38.46875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 5.0, 4.0, 12.0, 12.0, 12.0, 12.0, 10.0, 15.0, 16.0, 19.0, 17.0, 22.0, 29.0, 30.0, 29.0, 41.0, 33.0, 37.0, 40.0, 52.0, 40.0, 34.0, 28.0, 40.0, 40.0, 38.0, 35.0, 41.0, 20.0, 29.0, 23.0, 26.0, 20.0, 26.0, 16.0, 17.0, 13.0, 13.0, 7.0, 8.0, 7.0, 8.0, 4.0, 3.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2421875, -10.894287109375, -10.54638671875, -10.198486328125, -9.8505859375, -9.502685546875, -9.15478515625, -8.806884765625, -8.458984375, -8.111083984375, -7.76318359375, -7.415283203125, -7.0673828125, -6.719482421875, -6.37158203125, -6.023681640625, -5.67578125, -5.327880859375, -4.97998046875, -4.632080078125, -4.2841796875, -3.936279296875, -3.58837890625, -3.240478515625, -2.892578125, -2.544677734375, -2.19677734375, -1.848876953125, -1.5009765625, -1.153076171875, -0.80517578125, -0.457275390625, -0.109375, 0.238525390625, 0.58642578125, 0.934326171875, 1.2822265625, 1.630126953125, 1.97802734375, 2.325927734375, 2.673828125, 3.021728515625, 3.36962890625, 3.717529296875, 4.0654296875, 4.413330078125, 4.76123046875, 5.109130859375, 5.45703125, 5.804931640625, 6.15283203125, 6.500732421875, 6.8486328125, 7.196533203125, 7.54443359375, 7.892333984375, 8.240234375, 8.588134765625, 8.93603515625, 9.283935546875, 9.6318359375, 9.979736328125, 10.32763671875, 10.675537109375, 11.0234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 9.0, 7.0, 11.0, 25.0, 24.0, 32.0, 43.0, 62.0, 68.0, 119.0, 171.0, 249.0, 472.0, 744.0, 1391.0, 2567.0, 5490.0, 14168.0, 52247.0, 541378.0, 363523.0, 42848.0, 12414.0, 4881.0, 2323.0, 1256.0, 708.0, 434.0, 292.0, 170.0, 115.0, 78.0, 56.0, 39.0, 26.0, 21.0, 14.0, 20.0, 16.0, 9.0, 7.0, 9.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.1875, -78.3818359375, -75.576171875, -72.7705078125, -69.96484375, -67.1591796875, -64.353515625, -61.5478515625, -58.7421875, -55.9365234375, -53.130859375, -50.3251953125, -47.51953125, -44.7138671875, -41.908203125, -39.1025390625, -36.296875, -33.4912109375, -30.685546875, -27.8798828125, -25.07421875, -22.2685546875, -19.462890625, -16.6572265625, -13.8515625, -11.0458984375, -8.240234375, -5.4345703125, -2.62890625, 0.1767578125, 2.982421875, 5.7880859375, 8.59375, 11.3994140625, 14.205078125, 17.0107421875, 19.81640625, 22.6220703125, 25.427734375, 28.2333984375, 31.0390625, 33.8447265625, 36.650390625, 39.4560546875, 42.26171875, 45.0673828125, 47.873046875, 50.6787109375, 53.484375, 56.2900390625, 59.095703125, 61.9013671875, 64.70703125, 67.5126953125, 70.318359375, 73.1240234375, 75.9296875, 78.7353515625, 81.541015625, 84.3466796875, 87.15234375, 89.9580078125, 92.763671875, 95.5693359375, 98.375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 6.0, 6.0, 6.0, 8.0, 14.0, 13.0, 16.0, 24.0, 36.0, 38.0, 51.0, 67.0, 78.0, 75.0, 92.0, 57.0, 79.0, 73.0, 58.0, 49.0, 34.0, 26.0, 23.0, 16.0, 6.0, 11.0, 7.0, 2.0, 4.0, 2.0, 5.0, 0.0, 6.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.6875, -88.693359375, -85.69921875, -82.705078125, -79.7109375, -76.716796875, -73.72265625, -70.728515625, -67.734375, -64.740234375, -61.74609375, -58.751953125, -55.7578125, -52.763671875, -49.76953125, -46.775390625, -43.78125, -40.787109375, -37.79296875, -34.798828125, -31.8046875, -28.810546875, -25.81640625, -22.822265625, -19.828125, -16.833984375, -13.83984375, -10.845703125, -7.8515625, -4.857421875, -1.86328125, 1.130859375, 4.125, 7.119140625, 10.11328125, 13.107421875, 16.1015625, 19.095703125, 22.08984375, 25.083984375, 28.078125, 31.072265625, 34.06640625, 37.060546875, 40.0546875, 43.048828125, 46.04296875, 49.037109375, 52.03125, 55.025390625, 58.01953125, 61.013671875, 64.0078125, 67.001953125, 69.99609375, 72.990234375, 75.984375, 78.978515625, 81.97265625, 84.966796875, 87.9609375, 90.955078125, 93.94921875, 96.943359375, 99.9375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 3.0, 7.0, 10.0, 14.0, 18.0, 18.0, 32.0, 43.0, 65.0, 87.0, 126.0, 151.0, 253.0, 379.0, 516.0, 755.0, 1186.0, 2105.0, 4223.0, 11101.0, 54593.0, 860864.0, 86535.0, 14253.0, 4869.0, 2285.0, 1333.0, 882.0, 608.0, 370.0, 240.0, 156.0, 141.0, 93.0, 64.0, 49.0, 40.0, 21.0, 19.0, 12.0, 10.0, 11.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.25, -64.9775390625, -62.705078125, -60.4326171875, -58.16015625, -55.8876953125, -53.615234375, -51.3427734375, -49.0703125, -46.7978515625, -44.525390625, -42.2529296875, -39.98046875, -37.7080078125, -35.435546875, -33.1630859375, -30.890625, -28.6181640625, -26.345703125, -24.0732421875, -21.80078125, -19.5283203125, -17.255859375, -14.9833984375, -12.7109375, -10.4384765625, -8.166015625, -5.8935546875, -3.62109375, -1.3486328125, 0.923828125, 3.1962890625, 5.46875, 7.7412109375, 10.013671875, 12.2861328125, 14.55859375, 16.8310546875, 19.103515625, 21.3759765625, 23.6484375, 25.9208984375, 28.193359375, 30.4658203125, 32.73828125, 35.0107421875, 37.283203125, 39.5556640625, 41.828125, 44.1005859375, 46.373046875, 48.6455078125, 50.91796875, 53.1904296875, 55.462890625, 57.7353515625, 60.0078125, 62.2802734375, 64.552734375, 66.8251953125, 69.09765625, 71.3701171875, 73.642578125, 75.9150390625, 78.1875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 5.0, 8.0, 11.0, 16.0, 23.0, 37.0, 90.0, 365.0, 283.0, 71.0, 26.0, 20.0, 14.0, 11.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0207672119140625, -0.020022153854370117, -0.019277095794677734, -0.01853203773498535, -0.01778697967529297, -0.017041921615600586, -0.016296863555908203, -0.01555180549621582, -0.014806747436523438, -0.014061689376831055, -0.013316631317138672, -0.012571573257446289, -0.011826515197753906, -0.011081457138061523, -0.01033639907836914, -0.009591341018676758, -0.008846282958984375, -0.008101224899291992, -0.007356166839599609, -0.0066111087799072266, -0.005866050720214844, -0.005120992660522461, -0.004375934600830078, -0.0036308765411376953, -0.0028858184814453125, -0.0021407604217529297, -0.0013957023620605469, -0.0006506443023681641, 9.441375732421875e-05, 0.0008394718170166016, 0.0015845298767089844, 0.002329587936401367, 0.00307464599609375, 0.003819704055786133, 0.004564762115478516, 0.0053098201751708984, 0.006054878234863281, 0.006799936294555664, 0.007544994354248047, 0.00829005241394043, 0.009035110473632812, 0.009780168533325195, 0.010525226593017578, 0.011270284652709961, 0.012015342712402344, 0.012760400772094727, 0.01350545883178711, 0.014250516891479492, 0.014995574951171875, 0.015740633010864258, 0.01648569107055664, 0.017230749130249023, 0.017975807189941406, 0.01872086524963379, 0.019465923309326172, 0.020210981369018555, 0.020956039428710938, 0.02170109748840332, 0.022446155548095703, 0.023191213607788086, 0.02393627166748047, 0.02468132972717285, 0.025426387786865234, 0.026171445846557617, 0.02691650390625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 10.0, 14.0, 14.0, 21.0, 36.0, 48.0, 88.0, 110.0, 179.0, 301.0, 593.0, 1039.0, 2298.0, 6538.0, 26083.0, 586647.0, 391077.0, 22932.0, 5878.0, 2262.0, 1022.0, 544.0, 307.0, 174.0, 115.0, 66.0, 42.0, 33.0, 25.0, 16.0, 5.0, 8.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.3125, -73.84765625, -71.3828125, -68.91796875, -66.453125, -63.98828125, -61.5234375, -59.05859375, -56.59375, -54.12890625, -51.6640625, -49.19921875, -46.734375, -44.26953125, -41.8046875, -39.33984375, -36.875, -34.41015625, -31.9453125, -29.48046875, -27.015625, -24.55078125, -22.0859375, -19.62109375, -17.15625, -14.69140625, -12.2265625, -9.76171875, -7.296875, -4.83203125, -2.3671875, 0.09765625, 2.5625, 5.02734375, 7.4921875, 9.95703125, 12.421875, 14.88671875, 17.3515625, 19.81640625, 22.28125, 24.74609375, 27.2109375, 29.67578125, 32.140625, 34.60546875, 37.0703125, 39.53515625, 42.0, 44.46484375, 46.9296875, 49.39453125, 51.859375, 54.32421875, 56.7890625, 59.25390625, 61.71875, 64.18359375, 66.6484375, 69.11328125, 71.578125, 74.04296875, 76.5078125, 78.97265625, 81.4375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 12.0, 7.0, 14.0, 19.0, 43.0, 98.0, 325.0, 257.0, 107.0, 31.0, 20.0, 17.0, 9.0, 7.0, 6.0, 7.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.125, -69.7880859375, -67.451171875, -65.1142578125, -62.77734375, -60.4404296875, -58.103515625, -55.7666015625, -53.4296875, -51.0927734375, -48.755859375, -46.4189453125, -44.08203125, -41.7451171875, -39.408203125, -37.0712890625, -34.734375, -32.3974609375, -30.060546875, -27.7236328125, -25.38671875, -23.0498046875, -20.712890625, -18.3759765625, -16.0390625, -13.7021484375, -11.365234375, -9.0283203125, -6.69140625, -4.3544921875, -2.017578125, 0.3193359375, 2.65625, 4.9931640625, 7.330078125, 9.6669921875, 12.00390625, 14.3408203125, 16.677734375, 19.0146484375, 21.3515625, 23.6884765625, 26.025390625, 28.3623046875, 30.69921875, 33.0361328125, 35.373046875, 37.7099609375, 40.046875, 42.3837890625, 44.720703125, 47.0576171875, 49.39453125, 51.7314453125, 54.068359375, 56.4052734375, 58.7421875, 61.0791015625, 63.416015625, 65.7529296875, 68.08984375, 70.4267578125, 72.763671875, 75.1005859375, 77.4375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 10.0, 10.0, 28.0, 60.0, 105.0, 190.0, 198.0, 182.0, 102.0, 47.0, 36.0, 21.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-445.5379943847656, -416.69622802734375, -387.8544921875, -359.0127258300781, -330.1709899902344, -301.3292236328125, -272.48748779296875, -243.64572143554688, -214.80397033691406, -185.96221923828125, -157.12046813964844, -128.27871704101562, -99.43695831298828, -70.59519958496094, -41.753448486328125, -12.911697387695312, 15.9300537109375, 44.77180480957031, 73.61355590820312, 102.45531463623047, 131.29705810546875, 160.13882446289062, 188.98057556152344, 217.82232666015625, 246.66407775878906, 275.5058288574219, 304.34759521484375, 333.1893310546875, 362.0310974121094, 390.87286376953125, 419.714599609375, 448.55633544921875, 477.39813232421875, 506.2398986816406, 535.0816650390625, 563.9234008789062, 592.76513671875, 621.60693359375, 650.4486694335938, 679.2904052734375, 708.1321411132812, 736.973876953125, 765.815673828125, 794.6574096679688, 823.4991455078125, 852.3409423828125, 881.1826782226562, 910.0244140625, 938.8662109375, 967.7079467773438, 996.5497436523438, 1025.3914794921875, 1054.2332763671875, 1083.074951171875, 1111.916748046875, 1140.758544921875, 1169.6002197265625, 1198.4420166015625, 1227.28369140625, 1256.12548828125, 1284.96728515625, 1313.8089599609375, 1342.6507568359375, 1371.492431640625, 1400.334228515625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 2.0, 4.0, 10.0, 3.0, 11.0, 9.0, 9.0, 15.0, 14.0, 10.0, 23.0, 21.0, 22.0, 25.0, 15.0, 35.0, 37.0, 27.0, 30.0, 30.0, 39.0, 44.0, 41.0, 39.0, 43.0, 45.0, 47.0, 41.0, 37.0, 26.0, 31.0, 33.0, 17.0, 21.0, 21.0, 19.0, 24.0, 17.0, 10.0, 7.0, 10.0, 5.0, 10.0, 4.0, 3.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-278.5648193359375, -269.580322265625, -260.5958251953125, -251.611328125, -242.62681579589844, -233.64231872558594, -224.65782165527344, -215.67332458496094, -206.68881225585938, -197.70431518554688, -188.71981811523438, -179.73532104492188, -170.7508087158203, -161.7663116455078, -152.7818145751953, -143.7973175048828, -134.8128204345703, -125.82832336425781, -116.84381866455078, -107.85932159423828, -98.87481689453125, -89.89031982421875, -80.90582275390625, -71.92132568359375, -62.93682098388672, -53.95232009887695, -44.96781921386719, -35.98332214355469, -26.998821258544922, -18.014320373535156, -9.029823303222656, -0.045322418212890625, 8.939178466796875, 17.92367935180664, 26.908178329467773, 35.892677307128906, 44.87717819213867, 53.86167907714844, 62.84617614746094, 71.83067321777344, 80.81517791748047, 89.79967498779297, 98.7841796875, 107.7686767578125, 116.753173828125, 125.73767852783203, 134.72216796875, 143.70668029785156, 152.69117736816406, 161.67567443847656, 170.66017150878906, 179.64468383789062, 188.62918090820312, 197.61367797851562, 206.59817504882812, 215.58267211914062, 224.56716918945312, 233.55166625976562, 242.53616333007812, 251.52066040039062, 260.5051574707031, 269.48968505859375, 278.47418212890625, 287.45867919921875, 296.44317626953125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 4.0, 5.0, 10.0, 12.0, 16.0, 13.0, 23.0, 28.0, 41.0, 75.0, 98.0, 153.0, 235.0, 346.0, 561.0, 951.0, 1585.0, 2881.0, 5353.0, 10922.0, 27774.0, 124063.0, 3846040.0, 120945.0, 28392.0, 11319.0, 5446.0, 2889.0, 1616.0, 958.0, 551.0, 338.0, 204.0, 134.0, 94.0, 63.0, 39.0, 19.0, 17.0, 13.0, 14.0, 12.0, 6.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-125.0, -121.267578125, -117.53515625, -113.802734375, -110.0703125, -106.337890625, -102.60546875, -98.873046875, -95.140625, -91.408203125, -87.67578125, -83.943359375, -80.2109375, -76.478515625, -72.74609375, -69.013671875, -65.28125, -61.548828125, -57.81640625, -54.083984375, -50.3515625, -46.619140625, -42.88671875, -39.154296875, -35.421875, -31.689453125, -27.95703125, -24.224609375, -20.4921875, -16.759765625, -13.02734375, -9.294921875, -5.5625, -1.830078125, 1.90234375, 5.634765625, 9.3671875, 13.099609375, 16.83203125, 20.564453125, 24.296875, 28.029296875, 31.76171875, 35.494140625, 39.2265625, 42.958984375, 46.69140625, 50.423828125, 54.15625, 57.888671875, 61.62109375, 65.353515625, 69.0859375, 72.818359375, 76.55078125, 80.283203125, 84.015625, 87.748046875, 91.48046875, 95.212890625, 98.9453125, 102.677734375, 106.41015625, 110.142578125, 113.875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 8.0, 4.0, 4.0, 7.0, 17.0, 8.0, 19.0, 21.0, 29.0, 27.0, 37.0, 49.0, 28.0, 41.0, 52.0, 35.0, 50.0, 57.0, 54.0, 58.0, 46.0, 55.0, 34.0, 37.0, 38.0, 26.0, 26.0, 29.0, 30.0, 18.0, 16.0, 8.0, 9.0, 9.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3984375, -13.8973388671875, -13.396240234375, -12.8951416015625, -12.39404296875, -11.8929443359375, -11.391845703125, -10.8907470703125, -10.3896484375, -9.8885498046875, -9.387451171875, -8.8863525390625, -8.38525390625, -7.8841552734375, -7.383056640625, -6.8819580078125, -6.380859375, -5.8797607421875, -5.378662109375, -4.8775634765625, -4.37646484375, -3.8753662109375, -3.374267578125, -2.8731689453125, -2.3720703125, -1.8709716796875, -1.369873046875, -0.8687744140625, -0.36767578125, 0.1334228515625, 0.634521484375, 1.1356201171875, 1.63671875, 2.1378173828125, 2.638916015625, 3.1400146484375, 3.64111328125, 4.1422119140625, 4.643310546875, 5.1444091796875, 5.6455078125, 6.1466064453125, 6.647705078125, 7.1488037109375, 7.64990234375, 8.1510009765625, 8.652099609375, 9.1531982421875, 9.654296875, 10.1553955078125, 10.656494140625, 11.1575927734375, 11.65869140625, 12.1597900390625, 12.660888671875, 13.1619873046875, 13.6630859375, 14.1641845703125, 14.665283203125, 15.1663818359375, 15.66748046875, 16.1685791015625, 16.669677734375, 17.1707763671875, 17.671875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 4.0, 7.0, 7.0, 5.0, 6.0, 19.0, 11.0, 13.0, 30.0, 42.0, 57.0, 50.0, 95.0, 144.0, 252.0, 469.0, 1164.0, 3313.0, 11148.0, 56985.0, 3969535.0, 126579.0, 16778.0, 4539.0, 1569.0, 615.0, 311.0, 173.0, 104.0, 68.0, 46.0, 30.0, 18.0, 18.0, 18.0, 16.0, 2.0, 11.0, 11.0, 9.0, 6.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-309.0, -300.08203125, -291.1640625, -282.24609375, -273.328125, -264.41015625, -255.4921875, -246.57421875, -237.65625, -228.73828125, -219.8203125, -210.90234375, -201.984375, -193.06640625, -184.1484375, -175.23046875, -166.3125, -157.39453125, -148.4765625, -139.55859375, -130.640625, -121.72265625, -112.8046875, -103.88671875, -94.96875, -86.05078125, -77.1328125, -68.21484375, -59.296875, -50.37890625, -41.4609375, -32.54296875, -23.625, -14.70703125, -5.7890625, 3.12890625, 12.046875, 20.96484375, 29.8828125, 38.80078125, 47.71875, 56.63671875, 65.5546875, 74.47265625, 83.390625, 92.30859375, 101.2265625, 110.14453125, 119.0625, 127.98046875, 136.8984375, 145.81640625, 154.734375, 163.65234375, 172.5703125, 181.48828125, 190.40625, 199.32421875, 208.2421875, 217.16015625, 226.078125, 234.99609375, 243.9140625, 252.83203125, 261.75]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 6.0, 9.0, 14.0, 31.0, 66.0, 222.0, 3269.0, 296.0, 63.0, 35.0, 18.0, 21.0, 10.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-178.875, -174.669921875, -170.46484375, -166.259765625, -162.0546875, -157.849609375, -153.64453125, -149.439453125, -145.234375, -141.029296875, -136.82421875, -132.619140625, -128.4140625, -124.208984375, -120.00390625, -115.798828125, -111.59375, -107.388671875, -103.18359375, -98.978515625, -94.7734375, -90.568359375, -86.36328125, -82.158203125, -77.953125, -73.748046875, -69.54296875, -65.337890625, -61.1328125, -56.927734375, -52.72265625, -48.517578125, -44.3125, -40.107421875, -35.90234375, -31.697265625, -27.4921875, -23.287109375, -19.08203125, -14.876953125, -10.671875, -6.466796875, -2.26171875, 1.943359375, 6.1484375, 10.353515625, 14.55859375, 18.763671875, 22.96875, 27.173828125, 31.37890625, 35.583984375, 39.7890625, 43.994140625, 48.19921875, 52.404296875, 56.609375, 60.814453125, 65.01953125, 69.224609375, 73.4296875, 77.634765625, 81.83984375, 86.044921875, 90.25]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 15.0, 19.0, 32.0, 66.0, 149.0, 245.0, 243.0, 116.0, 72.0, 27.0, 12.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-434.6964111328125, -414.8282470703125, -394.9600830078125, -375.0919189453125, -355.2237548828125, -335.3555908203125, -315.4874267578125, -295.6192626953125, -275.7510986328125, -255.8829345703125, -236.0147705078125, -216.1466064453125, -196.2784423828125, -176.4102783203125, -156.5421142578125, -136.6739501953125, -116.8057861328125, -96.9376220703125, -77.0694580078125, -57.2012939453125, -37.3331298828125, -17.4649658203125, 2.4031982421875, 22.2713623046875, 42.1395263671875, 62.0076904296875, 81.8758544921875, 101.7440185546875, 121.6121826171875, 141.4803466796875, 161.3485107421875, 181.2166748046875, 201.08489990234375, 220.95306396484375, 240.82122802734375, 260.68939208984375, 280.55755615234375, 300.42572021484375, 320.29388427734375, 340.16204833984375, 360.03021240234375, 379.89837646484375, 399.76654052734375, 419.63470458984375, 439.50286865234375, 459.37103271484375, 479.23919677734375, 499.10736083984375, 518.9755249023438, 538.8436889648438, 558.7118530273438, 578.5800170898438, 598.4481811523438, 618.3163452148438, 638.1845092773438, 658.0526733398438, 677.9208374023438, 697.7890014648438, 717.6571655273438, 737.5253295898438, 757.3934936523438, 777.2616577148438, 797.1298217773438, 816.9979858398438, 836.8661499023438]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 6.0, 5.0, 7.0, 5.0, 10.0, 15.0, 19.0, 31.0, 23.0, 17.0, 25.0, 38.0, 33.0, 28.0, 34.0, 40.0, 40.0, 39.0, 36.0, 47.0, 48.0, 41.0, 49.0, 33.0, 45.0, 24.0, 31.0, 36.0, 27.0, 21.0, 13.0, 24.0, 16.0, 7.0, 13.0, 9.0, 16.0, 13.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-171.8367919921875, -166.40737915039062, -160.9779510498047, -155.5485382080078, -150.11912536621094, -144.689697265625, -139.26028442382812, -133.83087158203125, -128.40145874023438, -122.97203826904297, -117.5426254272461, -112.11320495605469, -106.68379211425781, -101.2543716430664, -95.824951171875, -90.39553833007812, -84.96611022949219, -79.53668975830078, -74.1072769165039, -68.6778564453125, -63.24843978881836, -57.81902313232422, -52.38960266113281, -46.96018600463867, -41.53076934814453, -36.10135269165039, -30.671934127807617, -25.242515563964844, -19.813098907470703, -14.383682250976562, -8.954261779785156, -3.5248451232910156, 1.904571533203125, 7.333989143371582, 12.763406753540039, 18.192825317382812, 23.622241973876953, 29.051658630371094, 34.4810791015625, 39.91049575805664, 45.33991241455078, 50.76932907104492, 56.19874572753906, 61.62816619873047, 67.05758666992188, 72.48699951171875, 77.91641998291016, 83.34584045410156, 88.77525329589844, 94.20467376708984, 99.63408660888672, 105.06350708007812, 110.492919921875, 115.9223403930664, 121.35176086425781, 126.78117370605469, 132.21060180664062, 137.6400146484375, 143.06944274902344, 148.4988555908203, 153.9282684326172, 159.35769653320312, 164.787109375, 170.21652221679688, 175.64593505859375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 3.0, 9.0, 8.0, 15.0, 18.0, 37.0, 46.0, 66.0, 98.0, 127.0, 210.0, 275.0, 465.0, 730.0, 1109.0, 1716.0, 2797.0, 4905.0, 8768.0, 16878.0, 34589.0, 77865.0, 204060.0, 402828.0, 162832.0, 64729.0, 29602.0, 14679.0, 7768.0, 4411.0, 2613.0, 1569.0, 976.0, 560.0, 409.0, 254.0, 159.0, 126.0, 74.0, 52.0, 35.0, 24.0, 16.0, 15.0, 9.0, 5.0, 9.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.34375, -52.35986328125, -50.3759765625, -48.39208984375, -46.408203125, -44.42431640625, -42.4404296875, -40.45654296875, -38.47265625, -36.48876953125, -34.5048828125, -32.52099609375, -30.537109375, -28.55322265625, -26.5693359375, -24.58544921875, -22.6015625, -20.61767578125, -18.6337890625, -16.64990234375, -14.666015625, -12.68212890625, -10.6982421875, -8.71435546875, -6.73046875, -4.74658203125, -2.7626953125, -0.77880859375, 1.205078125, 3.18896484375, 5.1728515625, 7.15673828125, 9.140625, 11.12451171875, 13.1083984375, 15.09228515625, 17.076171875, 19.06005859375, 21.0439453125, 23.02783203125, 25.01171875, 26.99560546875, 28.9794921875, 30.96337890625, 32.947265625, 34.93115234375, 36.9150390625, 38.89892578125, 40.8828125, 42.86669921875, 44.8505859375, 46.83447265625, 48.818359375, 50.80224609375, 52.7861328125, 54.77001953125, 56.75390625, 58.73779296875, 60.7216796875, 62.70556640625, 64.689453125, 66.67333984375, 68.6572265625, 70.64111328125, 72.625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 3.0, 5.0, 5.0, 11.0, 7.0, 9.0, 20.0, 20.0, 23.0, 20.0, 25.0, 22.0, 38.0, 29.0, 27.0, 43.0, 46.0, 49.0, 44.0, 44.0, 36.0, 40.0, 46.0, 41.0, 29.0, 27.0, 27.0, 38.0, 24.0, 26.0, 29.0, 20.0, 20.0, 20.0, 18.0, 15.0, 9.0, 10.0, 6.0, 7.0, 2.0, 3.0, 0.0, 5.0, 1.0, 2.0, 3.0], "bins": [-19.515625, -18.988037109375, -18.46044921875, -17.932861328125, -17.4052734375, -16.877685546875, -16.35009765625, -15.822509765625, -15.294921875, -14.767333984375, -14.23974609375, -13.712158203125, -13.1845703125, -12.656982421875, -12.12939453125, -11.601806640625, -11.07421875, -10.546630859375, -10.01904296875, -9.491455078125, -8.9638671875, -8.436279296875, -7.90869140625, -7.381103515625, -6.853515625, -6.325927734375, -5.79833984375, -5.270751953125, -4.7431640625, -4.215576171875, -3.68798828125, -3.160400390625, -2.6328125, -2.105224609375, -1.57763671875, -1.050048828125, -0.5224609375, 0.005126953125, 0.53271484375, 1.060302734375, 1.587890625, 2.115478515625, 2.64306640625, 3.170654296875, 3.6982421875, 4.225830078125, 4.75341796875, 5.281005859375, 5.80859375, 6.336181640625, 6.86376953125, 7.391357421875, 7.9189453125, 8.446533203125, 8.97412109375, 9.501708984375, 10.029296875, 10.556884765625, 11.08447265625, 11.612060546875, 12.1396484375, 12.667236328125, 13.19482421875, 13.722412109375, 14.25]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 4.0, 6.0, 2.0, 13.0, 9.0, 11.0, 8.0, 18.0, 26.0, 33.0, 43.0, 57.0, 86.0, 116.0, 194.0, 294.0, 421.0, 805.0, 1466.0, 2733.0, 5793.0, 14011.0, 40264.0, 163782.0, 613386.0, 143840.0, 36502.0, 13107.0, 5488.0, 2628.0, 1303.0, 781.0, 456.0, 259.0, 187.0, 114.0, 92.0, 49.0, 43.0, 22.0, 22.0, 24.0, 17.0, 12.0, 11.0, 8.0, 4.0, 3.0, 1.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-83.9375, -80.880859375, -77.82421875, -74.767578125, -71.7109375, -68.654296875, -65.59765625, -62.541015625, -59.484375, -56.427734375, -53.37109375, -50.314453125, -47.2578125, -44.201171875, -41.14453125, -38.087890625, -35.03125, -31.974609375, -28.91796875, -25.861328125, -22.8046875, -19.748046875, -16.69140625, -13.634765625, -10.578125, -7.521484375, -4.46484375, -1.408203125, 1.6484375, 4.705078125, 7.76171875, 10.818359375, 13.875, 16.931640625, 19.98828125, 23.044921875, 26.1015625, 29.158203125, 32.21484375, 35.271484375, 38.328125, 41.384765625, 44.44140625, 47.498046875, 50.5546875, 53.611328125, 56.66796875, 59.724609375, 62.78125, 65.837890625, 68.89453125, 71.951171875, 75.0078125, 78.064453125, 81.12109375, 84.177734375, 87.234375, 90.291015625, 93.34765625, 96.404296875, 99.4609375, 102.517578125, 105.57421875, 108.630859375, 111.6875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 7.0, 2.0, 5.0, 11.0, 9.0, 12.0, 19.0, 13.0, 20.0, 15.0, 20.0, 28.0, 28.0, 38.0, 36.0, 33.0, 33.0, 32.0, 39.0, 43.0, 59.0, 55.0, 44.0, 56.0, 41.0, 38.0, 34.0, 37.0, 38.0, 26.0, 12.0, 14.0, 16.0, 15.0, 16.0, 6.0, 9.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-73.3125, -70.6162109375, -67.919921875, -65.2236328125, -62.52734375, -59.8310546875, -57.134765625, -54.4384765625, -51.7421875, -49.0458984375, -46.349609375, -43.6533203125, -40.95703125, -38.2607421875, -35.564453125, -32.8681640625, -30.171875, -27.4755859375, -24.779296875, -22.0830078125, -19.38671875, -16.6904296875, -13.994140625, -11.2978515625, -8.6015625, -5.9052734375, -3.208984375, -0.5126953125, 2.18359375, 4.8798828125, 7.576171875, 10.2724609375, 12.96875, 15.6650390625, 18.361328125, 21.0576171875, 23.75390625, 26.4501953125, 29.146484375, 31.8427734375, 34.5390625, 37.2353515625, 39.931640625, 42.6279296875, 45.32421875, 48.0205078125, 50.716796875, 53.4130859375, 56.109375, 58.8056640625, 61.501953125, 64.1982421875, 66.89453125, 69.5908203125, 72.287109375, 74.9833984375, 77.6796875, 80.3759765625, 83.072265625, 85.7685546875, 88.46484375, 91.1611328125, 93.857421875, 96.5537109375, 99.25]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 11.0, 7.0, 25.0, 19.0, 24.0, 45.0, 69.0, 118.0, 201.0, 313.0, 609.0, 1175.0, 2437.0, 5216.0, 14411.0, 51789.0, 415748.0, 474016.0, 56296.0, 15223.0, 5737.0, 2416.0, 1180.0, 588.0, 336.0, 228.0, 110.0, 56.0, 39.0, 30.0, 28.0, 17.0, 13.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.0625, -46.2841796875, -44.505859375, -42.7275390625, -40.94921875, -39.1708984375, -37.392578125, -35.6142578125, -33.8359375, -32.0576171875, -30.279296875, -28.5009765625, -26.72265625, -24.9443359375, -23.166015625, -21.3876953125, -19.609375, -17.8310546875, -16.052734375, -14.2744140625, -12.49609375, -10.7177734375, -8.939453125, -7.1611328125, -5.3828125, -3.6044921875, -1.826171875, -0.0478515625, 1.73046875, 3.5087890625, 5.287109375, 7.0654296875, 8.84375, 10.6220703125, 12.400390625, 14.1787109375, 15.95703125, 17.7353515625, 19.513671875, 21.2919921875, 23.0703125, 24.8486328125, 26.626953125, 28.4052734375, 30.18359375, 31.9619140625, 33.740234375, 35.5185546875, 37.296875, 39.0751953125, 40.853515625, 42.6318359375, 44.41015625, 46.1884765625, 47.966796875, 49.7451171875, 51.5234375, 53.3017578125, 55.080078125, 56.8583984375, 58.63671875, 60.4150390625, 62.193359375, 63.9716796875, 65.75]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 7.0, 7.0, 9.0, 10.0, 9.0, 20.0, 20.0, 36.0, 48.0, 86.0, 141.0, 201.0, 141.0, 77.0, 55.0, 29.0, 27.0, 21.0, 9.0, 10.0, 13.0, 7.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0164337158203125, -0.01594412326812744, -0.015454530715942383, -0.014964938163757324, -0.014475345611572266, -0.013985753059387207, -0.013496160507202148, -0.01300656795501709, -0.012516975402832031, -0.012027382850646973, -0.011537790298461914, -0.011048197746276855, -0.010558605194091797, -0.010069012641906738, -0.00957942008972168, -0.009089827537536621, -0.008600234985351562, -0.008110642433166504, -0.007621049880981445, -0.007131457328796387, -0.006641864776611328, -0.0061522722244262695, -0.005662679672241211, -0.005173087120056152, -0.004683494567871094, -0.004193902015686035, -0.0037043094635009766, -0.003214716911315918, -0.0027251243591308594, -0.0022355318069458008, -0.0017459392547607422, -0.0012563467025756836, -0.000766754150390625, -0.0002771615982055664, 0.0002124309539794922, 0.0007020235061645508, 0.0011916160583496094, 0.001681208610534668, 0.0021708011627197266, 0.002660393714904785, 0.0031499862670898438, 0.0036395788192749023, 0.004129171371459961, 0.0046187639236450195, 0.005108356475830078, 0.005597949028015137, 0.006087541580200195, 0.006577134132385254, 0.0070667266845703125, 0.007556319236755371, 0.00804591178894043, 0.008535504341125488, 0.009025096893310547, 0.009514689445495605, 0.010004281997680664, 0.010493874549865723, 0.010983467102050781, 0.01147305965423584, 0.011962652206420898, 0.012452244758605957, 0.012941837310791016, 0.013431429862976074, 0.013921022415161133, 0.014410614967346191, 0.01490020751953125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 1.0, 5.0, 8.0, 11.0, 20.0, 25.0, 33.0, 47.0, 74.0, 101.0, 196.0, 315.0, 607.0, 1253.0, 2730.0, 7874.0, 28155.0, 176411.0, 680226.0, 117810.0, 21686.0, 6143.0, 2440.0, 1091.0, 542.0, 263.0, 176.0, 100.0, 67.0, 32.0, 32.0, 23.0, 8.0, 15.0, 7.0, 2.0, 10.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.3125, -51.3671875, -49.421875, -47.4765625, -45.53125, -43.5859375, -41.640625, -39.6953125, -37.75, -35.8046875, -33.859375, -31.9140625, -29.96875, -28.0234375, -26.078125, -24.1328125, -22.1875, -20.2421875, -18.296875, -16.3515625, -14.40625, -12.4609375, -10.515625, -8.5703125, -6.625, -4.6796875, -2.734375, -0.7890625, 1.15625, 3.1015625, 5.046875, 6.9921875, 8.9375, 10.8828125, 12.828125, 14.7734375, 16.71875, 18.6640625, 20.609375, 22.5546875, 24.5, 26.4453125, 28.390625, 30.3359375, 32.28125, 34.2265625, 36.171875, 38.1171875, 40.0625, 42.0078125, 43.953125, 45.8984375, 47.84375, 49.7890625, 51.734375, 53.6796875, 55.625, 57.5703125, 59.515625, 61.4609375, 63.40625, 65.3515625, 67.296875, 69.2421875, 71.1875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 14.0, 8.0, 12.0, 11.0, 12.0, 29.0, 33.0, 46.0, 52.0, 76.0, 127.0, 130.0, 133.0, 93.0, 59.0, 34.0, 36.0, 22.0, 20.0, 12.0, 7.0, 5.0, 9.0, 5.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.375, -39.61328125, -37.8515625, -36.08984375, -34.328125, -32.56640625, -30.8046875, -29.04296875, -27.28125, -25.51953125, -23.7578125, -21.99609375, -20.234375, -18.47265625, -16.7109375, -14.94921875, -13.1875, -11.42578125, -9.6640625, -7.90234375, -6.140625, -4.37890625, -2.6171875, -0.85546875, 0.90625, 2.66796875, 4.4296875, 6.19140625, 7.953125, 9.71484375, 11.4765625, 13.23828125, 15.0, 16.76171875, 18.5234375, 20.28515625, 22.046875, 23.80859375, 25.5703125, 27.33203125, 29.09375, 30.85546875, 32.6171875, 34.37890625, 36.140625, 37.90234375, 39.6640625, 41.42578125, 43.1875, 44.94921875, 46.7109375, 48.47265625, 50.234375, 51.99609375, 53.7578125, 55.51953125, 57.28125, 59.04296875, 60.8046875, 62.56640625, 64.328125, 66.08984375, 67.8515625, 69.61328125, 71.375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 10.0, 23.0, 49.0, 78.0, 149.0, 193.0, 220.0, 136.0, 74.0, 35.0, 24.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1474.6683349609375, -1435.7587890625, -1396.84912109375, -1357.9395751953125, -1319.030029296875, -1280.120361328125, -1241.2108154296875, -1202.30126953125, -1163.3916015625, -1124.4820556640625, -1085.5723876953125, -1046.662841796875, -1007.7532348632812, -968.8436279296875, -929.93408203125, -891.0244750976562, -852.1148681640625, -813.2052612304688, -774.295654296875, -735.3861083984375, -696.4765014648438, -657.56689453125, -618.6573486328125, -579.7477416992188, -540.838134765625, -501.92852783203125, -463.0189514160156, -424.109375, -385.19976806640625, -346.2901611328125, -307.3805847167969, -268.47100830078125, -229.56134033203125, -190.65174865722656, -151.74215698242188, -112.83256530761719, -73.9229736328125, -35.01338195800781, 3.896209716796875, 42.8057861328125, 81.71539306640625, 120.62498474121094, 159.53457641601562, 198.4441680908203, 237.353759765625, 276.26336669921875, 315.1729431152344, 354.08251953125, 392.99212646484375, 431.9017333984375, 470.8113098144531, 509.72088623046875, 548.6304931640625, 587.5401000976562, 626.44970703125, 665.3592529296875, 704.2688598632812, 743.178466796875, 782.0880126953125, 820.9976196289062, 859.9072265625, 898.8168334960938, 937.7264404296875, 976.635986328125, 1015.5455932617188]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 9.0, 10.0, 9.0, 6.0, 9.0, 6.0, 15.0, 18.0, 21.0, 32.0, 26.0, 19.0, 25.0, 29.0, 32.0, 40.0, 44.0, 39.0, 35.0, 39.0, 34.0, 31.0, 39.0, 33.0, 43.0, 35.0, 24.0, 39.0, 35.0, 34.0, 19.0, 19.0, 23.0, 16.0, 15.0, 9.0, 11.0, 13.0, 6.0, 5.0, 11.0, 8.0, 10.0, 2.0, 1.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-383.0623474121094, -371.3676452636719, -359.6729431152344, -347.9782409667969, -336.28350830078125, -324.58880615234375, -312.89410400390625, -301.19940185546875, -289.50469970703125, -277.80999755859375, -266.11529541015625, -254.4205780029297, -242.7258758544922, -231.0311737060547, -219.33645629882812, -207.64175415039062, -195.94705200195312, -184.25234985351562, -172.55764770507812, -160.86293029785156, -149.16822814941406, -137.47352600097656, -125.77881622314453, -114.0841064453125, -102.389404296875, -90.6947021484375, -78.99999237060547, -67.30528259277344, -55.61058044433594, -43.91587448120117, -32.221168518066406, -20.526458740234375, -8.831787109375, 2.8629188537597656, 14.557624816894531, 26.252330780029297, 37.94703674316406, 49.64174270629883, 61.336448669433594, 73.03115844726562, 84.72586059570312, 96.42056274414062, 108.11527252197266, 119.80998229980469, 131.5046844482422, 143.1993865966797, 154.89410400390625, 166.58880615234375, 178.28350830078125, 189.97821044921875, 201.67291259765625, 213.3676300048828, 225.0623321533203, 236.7570343017578, 248.45175170898438, 260.1464538574219, 271.8411560058594, 283.5358581542969, 295.2305603027344, 306.9252624511719, 318.6199951171875, 330.314697265625, 342.0093994140625, 353.7041015625, 365.3988037109375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 7.0, 5.0, 11.0, 10.0, 16.0, 12.0, 22.0, 32.0, 37.0, 72.0, 91.0, 98.0, 174.0, 218.0, 345.0, 484.0, 718.0, 1109.0, 1585.0, 2468.0, 4165.0, 7472.0, 15608.0, 37174.0, 127705.0, 3694992.0, 209546.0, 48352.0, 18838.0, 9207.0, 5053.0, 2972.0, 1926.0, 1229.0, 808.0, 543.0, 382.0, 260.0, 180.0, 123.0, 70.0, 56.0, 37.0, 26.0, 22.0, 10.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-96.0625, -93.3662109375, -90.669921875, -87.9736328125, -85.27734375, -82.5810546875, -79.884765625, -77.1884765625, -74.4921875, -71.7958984375, -69.099609375, -66.4033203125, -63.70703125, -61.0107421875, -58.314453125, -55.6181640625, -52.921875, -50.2255859375, -47.529296875, -44.8330078125, -42.13671875, -39.4404296875, -36.744140625, -34.0478515625, -31.3515625, -28.6552734375, -25.958984375, -23.2626953125, -20.56640625, -17.8701171875, -15.173828125, -12.4775390625, -9.78125, -7.0849609375, -4.388671875, -1.6923828125, 1.00390625, 3.7001953125, 6.396484375, 9.0927734375, 11.7890625, 14.4853515625, 17.181640625, 19.8779296875, 22.57421875, 25.2705078125, 27.966796875, 30.6630859375, 33.359375, 36.0556640625, 38.751953125, 41.4482421875, 44.14453125, 46.8408203125, 49.537109375, 52.2333984375, 54.9296875, 57.6259765625, 60.322265625, 63.0185546875, 65.71484375, 68.4111328125, 71.107421875, 73.8037109375, 76.5]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 4.0, 8.0, 7.0, 6.0, 11.0, 16.0, 17.0, 22.0, 26.0, 19.0, 27.0, 28.0, 34.0, 36.0, 41.0, 42.0, 52.0, 49.0, 46.0, 37.0, 59.0, 37.0, 46.0, 38.0, 37.0, 33.0, 33.0, 33.0, 26.0, 20.0, 18.0, 16.0, 16.0, 17.0, 11.0, 10.0, 5.0, 3.0, 7.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.171875, -19.6126708984375, -19.053466796875, -18.4942626953125, -17.93505859375, -17.3758544921875, -16.816650390625, -16.2574462890625, -15.6982421875, -15.1390380859375, -14.579833984375, -14.0206298828125, -13.46142578125, -12.9022216796875, -12.343017578125, -11.7838134765625, -11.224609375, -10.6654052734375, -10.106201171875, -9.5469970703125, -8.98779296875, -8.4285888671875, -7.869384765625, -7.3101806640625, -6.7509765625, -6.1917724609375, -5.632568359375, -5.0733642578125, -4.51416015625, -3.9549560546875, -3.395751953125, -2.8365478515625, -2.27734375, -1.7181396484375, -1.158935546875, -0.5997314453125, -0.04052734375, 0.5186767578125, 1.077880859375, 1.6370849609375, 2.1962890625, 2.7554931640625, 3.314697265625, 3.8739013671875, 4.43310546875, 4.9923095703125, 5.551513671875, 6.1107177734375, 6.669921875, 7.2291259765625, 7.788330078125, 8.3475341796875, 8.90673828125, 9.4659423828125, 10.025146484375, 10.5843505859375, 11.1435546875, 11.7027587890625, 12.261962890625, 12.8211669921875, 13.38037109375, 13.9395751953125, 14.498779296875, 15.0579833984375, 15.6171875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 8.0, 13.0, 13.0, 14.0, 26.0, 30.0, 30.0, 50.0, 55.0, 100.0, 157.0, 218.0, 441.0, 840.0, 1720.0, 3879.0, 10436.0, 35914.0, 285796.0, 3744019.0, 80746.0, 18296.0, 6266.0, 2525.0, 1163.0, 557.0, 310.0, 183.0, 134.0, 75.0, 57.0, 46.0, 33.0, 16.0, 22.0, 24.0, 11.0, 7.0, 11.0, 5.0, 4.0, 8.0, 3.0, 5.0, 2.0, 2.0], "bins": [-253.0, -246.20703125, -239.4140625, -232.62109375, -225.828125, -219.03515625, -212.2421875, -205.44921875, -198.65625, -191.86328125, -185.0703125, -178.27734375, -171.484375, -164.69140625, -157.8984375, -151.10546875, -144.3125, -137.51953125, -130.7265625, -123.93359375, -117.140625, -110.34765625, -103.5546875, -96.76171875, -89.96875, -83.17578125, -76.3828125, -69.58984375, -62.796875, -56.00390625, -49.2109375, -42.41796875, -35.625, -28.83203125, -22.0390625, -15.24609375, -8.453125, -1.66015625, 5.1328125, 11.92578125, 18.71875, 25.51171875, 32.3046875, 39.09765625, 45.890625, 52.68359375, 59.4765625, 66.26953125, 73.0625, 79.85546875, 86.6484375, 93.44140625, 100.234375, 107.02734375, 113.8203125, 120.61328125, 127.40625, 134.19921875, 140.9921875, 147.78515625, 154.578125, 161.37109375, 168.1640625, 174.95703125, 181.75]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 11.0, 9.0, 9.0, 21.0, 28.0, 28.0, 56.0, 131.0, 518.0, 2784.0, 233.0, 104.0, 46.0, 32.0, 20.0, 17.0, 7.0, 7.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-166.25, -162.576171875, -158.90234375, -155.228515625, -151.5546875, -147.880859375, -144.20703125, -140.533203125, -136.859375, -133.185546875, -129.51171875, -125.837890625, -122.1640625, -118.490234375, -114.81640625, -111.142578125, -107.46875, -103.794921875, -100.12109375, -96.447265625, -92.7734375, -89.099609375, -85.42578125, -81.751953125, -78.078125, -74.404296875, -70.73046875, -67.056640625, -63.3828125, -59.708984375, -56.03515625, -52.361328125, -48.6875, -45.013671875, -41.33984375, -37.666015625, -33.9921875, -30.318359375, -26.64453125, -22.970703125, -19.296875, -15.623046875, -11.94921875, -8.275390625, -4.6015625, -0.927734375, 2.74609375, 6.419921875, 10.09375, 13.767578125, 17.44140625, 21.115234375, 24.7890625, 28.462890625, 32.13671875, 35.810546875, 39.484375, 43.158203125, 46.83203125, 50.505859375, 54.1796875, 57.853515625, 61.52734375, 65.201171875, 68.875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 16.0, 41.0, 82.0, 202.0, 246.0, 243.0, 99.0, 41.0, 12.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-880.707275390625, -847.4222412109375, -814.13720703125, -780.8521118164062, -747.5670776367188, -714.2820434570312, -680.9969482421875, -647.7119140625, -614.4268798828125, -581.141845703125, -547.8568115234375, -514.5717163085938, -481.28668212890625, -448.00164794921875, -414.7165832519531, -381.4315185546875, -348.146484375, -314.8614501953125, -281.5763854980469, -248.2913360595703, -215.00628662109375, -181.7212371826172, -148.43618774414062, -115.15113830566406, -81.8660888671875, -48.58103942871094, -15.295989990234375, 17.989059448242188, 51.27410888671875, 84.55915832519531, 117.84420776367188, 151.12925720214844, 184.414306640625, 217.69935607910156, 250.98440551757812, 284.26947021484375, 317.55450439453125, 350.83953857421875, 384.1246032714844, 417.40966796875, 450.6947021484375, 483.979736328125, 517.2647705078125, 550.5498657226562, 583.8348999023438, 617.1199340820312, 650.405029296875, 683.6900634765625, 716.97509765625, 750.2601318359375, 783.545166015625, 816.8302612304688, 850.1152954101562, 883.4003295898438, 916.6854248046875, 949.970458984375, 983.2554931640625, 1016.54052734375, 1049.8255615234375, 1083.110595703125, 1116.395751953125, 1149.6807861328125, 1182.9658203125, 1216.2508544921875, 1249.535888671875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 8.0, 6.0, 12.0, 5.0, 12.0, 16.0, 15.0, 21.0, 15.0, 19.0, 29.0, 24.0, 22.0, 38.0, 42.0, 43.0, 39.0, 37.0, 44.0, 43.0, 41.0, 40.0, 49.0, 40.0, 50.0, 42.0, 35.0, 37.0, 20.0, 30.0, 25.0, 18.0, 14.0, 18.0, 8.0, 13.0, 6.0, 5.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-230.9420623779297, -223.25466918945312, -215.56727600097656, -207.8798828125, -200.19248962402344, -192.50509643554688, -184.81771850585938, -177.13031005859375, -169.44293212890625, -161.7555389404297, -154.06814575195312, -146.38075256347656, -138.693359375, -131.00596618652344, -123.3185806274414, -115.63118743896484, -107.94378662109375, -100.25639343261719, -92.56900024414062, -84.88160705566406, -77.1942138671875, -69.50682067871094, -61.819435119628906, -54.132041931152344, -46.44464874267578, -38.75725555419922, -31.06986427307129, -23.38247299194336, -15.695079803466797, -8.007686614990234, -0.3202972412109375, 7.367095947265625, 15.05450439453125, 22.741897583007812, 30.429288864135742, 38.11668014526367, 45.804073333740234, 53.4914665222168, 61.178855895996094, 68.86624908447266, 76.55364227294922, 84.24103546142578, 91.92842864990234, 99.61581420898438, 107.30320739746094, 114.9906005859375, 122.67799377441406, 130.36538696289062, 138.0527801513672, 145.74017333984375, 153.4275665283203, 161.11495971679688, 168.80235290527344, 176.48974609375, 184.1771240234375, 191.86453247070312, 199.55191040039062, 207.2393035888672, 214.92669677734375, 222.6140899658203, 230.30148315429688, 237.98887634277344, 245.67626953125, 253.3636474609375, 261.0510559082031]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 5.0, 1.0, 5.0, 11.0, 15.0, 21.0, 17.0, 31.0, 51.0, 62.0, 105.0, 127.0, 185.0, 280.0, 430.0, 670.0, 1106.0, 2085.0, 4254.0, 9491.0, 24525.0, 78861.0, 345640.0, 431039.0, 98292.0, 29675.0, 10991.0, 4834.0, 2421.0, 1212.0, 700.0, 429.0, 301.0, 224.0, 115.0, 81.0, 73.0, 52.0, 32.0, 28.0, 22.0, 24.0, 12.0, 7.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0], "bins": [-115.4375, -112.23828125, -109.0390625, -105.83984375, -102.640625, -99.44140625, -96.2421875, -93.04296875, -89.84375, -86.64453125, -83.4453125, -80.24609375, -77.046875, -73.84765625, -70.6484375, -67.44921875, -64.25, -61.05078125, -57.8515625, -54.65234375, -51.453125, -48.25390625, -45.0546875, -41.85546875, -38.65625, -35.45703125, -32.2578125, -29.05859375, -25.859375, -22.66015625, -19.4609375, -16.26171875, -13.0625, -9.86328125, -6.6640625, -3.46484375, -0.265625, 2.93359375, 6.1328125, 9.33203125, 12.53125, 15.73046875, 18.9296875, 22.12890625, 25.328125, 28.52734375, 31.7265625, 34.92578125, 38.125, 41.32421875, 44.5234375, 47.72265625, 50.921875, 54.12109375, 57.3203125, 60.51953125, 63.71875, 66.91796875, 70.1171875, 73.31640625, 76.515625, 79.71484375, 82.9140625, 86.11328125, 89.3125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 11.0, 6.0, 8.0, 15.0, 13.0, 9.0, 14.0, 22.0, 28.0, 24.0, 33.0, 38.0, 46.0, 40.0, 50.0, 49.0, 50.0, 38.0, 57.0, 54.0, 46.0, 39.0, 40.0, 50.0, 32.0, 25.0, 31.0, 28.0, 22.0, 9.0, 20.0, 14.0, 8.0, 7.0, 5.0, 9.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.140625, -24.349853515625, -23.55908203125, -22.768310546875, -21.9775390625, -21.186767578125, -20.39599609375, -19.605224609375, -18.814453125, -18.023681640625, -17.23291015625, -16.442138671875, -15.6513671875, -14.860595703125, -14.06982421875, -13.279052734375, -12.48828125, -11.697509765625, -10.90673828125, -10.115966796875, -9.3251953125, -8.534423828125, -7.74365234375, -6.952880859375, -6.162109375, -5.371337890625, -4.58056640625, -3.789794921875, -2.9990234375, -2.208251953125, -1.41748046875, -0.626708984375, 0.1640625, 0.954833984375, 1.74560546875, 2.536376953125, 3.3271484375, 4.117919921875, 4.90869140625, 5.699462890625, 6.490234375, 7.281005859375, 8.07177734375, 8.862548828125, 9.6533203125, 10.444091796875, 11.23486328125, 12.025634765625, 12.81640625, 13.607177734375, 14.39794921875, 15.188720703125, 15.9794921875, 16.770263671875, 17.56103515625, 18.351806640625, 19.142578125, 19.933349609375, 20.72412109375, 21.514892578125, 22.3056640625, 23.096435546875, 23.88720703125, 24.677978515625, 25.46875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 7.0, 5.0, 3.0, 12.0, 27.0, 32.0, 45.0, 86.0, 124.0, 199.0, 329.0, 594.0, 1040.0, 1925.0, 4242.0, 12956.0, 72892.0, 746505.0, 174035.0, 21908.0, 6038.0, 2467.0, 1304.0, 706.0, 418.0, 247.0, 170.0, 88.0, 60.0, 30.0, 23.0, 12.0, 9.0, 11.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.125, -172.87890625, -166.6328125, -160.38671875, -154.140625, -147.89453125, -141.6484375, -135.40234375, -129.15625, -122.91015625, -116.6640625, -110.41796875, -104.171875, -97.92578125, -91.6796875, -85.43359375, -79.1875, -72.94140625, -66.6953125, -60.44921875, -54.203125, -47.95703125, -41.7109375, -35.46484375, -29.21875, -22.97265625, -16.7265625, -10.48046875, -4.234375, 2.01171875, 8.2578125, 14.50390625, 20.75, 26.99609375, 33.2421875, 39.48828125, 45.734375, 51.98046875, 58.2265625, 64.47265625, 70.71875, 76.96484375, 83.2109375, 89.45703125, 95.703125, 101.94921875, 108.1953125, 114.44140625, 120.6875, 126.93359375, 133.1796875, 139.42578125, 145.671875, 151.91796875, 158.1640625, 164.41015625, 170.65625, 176.90234375, 183.1484375, 189.39453125, 195.640625, 201.88671875, 208.1328125, 214.37890625, 220.625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 5.0, 6.0, 12.0, 12.0, 14.0, 15.0, 15.0, 25.0, 17.0, 33.0, 43.0, 59.0, 46.0, 59.0, 55.0, 56.0, 41.0, 48.0, 49.0, 47.0, 61.0, 45.0, 28.0, 28.0, 27.0, 23.0, 26.0, 21.0, 19.0, 8.0, 14.0, 10.0, 8.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-124.9375, -120.4228515625, -115.908203125, -111.3935546875, -106.87890625, -102.3642578125, -97.849609375, -93.3349609375, -88.8203125, -84.3056640625, -79.791015625, -75.2763671875, -70.76171875, -66.2470703125, -61.732421875, -57.2177734375, -52.703125, -48.1884765625, -43.673828125, -39.1591796875, -34.64453125, -30.1298828125, -25.615234375, -21.1005859375, -16.5859375, -12.0712890625, -7.556640625, -3.0419921875, 1.47265625, 5.9873046875, 10.501953125, 15.0166015625, 19.53125, 24.0458984375, 28.560546875, 33.0751953125, 37.58984375, 42.1044921875, 46.619140625, 51.1337890625, 55.6484375, 60.1630859375, 64.677734375, 69.1923828125, 73.70703125, 78.2216796875, 82.736328125, 87.2509765625, 91.765625, 96.2802734375, 100.794921875, 105.3095703125, 109.82421875, 114.3388671875, 118.853515625, 123.3681640625, 127.8828125, 132.3974609375, 136.912109375, 141.4267578125, 145.94140625, 150.4560546875, 154.970703125, 159.4853515625, 164.0]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 0.0, 11.0, 10.0, 9.0, 19.0, 15.0, 28.0, 24.0, 47.0, 56.0, 73.0, 108.0, 162.0, 245.0, 274.0, 400.0, 515.0, 751.0, 1032.0, 1562.0, 2398.0, 4408.0, 15316.0, 661375.0, 335975.0, 12283.0, 4126.0, 2248.0, 1456.0, 1012.0, 672.0, 535.0, 373.0, 274.0, 184.0, 159.0, 98.0, 95.0, 53.0, 51.0, 33.0, 24.0, 13.0, 16.0, 10.0, 9.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-213.0, -206.115234375, -199.23046875, -192.345703125, -185.4609375, -178.576171875, -171.69140625, -164.806640625, -157.921875, -151.037109375, -144.15234375, -137.267578125, -130.3828125, -123.498046875, -116.61328125, -109.728515625, -102.84375, -95.958984375, -89.07421875, -82.189453125, -75.3046875, -68.419921875, -61.53515625, -54.650390625, -47.765625, -40.880859375, -33.99609375, -27.111328125, -20.2265625, -13.341796875, -6.45703125, 0.427734375, 7.3125, 14.197265625, 21.08203125, 27.966796875, 34.8515625, 41.736328125, 48.62109375, 55.505859375, 62.390625, 69.275390625, 76.16015625, 83.044921875, 89.9296875, 96.814453125, 103.69921875, 110.583984375, 117.46875, 124.353515625, 131.23828125, 138.123046875, 145.0078125, 151.892578125, 158.77734375, 165.662109375, 172.546875, 179.431640625, 186.31640625, 193.201171875, 200.0859375, 206.970703125, 213.85546875, 220.740234375, 227.625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 12.0, 26.0, 113.0, 594.0, 165.0, 43.0, 20.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097412109375, -0.09401321411132812, -0.09061431884765625, -0.08721542358398438, -0.0838165283203125, -0.08041763305664062, -0.07701873779296875, -0.07361984252929688, -0.070220947265625, -0.06682205200195312, -0.06342315673828125, -0.060024261474609375, -0.0566253662109375, -0.053226470947265625, -0.04982757568359375, -0.046428680419921875, -0.04302978515625, -0.039630889892578125, -0.03623199462890625, -0.032833099365234375, -0.0294342041015625, -0.026035308837890625, -0.02263641357421875, -0.019237518310546875, -0.015838623046875, -0.012439727783203125, -0.00904083251953125, -0.005641937255859375, -0.0022430419921875, 0.001155853271484375, 0.00455474853515625, 0.007953643798828125, 0.0113525390625, 0.014751434326171875, 0.01815032958984375, 0.021549224853515625, 0.0249481201171875, 0.028347015380859375, 0.03174591064453125, 0.035144805908203125, 0.038543701171875, 0.041942596435546875, 0.04534149169921875, 0.048740386962890625, 0.0521392822265625, 0.055538177490234375, 0.05893707275390625, 0.062335968017578125, 0.06573486328125, 0.06913375854492188, 0.07253265380859375, 0.07593154907226562, 0.0793304443359375, 0.08272933959960938, 0.08612823486328125, 0.08952713012695312, 0.092926025390625, 0.09632492065429688, 0.09972381591796875, 0.10312271118164062, 0.1065216064453125, 0.10992050170898438, 0.11331939697265625, 0.11671829223632812, 0.1201171875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 0.0, 0.0, 9.0, 11.0, 10.0, 17.0, 28.0, 49.0, 52.0, 96.0, 148.0, 264.0, 464.0, 916.0, 2024.0, 5040.0, 24008.0, 988400.0, 18538.0, 4589.0, 1902.0, 910.0, 428.0, 256.0, 149.0, 80.0, 44.0, 36.0, 22.0, 14.0, 12.0, 11.0, 9.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-346.5, -333.87890625, -321.2578125, -308.63671875, -296.015625, -283.39453125, -270.7734375, -258.15234375, -245.53125, -232.91015625, -220.2890625, -207.66796875, -195.046875, -182.42578125, -169.8046875, -157.18359375, -144.5625, -131.94140625, -119.3203125, -106.69921875, -94.078125, -81.45703125, -68.8359375, -56.21484375, -43.59375, -30.97265625, -18.3515625, -5.73046875, 6.890625, 19.51171875, 32.1328125, 44.75390625, 57.375, 69.99609375, 82.6171875, 95.23828125, 107.859375, 120.48046875, 133.1015625, 145.72265625, 158.34375, 170.96484375, 183.5859375, 196.20703125, 208.828125, 221.44921875, 234.0703125, 246.69140625, 259.3125, 271.93359375, 284.5546875, 297.17578125, 309.796875, 322.41796875, 335.0390625, 347.66015625, 360.28125, 372.90234375, 385.5234375, 398.14453125, 410.765625, 423.38671875, 436.0078125, 448.62890625, 461.25]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 14.0, 45.0, 295.0, 474.0, 101.0, 21.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-298.5, -287.93359375, -277.3671875, -266.80078125, -256.234375, -245.66796875, -235.1015625, -224.53515625, -213.96875, -203.40234375, -192.8359375, -182.26953125, -171.703125, -161.13671875, -150.5703125, -140.00390625, -129.4375, -118.87109375, -108.3046875, -97.73828125, -87.171875, -76.60546875, -66.0390625, -55.47265625, -44.90625, -34.33984375, -23.7734375, -13.20703125, -2.640625, 7.92578125, 18.4921875, 29.05859375, 39.625, 50.19140625, 60.7578125, 71.32421875, 81.890625, 92.45703125, 103.0234375, 113.58984375, 124.15625, 134.72265625, 145.2890625, 155.85546875, 166.421875, 176.98828125, 187.5546875, 198.12109375, 208.6875, 219.25390625, 229.8203125, 240.38671875, 250.953125, 261.51953125, 272.0859375, 282.65234375, 293.21875, 303.78515625, 314.3515625, 324.91796875, 335.484375, 346.05078125, 356.6171875, 367.18359375, 377.75]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 13.0, 18.0, 16.0, 31.0, 25.0, 51.0, 54.0, 77.0, 86.0, 120.0, 106.0, 104.0, 82.0, 57.0, 48.0, 40.0, 19.0, 9.0, 9.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1795.10498046875, -1750.699462890625, -1706.2939453125, -1661.888427734375, -1617.48291015625, -1573.077392578125, -1528.671875, -1484.2662353515625, -1439.8607177734375, -1395.4552001953125, -1351.0496826171875, -1306.6441650390625, -1262.2386474609375, -1217.8330078125, -1173.427490234375, -1129.02197265625, -1084.616455078125, -1040.2109375, -995.805419921875, -951.39990234375, -906.9943237304688, -862.5888061523438, -818.1832885742188, -773.7777099609375, -729.372314453125, -684.966796875, -640.561279296875, -596.15576171875, -551.7501831054688, -507.34466552734375, -462.93914794921875, -418.5335998535156, -374.1280517578125, -329.7225341796875, -285.3169860839844, -240.91146850585938, -196.5059356689453, -152.10040283203125, -107.69488525390625, -63.289337158203125, -18.883819580078125, 25.521709442138672, 69.92723846435547, 114.332763671875, 158.73829650878906, 203.14382934570312, 247.54934692382812, 291.95489501953125, 336.36041259765625, 380.76593017578125, 425.1714782714844, 469.5769958496094, 513.9825439453125, 558.3880615234375, 602.7935791015625, 647.1990966796875, 691.6046142578125, 736.0101318359375, 780.4156494140625, 824.8211669921875, 869.2267456054688, 913.6322631835938, 958.0377807617188, 1002.443359375, 1046.848876953125]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 11.0, 11.0, 9.0, 7.0, 13.0, 14.0, 27.0, 23.0, 33.0, 25.0, 23.0, 29.0, 31.0, 46.0, 35.0, 45.0, 54.0, 43.0, 39.0, 38.0, 49.0, 38.0, 44.0, 44.0, 34.0, 26.0, 32.0, 28.0, 33.0, 18.0, 20.0, 19.0, 9.0, 13.0, 11.0, 5.0, 9.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-966.2689208984375, -938.384521484375, -910.5001831054688, -882.6157836914062, -854.7314453125, -826.8470458984375, -798.9627075195312, -771.0783081054688, -743.1939697265625, -715.3095703125, -687.4252319335938, -659.5408325195312, -631.656494140625, -603.7720947265625, -575.8877563476562, -548.0033569335938, -520.1190185546875, -492.2346496582031, -464.35028076171875, -436.4659118652344, -408.58154296875, -380.6971435546875, -352.81280517578125, -324.92840576171875, -297.04400634765625, -269.1596374511719, -241.2752685546875, -213.39089965820312, -185.50653076171875, -157.6221466064453, -129.73777770996094, -101.85340881347656, -73.96905517578125, -46.084686279296875, -18.200313568115234, 9.684059143066406, 37.56842803955078, 65.45280456542969, 93.33717346191406, 121.22154235839844, 149.1059112548828, 176.9902801513672, 204.87464904785156, 232.759033203125, 260.6434020996094, 288.52777099609375, 316.4121398925781, 344.2965087890625, 372.1808776855469, 400.06524658203125, 427.9496154785156, 455.833984375, 483.7183532714844, 511.60272216796875, 539.4871215820312, 567.3714599609375, 595.255859375, 623.1402587890625, 651.0245971679688, 678.9089965820312, 706.7933349609375, 734.677734375, 762.5620727539062, 790.4464721679688, 818.330810546875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 10.0, 2.0, 4.0, 7.0, 8.0, 7.0, 20.0, 19.0, 33.0, 49.0, 42.0, 77.0, 115.0, 160.0, 261.0, 450.0, 707.0, 1330.0, 3114.0, 11585.0, 4154649.0, 14592.0, 3471.0, 1425.0, 743.0, 455.0, 319.0, 186.0, 130.0, 85.0, 51.0, 42.0, 36.0, 23.0, 20.0, 14.0, 13.0, 7.0, 10.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-318.0, -307.59375, -297.1875, -286.78125, -276.375, -265.96875, -255.5625, -245.15625, -234.75, -224.34375, -213.9375, -203.53125, -193.125, -182.71875, -172.3125, -161.90625, -151.5, -141.09375, -130.6875, -120.28125, -109.875, -99.46875, -89.0625, -78.65625, -68.25, -57.84375, -47.4375, -37.03125, -26.625, -16.21875, -5.8125, 4.59375, 15.0, 25.40625, 35.8125, 46.21875, 56.625, 67.03125, 77.4375, 87.84375, 98.25, 108.65625, 119.0625, 129.46875, 139.875, 150.28125, 160.6875, 171.09375, 181.5, 191.90625, 202.3125, 212.71875, 223.125, 233.53125, 243.9375, 254.34375, 264.75, 275.15625, 285.5625, 295.96875, 306.375, 316.78125, 327.1875, 337.59375, 348.0]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 7.0, 6.0, 19.0, 14.0, 18.0, 24.0, 20.0, 31.0, 21.0, 37.0, 42.0, 43.0, 44.0, 54.0, 64.0, 52.0, 54.0, 46.0, 48.0, 35.0, 48.0, 33.0, 40.0, 29.0, 24.0, 23.0, 14.0, 12.0, 18.0, 17.0, 11.0, 10.0, 9.0, 4.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.015625, -29.906982421875, -28.79833984375, -27.689697265625, -26.5810546875, -25.472412109375, -24.36376953125, -23.255126953125, -22.146484375, -21.037841796875, -19.92919921875, -18.820556640625, -17.7119140625, -16.603271484375, -15.49462890625, -14.385986328125, -13.27734375, -12.168701171875, -11.06005859375, -9.951416015625, -8.8427734375, -7.734130859375, -6.62548828125, -5.516845703125, -4.408203125, -3.299560546875, -2.19091796875, -1.082275390625, 0.0263671875, 1.135009765625, 2.24365234375, 3.352294921875, 4.4609375, 5.569580078125, 6.67822265625, 7.786865234375, 8.8955078125, 10.004150390625, 11.11279296875, 12.221435546875, 13.330078125, 14.438720703125, 15.54736328125, 16.656005859375, 17.7646484375, 18.873291015625, 19.98193359375, 21.090576171875, 22.19921875, 23.307861328125, 24.41650390625, 25.525146484375, 26.6337890625, 27.742431640625, 28.85107421875, 29.959716796875, 31.068359375, 32.177001953125, 33.28564453125, 34.394287109375, 35.5029296875, 36.611572265625, 37.72021484375, 38.828857421875, 39.9375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 8.0, 4.0, 15.0, 19.0, 25.0, 39.0, 49.0, 79.0, 151.0, 205.0, 297.0, 481.0, 712.0, 1169.0, 1825.0, 3136.0, 6654.0, 38889.0, 4116437.0, 12889.0, 4443.0, 2423.0, 1473.0, 957.0, 645.0, 438.0, 271.0, 185.0, 115.0, 85.0, 54.0, 49.0, 15.0, 21.0, 9.0, 10.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.375, -216.681640625, -205.98828125, -195.294921875, -184.6015625, -173.908203125, -163.21484375, -152.521484375, -141.828125, -131.134765625, -120.44140625, -109.748046875, -99.0546875, -88.361328125, -77.66796875, -66.974609375, -56.28125, -45.587890625, -34.89453125, -24.201171875, -13.5078125, -2.814453125, 7.87890625, 18.572265625, 29.265625, 39.958984375, 50.65234375, 61.345703125, 72.0390625, 82.732421875, 93.42578125, 104.119140625, 114.8125, 125.505859375, 136.19921875, 146.892578125, 157.5859375, 168.279296875, 178.97265625, 189.666015625, 200.359375, 211.052734375, 221.74609375, 232.439453125, 243.1328125, 253.826171875, 264.51953125, 275.212890625, 285.90625, 296.599609375, 307.29296875, 317.986328125, 328.6796875, 339.373046875, 350.06640625, 360.759765625, 371.453125, 382.146484375, 392.83984375, 403.533203125, 414.2265625, 424.919921875, 435.61328125, 446.306640625, 457.0]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 9.0, 29.0, 69.0, 3852.0, 41.0, 20.0, 11.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.34375, -43.62939453125, -41.9150390625, -40.20068359375, -38.486328125, -36.77197265625, -35.0576171875, -33.34326171875, -31.62890625, -29.91455078125, -28.2001953125, -26.48583984375, -24.771484375, -23.05712890625, -21.3427734375, -19.62841796875, -17.9140625, -16.19970703125, -14.4853515625, -12.77099609375, -11.056640625, -9.34228515625, -7.6279296875, -5.91357421875, -4.19921875, -2.48486328125, -0.7705078125, 0.94384765625, 2.658203125, 4.37255859375, 6.0869140625, 7.80126953125, 9.515625, 11.22998046875, 12.9443359375, 14.65869140625, 16.373046875, 18.08740234375, 19.8017578125, 21.51611328125, 23.23046875, 24.94482421875, 26.6591796875, 28.37353515625, 30.087890625, 31.80224609375, 33.5166015625, 35.23095703125, 36.9453125, 38.65966796875, 40.3740234375, 42.08837890625, 43.802734375, 45.51708984375, 47.2314453125, 48.94580078125, 50.66015625, 52.37451171875, 54.0888671875, 55.80322265625, 57.517578125, 59.23193359375, 60.9462890625, 62.66064453125, 64.375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 10.0, 15.0, 26.0, 44.0, 65.0, 67.0, 116.0, 117.0, 108.0, 108.0, 87.0, 52.0, 45.0, 23.0, 31.0, 24.0, 12.0, 10.0, 9.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.50454711914062, -144.19775390625, -137.89096069335938, -131.5841827392578, -125.27738952636719, -118.97059631347656, -112.66381072998047, -106.35702514648438, -100.05023193359375, -93.74343872070312, -87.43665313720703, -81.12986755371094, -74.82307434082031, -68.51628112792969, -62.209495544433594, -55.902706146240234, -49.595916748046875, -43.289127349853516, -36.982337951660156, -30.675548553466797, -24.368759155273438, -18.061969757080078, -11.755180358886719, -5.448390960693359, 0.8583984375, 7.165187835693359, 13.471977233886719, 19.778766632080078, 26.085556030273438, 32.3923454284668, 38.699134826660156, 45.005924224853516, 51.31272888183594, 57.6195182800293, 63.926307678222656, 70.23309326171875, 76.53988647460938, 82.8466796875, 89.1534652709961, 95.46025085449219, 101.76704406738281, 108.07383728027344, 114.38062286376953, 120.68740844726562, 126.99420166015625, 133.30099487304688, 139.6077880859375, 145.91456604003906, 152.2213592529297, 158.5281524658203, 164.83493041992188, 171.1417236328125, 177.44851684570312, 183.75531005859375, 190.06210327148438, 196.36888122558594, 202.67567443847656, 208.9824676513672, 215.28924560546875, 221.59603881835938, 227.90283203125, 234.20962524414062, 240.51641845703125, 246.8231964111328, 253.12998962402344]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 2.0, 8.0, 7.0, 11.0, 11.0, 16.0, 24.0, 20.0, 26.0, 27.0, 20.0, 25.0, 28.0, 28.0, 40.0, 38.0, 40.0, 51.0, 34.0, 40.0, 49.0, 42.0, 38.0, 27.0, 33.0, 34.0, 41.0, 40.0, 26.0, 20.0, 25.0, 20.0, 23.0, 13.0, 11.0, 14.0, 9.0, 9.0, 11.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-100.87227630615234, -97.64218139648438, -94.41209411621094, -91.18199920654297, -87.951904296875, -84.72180938720703, -81.49171447753906, -78.26162719726562, -75.03153228759766, -71.80143737792969, -68.57135009765625, -65.34125518798828, -62.11116027832031, -58.881065368652344, -55.65097427368164, -52.42088317871094, -49.19078826904297, -45.960693359375, -42.7306022644043, -39.500511169433594, -36.270416259765625, -33.040321350097656, -29.810230255126953, -26.580137252807617, -23.35004425048828, -20.119951248168945, -16.88985824584961, -13.659765243530273, -10.429672241210938, -7.199579238891602, -3.9694862365722656, -0.7393932342529297, 2.490692138671875, 5.720785140991211, 8.950878143310547, 12.180971145629883, 15.411064147949219, 18.641157150268555, 21.87125015258789, 25.101343154907227, 28.331436157226562, 31.5615291595459, 34.791622161865234, 38.02171325683594, 41.251808166503906, 44.481903076171875, 47.71199417114258, 50.94208526611328, 54.17218017578125, 57.40227508544922, 60.63236618041992, 63.862457275390625, 67.0925521850586, 70.32264709472656, 73.552734375, 76.78282928466797, 80.01292419433594, 83.2430191040039, 86.47311401367188, 89.70320129394531, 92.93329620361328, 96.16339111328125, 99.39347839355469, 102.62357330322266, 105.85366821289062]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 9.0, 10.0, 11.0, 23.0, 37.0, 53.0, 78.0, 116.0, 186.0, 275.0, 435.0, 647.0, 1011.0, 1502.0, 2555.0, 4066.0, 7461.0, 12906.0, 24162.0, 49217.0, 111254.0, 278614.0, 309605.0, 128408.0, 55104.0, 26688.0, 13985.0, 7844.0, 4664.0, 2861.0, 1760.0, 1121.0, 652.0, 399.0, 284.0, 172.0, 147.0, 71.0, 50.0, 35.0, 26.0, 16.0, 12.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.125, -77.4609375, -74.796875, -72.1328125, -69.46875, -66.8046875, -64.140625, -61.4765625, -58.8125, -56.1484375, -53.484375, -50.8203125, -48.15625, -45.4921875, -42.828125, -40.1640625, -37.5, -34.8359375, -32.171875, -29.5078125, -26.84375, -24.1796875, -21.515625, -18.8515625, -16.1875, -13.5234375, -10.859375, -8.1953125, -5.53125, -2.8671875, -0.203125, 2.4609375, 5.125, 7.7890625, 10.453125, 13.1171875, 15.78125, 18.4453125, 21.109375, 23.7734375, 26.4375, 29.1015625, 31.765625, 34.4296875, 37.09375, 39.7578125, 42.421875, 45.0859375, 47.75, 50.4140625, 53.078125, 55.7421875, 58.40625, 61.0703125, 63.734375, 66.3984375, 69.0625, 71.7265625, 74.390625, 77.0546875, 79.71875, 82.3828125, 85.046875, 87.7109375, 90.375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 4.0, 4.0, 6.0, 6.0, 9.0, 8.0, 12.0, 12.0, 25.0, 15.0, 22.0, 23.0, 20.0, 29.0, 30.0, 35.0, 24.0, 39.0, 47.0, 54.0, 53.0, 39.0, 37.0, 41.0, 26.0, 40.0, 39.0, 54.0, 36.0, 22.0, 26.0, 17.0, 28.0, 17.0, 13.0, 17.0, 17.0, 8.0, 13.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-31.25, -30.19287109375, -29.1357421875, -28.07861328125, -27.021484375, -25.96435546875, -24.9072265625, -23.85009765625, -22.79296875, -21.73583984375, -20.6787109375, -19.62158203125, -18.564453125, -17.50732421875, -16.4501953125, -15.39306640625, -14.3359375, -13.27880859375, -12.2216796875, -11.16455078125, -10.107421875, -9.05029296875, -7.9931640625, -6.93603515625, -5.87890625, -4.82177734375, -3.7646484375, -2.70751953125, -1.650390625, -0.59326171875, 0.4638671875, 1.52099609375, 2.578125, 3.63525390625, 4.6923828125, 5.74951171875, 6.806640625, 7.86376953125, 8.9208984375, 9.97802734375, 11.03515625, 12.09228515625, 13.1494140625, 14.20654296875, 15.263671875, 16.32080078125, 17.3779296875, 18.43505859375, 19.4921875, 20.54931640625, 21.6064453125, 22.66357421875, 23.720703125, 24.77783203125, 25.8349609375, 26.89208984375, 27.94921875, 29.00634765625, 30.0634765625, 31.12060546875, 32.177734375, 33.23486328125, 34.2919921875, 35.34912109375, 36.40625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 21.0, 20.0, 23.0, 30.0, 40.0, 59.0, 104.0, 140.0, 239.0, 429.0, 780.0, 1531.0, 3426.0, 8090.0, 22827.0, 79323.0, 453133.0, 374092.0, 69664.0, 20596.0, 7511.0, 3178.0, 1457.0, 775.0, 407.0, 228.0, 139.0, 85.0, 58.0, 38.0, 26.0, 18.0, 12.0, 15.0, 4.0, 9.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-168.625, -163.34765625, -158.0703125, -152.79296875, -147.515625, -142.23828125, -136.9609375, -131.68359375, -126.40625, -121.12890625, -115.8515625, -110.57421875, -105.296875, -100.01953125, -94.7421875, -89.46484375, -84.1875, -78.91015625, -73.6328125, -68.35546875, -63.078125, -57.80078125, -52.5234375, -47.24609375, -41.96875, -36.69140625, -31.4140625, -26.13671875, -20.859375, -15.58203125, -10.3046875, -5.02734375, 0.25, 5.52734375, 10.8046875, 16.08203125, 21.359375, 26.63671875, 31.9140625, 37.19140625, 42.46875, 47.74609375, 53.0234375, 58.30078125, 63.578125, 68.85546875, 74.1328125, 79.41015625, 84.6875, 89.96484375, 95.2421875, 100.51953125, 105.796875, 111.07421875, 116.3515625, 121.62890625, 126.90625, 132.18359375, 137.4609375, 142.73828125, 148.015625, 153.29296875, 158.5703125, 163.84765625, 169.125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 9.0, 14.0, 13.0, 22.0, 15.0, 19.0, 19.0, 27.0, 36.0, 32.0, 50.0, 33.0, 39.0, 50.0, 41.0, 48.0, 50.0, 50.0, 61.0, 53.0, 31.0, 51.0, 31.0, 33.0, 23.0, 27.0, 30.0, 14.0, 11.0, 9.0, 12.0, 11.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-213.375, -206.7890625, -200.203125, -193.6171875, -187.03125, -180.4453125, -173.859375, -167.2734375, -160.6875, -154.1015625, -147.515625, -140.9296875, -134.34375, -127.7578125, -121.171875, -114.5859375, -108.0, -101.4140625, -94.828125, -88.2421875, -81.65625, -75.0703125, -68.484375, -61.8984375, -55.3125, -48.7265625, -42.140625, -35.5546875, -28.96875, -22.3828125, -15.796875, -9.2109375, -2.625, 3.9609375, 10.546875, 17.1328125, 23.71875, 30.3046875, 36.890625, 43.4765625, 50.0625, 56.6484375, 63.234375, 69.8203125, 76.40625, 82.9921875, 89.578125, 96.1640625, 102.75, 109.3359375, 115.921875, 122.5078125, 129.09375, 135.6796875, 142.265625, 148.8515625, 155.4375, 162.0234375, 168.609375, 175.1953125, 181.78125, 188.3671875, 194.953125, 201.5390625, 208.125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 1.0, 7.0, 10.0, 10.0, 15.0, 25.0, 25.0, 37.0, 55.0, 78.0, 99.0, 173.0, 223.0, 310.0, 531.0, 836.0, 1504.0, 2930.0, 6198.0, 16139.0, 54503.0, 285710.0, 538866.0, 97652.0, 24944.0, 8820.0, 3886.0, 1900.0, 1141.0, 631.0, 396.0, 258.0, 195.0, 136.0, 75.0, 65.0, 50.0, 30.0, 26.0, 18.0, 10.0, 4.0, 3.0, 9.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-68.9375, -66.86083984375, -64.7841796875, -62.70751953125, -60.630859375, -58.55419921875, -56.4775390625, -54.40087890625, -52.32421875, -50.24755859375, -48.1708984375, -46.09423828125, -44.017578125, -41.94091796875, -39.8642578125, -37.78759765625, -35.7109375, -33.63427734375, -31.5576171875, -29.48095703125, -27.404296875, -25.32763671875, -23.2509765625, -21.17431640625, -19.09765625, -17.02099609375, -14.9443359375, -12.86767578125, -10.791015625, -8.71435546875, -6.6376953125, -4.56103515625, -2.484375, -0.40771484375, 1.6689453125, 3.74560546875, 5.822265625, 7.89892578125, 9.9755859375, 12.05224609375, 14.12890625, 16.20556640625, 18.2822265625, 20.35888671875, 22.435546875, 24.51220703125, 26.5888671875, 28.66552734375, 30.7421875, 32.81884765625, 34.8955078125, 36.97216796875, 39.048828125, 41.12548828125, 43.2021484375, 45.27880859375, 47.35546875, 49.43212890625, 51.5087890625, 53.58544921875, 55.662109375, 57.73876953125, 59.8154296875, 61.89208984375, 63.96875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 5.0, 6.0, 4.0, 11.0, 15.0, 16.0, 21.0, 37.0, 64.0, 106.0, 148.0, 155.0, 133.0, 84.0, 61.0, 43.0, 29.0, 21.0, 12.0, 9.0, 5.0, 8.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0347900390625, -0.0339512825012207, -0.033112525939941406, -0.03227376937866211, -0.03143501281738281, -0.030596256256103516, -0.02975749969482422, -0.028918743133544922, -0.028079986572265625, -0.027241230010986328, -0.02640247344970703, -0.025563716888427734, -0.024724960327148438, -0.02388620376586914, -0.023047447204589844, -0.022208690643310547, -0.02136993408203125, -0.020531177520751953, -0.019692420959472656, -0.01885366439819336, -0.018014907836914062, -0.017176151275634766, -0.01633739471435547, -0.015498638153076172, -0.014659881591796875, -0.013821125030517578, -0.012982368469238281, -0.012143611907958984, -0.011304855346679688, -0.01046609878540039, -0.009627342224121094, -0.008788585662841797, -0.0079498291015625, -0.007111072540283203, -0.006272315979003906, -0.005433559417724609, -0.0045948028564453125, -0.0037560462951660156, -0.0029172897338867188, -0.002078533172607422, -0.001239776611328125, -0.0004010200500488281, 0.00043773651123046875, 0.0012764930725097656, 0.0021152496337890625, 0.0029540061950683594, 0.0037927627563476562, 0.004631519317626953, 0.00547027587890625, 0.006309032440185547, 0.007147789001464844, 0.00798654556274414, 0.008825302124023438, 0.009664058685302734, 0.010502815246582031, 0.011341571807861328, 0.012180328369140625, 0.013019084930419922, 0.013857841491699219, 0.014696598052978516, 0.015535354614257812, 0.01637411117553711, 0.017212867736816406, 0.018051624298095703, 0.018890380859375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 5.0, 4.0, 8.0, 22.0, 15.0, 18.0, 39.0, 72.0, 87.0, 138.0, 234.0, 365.0, 758.0, 1400.0, 3233.0, 8347.0, 27587.0, 129008.0, 588806.0, 225319.0, 43034.0, 11940.0, 4170.0, 1848.0, 875.0, 486.0, 260.0, 157.0, 115.0, 65.0, 37.0, 22.0, 28.0, 13.0, 8.0, 8.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.5, -65.14453125, -62.7890625, -60.43359375, -58.078125, -55.72265625, -53.3671875, -51.01171875, -48.65625, -46.30078125, -43.9453125, -41.58984375, -39.234375, -36.87890625, -34.5234375, -32.16796875, -29.8125, -27.45703125, -25.1015625, -22.74609375, -20.390625, -18.03515625, -15.6796875, -13.32421875, -10.96875, -8.61328125, -6.2578125, -3.90234375, -1.546875, 0.80859375, 3.1640625, 5.51953125, 7.875, 10.23046875, 12.5859375, 14.94140625, 17.296875, 19.65234375, 22.0078125, 24.36328125, 26.71875, 29.07421875, 31.4296875, 33.78515625, 36.140625, 38.49609375, 40.8515625, 43.20703125, 45.5625, 47.91796875, 50.2734375, 52.62890625, 54.984375, 57.33984375, 59.6953125, 62.05078125, 64.40625, 66.76171875, 69.1171875, 71.47265625, 73.828125, 76.18359375, 78.5390625, 80.89453125, 83.25]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 3.0, 4.0, 5.0, 11.0, 12.0, 25.0, 40.0, 46.0, 49.0, 66.0, 77.0, 89.0, 114.0, 111.0, 78.0, 61.0, 48.0, 49.0, 24.0, 20.0, 18.0, 13.0, 10.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.96875, -60.56494140625, -58.1611328125, -55.75732421875, -53.353515625, -50.94970703125, -48.5458984375, -46.14208984375, -43.73828125, -41.33447265625, -38.9306640625, -36.52685546875, -34.123046875, -31.71923828125, -29.3154296875, -26.91162109375, -24.5078125, -22.10400390625, -19.7001953125, -17.29638671875, -14.892578125, -12.48876953125, -10.0849609375, -7.68115234375, -5.27734375, -2.87353515625, -0.4697265625, 1.93408203125, 4.337890625, 6.74169921875, 9.1455078125, 11.54931640625, 13.953125, 16.35693359375, 18.7607421875, 21.16455078125, 23.568359375, 25.97216796875, 28.3759765625, 30.77978515625, 33.18359375, 35.58740234375, 37.9912109375, 40.39501953125, 42.798828125, 45.20263671875, 47.6064453125, 50.01025390625, 52.4140625, 54.81787109375, 57.2216796875, 59.62548828125, 62.029296875, 64.43310546875, 66.8369140625, 69.24072265625, 71.64453125, 74.04833984375, 76.4521484375, 78.85595703125, 81.259765625, 83.66357421875, 86.0673828125, 88.47119140625, 90.875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 11.0, 12.0, 18.0, 56.0, 53.0, 90.0, 149.0, 169.0, 139.0, 112.0, 79.0, 42.0, 17.0, 18.0, 11.0, 12.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-801.0159912109375, -749.6306762695312, -698.245361328125, -646.8599853515625, -595.4747314453125, -544.08935546875, -492.70404052734375, -441.3187255859375, -389.93341064453125, -338.548095703125, -287.16278076171875, -235.77743530273438, -184.39212036132812, -133.00680541992188, -81.6214599609375, -30.23614501953125, 21.149169921875, 72.53449249267578, 123.91981506347656, 175.30514526367188, 226.69046020507812, 278.0757751464844, 329.46112060546875, 380.846435546875, 432.23175048828125, 483.6170654296875, 535.0023803710938, 586.3876953125, 637.7730712890625, 689.1583251953125, 740.543701171875, 791.9290161132812, 843.314453125, 894.6997680664062, 946.0850830078125, 997.470458984375, 1048.855712890625, 1100.2410888671875, 1151.62646484375, 1203.01171875, 1254.39697265625, 1305.7823486328125, 1357.1676025390625, 1408.552978515625, 1459.938232421875, 1511.3236083984375, 1562.708984375, 1614.09423828125, 1665.4796142578125, 1716.864990234375, 1768.250244140625, 1819.6356201171875, 1871.0208740234375, 1922.40625, 1973.79150390625, 2025.1768798828125, 2076.562255859375, 2127.947509765625, 2179.3330078125, 2230.71826171875, 2282.103515625, 2333.48876953125, 2384.874267578125, 2436.259521484375, 2487.644775390625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 4.0, 6.0, 7.0, 4.0, 8.0, 12.0, 9.0, 6.0, 16.0, 26.0, 27.0, 23.0, 24.0, 31.0, 39.0, 52.0, 50.0, 50.0, 50.0, 59.0, 55.0, 63.0, 57.0, 58.0, 38.0, 33.0, 29.0, 30.0, 25.0, 23.0, 16.0, 12.0, 13.0, 13.0, 11.0, 4.0, 3.0, 3.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1346.954345703125, -1311.202880859375, -1275.451416015625, -1239.699951171875, -1203.948486328125, -1168.197021484375, -1132.445556640625, -1096.694091796875, -1060.942626953125, -1025.191162109375, -989.439697265625, -953.688232421875, -917.936767578125, -882.185302734375, -846.433837890625, -810.682373046875, -774.930908203125, -739.179443359375, -703.427978515625, -667.676513671875, -631.925048828125, -596.173583984375, -560.422119140625, -524.670654296875, -488.919189453125, -453.167724609375, -417.416259765625, -381.664794921875, -345.913330078125, -310.161865234375, -274.410400390625, -238.658935546875, -202.9073486328125, -167.1558837890625, -131.4044189453125, -95.6529541015625, -59.9014892578125, -24.1500244140625, 11.6014404296875, 47.3529052734375, 83.1043701171875, 118.8558349609375, 154.6072998046875, 190.3587646484375, 226.1102294921875, 261.8616943359375, 297.6131591796875, 333.3646240234375, 369.1160888671875, 404.8675537109375, 440.6190185546875, 476.3704833984375, 512.1219482421875, 547.8734130859375, 583.6248779296875, 619.3763427734375, 655.1278076171875, 690.8792724609375, 726.6307373046875, 762.3822021484375, 798.1336669921875, 833.8851318359375, 869.6365966796875, 905.3880615234375, 941.1395263671875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 1.0, 6.0, 3.0, 6.0, 4.0, 10.0, 8.0, 19.0, 22.0, 29.0, 45.0, 70.0, 98.0, 118.0, 191.0, 231.0, 328.0, 516.0, 757.0, 1114.0, 2186.0, 5519.0, 4043915.0, 128159.0, 5259.0, 2094.0, 1212.0, 698.0, 473.0, 317.0, 239.0, 192.0, 108.0, 96.0, 57.0, 49.0, 42.0, 26.0, 16.0, 14.0, 10.0, 7.0, 11.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-348.75, -338.17578125, -327.6015625, -317.02734375, -306.453125, -295.87890625, -285.3046875, -274.73046875, -264.15625, -253.58203125, -243.0078125, -232.43359375, -221.859375, -211.28515625, -200.7109375, -190.13671875, -179.5625, -168.98828125, -158.4140625, -147.83984375, -137.265625, -126.69140625, -116.1171875, -105.54296875, -94.96875, -84.39453125, -73.8203125, -63.24609375, -52.671875, -42.09765625, -31.5234375, -20.94921875, -10.375, 0.19921875, 10.7734375, 21.34765625, 31.921875, 42.49609375, 53.0703125, 63.64453125, 74.21875, 84.79296875, 95.3671875, 105.94140625, 116.515625, 127.08984375, 137.6640625, 148.23828125, 158.8125, 169.38671875, 179.9609375, 190.53515625, 201.109375, 211.68359375, 222.2578125, 232.83203125, 243.40625, 253.98046875, 264.5546875, 275.12890625, 285.703125, 296.27734375, 306.8515625, 317.42578125, 328.0]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 6.0, 6.0, 2.0, 3.0, 9.0, 4.0, 7.0, 12.0, 9.0, 12.0, 9.0, 15.0, 22.0, 21.0, 22.0, 30.0, 33.0, 22.0, 38.0, 28.0, 45.0, 41.0, 51.0, 47.0, 51.0, 54.0, 42.0, 36.0, 32.0, 39.0, 28.0, 25.0, 29.0, 28.0, 20.0, 26.0, 14.0, 15.0, 12.0, 7.0, 9.0, 9.0, 10.0, 5.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-31.421875, -30.412841796875, -29.40380859375, -28.394775390625, -27.3857421875, -26.376708984375, -25.36767578125, -24.358642578125, -23.349609375, -22.340576171875, -21.33154296875, -20.322509765625, -19.3134765625, -18.304443359375, -17.29541015625, -16.286376953125, -15.27734375, -14.268310546875, -13.25927734375, -12.250244140625, -11.2412109375, -10.232177734375, -9.22314453125, -8.214111328125, -7.205078125, -6.196044921875, -5.18701171875, -4.177978515625, -3.1689453125, -2.159912109375, -1.15087890625, -0.141845703125, 0.8671875, 1.876220703125, 2.88525390625, 3.894287109375, 4.9033203125, 5.912353515625, 6.92138671875, 7.930419921875, 8.939453125, 9.948486328125, 10.95751953125, 11.966552734375, 12.9755859375, 13.984619140625, 14.99365234375, 16.002685546875, 17.01171875, 18.020751953125, 19.02978515625, 20.038818359375, 21.0478515625, 22.056884765625, 23.06591796875, 24.074951171875, 25.083984375, 26.093017578125, 27.10205078125, 28.111083984375, 29.1201171875, 30.129150390625, 31.13818359375, 32.147216796875, 33.15625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 1.0, 4.0, 9.0, 2.0, 3.0, 7.0, 9.0, 6.0, 17.0, 13.0, 29.0, 31.0, 55.0, 86.0, 97.0, 165.0, 234.0, 398.0, 669.0, 1087.0, 2170.0, 8104.0, 4139805.0, 33759.0, 3664.0, 1510.0, 891.0, 527.0, 308.0, 172.0, 135.0, 87.0, 47.0, 50.0, 24.0, 23.0, 21.0, 24.0, 11.0, 9.0, 9.0, 4.0, 6.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-519.0, -502.125, -485.25, -468.375, -451.5, -434.625, -417.75, -400.875, -384.0, -367.125, -350.25, -333.375, -316.5, -299.625, -282.75, -265.875, -249.0, -232.125, -215.25, -198.375, -181.5, -164.625, -147.75, -130.875, -114.0, -97.125, -80.25, -63.375, -46.5, -29.625, -12.75, 4.125, 21.0, 37.875, 54.75, 71.625, 88.5, 105.375, 122.25, 139.125, 156.0, 172.875, 189.75, 206.625, 223.5, 240.375, 257.25, 274.125, 291.0, 307.875, 324.75, 341.625, 358.5, 375.375, 392.25, 409.125, 426.0, 442.875, 459.75, 476.625, 493.5, 510.375, 527.25, 544.125, 561.0]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 7.0, 21.0, 49.0, 3905.0, 70.0, 18.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.75, -167.5263671875, -163.302734375, -159.0791015625, -154.85546875, -150.6318359375, -146.408203125, -142.1845703125, -137.9609375, -133.7373046875, -129.513671875, -125.2900390625, -121.06640625, -116.8427734375, -112.619140625, -108.3955078125, -104.171875, -99.9482421875, -95.724609375, -91.5009765625, -87.27734375, -83.0537109375, -78.830078125, -74.6064453125, -70.3828125, -66.1591796875, -61.935546875, -57.7119140625, -53.48828125, -49.2646484375, -45.041015625, -40.8173828125, -36.59375, -32.3701171875, -28.146484375, -23.9228515625, -19.69921875, -15.4755859375, -11.251953125, -7.0283203125, -2.8046875, 1.4189453125, 5.642578125, 9.8662109375, 14.08984375, 18.3134765625, 22.537109375, 26.7607421875, 30.984375, 35.2080078125, 39.431640625, 43.6552734375, 47.87890625, 52.1025390625, 56.326171875, 60.5498046875, 64.7734375, 68.9970703125, 73.220703125, 77.4443359375, 81.66796875, 85.8916015625, 90.115234375, 94.3388671875, 98.5625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 7.0, 10.0, 11.0, 14.0, 11.0, 20.0, 18.0, 27.0, 35.0, 41.0, 45.0, 73.0, 87.0, 84.0, 80.0, 92.0, 73.0, 67.0, 44.0, 40.0, 30.0, 15.0, 10.0, 14.0, 9.0, 10.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-243.32638549804688, -237.09654235839844, -230.86669921875, -224.63685607910156, -218.40701293945312, -212.1771697998047, -205.94732666015625, -199.71746826171875, -193.48764038085938, -187.25779724121094, -181.0279541015625, -174.79811096191406, -168.56826782226562, -162.3384246826172, -156.10858154296875, -149.87872314453125, -143.6488800048828, -137.41903686523438, -131.18919372558594, -124.9593505859375, -118.72950744628906, -112.49966430664062, -106.26981353759766, -100.03997039794922, -93.81012725830078, -87.58028411865234, -81.3504409790039, -75.12059020996094, -68.8907470703125, -62.66090774536133, -56.431060791015625, -50.20121765136719, -43.97135925292969, -37.74151611328125, -31.51167106628418, -25.28182601928711, -19.051982879638672, -12.822139739990234, -6.592292785644531, -0.36244964599609375, 5.867393493652344, 12.097237586975098, 18.32708168029785, 24.556926727294922, 30.78676986694336, 37.0166130065918, 43.2464599609375, 49.47630310058594, 55.706146240234375, 61.93598937988281, 68.16583251953125, 74.39567565917969, 80.62551879882812, 86.85536193847656, 93.08521270751953, 99.31505584716797, 105.5448989868164, 111.77474212646484, 118.00458526611328, 124.23443603515625, 130.4642791748047, 136.69412231445312, 142.92396545410156, 149.15380859375, 155.38365173339844]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 7.0, 7.0, 8.0, 7.0, 13.0, 17.0, 17.0, 12.0, 25.0, 31.0, 31.0, 31.0, 30.0, 40.0, 30.0, 33.0, 52.0, 44.0, 50.0, 55.0, 34.0, 44.0, 48.0, 41.0, 35.0, 35.0, 31.0, 30.0, 25.0, 18.0, 19.0, 16.0, 14.0, 15.0, 4.0, 8.0, 6.0, 11.0, 7.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.7794952392578, -164.78338623046875, -159.78729248046875, -154.7911834716797, -149.79507446289062, -144.79896545410156, -139.8028564453125, -134.8067626953125, -129.81065368652344, -124.81454467773438, -119.81844329833984, -114.82234191894531, -109.82623291015625, -104.83012390136719, -99.83402252197266, -94.83792114257812, -89.84181213378906, -84.845703125, -79.84960174560547, -74.85350036621094, -69.85739135742188, -64.86128234863281, -59.86518096923828, -54.869075775146484, -49.87297058105469, -44.87686538696289, -39.880760192871094, -34.8846549987793, -29.8885498046875, -24.892444610595703, -19.896339416503906, -14.90023422241211, -9.904144287109375, -4.908039093017578, 0.08806610107421875, 5.084171295166016, 10.080276489257812, 15.07638168334961, 20.072486877441406, 25.068592071533203, 30.064697265625, 35.0608024597168, 40.056907653808594, 45.05301284790039, 50.04911804199219, 55.045223236083984, 60.04132843017578, 65.03742980957031, 70.03353881835938, 75.02964782714844, 80.02574920654297, 85.0218505859375, 90.01795959472656, 95.01406860351562, 100.01016998291016, 105.00627136230469, 110.00238037109375, 114.99848937988281, 119.99459075927734, 124.99069213867188, 129.98680114746094, 134.98291015625, 139.97900390625, 144.97511291503906, 149.97122192382812]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 0.0, 5.0, 9.0, 19.0, 17.0, 36.0, 58.0, 64.0, 86.0, 152.0, 272.0, 437.0, 699.0, 1219.0, 2161.0, 3951.0, 7097.0, 14550.0, 30791.0, 70494.0, 181620.0, 378698.0, 207841.0, 79922.0, 34469.0, 15934.0, 8056.0, 4348.0, 2294.0, 1323.0, 763.0, 451.0, 267.0, 172.0, 80.0, 54.0, 44.0, 39.0, 24.0, 18.0, 12.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-106.0, -102.93359375, -99.8671875, -96.80078125, -93.734375, -90.66796875, -87.6015625, -84.53515625, -81.46875, -78.40234375, -75.3359375, -72.26953125, -69.203125, -66.13671875, -63.0703125, -60.00390625, -56.9375, -53.87109375, -50.8046875, -47.73828125, -44.671875, -41.60546875, -38.5390625, -35.47265625, -32.40625, -29.33984375, -26.2734375, -23.20703125, -20.140625, -17.07421875, -14.0078125, -10.94140625, -7.875, -4.80859375, -1.7421875, 1.32421875, 4.390625, 7.45703125, 10.5234375, 13.58984375, 16.65625, 19.72265625, 22.7890625, 25.85546875, 28.921875, 31.98828125, 35.0546875, 38.12109375, 41.1875, 44.25390625, 47.3203125, 50.38671875, 53.453125, 56.51953125, 59.5859375, 62.65234375, 65.71875, 68.78515625, 71.8515625, 74.91796875, 77.984375, 81.05078125, 84.1171875, 87.18359375, 90.25]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 4.0, 4.0, 5.0, 5.0, 8.0, 10.0, 13.0, 14.0, 16.0, 17.0, 18.0, 28.0, 22.0, 24.0, 31.0, 34.0, 28.0, 29.0, 37.0, 43.0, 44.0, 40.0, 47.0, 48.0, 36.0, 47.0, 35.0, 33.0, 25.0, 30.0, 28.0, 25.0, 28.0, 21.0, 17.0, 16.0, 16.0, 14.0, 11.0, 5.0, 14.0, 9.0, 5.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0], "bins": [-41.9375, -40.8017578125, -39.666015625, -38.5302734375, -37.39453125, -36.2587890625, -35.123046875, -33.9873046875, -32.8515625, -31.7158203125, -30.580078125, -29.4443359375, -28.30859375, -27.1728515625, -26.037109375, -24.9013671875, -23.765625, -22.6298828125, -21.494140625, -20.3583984375, -19.22265625, -18.0869140625, -16.951171875, -15.8154296875, -14.6796875, -13.5439453125, -12.408203125, -11.2724609375, -10.13671875, -9.0009765625, -7.865234375, -6.7294921875, -5.59375, -4.4580078125, -3.322265625, -2.1865234375, -1.05078125, 0.0849609375, 1.220703125, 2.3564453125, 3.4921875, 4.6279296875, 5.763671875, 6.8994140625, 8.03515625, 9.1708984375, 10.306640625, 11.4423828125, 12.578125, 13.7138671875, 14.849609375, 15.9853515625, 17.12109375, 18.2568359375, 19.392578125, 20.5283203125, 21.6640625, 22.7998046875, 23.935546875, 25.0712890625, 26.20703125, 27.3427734375, 28.478515625, 29.6142578125, 30.75]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 5.0, 7.0, 7.0, 10.0, 18.0, 20.0, 45.0, 74.0, 86.0, 166.0, 278.0, 526.0, 1009.0, 2288.0, 6385.0, 21885.0, 124794.0, 718002.0, 137959.0, 23607.0, 6683.0, 2404.0, 1086.0, 496.0, 274.0, 151.0, 102.0, 55.0, 40.0, 23.0, 15.0, 13.0, 9.0, 12.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-181.75, -175.146484375, -168.54296875, -161.939453125, -155.3359375, -148.732421875, -142.12890625, -135.525390625, -128.921875, -122.318359375, -115.71484375, -109.111328125, -102.5078125, -95.904296875, -89.30078125, -82.697265625, -76.09375, -69.490234375, -62.88671875, -56.283203125, -49.6796875, -43.076171875, -36.47265625, -29.869140625, -23.265625, -16.662109375, -10.05859375, -3.455078125, 3.1484375, 9.751953125, 16.35546875, 22.958984375, 29.5625, 36.166015625, 42.76953125, 49.373046875, 55.9765625, 62.580078125, 69.18359375, 75.787109375, 82.390625, 88.994140625, 95.59765625, 102.201171875, 108.8046875, 115.408203125, 122.01171875, 128.615234375, 135.21875, 141.822265625, 148.42578125, 155.029296875, 161.6328125, 168.236328125, 174.83984375, 181.443359375, 188.046875, 194.650390625, 201.25390625, 207.857421875, 214.4609375, 221.064453125, 227.66796875, 234.271484375, 240.875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 11.0, 8.0, 12.0, 18.0, 27.0, 17.0, 24.0, 26.0, 32.0, 40.0, 36.0, 34.0, 52.0, 43.0, 46.0, 41.0, 50.0, 54.0, 45.0, 38.0, 50.0, 33.0, 29.0, 36.0, 28.0, 27.0, 19.0, 18.0, 13.0, 6.0, 15.0, 13.0, 3.0, 5.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-195.875, -190.046875, -184.21875, -178.390625, -172.5625, -166.734375, -160.90625, -155.078125, -149.25, -143.421875, -137.59375, -131.765625, -125.9375, -120.109375, -114.28125, -108.453125, -102.625, -96.796875, -90.96875, -85.140625, -79.3125, -73.484375, -67.65625, -61.828125, -56.0, -50.171875, -44.34375, -38.515625, -32.6875, -26.859375, -21.03125, -15.203125, -9.375, -3.546875, 2.28125, 8.109375, 13.9375, 19.765625, 25.59375, 31.421875, 37.25, 43.078125, 48.90625, 54.734375, 60.5625, 66.390625, 72.21875, 78.046875, 83.875, 89.703125, 95.53125, 101.359375, 107.1875, 113.015625, 118.84375, 124.671875, 130.5, 136.328125, 142.15625, 147.984375, 153.8125, 159.640625, 165.46875, 171.296875, 177.125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 7.0, 9.0, 11.0, 24.0, 28.0, 39.0, 72.0, 89.0, 189.0, 335.0, 675.0, 1368.0, 3252.0, 8967.0, 36706.0, 463821.0, 480612.0, 37553.0, 8658.0, 3123.0, 1340.0, 702.0, 389.0, 246.0, 126.0, 71.0, 56.0, 23.0, 18.0, 16.0, 8.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-103.625, -100.4853515625, -97.345703125, -94.2060546875, -91.06640625, -87.9267578125, -84.787109375, -81.6474609375, -78.5078125, -75.3681640625, -72.228515625, -69.0888671875, -65.94921875, -62.8095703125, -59.669921875, -56.5302734375, -53.390625, -50.2509765625, -47.111328125, -43.9716796875, -40.83203125, -37.6923828125, -34.552734375, -31.4130859375, -28.2734375, -25.1337890625, -21.994140625, -18.8544921875, -15.71484375, -12.5751953125, -9.435546875, -6.2958984375, -3.15625, -0.0166015625, 3.123046875, 6.2626953125, 9.40234375, 12.5419921875, 15.681640625, 18.8212890625, 21.9609375, 25.1005859375, 28.240234375, 31.3798828125, 34.51953125, 37.6591796875, 40.798828125, 43.9384765625, 47.078125, 50.2177734375, 53.357421875, 56.4970703125, 59.63671875, 62.7763671875, 65.916015625, 69.0556640625, 72.1953125, 75.3349609375, 78.474609375, 81.6142578125, 84.75390625, 87.8935546875, 91.033203125, 94.1728515625, 97.3125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 13.0, 21.0, 28.0, 48.0, 82.0, 156.0, 228.0, 182.0, 114.0, 60.0, 30.0, 9.0, 7.0, 9.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022216796875, -0.020956993103027344, -0.019697189331054688, -0.01843738555908203, -0.017177581787109375, -0.01591777801513672, -0.014657974243164062, -0.013398170471191406, -0.01213836669921875, -0.010878562927246094, -0.009618759155273438, -0.008358955383300781, -0.007099151611328125, -0.005839347839355469, -0.0045795440673828125, -0.0033197402954101562, -0.0020599365234375, -0.0008001327514648438, 0.0004596710205078125, 0.0017194747924804688, 0.002979278564453125, 0.004239082336425781, 0.0054988861083984375, 0.006758689880371094, 0.00801849365234375, 0.009278297424316406, 0.010538101196289062, 0.011797904968261719, 0.013057708740234375, 0.014317512512207031, 0.015577316284179688, 0.016837120056152344, 0.018096923828125, 0.019356727600097656, 0.020616531372070312, 0.02187633514404297, 0.023136138916015625, 0.02439594268798828, 0.025655746459960938, 0.026915550231933594, 0.02817535400390625, 0.029435157775878906, 0.030694961547851562, 0.03195476531982422, 0.033214569091796875, 0.03447437286376953, 0.03573417663574219, 0.036993980407714844, 0.0382537841796875, 0.039513587951660156, 0.04077339172363281, 0.04203319549560547, 0.043292999267578125, 0.04455280303955078, 0.04581260681152344, 0.047072410583496094, 0.04833221435546875, 0.049592018127441406, 0.05085182189941406, 0.05211162567138672, 0.053371429443359375, 0.05463123321533203, 0.05589103698730469, 0.057150840759277344, 0.05841064453125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 6.0, 13.0, 17.0, 27.0, 34.0, 70.0, 109.0, 154.0, 361.0, 752.0, 1953.0, 6387.0, 41782.0, 778075.0, 198024.0, 15166.0, 3355.0, 1092.0, 503.0, 295.0, 127.0, 87.0, 47.0, 24.0, 20.0, 14.0, 19.0, 6.0, 10.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-134.5, -129.98046875, -125.4609375, -120.94140625, -116.421875, -111.90234375, -107.3828125, -102.86328125, -98.34375, -93.82421875, -89.3046875, -84.78515625, -80.265625, -75.74609375, -71.2265625, -66.70703125, -62.1875, -57.66796875, -53.1484375, -48.62890625, -44.109375, -39.58984375, -35.0703125, -30.55078125, -26.03125, -21.51171875, -16.9921875, -12.47265625, -7.953125, -3.43359375, 1.0859375, 5.60546875, 10.125, 14.64453125, 19.1640625, 23.68359375, 28.203125, 32.72265625, 37.2421875, 41.76171875, 46.28125, 50.80078125, 55.3203125, 59.83984375, 64.359375, 68.87890625, 73.3984375, 77.91796875, 82.4375, 86.95703125, 91.4765625, 95.99609375, 100.515625, 105.03515625, 109.5546875, 114.07421875, 118.59375, 123.11328125, 127.6328125, 132.15234375, 136.671875, 141.19140625, 145.7109375, 150.23046875, 154.75]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 5.0, 8.0, 15.0, 8.0, 23.0, 34.0, 60.0, 63.0, 120.0, 118.0, 128.0, 135.0, 92.0, 63.0, 33.0, 33.0, 16.0, 11.0, 8.0, 9.0, 7.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.28125, -52.42529296875, -49.5693359375, -46.71337890625, -43.857421875, -41.00146484375, -38.1455078125, -35.28955078125, -32.43359375, -29.57763671875, -26.7216796875, -23.86572265625, -21.009765625, -18.15380859375, -15.2978515625, -12.44189453125, -9.5859375, -6.72998046875, -3.8740234375, -1.01806640625, 1.837890625, 4.69384765625, 7.5498046875, 10.40576171875, 13.26171875, 16.11767578125, 18.9736328125, 21.82958984375, 24.685546875, 27.54150390625, 30.3974609375, 33.25341796875, 36.109375, 38.96533203125, 41.8212890625, 44.67724609375, 47.533203125, 50.38916015625, 53.2451171875, 56.10107421875, 58.95703125, 61.81298828125, 64.6689453125, 67.52490234375, 70.380859375, 73.23681640625, 76.0927734375, 78.94873046875, 81.8046875, 84.66064453125, 87.5166015625, 90.37255859375, 93.228515625, 96.08447265625, 98.9404296875, 101.79638671875, 104.65234375, 107.50830078125, 110.3642578125, 113.22021484375, 116.076171875, 118.93212890625, 121.7880859375, 124.64404296875, 127.5]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 5.0, 12.0, 22.0, 59.0, 108.0, 207.0, 242.0, 176.0, 78.0, 47.0, 23.0, 17.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3731.10546875, -3645.3759765625, -3559.646484375, -3473.9169921875, -3388.1875, -3302.458251953125, -3216.728759765625, -3130.999267578125, -3045.269775390625, -2959.540283203125, -2873.810791015625, -2788.081298828125, -2702.35205078125, -2616.62255859375, -2530.89306640625, -2445.16357421875, -2359.43408203125, -2273.70458984375, -2187.97509765625, -2102.24560546875, -2016.5162353515625, -1930.7867431640625, -1845.057373046875, -1759.327880859375, -1673.598388671875, -1587.868896484375, -1502.139404296875, -1416.4100341796875, -1330.6805419921875, -1244.9510498046875, -1159.2216796875, -1073.4921875, -987.7628173828125, -902.0333251953125, -816.3038940429688, -730.574462890625, -644.844970703125, -559.115478515625, -473.38604736328125, -387.6566162109375, -301.9271240234375, -216.19766235351562, -130.46820068359375, -44.738739013671875, 40.99072265625, 126.72018432617188, 212.44964599609375, 298.1790771484375, 383.9085693359375, 469.6380310058594, 555.3674926757812, 641.096923828125, 726.826416015625, 812.555908203125, 898.2853393554688, 984.0147705078125, 1069.7442626953125, 1155.4737548828125, 1241.203125, 1326.9326171875, 1412.662109375, 1498.3916015625, 1584.12109375, 1669.8504638671875, 1755.5799560546875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 7.0, 10.0, 8.0, 13.0, 19.0, 17.0, 21.0, 15.0, 19.0, 31.0, 37.0, 38.0, 46.0, 54.0, 69.0, 54.0, 58.0, 59.0, 47.0, 50.0, 59.0, 37.0, 42.0, 35.0, 34.0, 34.0, 18.0, 20.0, 13.0, 13.0, 4.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1028.7578125, -993.9733276367188, -959.1888427734375, -924.4044189453125, -889.6199340820312, -854.83544921875, -820.051025390625, -785.2665405273438, -750.4820556640625, -715.6975708007812, -680.9130859375, -646.128662109375, -611.3441772460938, -576.5596923828125, -541.7752685546875, -506.99078369140625, -472.206298828125, -437.42181396484375, -402.6373596191406, -367.8529052734375, -333.06842041015625, -298.283935546875, -263.4994812011719, -228.7150115966797, -193.9305419921875, -159.1460723876953, -124.36160278320312, -89.57713317871094, -54.79266357421875, -20.008193969726562, 14.776275634765625, 49.56074523925781, 84.3453369140625, 119.12980651855469, 153.91427612304688, 188.69874572753906, 223.48321533203125, 258.2677001953125, 293.0521545410156, 327.83660888671875, 362.62109375, 397.40557861328125, 432.1900329589844, 466.9744873046875, 501.75897216796875, 536.54345703125, 571.327880859375, 606.1123657226562, 640.8968505859375, 675.6813354492188, 710.4658203125, 745.250244140625, 780.0347290039062, 814.8192138671875, 849.6036376953125, 884.3881225585938, 919.172607421875, 953.9570922851562, 988.7415771484375, 1023.5260009765625, 1058.310546875, 1093.094970703125, 1127.87939453125, 1162.6639404296875, 1197.4483642578125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 6.0, 5.0, 9.0, 5.0, 12.0, 19.0, 16.0, 27.0, 24.0, 35.0, 42.0, 76.0, 64.0, 112.0, 128.0, 181.0, 209.0, 283.0, 393.0, 600.0, 915.0, 1767.0, 5137.0, 4165384.0, 12410.0, 2703.0, 1206.0, 662.0, 416.0, 348.0, 249.0, 173.0, 161.0, 112.0, 91.0, 65.0, 64.0, 41.0, 26.0, 27.0, 18.0, 18.0, 15.0, 7.0, 3.0, 7.0, 5.0, 3.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-291.5, -282.58984375, -273.6796875, -264.76953125, -255.859375, -246.94921875, -238.0390625, -229.12890625, -220.21875, -211.30859375, -202.3984375, -193.48828125, -184.578125, -175.66796875, -166.7578125, -157.84765625, -148.9375, -140.02734375, -131.1171875, -122.20703125, -113.296875, -104.38671875, -95.4765625, -86.56640625, -77.65625, -68.74609375, -59.8359375, -50.92578125, -42.015625, -33.10546875, -24.1953125, -15.28515625, -6.375, 2.53515625, 11.4453125, 20.35546875, 29.265625, 38.17578125, 47.0859375, 55.99609375, 64.90625, 73.81640625, 82.7265625, 91.63671875, 100.546875, 109.45703125, 118.3671875, 127.27734375, 136.1875, 145.09765625, 154.0078125, 162.91796875, 171.828125, 180.73828125, 189.6484375, 198.55859375, 207.46875, 216.37890625, 225.2890625, 234.19921875, 243.109375, 252.01953125, 260.9296875, 269.83984375, 278.75]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 12.0, 9.0, 17.0, 12.0, 13.0, 27.0, 19.0, 28.0, 35.0, 38.0, 39.0, 46.0, 36.0, 52.0, 54.0, 57.0, 53.0, 46.0, 51.0, 54.0, 42.0, 48.0, 37.0, 32.0, 18.0, 15.0, 14.0, 18.0, 18.0, 11.0, 11.0, 6.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.75, -44.26318359375, -42.7763671875, -41.28955078125, -39.802734375, -38.31591796875, -36.8291015625, -35.34228515625, -33.85546875, -32.36865234375, -30.8818359375, -29.39501953125, -27.908203125, -26.42138671875, -24.9345703125, -23.44775390625, -21.9609375, -20.47412109375, -18.9873046875, -17.50048828125, -16.013671875, -14.52685546875, -13.0400390625, -11.55322265625, -10.06640625, -8.57958984375, -7.0927734375, -5.60595703125, -4.119140625, -2.63232421875, -1.1455078125, 0.34130859375, 1.828125, 3.31494140625, 4.8017578125, 6.28857421875, 7.775390625, 9.26220703125, 10.7490234375, 12.23583984375, 13.72265625, 15.20947265625, 16.6962890625, 18.18310546875, 19.669921875, 21.15673828125, 22.6435546875, 24.13037109375, 25.6171875, 27.10400390625, 28.5908203125, 30.07763671875, 31.564453125, 33.05126953125, 34.5380859375, 36.02490234375, 37.51171875, 38.99853515625, 40.4853515625, 41.97216796875, 43.458984375, 44.94580078125, 46.4326171875, 47.91943359375, 49.40625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 6.0, 4.0, 14.0, 20.0, 17.0, 26.0, 38.0, 40.0, 51.0, 72.0, 103.0, 120.0, 204.0, 260.0, 427.0, 655.0, 1186.0, 2632.0, 10167.0, 4155381.0, 15990.0, 3249.0, 1374.0, 731.0, 435.0, 306.0, 217.0, 144.0, 107.0, 92.0, 50.0, 39.0, 20.0, 24.0, 18.0, 22.0, 9.0, 12.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-380.75, -368.69921875, -356.6484375, -344.59765625, -332.546875, -320.49609375, -308.4453125, -296.39453125, -284.34375, -272.29296875, -260.2421875, -248.19140625, -236.140625, -224.08984375, -212.0390625, -199.98828125, -187.9375, -175.88671875, -163.8359375, -151.78515625, -139.734375, -127.68359375, -115.6328125, -103.58203125, -91.53125, -79.48046875, -67.4296875, -55.37890625, -43.328125, -31.27734375, -19.2265625, -7.17578125, 4.875, 16.92578125, 28.9765625, 41.02734375, 53.078125, 65.12890625, 77.1796875, 89.23046875, 101.28125, 113.33203125, 125.3828125, 137.43359375, 149.484375, 161.53515625, 173.5859375, 185.63671875, 197.6875, 209.73828125, 221.7890625, 233.83984375, 245.890625, 257.94140625, 269.9921875, 282.04296875, 294.09375, 306.14453125, 318.1953125, 330.24609375, 342.296875, 354.34765625, 366.3984375, 378.44921875, 390.5]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 16.0, 3904.0, 102.0, 19.0, 9.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.3125, -79.7314453125, -77.150390625, -74.5693359375, -71.98828125, -69.4072265625, -66.826171875, -64.2451171875, -61.6640625, -59.0830078125, -56.501953125, -53.9208984375, -51.33984375, -48.7587890625, -46.177734375, -43.5966796875, -41.015625, -38.4345703125, -35.853515625, -33.2724609375, -30.69140625, -28.1103515625, -25.529296875, -22.9482421875, -20.3671875, -17.7861328125, -15.205078125, -12.6240234375, -10.04296875, -7.4619140625, -4.880859375, -2.2998046875, 0.28125, 2.8623046875, 5.443359375, 8.0244140625, 10.60546875, 13.1865234375, 15.767578125, 18.3486328125, 20.9296875, 23.5107421875, 26.091796875, 28.6728515625, 31.25390625, 33.8349609375, 36.416015625, 38.9970703125, 41.578125, 44.1591796875, 46.740234375, 49.3212890625, 51.90234375, 54.4833984375, 57.064453125, 59.6455078125, 62.2265625, 64.8076171875, 67.388671875, 69.9697265625, 72.55078125, 75.1318359375, 77.712890625, 80.2939453125, 82.875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 5.0, 5.0, 8.0, 10.0, 19.0, 11.0, 22.0, 41.0, 63.0, 76.0, 78.0, 85.0, 115.0, 94.0, 100.0, 76.0, 47.0, 43.0, 26.0, 21.0, 15.0, 8.0, 8.0, 8.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.56581115722656, -161.5968017578125, -156.6278076171875, -151.6588134765625, -146.68980407714844, -141.72079467773438, -136.75180053710938, -131.78280639648438, -126.81379699707031, -121.84479522705078, -116.87579345703125, -111.90679168701172, -106.93778991699219, -101.96878814697266, -96.99978637695312, -92.0307846069336, -87.06178283691406, -82.09278106689453, -77.123779296875, -72.15477752685547, -67.18577575683594, -62.216773986816406, -57.247772216796875, -52.278770446777344, -47.30976867675781, -42.34076690673828, -37.37176513671875, -32.40276336669922, -27.433761596679688, -22.464759826660156, -17.495758056640625, -12.526756286621094, -7.5577392578125, -2.5887374877929688, 2.3802642822265625, 7.349266052246094, 12.318267822265625, 17.287269592285156, 22.256271362304688, 27.22527313232422, 32.19427490234375, 37.16327667236328, 42.13227844238281, 47.101280212402344, 52.070281982421875, 57.039283752441406, 62.00828552246094, 66.97728729248047, 71.9462890625, 76.91529083251953, 81.88429260253906, 86.8532943725586, 91.82229614257812, 96.79129791259766, 101.76029968261719, 106.72930145263672, 111.69830322265625, 116.66730499267578, 121.63630676269531, 126.60530853271484, 131.57431030273438, 136.54330444335938, 141.51231384277344, 146.4813232421875, 151.4503173828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 11.0, 17.0, 9.0, 16.0, 13.0, 22.0, 16.0, 22.0, 28.0, 37.0, 25.0, 40.0, 29.0, 35.0, 49.0, 44.0, 47.0, 40.0, 47.0, 31.0, 34.0, 42.0, 37.0, 29.0, 37.0, 20.0, 33.0, 25.0, 26.0, 23.0, 13.0, 14.0, 19.0, 7.0, 9.0, 7.0, 8.0, 4.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-76.51296997070312, -74.08256530761719, -71.65216064453125, -69.22174835205078, -66.79134368896484, -64.3609390258789, -61.93053436279297, -59.500125885009766, -57.06971740722656, -54.639312744140625, -52.20890426635742, -49.778499603271484, -47.34809112548828, -44.917686462402344, -42.487281799316406, -40.0568733215332, -37.626468658447266, -35.19606399536133, -32.765655517578125, -30.335250854492188, -27.904842376708984, -25.474437713623047, -23.044031143188477, -20.613624572753906, -18.183218002319336, -15.752811431884766, -13.322404861450195, -10.891999244689941, -8.461592674255371, -6.031186103820801, -3.600780487060547, -1.1703739166259766, 1.2600326538085938, 3.690438985824585, 6.120845317840576, 8.551251411437988, 10.981657981872559, 13.412064552307129, 15.842470169067383, 18.272876739501953, 20.703283309936523, 23.133689880371094, 25.564096450805664, 27.994503021240234, 30.424907684326172, 32.855316162109375, 35.28572082519531, 37.71612548828125, 40.14653396606445, 42.57693862915039, 45.007347106933594, 47.43775177001953, 49.868160247802734, 52.29856491088867, 54.728973388671875, 57.15937805175781, 59.58978271484375, 62.02018737792969, 64.45059204101562, 66.8810043334961, 69.31140899658203, 71.74181365966797, 74.1722183227539, 76.60263061523438, 79.03303527832031]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 9.0, 13.0, 17.0, 18.0, 28.0, 50.0, 63.0, 93.0, 145.0, 226.0, 292.0, 510.0, 727.0, 1228.0, 2205.0, 4259.0, 9036.0, 22181.0, 63455.0, 233213.0, 496910.0, 140574.0, 42745.0, 15744.0, 6734.0, 3303.0, 1810.0, 1061.0, 655.0, 411.0, 250.0, 203.0, 113.0, 83.0, 50.0, 46.0, 22.0, 19.0, 18.0, 13.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-132.5, -128.400390625, -124.30078125, -120.201171875, -116.1015625, -112.001953125, -107.90234375, -103.802734375, -99.703125, -95.603515625, -91.50390625, -87.404296875, -83.3046875, -79.205078125, -75.10546875, -71.005859375, -66.90625, -62.806640625, -58.70703125, -54.607421875, -50.5078125, -46.408203125, -42.30859375, -38.208984375, -34.109375, -30.009765625, -25.91015625, -21.810546875, -17.7109375, -13.611328125, -9.51171875, -5.412109375, -1.3125, 2.787109375, 6.88671875, 10.986328125, 15.0859375, 19.185546875, 23.28515625, 27.384765625, 31.484375, 35.583984375, 39.68359375, 43.783203125, 47.8828125, 51.982421875, 56.08203125, 60.181640625, 64.28125, 68.380859375, 72.48046875, 76.580078125, 80.6796875, 84.779296875, 88.87890625, 92.978515625, 97.078125, 101.177734375, 105.27734375, 109.376953125, 113.4765625, 117.576171875, 121.67578125, 125.775390625, 129.875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 10.0, 7.0, 6.0, 19.0, 8.0, 15.0, 22.0, 16.0, 32.0, 36.0, 38.0, 43.0, 36.0, 49.0, 53.0, 53.0, 51.0, 39.0, 54.0, 42.0, 47.0, 31.0, 48.0, 51.0, 34.0, 25.0, 23.0, 18.0, 17.0, 14.0, 10.0, 11.0, 6.0, 7.0, 1.0, 9.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.78125, -48.2314453125, -46.681640625, -45.1318359375, -43.58203125, -42.0322265625, -40.482421875, -38.9326171875, -37.3828125, -35.8330078125, -34.283203125, -32.7333984375, -31.18359375, -29.6337890625, -28.083984375, -26.5341796875, -24.984375, -23.4345703125, -21.884765625, -20.3349609375, -18.78515625, -17.2353515625, -15.685546875, -14.1357421875, -12.5859375, -11.0361328125, -9.486328125, -7.9365234375, -6.38671875, -4.8369140625, -3.287109375, -1.7373046875, -0.1875, 1.3623046875, 2.912109375, 4.4619140625, 6.01171875, 7.5615234375, 9.111328125, 10.6611328125, 12.2109375, 13.7607421875, 15.310546875, 16.8603515625, 18.41015625, 19.9599609375, 21.509765625, 23.0595703125, 24.609375, 26.1591796875, 27.708984375, 29.2587890625, 30.80859375, 32.3583984375, 33.908203125, 35.4580078125, 37.0078125, 38.5576171875, 40.107421875, 41.6572265625, 43.20703125, 44.7568359375, 46.306640625, 47.8564453125, 49.40625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 9.0, 7.0, 15.0, 22.0, 23.0, 43.0, 61.0, 77.0, 145.0, 219.0, 350.0, 622.0, 1250.0, 2873.0, 7816.0, 27196.0, 148564.0, 689299.0, 132217.0, 25100.0, 7295.0, 2611.0, 1165.0, 610.0, 336.0, 199.0, 125.0, 90.0, 41.0, 41.0, 26.0, 22.0, 19.0, 19.0, 7.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-176.125, -171.015625, -165.90625, -160.796875, -155.6875, -150.578125, -145.46875, -140.359375, -135.25, -130.140625, -125.03125, -119.921875, -114.8125, -109.703125, -104.59375, -99.484375, -94.375, -89.265625, -84.15625, -79.046875, -73.9375, -68.828125, -63.71875, -58.609375, -53.5, -48.390625, -43.28125, -38.171875, -33.0625, -27.953125, -22.84375, -17.734375, -12.625, -7.515625, -2.40625, 2.703125, 7.8125, 12.921875, 18.03125, 23.140625, 28.25, 33.359375, 38.46875, 43.578125, 48.6875, 53.796875, 58.90625, 64.015625, 69.125, 74.234375, 79.34375, 84.453125, 89.5625, 94.671875, 99.78125, 104.890625, 110.0, 115.109375, 120.21875, 125.328125, 130.4375, 135.546875, 140.65625, 145.765625, 150.875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 10.0, 5.0, 17.0, 13.0, 21.0, 17.0, 34.0, 29.0, 29.0, 33.0, 43.0, 39.0, 35.0, 50.0, 62.0, 52.0, 56.0, 57.0, 55.0, 54.0, 46.0, 30.0, 32.0, 34.0, 28.0, 27.0, 16.0, 15.0, 12.0, 10.0, 13.0, 7.0, 4.0, 6.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-190.375, -183.169921875, -175.96484375, -168.759765625, -161.5546875, -154.349609375, -147.14453125, -139.939453125, -132.734375, -125.529296875, -118.32421875, -111.119140625, -103.9140625, -96.708984375, -89.50390625, -82.298828125, -75.09375, -67.888671875, -60.68359375, -53.478515625, -46.2734375, -39.068359375, -31.86328125, -24.658203125, -17.453125, -10.248046875, -3.04296875, 4.162109375, 11.3671875, 18.572265625, 25.77734375, 32.982421875, 40.1875, 47.392578125, 54.59765625, 61.802734375, 69.0078125, 76.212890625, 83.41796875, 90.623046875, 97.828125, 105.033203125, 112.23828125, 119.443359375, 126.6484375, 133.853515625, 141.05859375, 148.263671875, 155.46875, 162.673828125, 169.87890625, 177.083984375, 184.2890625, 191.494140625, 198.69921875, 205.904296875, 213.109375, 220.314453125, 227.51953125, 234.724609375, 241.9296875, 249.134765625, 256.33984375, 263.544921875, 270.75]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 11.0, 14.0, 16.0, 36.0, 64.0, 163.0, 449.0, 1240.0, 4621.0, 36494.0, 915505.0, 80618.0, 6809.0, 1616.0, 525.0, 184.0, 84.0, 41.0, 24.0, 15.0, 4.0, 9.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-209.25, -203.83203125, -198.4140625, -192.99609375, -187.578125, -182.16015625, -176.7421875, -171.32421875, -165.90625, -160.48828125, -155.0703125, -149.65234375, -144.234375, -138.81640625, -133.3984375, -127.98046875, -122.5625, -117.14453125, -111.7265625, -106.30859375, -100.890625, -95.47265625, -90.0546875, -84.63671875, -79.21875, -73.80078125, -68.3828125, -62.96484375, -57.546875, -52.12890625, -46.7109375, -41.29296875, -35.875, -30.45703125, -25.0390625, -19.62109375, -14.203125, -8.78515625, -3.3671875, 2.05078125, 7.46875, 12.88671875, 18.3046875, 23.72265625, 29.140625, 34.55859375, 39.9765625, 45.39453125, 50.8125, 56.23046875, 61.6484375, 67.06640625, 72.484375, 77.90234375, 83.3203125, 88.73828125, 94.15625, 99.57421875, 104.9921875, 110.41015625, 115.828125, 121.24609375, 126.6640625, 132.08203125, 137.5]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 3.0, 11.0, 8.0, 9.0, 18.0, 26.0, 24.0, 36.0, 52.0, 81.0, 153.0, 151.0, 126.0, 83.0, 60.0, 39.0, 28.0, 21.0, 18.0, 10.0, 10.0, 9.0, 8.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01995849609375, -0.019141197204589844, -0.018323898315429688, -0.01750659942626953, -0.016689300537109375, -0.01587200164794922, -0.015054702758789062, -0.014237403869628906, -0.01342010498046875, -0.012602806091308594, -0.011785507202148438, -0.010968208312988281, -0.010150909423828125, -0.009333610534667969, -0.008516311645507812, -0.007699012756347656, -0.0068817138671875, -0.006064414978027344, -0.0052471160888671875, -0.004429817199707031, -0.003612518310546875, -0.0027952194213867188, -0.0019779205322265625, -0.0011606216430664062, -0.00034332275390625, 0.00047397613525390625, 0.0012912750244140625, 0.0021085739135742188, 0.002925872802734375, 0.0037431716918945312, 0.0045604705810546875, 0.005377769470214844, 0.006195068359375, 0.007012367248535156, 0.007829666137695312, 0.008646965026855469, 0.009464263916015625, 0.010281562805175781, 0.011098861694335938, 0.011916160583496094, 0.01273345947265625, 0.013550758361816406, 0.014368057250976562, 0.015185356140136719, 0.016002655029296875, 0.01681995391845703, 0.017637252807617188, 0.018454551696777344, 0.0192718505859375, 0.020089149475097656, 0.020906448364257812, 0.02172374725341797, 0.022541046142578125, 0.02335834503173828, 0.024175643920898438, 0.024992942810058594, 0.02581024169921875, 0.026627540588378906, 0.027444839477539062, 0.02826213836669922, 0.029079437255859375, 0.02989673614501953, 0.030714035034179688, 0.031531333923339844, 0.0323486328125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 7.0, 15.0, 7.0, 10.0, 23.0, 40.0, 87.0, 106.0, 255.0, 658.0, 3243.0, 46045.0, 951014.0, 42775.0, 3096.0, 648.0, 248.0, 111.0, 62.0, 38.0, 26.0, 15.0, 12.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-178.375, -171.376953125, -164.37890625, -157.380859375, -150.3828125, -143.384765625, -136.38671875, -129.388671875, -122.390625, -115.392578125, -108.39453125, -101.396484375, -94.3984375, -87.400390625, -80.40234375, -73.404296875, -66.40625, -59.408203125, -52.41015625, -45.412109375, -38.4140625, -31.416015625, -24.41796875, -17.419921875, -10.421875, -3.423828125, 3.57421875, 10.572265625, 17.5703125, 24.568359375, 31.56640625, 38.564453125, 45.5625, 52.560546875, 59.55859375, 66.556640625, 73.5546875, 80.552734375, 87.55078125, 94.548828125, 101.546875, 108.544921875, 115.54296875, 122.541015625, 129.5390625, 136.537109375, 143.53515625, 150.533203125, 157.53125, 164.529296875, 171.52734375, 178.525390625, 185.5234375, 192.521484375, 199.51953125, 206.517578125, 213.515625, 220.513671875, 227.51171875, 234.509765625, 241.5078125, 248.505859375, 255.50390625, 262.501953125, 269.5]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 9.0, 9.0, 25.0, 43.0, 110.0, 216.0, 314.0, 154.0, 59.0, 33.0, 21.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.25, -102.11328125, -94.9765625, -87.83984375, -80.703125, -73.56640625, -66.4296875, -59.29296875, -52.15625, -45.01953125, -37.8828125, -30.74609375, -23.609375, -16.47265625, -9.3359375, -2.19921875, 4.9375, 12.07421875, 19.2109375, 26.34765625, 33.484375, 40.62109375, 47.7578125, 54.89453125, 62.03125, 69.16796875, 76.3046875, 83.44140625, 90.578125, 97.71484375, 104.8515625, 111.98828125, 119.125, 126.26171875, 133.3984375, 140.53515625, 147.671875, 154.80859375, 161.9453125, 169.08203125, 176.21875, 183.35546875, 190.4921875, 197.62890625, 204.765625, 211.90234375, 219.0390625, 226.17578125, 233.3125, 240.44921875, 247.5859375, 254.72265625, 261.859375, 268.99609375, 276.1328125, 283.26953125, 290.40625, 297.54296875, 304.6796875, 311.81640625, 318.953125, 326.08984375, 333.2265625, 340.36328125, 347.5]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 26.0, 77.0, 188.0, 304.0, 244.0, 104.0, 35.0, 10.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2995.394287109375, -2897.577392578125, -2799.760498046875, -2701.943359375, -2604.12646484375, -2506.3095703125, -2408.49267578125, -2310.67578125, -2212.85888671875, -2115.0419921875, -2017.2249755859375, -1919.4080810546875, -1821.591064453125, -1723.774169921875, -1625.957275390625, -1528.140380859375, -1430.3232421875, -1332.50634765625, -1234.6893310546875, -1136.8724365234375, -1039.055419921875, -941.238525390625, -843.421630859375, -745.6046752929688, -647.7877197265625, -549.9707641601562, -452.1538391113281, -354.3369140625, -256.51995849609375, -158.7030029296875, -60.8861083984375, 36.93084716796875, 134.747802734375, 232.5647430419922, 330.3816833496094, 428.1986083984375, 526.0155639648438, 623.83251953125, 721.6494140625, 819.4663696289062, 917.2833251953125, 1015.1002807617188, 1112.917236328125, 1210.734130859375, 1308.551025390625, 1406.3680419921875, 1504.1849365234375, 1602.001953125, 1699.81884765625, 1797.6357421875, 1895.4527587890625, 1993.2696533203125, 2091.086669921875, 2188.903564453125, 2286.720458984375, 2384.537353515625, 2482.3544921875, 2580.17138671875, 2677.98828125, 2775.80517578125, 2873.622314453125, 2971.439208984375, 3069.256103515625, 3167.072998046875, 3264.889892578125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 4.0, 8.0, 7.0, 7.0, 12.0, 9.0, 12.0, 14.0, 14.0, 15.0, 17.0, 19.0, 23.0, 26.0, 29.0, 33.0, 30.0, 39.0, 45.0, 50.0, 50.0, 39.0, 47.0, 56.0, 50.0, 47.0, 37.0, 25.0, 32.0, 25.0, 23.0, 23.0, 21.0, 14.0, 19.0, 10.0, 16.0, 9.0, 7.0, 4.0, 3.0, 1.0, 8.0, 5.0, 4.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-890.6057739257812, -863.0966796875, -835.587646484375, -808.0785522460938, -780.5695190429688, -753.0604248046875, -725.5513916015625, -698.0422973632812, -670.533203125, -643.0241088867188, -615.5150756835938, -588.0059814453125, -560.4969482421875, -532.9878540039062, -505.4787902832031, -477.9697265625, -450.460693359375, -422.9516296386719, -395.44256591796875, -367.9334716796875, -340.4244384765625, -312.91534423828125, -285.4062805175781, -257.897216796875, -230.38815307617188, -202.87908935546875, -175.37002563476562, -147.86094665527344, -120.35188293457031, -92.84281921386719, -65.333740234375, -37.824676513671875, -10.3155517578125, 17.19351577758789, 44.70258331298828, 72.21165466308594, 99.72071838378906, 127.22978210449219, 154.73886108398438, 182.2479248046875, 209.75698852539062, 237.26605224609375, 264.7751159667969, 292.2841796875, 319.79327392578125, 347.30230712890625, 374.8114013671875, 402.3204650878906, 429.82952880859375, 457.3385925292969, 484.84765625, 512.3567504882812, 539.8657836914062, 567.3748779296875, 594.8839111328125, 622.3930053710938, 649.902099609375, 677.4111938476562, 704.9202270507812, 732.4293212890625, 759.9383544921875, 787.4474487304688, 814.95654296875, 842.465576171875, 869.974609375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 8.0, 17.0, 15.0, 15.0, 36.0, 36.0, 46.0, 55.0, 74.0, 95.0, 116.0, 218.0, 281.0, 435.0, 709.0, 1223.0, 2188.0, 4830.0, 15213.0, 4094330.0, 58181.0, 8412.0, 3318.0, 1690.0, 883.0, 569.0, 378.0, 229.0, 170.0, 115.0, 89.0, 52.0, 61.0, 43.0, 32.0, 25.0, 17.0, 15.0, 13.0, 14.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-258.5, -250.3671875, -242.234375, -234.1015625, -225.96875, -217.8359375, -209.703125, -201.5703125, -193.4375, -185.3046875, -177.171875, -169.0390625, -160.90625, -152.7734375, -144.640625, -136.5078125, -128.375, -120.2421875, -112.109375, -103.9765625, -95.84375, -87.7109375, -79.578125, -71.4453125, -63.3125, -55.1796875, -47.046875, -38.9140625, -30.78125, -22.6484375, -14.515625, -6.3828125, 1.75, 9.8828125, 18.015625, 26.1484375, 34.28125, 42.4140625, 50.546875, 58.6796875, 66.8125, 74.9453125, 83.078125, 91.2109375, 99.34375, 107.4765625, 115.609375, 123.7421875, 131.875, 140.0078125, 148.140625, 156.2734375, 164.40625, 172.5390625, 180.671875, 188.8046875, 196.9375, 205.0703125, 213.203125, 221.3359375, 229.46875, 237.6015625, 245.734375, 253.8671875, 262.0]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 11.0, 5.0, 11.0, 6.0, 12.0, 14.0, 18.0, 24.0, 23.0, 37.0, 33.0, 33.0, 36.0, 44.0, 56.0, 43.0, 46.0, 50.0, 57.0, 49.0, 43.0, 32.0, 51.0, 39.0, 33.0, 43.0, 17.0, 19.0, 15.0, 18.0, 12.0, 7.0, 13.0, 9.0, 8.0, 8.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.0, -45.47607421875, -43.9521484375, -42.42822265625, -40.904296875, -39.38037109375, -37.8564453125, -36.33251953125, -34.80859375, -33.28466796875, -31.7607421875, -30.23681640625, -28.712890625, -27.18896484375, -25.6650390625, -24.14111328125, -22.6171875, -21.09326171875, -19.5693359375, -18.04541015625, -16.521484375, -14.99755859375, -13.4736328125, -11.94970703125, -10.42578125, -8.90185546875, -7.3779296875, -5.85400390625, -4.330078125, -2.80615234375, -1.2822265625, 0.24169921875, 1.765625, 3.28955078125, 4.8134765625, 6.33740234375, 7.861328125, 9.38525390625, 10.9091796875, 12.43310546875, 13.95703125, 15.48095703125, 17.0048828125, 18.52880859375, 20.052734375, 21.57666015625, 23.1005859375, 24.62451171875, 26.1484375, 27.67236328125, 29.1962890625, 30.72021484375, 32.244140625, 33.76806640625, 35.2919921875, 36.81591796875, 38.33984375, 39.86376953125, 41.3876953125, 42.91162109375, 44.435546875, 45.95947265625, 47.4833984375, 49.00732421875, 50.53125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 8.0, 11.0, 20.0, 22.0, 48.0, 49.0, 85.0, 159.0, 222.0, 423.0, 696.0, 1305.0, 2630.0, 5881.0, 19027.0, 3952864.0, 185909.0, 14756.0, 5080.0, 2264.0, 1215.0, 626.0, 370.0, 202.0, 151.0, 86.0, 62.0, 29.0, 21.0, 17.0, 10.0, 15.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-318.75, -308.76171875, -298.7734375, -288.78515625, -278.796875, -268.80859375, -258.8203125, -248.83203125, -238.84375, -228.85546875, -218.8671875, -208.87890625, -198.890625, -188.90234375, -178.9140625, -168.92578125, -158.9375, -148.94921875, -138.9609375, -128.97265625, -118.984375, -108.99609375, -99.0078125, -89.01953125, -79.03125, -69.04296875, -59.0546875, -49.06640625, -39.078125, -29.08984375, -19.1015625, -9.11328125, 0.875, 10.86328125, 20.8515625, 30.83984375, 40.828125, 50.81640625, 60.8046875, 70.79296875, 80.78125, 90.76953125, 100.7578125, 110.74609375, 120.734375, 130.72265625, 140.7109375, 150.69921875, 160.6875, 170.67578125, 180.6640625, 190.65234375, 200.640625, 210.62890625, 220.6171875, 230.60546875, 240.59375, 250.58203125, 260.5703125, 270.55859375, 280.546875, 290.53515625, 300.5234375, 310.51171875, 320.5]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 7.0, 7.0, 13.0, 23.0, 43.0, 125.0, 3644.0, 98.0, 46.0, 12.0, 12.0, 12.0, 6.0, 7.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.25, -106.37890625, -102.5078125, -98.63671875, -94.765625, -90.89453125, -87.0234375, -83.15234375, -79.28125, -75.41015625, -71.5390625, -67.66796875, -63.796875, -59.92578125, -56.0546875, -52.18359375, -48.3125, -44.44140625, -40.5703125, -36.69921875, -32.828125, -28.95703125, -25.0859375, -21.21484375, -17.34375, -13.47265625, -9.6015625, -5.73046875, -1.859375, 2.01171875, 5.8828125, 9.75390625, 13.625, 17.49609375, 21.3671875, 25.23828125, 29.109375, 32.98046875, 36.8515625, 40.72265625, 44.59375, 48.46484375, 52.3359375, 56.20703125, 60.078125, 63.94921875, 67.8203125, 71.69140625, 75.5625, 79.43359375, 83.3046875, 87.17578125, 91.046875, 94.91796875, 98.7890625, 102.66015625, 106.53125, 110.40234375, 114.2734375, 118.14453125, 122.015625, 125.88671875, 129.7578125, 133.62890625, 137.5]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 2.0, 2.0, 8.0, 4.0, 10.0, 15.0, 30.0, 42.0, 58.0, 86.0, 117.0, 136.0, 144.0, 104.0, 76.0, 46.0, 43.0, 28.0, 18.0, 5.0, 6.0, 4.0, 12.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-458.49542236328125, -444.99444580078125, -431.4934387207031, -417.9924621582031, -404.491455078125, -390.990478515625, -377.489501953125, -363.988525390625, -350.4875183105469, -336.9865417480469, -323.48553466796875, -309.98455810546875, -296.48358154296875, -282.9825744628906, -269.4815979003906, -255.98060607910156, -242.4796142578125, -228.97862243652344, -215.47763061523438, -201.97665405273438, -188.4756622314453, -174.97467041015625, -161.47369384765625, -147.9727020263672, -134.47171020507812, -120.97071838378906, -107.46973419189453, -93.96875, -80.46775817871094, -66.96676635742188, -53.465782165527344, -39.96479797363281, -26.463775634765625, -12.962787628173828, 0.5382003784179688, 14.039188385009766, 27.540176391601562, 41.041168212890625, 54.542152404785156, 68.04313659667969, 81.54412841796875, 95.04512023925781, 108.54610443115234, 122.04708862304688, 135.54808044433594, 149.049072265625, 162.550048828125, 176.05104064941406, 189.55203247070312, 203.0530242919922, 216.55401611328125, 230.05499267578125, 243.5559844970703, 257.0569763183594, 270.5579528808594, 284.0589599609375, 297.5599365234375, 311.0609130859375, 324.5619201660156, 338.0628967285156, 351.56390380859375, 365.06488037109375, 378.56585693359375, 392.06683349609375, 405.5678405761719]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 9.0, 9.0, 22.0, 10.0, 17.0, 20.0, 20.0, 30.0, 32.0, 28.0, 41.0, 42.0, 43.0, 47.0, 51.0, 45.0, 60.0, 55.0, 38.0, 44.0, 39.0, 33.0, 29.0, 36.0, 20.0, 22.0, 19.0, 23.0, 16.0, 16.0, 16.0, 10.0, 6.0, 6.0, 4.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-227.385498046875, -220.46206665039062, -213.5386505126953, -206.61521911621094, -199.69180297851562, -192.76837158203125, -185.84494018554688, -178.9215087890625, -171.9980926513672, -165.0746612548828, -158.1512451171875, -151.22781372070312, -144.30438232421875, -137.38096618652344, -130.45753479003906, -123.53411102294922, -116.61068725585938, -109.68726348876953, -102.76383972167969, -95.84040832519531, -88.91698455810547, -81.99356079101562, -75.07012939453125, -68.1467056274414, -61.22328186035156, -54.29985809326172, -47.37643051147461, -40.4530029296875, -33.529579162597656, -26.606155395507812, -19.682727813720703, -12.759300231933594, -5.8358917236328125, 1.087533950805664, 8.01095962524414, 14.934385299682617, 21.857810974121094, 28.781234741210938, 35.70466232299805, 42.628089904785156, 49.551513671875, 56.474937438964844, 63.39836502075195, 70.32179260253906, 77.2452163696289, 84.16864013671875, 91.09207153320312, 98.01549530029297, 104.93891906738281, 111.86234283447266, 118.7857666015625, 125.70919799804688, 132.63262939453125, 139.55604553222656, 146.47947692871094, 153.40289306640625, 160.32632446289062, 167.249755859375, 174.1731719970703, 181.0966033935547, 188.02001953125, 194.94345092773438, 201.86688232421875, 208.79031372070312, 215.71372985839844]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 10.0, 11.0, 21.0, 43.0, 41.0, 73.0, 112.0, 165.0, 319.0, 468.0, 897.0, 1678.0, 3198.0, 6688.0, 14824.0, 36220.0, 98647.0, 334594.0, 372618.0, 108152.0, 39625.0, 15820.0, 7106.0, 3462.0, 1634.0, 810.0, 512.0, 275.0, 177.0, 104.0, 59.0, 52.0, 43.0, 35.0, 16.0, 13.0, 5.0, 2.0, 4.0, 8.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.125, -128.541015625, -123.95703125, -119.373046875, -114.7890625, -110.205078125, -105.62109375, -101.037109375, -96.453125, -91.869140625, -87.28515625, -82.701171875, -78.1171875, -73.533203125, -68.94921875, -64.365234375, -59.78125, -55.197265625, -50.61328125, -46.029296875, -41.4453125, -36.861328125, -32.27734375, -27.693359375, -23.109375, -18.525390625, -13.94140625, -9.357421875, -4.7734375, -0.189453125, 4.39453125, 8.978515625, 13.5625, 18.146484375, 22.73046875, 27.314453125, 31.8984375, 36.482421875, 41.06640625, 45.650390625, 50.234375, 54.818359375, 59.40234375, 63.986328125, 68.5703125, 73.154296875, 77.73828125, 82.322265625, 86.90625, 91.490234375, 96.07421875, 100.658203125, 105.2421875, 109.826171875, 114.41015625, 118.994140625, 123.578125, 128.162109375, 132.74609375, 137.330078125, 141.9140625, 146.498046875, 151.08203125, 155.666015625, 160.25]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 4.0, 4.0, 10.0, 12.0, 10.0, 14.0, 22.0, 21.0, 36.0, 31.0, 44.0, 45.0, 48.0, 47.0, 67.0, 75.0, 65.0, 55.0, 48.0, 47.0, 55.0, 38.0, 41.0, 32.0, 28.0, 14.0, 11.0, 20.0, 11.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.25, -63.27880859375, -61.3076171875, -59.33642578125, -57.365234375, -55.39404296875, -53.4228515625, -51.45166015625, -49.48046875, -47.50927734375, -45.5380859375, -43.56689453125, -41.595703125, -39.62451171875, -37.6533203125, -35.68212890625, -33.7109375, -31.73974609375, -29.7685546875, -27.79736328125, -25.826171875, -23.85498046875, -21.8837890625, -19.91259765625, -17.94140625, -15.97021484375, -13.9990234375, -12.02783203125, -10.056640625, -8.08544921875, -6.1142578125, -4.14306640625, -2.171875, -0.20068359375, 1.7705078125, 3.74169921875, 5.712890625, 7.68408203125, 9.6552734375, 11.62646484375, 13.59765625, 15.56884765625, 17.5400390625, 19.51123046875, 21.482421875, 23.45361328125, 25.4248046875, 27.39599609375, 29.3671875, 31.33837890625, 33.3095703125, 35.28076171875, 37.251953125, 39.22314453125, 41.1943359375, 43.16552734375, 45.13671875, 47.10791015625, 49.0791015625, 51.05029296875, 53.021484375, 54.99267578125, 56.9638671875, 58.93505859375, 60.90625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 7.0, 4.0, 3.0, 11.0, 20.0, 21.0, 40.0, 41.0, 59.0, 99.0, 110.0, 173.0, 264.0, 390.0, 590.0, 1028.0, 1847.0, 3608.0, 8797.0, 25701.0, 101468.0, 577890.0, 249482.0, 50221.0, 14922.0, 5637.0, 2519.0, 1347.0, 813.0, 460.0, 270.0, 200.0, 152.0, 92.0, 71.0, 55.0, 35.0, 30.0, 14.0, 12.0, 15.0, 11.0, 6.0, 5.0, 0.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-160.875, -155.46875, -150.0625, -144.65625, -139.25, -133.84375, -128.4375, -123.03125, -117.625, -112.21875, -106.8125, -101.40625, -96.0, -90.59375, -85.1875, -79.78125, -74.375, -68.96875, -63.5625, -58.15625, -52.75, -47.34375, -41.9375, -36.53125, -31.125, -25.71875, -20.3125, -14.90625, -9.5, -4.09375, 1.3125, 6.71875, 12.125, 17.53125, 22.9375, 28.34375, 33.75, 39.15625, 44.5625, 49.96875, 55.375, 60.78125, 66.1875, 71.59375, 77.0, 82.40625, 87.8125, 93.21875, 98.625, 104.03125, 109.4375, 114.84375, 120.25, 125.65625, 131.0625, 136.46875, 141.875, 147.28125, 152.6875, 158.09375, 163.5, 168.90625, 174.3125, 179.71875, 185.125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 2.0, 3.0, 7.0, 10.0, 13.0, 13.0, 22.0, 27.0, 28.0, 29.0, 39.0, 40.0, 48.0, 50.0, 52.0, 40.0, 45.0, 58.0, 64.0, 45.0, 52.0, 39.0, 41.0, 40.0, 38.0, 29.0, 22.0, 25.0, 16.0, 13.0, 11.0, 7.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-198.625, -191.095703125, -183.56640625, -176.037109375, -168.5078125, -160.978515625, -153.44921875, -145.919921875, -138.390625, -130.861328125, -123.33203125, -115.802734375, -108.2734375, -100.744140625, -93.21484375, -85.685546875, -78.15625, -70.626953125, -63.09765625, -55.568359375, -48.0390625, -40.509765625, -32.98046875, -25.451171875, -17.921875, -10.392578125, -2.86328125, 4.666015625, 12.1953125, 19.724609375, 27.25390625, 34.783203125, 42.3125, 49.841796875, 57.37109375, 64.900390625, 72.4296875, 79.958984375, 87.48828125, 95.017578125, 102.546875, 110.076171875, 117.60546875, 125.134765625, 132.6640625, 140.193359375, 147.72265625, 155.251953125, 162.78125, 170.310546875, 177.83984375, 185.369140625, 192.8984375, 200.427734375, 207.95703125, 215.486328125, 223.015625, 230.544921875, 238.07421875, 245.603515625, 253.1328125, 260.662109375, 268.19140625, 275.720703125, 283.25]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 8.0, 17.0, 14.0, 23.0, 39.0, 79.0, 150.0, 380.0, 953.0, 2970.0, 11800.0, 88416.0, 769582.0, 151107.0, 17012.0, 3863.0, 1206.0, 468.0, 230.0, 91.0, 52.0, 30.0, 21.0, 11.0, 9.0, 10.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.125, -95.369140625, -92.61328125, -89.857421875, -87.1015625, -84.345703125, -81.58984375, -78.833984375, -76.078125, -73.322265625, -70.56640625, -67.810546875, -65.0546875, -62.298828125, -59.54296875, -56.787109375, -54.03125, -51.275390625, -48.51953125, -45.763671875, -43.0078125, -40.251953125, -37.49609375, -34.740234375, -31.984375, -29.228515625, -26.47265625, -23.716796875, -20.9609375, -18.205078125, -15.44921875, -12.693359375, -9.9375, -7.181640625, -4.42578125, -1.669921875, 1.0859375, 3.841796875, 6.59765625, 9.353515625, 12.109375, 14.865234375, 17.62109375, 20.376953125, 23.1328125, 25.888671875, 28.64453125, 31.400390625, 34.15625, 36.912109375, 39.66796875, 42.423828125, 45.1796875, 47.935546875, 50.69140625, 53.447265625, 56.203125, 58.958984375, 61.71484375, 64.470703125, 67.2265625, 69.982421875, 72.73828125, 75.494140625, 78.25]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 4.0, 3.0, 8.0, 13.0, 12.0, 18.0, 19.0, 34.0, 34.0, 36.0, 29.0, 45.0, 54.0, 73.0, 115.0, 81.0, 86.0, 72.0, 44.0, 40.0, 26.0, 27.0, 20.0, 14.0, 14.0, 8.0, 11.0, 14.0, 4.0, 9.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01447296142578125, -0.01399219036102295, -0.013511419296264648, -0.013030648231506348, -0.012549877166748047, -0.012069106101989746, -0.011588335037231445, -0.011107563972473145, -0.010626792907714844, -0.010146021842956543, -0.009665250778198242, -0.009184479713439941, -0.00870370864868164, -0.00822293758392334, -0.007742166519165039, -0.007261395454406738, -0.0067806243896484375, -0.006299853324890137, -0.005819082260131836, -0.005338311195373535, -0.004857540130615234, -0.004376769065856934, -0.003895998001098633, -0.003415226936340332, -0.0029344558715820312, -0.0024536848068237305, -0.0019729137420654297, -0.001492142677307129, -0.0010113716125488281, -0.0005306005477905273, -4.982948303222656e-05, 0.0004309415817260742, 0.000911712646484375, 0.0013924837112426758, 0.0018732547760009766, 0.0023540258407592773, 0.002834796905517578, 0.003315567970275879, 0.0037963390350341797, 0.0042771100997924805, 0.004757881164550781, 0.005238652229309082, 0.005719423294067383, 0.006200194358825684, 0.006680965423583984, 0.007161736488342285, 0.007642507553100586, 0.008123278617858887, 0.008604049682617188, 0.009084820747375488, 0.009565591812133789, 0.01004636287689209, 0.01052713394165039, 0.011007905006408691, 0.011488676071166992, 0.011969447135925293, 0.012450218200683594, 0.012930989265441895, 0.013411760330200195, 0.013892531394958496, 0.014373302459716797, 0.014854073524475098, 0.015334844589233398, 0.0158156156539917, 0.01629638671875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 1.0, 9.0, 9.0, 13.0, 19.0, 24.0, 32.0, 50.0, 77.0, 131.0, 160.0, 314.0, 511.0, 932.0, 1806.0, 4027.0, 10690.0, 39369.0, 221504.0, 606561.0, 122940.0, 25362.0, 7612.0, 2988.0, 1479.0, 755.0, 410.0, 252.0, 159.0, 92.0, 71.0, 57.0, 33.0, 25.0, 20.0, 13.0, 15.0, 5.0, 4.0, 8.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-69.875, -67.84033203125, -65.8056640625, -63.77099609375, -61.736328125, -59.70166015625, -57.6669921875, -55.63232421875, -53.59765625, -51.56298828125, -49.5283203125, -47.49365234375, -45.458984375, -43.42431640625, -41.3896484375, -39.35498046875, -37.3203125, -35.28564453125, -33.2509765625, -31.21630859375, -29.181640625, -27.14697265625, -25.1123046875, -23.07763671875, -21.04296875, -19.00830078125, -16.9736328125, -14.93896484375, -12.904296875, -10.86962890625, -8.8349609375, -6.80029296875, -4.765625, -2.73095703125, -0.6962890625, 1.33837890625, 3.373046875, 5.40771484375, 7.4423828125, 9.47705078125, 11.51171875, 13.54638671875, 15.5810546875, 17.61572265625, 19.650390625, 21.68505859375, 23.7197265625, 25.75439453125, 27.7890625, 29.82373046875, 31.8583984375, 33.89306640625, 35.927734375, 37.96240234375, 39.9970703125, 42.03173828125, 44.06640625, 46.10107421875, 48.1357421875, 50.17041015625, 52.205078125, 54.23974609375, 56.2744140625, 58.30908203125, 60.34375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 8.0, 9.0, 20.0, 31.0, 42.0, 86.0, 93.0, 129.0, 178.0, 113.0, 103.0, 79.0, 34.0, 24.0, 15.0, 8.0, 3.0, 11.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.75, -114.3232421875, -110.896484375, -107.4697265625, -104.04296875, -100.6162109375, -97.189453125, -93.7626953125, -90.3359375, -86.9091796875, -83.482421875, -80.0556640625, -76.62890625, -73.2021484375, -69.775390625, -66.3486328125, -62.921875, -59.4951171875, -56.068359375, -52.6416015625, -49.21484375, -45.7880859375, -42.361328125, -38.9345703125, -35.5078125, -32.0810546875, -28.654296875, -25.2275390625, -21.80078125, -18.3740234375, -14.947265625, -11.5205078125, -8.09375, -4.6669921875, -1.240234375, 2.1865234375, 5.61328125, 9.0400390625, 12.466796875, 15.8935546875, 19.3203125, 22.7470703125, 26.173828125, 29.6005859375, 33.02734375, 36.4541015625, 39.880859375, 43.3076171875, 46.734375, 50.1611328125, 53.587890625, 57.0146484375, 60.44140625, 63.8681640625, 67.294921875, 70.7216796875, 74.1484375, 77.5751953125, 81.001953125, 84.4287109375, 87.85546875, 91.2822265625, 94.708984375, 98.1357421875, 101.5625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 13.0, 13.0, 29.0, 49.0, 66.0, 113.0, 124.0, 161.0, 136.0, 105.0, 62.0, 37.0, 25.0, 16.0, 14.0, 8.0, 5.0, 3.0, 0.0, 4.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1657.6605224609375, -1606.6939697265625, -1555.727294921875, -1504.7607421875, -1453.794189453125, -1402.8275146484375, -1351.8609619140625, -1300.894287109375, -1249.927734375, -1198.961181640625, -1147.9945068359375, -1097.0279541015625, -1046.061279296875, -995.0947265625, -944.128173828125, -893.1615600585938, -842.1949462890625, -791.2283325195312, -740.26171875, -689.295166015625, -638.3285522460938, -587.3619384765625, -536.3953857421875, -485.42877197265625, -434.462158203125, -383.49554443359375, -332.5289611816406, -281.5623779296875, -230.59576416015625, -179.62916564941406, -128.66256713867188, -77.69598388671875, -26.7294921875, 24.237106323242188, 75.20370483398438, 126.17030334472656, 177.13690185546875, 228.10350036621094, 279.0700988769531, 330.03668212890625, 381.0032958984375, 431.96990966796875, 482.9364929199219, 533.903076171875, 584.8696899414062, 635.8363037109375, 686.8028564453125, 737.7694702148438, 788.736083984375, 839.7026977539062, 890.6693115234375, 941.6358642578125, 992.6024780273438, 1043.569091796875, 1094.53564453125, 1145.502197265625, 1196.4688720703125, 1247.4354248046875, 1298.402099609375, 1349.36865234375, 1400.335205078125, 1451.3018798828125, 1502.2684326171875, 1553.235107421875, 1604.20166015625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 6.0, 9.0, 12.0, 10.0, 16.0, 20.0, 25.0, 28.0, 20.0, 33.0, 34.0, 39.0, 53.0, 41.0, 47.0, 49.0, 41.0, 49.0, 39.0, 38.0, 48.0, 47.0, 28.0, 44.0, 27.0, 37.0, 20.0, 28.0, 20.0, 15.0, 13.0, 13.0, 9.0, 13.0, 9.0, 3.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1066.38671875, -1032.3743896484375, -998.3619995117188, -964.349609375, -930.3372802734375, -896.3248901367188, -862.3125, -828.3001708984375, -794.2877807617188, -760.275390625, -726.2630615234375, -692.2506713867188, -658.23828125, -624.2259521484375, -590.2135620117188, -556.201171875, -522.1888427734375, -488.1764831542969, -454.16412353515625, -420.1517333984375, -386.1393737792969, -352.12701416015625, -318.1146240234375, -284.1022644042969, -250.08990478515625, -216.07754516601562, -182.06517028808594, -148.05279541015625, -114.04043579101562, -80.028076171875, -46.01570129394531, -12.003326416015625, 22.0089111328125, 56.021278381347656, 90.03364562988281, 124.04601287841797, 158.05838012695312, 192.07073974609375, 226.08311462402344, 260.0954895019531, 294.10784912109375, 328.1202087402344, 362.132568359375, 396.14495849609375, 430.1573181152344, 464.169677734375, 498.18206787109375, 532.1944580078125, 566.206787109375, 600.2191772460938, 634.2315063476562, 668.243896484375, 702.2562255859375, 736.2686157226562, 770.281005859375, 804.2933349609375, 838.3057250976562, 872.318115234375, 906.3304443359375, 940.3428344726562, 974.355224609375, 1008.3675537109375, 1042.3798828125, 1076.392333984375, 1110.4046630859375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 7.0, 6.0, 18.0, 14.0, 36.0, 20.0, 38.0, 56.0, 81.0, 112.0, 190.0, 344.0, 505.0, 802.0, 1448.0, 2357.0, 4321.0, 8306.0, 18402.0, 53158.0, 451295.0, 3372747.0, 210470.0, 39314.0, 14818.0, 6843.0, 3548.0, 1950.0, 1148.0, 707.0, 408.0, 256.0, 162.0, 129.0, 72.0, 46.0, 39.0, 25.0, 22.0, 15.0, 11.0, 12.0, 10.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.0, -120.744140625, -116.48828125, -112.232421875, -107.9765625, -103.720703125, -99.46484375, -95.208984375, -90.953125, -86.697265625, -82.44140625, -78.185546875, -73.9296875, -69.673828125, -65.41796875, -61.162109375, -56.90625, -52.650390625, -48.39453125, -44.138671875, -39.8828125, -35.626953125, -31.37109375, -27.115234375, -22.859375, -18.603515625, -14.34765625, -10.091796875, -5.8359375, -1.580078125, 2.67578125, 6.931640625, 11.1875, 15.443359375, 19.69921875, 23.955078125, 28.2109375, 32.466796875, 36.72265625, 40.978515625, 45.234375, 49.490234375, 53.74609375, 58.001953125, 62.2578125, 66.513671875, 70.76953125, 75.025390625, 79.28125, 83.537109375, 87.79296875, 92.048828125, 96.3046875, 100.560546875, 104.81640625, 109.072265625, 113.328125, 117.583984375, 121.83984375, 126.095703125, 130.3515625, 134.607421875, 138.86328125, 143.119140625, 147.375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 10.0, 9.0, 15.0, 14.0, 16.0, 22.0, 33.0, 24.0, 36.0, 24.0, 27.0, 42.0, 44.0, 54.0, 55.0, 52.0, 50.0, 44.0, 50.0, 32.0, 33.0, 41.0, 50.0, 31.0, 32.0, 24.0, 17.0, 20.0, 13.0, 19.0, 16.0, 4.0, 7.0, 9.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.21875, -47.68359375, -46.1484375, -44.61328125, -43.078125, -41.54296875, -40.0078125, -38.47265625, -36.9375, -35.40234375, -33.8671875, -32.33203125, -30.796875, -29.26171875, -27.7265625, -26.19140625, -24.65625, -23.12109375, -21.5859375, -20.05078125, -18.515625, -16.98046875, -15.4453125, -13.91015625, -12.375, -10.83984375, -9.3046875, -7.76953125, -6.234375, -4.69921875, -3.1640625, -1.62890625, -0.09375, 1.44140625, 2.9765625, 4.51171875, 6.046875, 7.58203125, 9.1171875, 10.65234375, 12.1875, 13.72265625, 15.2578125, 16.79296875, 18.328125, 19.86328125, 21.3984375, 22.93359375, 24.46875, 26.00390625, 27.5390625, 29.07421875, 30.609375, 32.14453125, 33.6796875, 35.21484375, 36.75, 38.28515625, 39.8203125, 41.35546875, 42.890625, 44.42578125, 45.9609375, 47.49609375, 49.03125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 16.0, 11.0, 21.0, 28.0, 38.0, 55.0, 73.0, 118.0, 206.0, 356.0, 710.0, 1394.0, 3027.0, 6668.0, 16900.0, 52043.0, 277419.0, 3492503.0, 263150.0, 50845.0, 16558.0, 6534.0, 2712.0, 1365.0, 625.0, 348.0, 216.0, 111.0, 65.0, 50.0, 34.0, 21.0, 17.0, 14.0, 9.0, 8.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-174.375, -169.0078125, -163.640625, -158.2734375, -152.90625, -147.5390625, -142.171875, -136.8046875, -131.4375, -126.0703125, -120.703125, -115.3359375, -109.96875, -104.6015625, -99.234375, -93.8671875, -88.5, -83.1328125, -77.765625, -72.3984375, -67.03125, -61.6640625, -56.296875, -50.9296875, -45.5625, -40.1953125, -34.828125, -29.4609375, -24.09375, -18.7265625, -13.359375, -7.9921875, -2.625, 2.7421875, 8.109375, 13.4765625, 18.84375, 24.2109375, 29.578125, 34.9453125, 40.3125, 45.6796875, 51.046875, 56.4140625, 61.78125, 67.1484375, 72.515625, 77.8828125, 83.25, 88.6171875, 93.984375, 99.3515625, 104.71875, 110.0859375, 115.453125, 120.8203125, 126.1875, 131.5546875, 136.921875, 142.2890625, 147.65625, 153.0234375, 158.390625, 163.7578125, 169.125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 4.0, 4.0, 9.0, 11.0, 9.0, 16.0, 18.0, 18.0, 19.0, 30.0, 58.0, 67.0, 83.0, 171.0, 370.0, 953.0, 1060.0, 478.0, 236.0, 134.0, 74.0, 54.0, 48.0, 25.0, 25.0, 25.0, 14.0, 7.0, 5.0, 5.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-194.5, -189.1328125, -183.765625, -178.3984375, -173.03125, -167.6640625, -162.296875, -156.9296875, -151.5625, -146.1953125, -140.828125, -135.4609375, -130.09375, -124.7265625, -119.359375, -113.9921875, -108.625, -103.2578125, -97.890625, -92.5234375, -87.15625, -81.7890625, -76.421875, -71.0546875, -65.6875, -60.3203125, -54.953125, -49.5859375, -44.21875, -38.8515625, -33.484375, -28.1171875, -22.75, -17.3828125, -12.015625, -6.6484375, -1.28125, 4.0859375, 9.453125, 14.8203125, 20.1875, 25.5546875, 30.921875, 36.2890625, 41.65625, 47.0234375, 52.390625, 57.7578125, 63.125, 68.4921875, 73.859375, 79.2265625, 84.59375, 89.9609375, 95.328125, 100.6953125, 106.0625, 111.4296875, 116.796875, 122.1640625, 127.53125, 132.8984375, 138.265625, 143.6328125, 149.0]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 9.0, 14.0, 30.0, 78.0, 190.0, 284.0, 237.0, 84.0, 37.0, 21.0, 4.0, 3.0, 3.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2384.1220703125, -2290.970458984375, -2197.818603515625, -2104.6669921875, -2011.51513671875, -1918.363525390625, -1825.2117919921875, -1732.06005859375, -1638.9083251953125, -1545.756591796875, -1452.6048583984375, -1359.453125, -1266.301513671875, -1173.149658203125, -1079.998046875, -986.8463134765625, -893.694580078125, -800.5428466796875, -707.39111328125, -614.2394409179688, -521.0877075195312, -427.93597412109375, -334.7843017578125, -241.632568359375, -148.4808349609375, -55.32911682128906, 37.822601318359375, 130.97430419921875, 224.12603759765625, 317.27777099609375, 410.429443359375, 503.5811767578125, 596.73291015625, 689.8846435546875, 783.036376953125, 876.1880493164062, 969.3397827148438, 1062.491455078125, 1155.6431884765625, 1248.794921875, 1341.9466552734375, 1435.098388671875, 1528.2501220703125, 1621.40185546875, 1714.553466796875, 1807.705322265625, 1900.85693359375, 1994.0086669921875, 2087.160400390625, 2180.31201171875, 2273.4638671875, 2366.615478515625, 2459.767333984375, 2552.9189453125, 2646.07080078125, 2739.222412109375, 2832.3740234375, 2925.525634765625, 3018.677490234375, 3111.8291015625, 3204.98095703125, 3298.132568359375, 3391.2841796875, 3484.43603515625, 3577.587890625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 6.0, 10.0, 9.0, 8.0, 12.0, 13.0, 15.0, 12.0, 16.0, 26.0, 23.0, 28.0, 28.0, 38.0, 30.0, 27.0, 37.0, 43.0, 44.0, 49.0, 31.0, 42.0, 30.0, 36.0, 36.0, 46.0, 35.0, 39.0, 29.0, 23.0, 12.0, 21.0, 17.0, 17.0, 16.0, 17.0, 7.0, 7.0, 11.0, 4.0, 7.0, 5.0, 9.0, 9.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-557.974853515625, -538.8375854492188, -519.7003784179688, -500.5631103515625, -481.4258728027344, -462.28863525390625, -443.1513671875, -424.0141296386719, -404.87689208984375, -385.7396545410156, -366.6024169921875, -347.46514892578125, -328.3279113769531, -309.190673828125, -290.05340576171875, -270.9161682128906, -251.7789306640625, -232.64169311523438, -213.5044403076172, -194.3671875, -175.22994995117188, -156.09271240234375, -136.95545959472656, -117.81820678710938, -98.68096923828125, -79.5437240600586, -60.40647888183594, -41.26923370361328, -22.131988525390625, -2.9947433471679688, 16.142501831054688, 35.279754638671875, 54.4169921875, 73.55423736572266, 92.69148254394531, 111.82872772216797, 130.96597290039062, 150.10321044921875, 169.24046325683594, 188.37771606445312, 207.51495361328125, 226.65219116210938, 245.78944396972656, 264.92669677734375, 284.0639343261719, 303.201171875, 322.33843994140625, 341.4756774902344, 360.6129150390625, 379.7501525878906, 398.88739013671875, 418.024658203125, 437.1618957519531, 456.29913330078125, 475.4364013671875, 494.5736389160156, 513.7108764648438, 532.84814453125, 551.9853515625, 571.1226196289062, 590.2598876953125, 609.3970947265625, 628.5343627929688, 647.671630859375, 666.808837890625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 17.0, 18.0, 30.0, 28.0, 59.0, 84.0, 110.0, 159.0, 221.0, 360.0, 564.0, 839.0, 1230.0, 1988.0, 3156.0, 5460.0, 9110.0, 16596.0, 32566.0, 68115.0, 161287.0, 357832.0, 214596.0, 86745.0, 39651.0, 20294.0, 10987.0, 6175.0, 3746.0, 2263.0, 1456.0, 944.0, 613.0, 405.0, 301.0, 183.0, 132.0, 74.0, 44.0, 39.0, 23.0, 16.0, 11.0, 7.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.3125, -101.0166015625, -97.720703125, -94.4248046875, -91.12890625, -87.8330078125, -84.537109375, -81.2412109375, -77.9453125, -74.6494140625, -71.353515625, -68.0576171875, -64.76171875, -61.4658203125, -58.169921875, -54.8740234375, -51.578125, -48.2822265625, -44.986328125, -41.6904296875, -38.39453125, -35.0986328125, -31.802734375, -28.5068359375, -25.2109375, -21.9150390625, -18.619140625, -15.3232421875, -12.02734375, -8.7314453125, -5.435546875, -2.1396484375, 1.15625, 4.4521484375, 7.748046875, 11.0439453125, 14.33984375, 17.6357421875, 20.931640625, 24.2275390625, 27.5234375, 30.8193359375, 34.115234375, 37.4111328125, 40.70703125, 44.0029296875, 47.298828125, 50.5947265625, 53.890625, 57.1865234375, 60.482421875, 63.7783203125, 67.07421875, 70.3701171875, 73.666015625, 76.9619140625, 80.2578125, 83.5537109375, 86.849609375, 90.1455078125, 93.44140625, 96.7373046875, 100.033203125, 103.3291015625, 106.625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 4.0, 6.0, 6.0, 6.0, 9.0, 9.0, 11.0, 14.0, 16.0, 12.0, 18.0, 24.0, 25.0, 28.0, 33.0, 27.0, 36.0, 40.0, 45.0, 34.0, 34.0, 53.0, 62.0, 37.0, 43.0, 36.0, 36.0, 44.0, 27.0, 32.0, 28.0, 26.0, 17.0, 20.0, 16.0, 19.0, 10.0, 16.0, 6.0, 7.0, 3.0, 6.0, 1.0, 4.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-42.03125, -40.61279296875, -39.1943359375, -37.77587890625, -36.357421875, -34.93896484375, -33.5205078125, -32.10205078125, -30.68359375, -29.26513671875, -27.8466796875, -26.42822265625, -25.009765625, -23.59130859375, -22.1728515625, -20.75439453125, -19.3359375, -17.91748046875, -16.4990234375, -15.08056640625, -13.662109375, -12.24365234375, -10.8251953125, -9.40673828125, -7.98828125, -6.56982421875, -5.1513671875, -3.73291015625, -2.314453125, -0.89599609375, 0.5224609375, 1.94091796875, 3.359375, 4.77783203125, 6.1962890625, 7.61474609375, 9.033203125, 10.45166015625, 11.8701171875, 13.28857421875, 14.70703125, 16.12548828125, 17.5439453125, 18.96240234375, 20.380859375, 21.79931640625, 23.2177734375, 24.63623046875, 26.0546875, 27.47314453125, 28.8916015625, 30.31005859375, 31.728515625, 33.14697265625, 34.5654296875, 35.98388671875, 37.40234375, 38.82080078125, 40.2392578125, 41.65771484375, 43.076171875, 44.49462890625, 45.9130859375, 47.33154296875, 48.75]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 11.0, 17.0, 24.0, 20.0, 44.0, 56.0, 90.0, 110.0, 219.0, 320.0, 569.0, 1005.0, 2190.0, 5506.0, 19753.0, 132081.0, 765317.0, 96064.0, 16237.0, 4687.0, 1963.0, 915.0, 495.0, 299.0, 171.0, 124.0, 83.0, 56.0, 35.0, 26.0, 19.0, 12.0, 8.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-270.25, -262.166015625, -254.08203125, -245.998046875, -237.9140625, -229.830078125, -221.74609375, -213.662109375, -205.578125, -197.494140625, -189.41015625, -181.326171875, -173.2421875, -165.158203125, -157.07421875, -148.990234375, -140.90625, -132.822265625, -124.73828125, -116.654296875, -108.5703125, -100.486328125, -92.40234375, -84.318359375, -76.234375, -68.150390625, -60.06640625, -51.982421875, -43.8984375, -35.814453125, -27.73046875, -19.646484375, -11.5625, -3.478515625, 4.60546875, 12.689453125, 20.7734375, 28.857421875, 36.94140625, 45.025390625, 53.109375, 61.193359375, 69.27734375, 77.361328125, 85.4453125, 93.529296875, 101.61328125, 109.697265625, 117.78125, 125.865234375, 133.94921875, 142.033203125, 150.1171875, 158.201171875, 166.28515625, 174.369140625, 182.453125, 190.537109375, 198.62109375, 206.705078125, 214.7890625, 222.873046875, 230.95703125, 239.041015625, 247.125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 13.0, 6.0, 13.0, 14.0, 25.0, 25.0, 34.0, 39.0, 30.0, 46.0, 62.0, 44.0, 46.0, 49.0, 64.0, 69.0, 59.0, 58.0, 49.0, 40.0, 40.0, 23.0, 31.0, 28.0, 20.0, 17.0, 20.0, 5.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.5, -227.9921875, -219.484375, -210.9765625, -202.46875, -193.9609375, -185.453125, -176.9453125, -168.4375, -159.9296875, -151.421875, -142.9140625, -134.40625, -125.8984375, -117.390625, -108.8828125, -100.375, -91.8671875, -83.359375, -74.8515625, -66.34375, -57.8359375, -49.328125, -40.8203125, -32.3125, -23.8046875, -15.296875, -6.7890625, 1.71875, 10.2265625, 18.734375, 27.2421875, 35.75, 44.2578125, 52.765625, 61.2734375, 69.78125, 78.2890625, 86.796875, 95.3046875, 103.8125, 112.3203125, 120.828125, 129.3359375, 137.84375, 146.3515625, 154.859375, 163.3671875, 171.875, 180.3828125, 188.890625, 197.3984375, 205.90625, 214.4140625, 222.921875, 231.4296875, 239.9375, 248.4453125, 256.953125, 265.4609375, 273.96875, 282.4765625, 290.984375, 299.4921875, 308.0]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 8.0, 7.0, 10.0, 19.0, 18.0, 31.0, 40.0, 87.0, 141.0, 284.0, 609.0, 1572.0, 4842.0, 23406.0, 442921.0, 541631.0, 24884.0, 5148.0, 1632.0, 605.0, 295.0, 157.0, 76.0, 37.0, 32.0, 23.0, 12.0, 8.0, 9.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.125, -132.556640625, -127.98828125, -123.419921875, -118.8515625, -114.283203125, -109.71484375, -105.146484375, -100.578125, -96.009765625, -91.44140625, -86.873046875, -82.3046875, -77.736328125, -73.16796875, -68.599609375, -64.03125, -59.462890625, -54.89453125, -50.326171875, -45.7578125, -41.189453125, -36.62109375, -32.052734375, -27.484375, -22.916015625, -18.34765625, -13.779296875, -9.2109375, -4.642578125, -0.07421875, 4.494140625, 9.0625, 13.630859375, 18.19921875, 22.767578125, 27.3359375, 31.904296875, 36.47265625, 41.041015625, 45.609375, 50.177734375, 54.74609375, 59.314453125, 63.8828125, 68.451171875, 73.01953125, 77.587890625, 82.15625, 86.724609375, 91.29296875, 95.861328125, 100.4296875, 104.998046875, 109.56640625, 114.134765625, 118.703125, 123.271484375, 127.83984375, 132.408203125, 136.9765625, 141.544921875, 146.11328125, 150.681640625, 155.25]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 6.0, 5.0, 21.0, 25.0, 46.0, 68.0, 105.0, 182.0, 191.0, 132.0, 85.0, 39.0, 30.0, 20.0, 10.0, 7.0, 4.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0301513671875, -0.028729915618896484, -0.02730846405029297, -0.025887012481689453, -0.024465560913085938, -0.023044109344482422, -0.021622657775878906, -0.02020120620727539, -0.018779754638671875, -0.01735830307006836, -0.015936851501464844, -0.014515399932861328, -0.013093948364257812, -0.011672496795654297, -0.010251045227050781, -0.008829593658447266, -0.00740814208984375, -0.005986690521240234, -0.004565238952636719, -0.003143787384033203, -0.0017223358154296875, -0.0003008842468261719, 0.0011205673217773438, 0.0025420188903808594, 0.003963470458984375, 0.005384922027587891, 0.006806373596191406, 0.008227825164794922, 0.009649276733398438, 0.011070728302001953, 0.012492179870605469, 0.013913631439208984, 0.0153350830078125, 0.016756534576416016, 0.01817798614501953, 0.019599437713623047, 0.021020889282226562, 0.022442340850830078, 0.023863792419433594, 0.02528524398803711, 0.026706695556640625, 0.02812814712524414, 0.029549598693847656, 0.030971050262451172, 0.03239250183105469, 0.0338139533996582, 0.03523540496826172, 0.036656856536865234, 0.03807830810546875, 0.039499759674072266, 0.04092121124267578, 0.0423426628112793, 0.04376411437988281, 0.04518556594848633, 0.046607017517089844, 0.04802846908569336, 0.049449920654296875, 0.05087137222290039, 0.052292823791503906, 0.05371427536010742, 0.05513572692871094, 0.05655717849731445, 0.05797863006591797, 0.059400081634521484, 0.060821533203125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 10.0, 21.0, 19.0, 29.0, 50.0, 70.0, 109.0, 179.0, 323.0, 643.0, 1464.0, 3709.0, 13035.0, 79852.0, 758144.0, 161857.0, 20291.0, 5145.0, 1840.0, 824.0, 383.0, 208.0, 123.0, 77.0, 47.0, 23.0, 13.0, 16.0, 14.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.8125, -100.4248046875, -97.037109375, -93.6494140625, -90.26171875, -86.8740234375, -83.486328125, -80.0986328125, -76.7109375, -73.3232421875, -69.935546875, -66.5478515625, -63.16015625, -59.7724609375, -56.384765625, -52.9970703125, -49.609375, -46.2216796875, -42.833984375, -39.4462890625, -36.05859375, -32.6708984375, -29.283203125, -25.8955078125, -22.5078125, -19.1201171875, -15.732421875, -12.3447265625, -8.95703125, -5.5693359375, -2.181640625, 1.2060546875, 4.59375, 7.9814453125, 11.369140625, 14.7568359375, 18.14453125, 21.5322265625, 24.919921875, 28.3076171875, 31.6953125, 35.0830078125, 38.470703125, 41.8583984375, 45.24609375, 48.6337890625, 52.021484375, 55.4091796875, 58.796875, 62.1845703125, 65.572265625, 68.9599609375, 72.34765625, 75.7353515625, 79.123046875, 82.5107421875, 85.8984375, 89.2861328125, 92.673828125, 96.0615234375, 99.44921875, 102.8369140625, 106.224609375, 109.6123046875, 113.0]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 6.0, 11.0, 10.0, 15.0, 18.0, 21.0, 53.0, 54.0, 80.0, 71.0, 128.0, 99.0, 101.0, 82.0, 62.0, 38.0, 35.0, 24.0, 17.0, 10.0, 17.0, 7.0, 7.0, 10.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-105.3125, -102.490234375, -99.66796875, -96.845703125, -94.0234375, -91.201171875, -88.37890625, -85.556640625, -82.734375, -79.912109375, -77.08984375, -74.267578125, -71.4453125, -68.623046875, -65.80078125, -62.978515625, -60.15625, -57.333984375, -54.51171875, -51.689453125, -48.8671875, -46.044921875, -43.22265625, -40.400390625, -37.578125, -34.755859375, -31.93359375, -29.111328125, -26.2890625, -23.466796875, -20.64453125, -17.822265625, -15.0, -12.177734375, -9.35546875, -6.533203125, -3.7109375, -0.888671875, 1.93359375, 4.755859375, 7.578125, 10.400390625, 13.22265625, 16.044921875, 18.8671875, 21.689453125, 24.51171875, 27.333984375, 30.15625, 32.978515625, 35.80078125, 38.623046875, 41.4453125, 44.267578125, 47.08984375, 49.912109375, 52.734375, 55.556640625, 58.37890625, 61.201171875, 64.0234375, 66.845703125, 69.66796875, 72.490234375, 75.3125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 7.0, 11.0, 19.0, 32.0, 52.0, 98.0, 144.0, 179.0, 137.0, 102.0, 73.0, 62.0, 28.0, 15.0, 6.0, 10.0, 3.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-938.35693359375, -884.2062377929688, -830.0555419921875, -775.9049072265625, -721.754150390625, -667.603515625, -613.4528198242188, -559.3021240234375, -505.15142822265625, -451.000732421875, -396.85003662109375, -342.6993713378906, -288.5486755371094, -234.39797973632812, -180.247314453125, -126.09661865234375, -71.9459228515625, -17.79523468017578, 36.35545349121094, 90.50613403320312, 144.65682983398438, 198.80752563476562, 252.95819091796875, 307.10888671875, 361.25958251953125, 415.4102783203125, 469.56097412109375, 523.711669921875, 577.8623046875, 632.0130615234375, 686.1636962890625, 740.3143920898438, 794.465087890625, 848.6157836914062, 902.7664794921875, 956.9171142578125, 1011.06787109375, 1065.218505859375, 1119.369140625, 1173.5198974609375, 1227.670654296875, 1281.8212890625, 1335.9720458984375, 1390.1226806640625, 1444.2734375, 1498.424072265625, 1552.57470703125, 1606.7254638671875, 1660.8760986328125, 1715.0267333984375, 1769.177490234375, 1823.328125, 1877.4788818359375, 1931.6295166015625, 1985.7802734375, 2039.930908203125, 2094.08154296875, 2148.232177734375, 2202.3828125, 2256.53369140625, 2310.684326171875, 2364.8349609375, 2418.985595703125, 2473.13623046875, 2527.287109375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 11.0, 7.0, 14.0, 11.0, 24.0, 27.0, 31.0, 29.0, 32.0, 28.0, 34.0, 44.0, 39.0, 49.0, 55.0, 35.0, 52.0, 41.0, 51.0, 45.0, 56.0, 36.0, 31.0, 20.0, 28.0, 29.0, 21.0, 16.0, 11.0, 9.0, 9.0, 13.0, 1.0, 8.0, 5.0, 7.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-763.8731689453125, -736.0970458984375, -708.3209228515625, -680.5447998046875, -652.7686767578125, -624.9925537109375, -597.2164306640625, -569.4403076171875, -541.6641845703125, -513.8880615234375, -486.1119384765625, -458.3358154296875, -430.5596923828125, -402.7835693359375, -375.0074768066406, -347.2313537597656, -319.45526123046875, -291.67913818359375, -263.90301513671875, -236.1269073486328, -208.3507843017578, -180.5746612548828, -152.79855346679688, -125.02243041992188, -97.24630737304688, -69.47018432617188, -41.694068908691406, -13.917953491210938, 13.858169555664062, 41.63429260253906, 69.410400390625, 97.1865234375, 124.96258544921875, 152.73870849609375, 180.51483154296875, 208.2909393310547, 236.0670623779297, 263.84320068359375, 291.6192932128906, 319.3954162597656, 347.1715393066406, 374.9476623535156, 402.7237854003906, 430.4998779296875, 458.2760009765625, 486.0521240234375, 513.8282470703125, 541.6043701171875, 569.3804931640625, 597.1566162109375, 624.9327392578125, 652.7088623046875, 680.4849853515625, 708.2611083984375, 736.0372314453125, 763.8133544921875, 791.5894775390625, 819.3656005859375, 847.1417236328125, 874.9178466796875, 902.6939697265625, 930.4700927734375, 958.2462158203125, 986.0223388671875, 1013.7984008789062]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 6.0, 7.0, 9.0, 18.0, 21.0, 36.0, 52.0, 88.0, 174.0, 524.0, 3412.0, 61314.0, 4090829.0, 34984.0, 2101.0, 380.0, 133.0, 58.0, 40.0, 22.0, 27.0, 10.0, 13.0, 5.0, 5.0, 11.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-277.25, -263.67578125, -250.1015625, -236.52734375, -222.953125, -209.37890625, -195.8046875, -182.23046875, -168.65625, -155.08203125, -141.5078125, -127.93359375, -114.359375, -100.78515625, -87.2109375, -73.63671875, -60.0625, -46.48828125, -32.9140625, -19.33984375, -5.765625, 7.80859375, 21.3828125, 34.95703125, 48.53125, 62.10546875, 75.6796875, 89.25390625, 102.828125, 116.40234375, 129.9765625, 143.55078125, 157.125, 170.69921875, 184.2734375, 197.84765625, 211.421875, 224.99609375, 238.5703125, 252.14453125, 265.71875, 279.29296875, 292.8671875, 306.44140625, 320.015625, 333.58984375, 347.1640625, 360.73828125, 374.3125, 387.88671875, 401.4609375, 415.03515625, 428.609375, 442.18359375, 455.7578125, 469.33203125, 482.90625, 496.48046875, 510.0546875, 523.62890625, 537.203125, 550.77734375, 564.3515625, 577.92578125, 591.5]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 4.0, 10.0, 6.0, 9.0, 7.0, 6.0, 13.0, 16.0, 9.0, 16.0, 20.0, 26.0, 21.0, 23.0, 32.0, 39.0, 31.0, 25.0, 37.0, 36.0, 39.0, 54.0, 43.0, 40.0, 36.0, 37.0, 53.0, 42.0, 35.0, 33.0, 22.0, 27.0, 26.0, 28.0, 11.0, 21.0, 11.0, 5.0, 10.0, 5.0, 7.0, 4.0, 5.0, 3.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-42.71875, -41.41943359375, -40.1201171875, -38.82080078125, -37.521484375, -36.22216796875, -34.9228515625, -33.62353515625, -32.32421875, -31.02490234375, -29.7255859375, -28.42626953125, -27.126953125, -25.82763671875, -24.5283203125, -23.22900390625, -21.9296875, -20.63037109375, -19.3310546875, -18.03173828125, -16.732421875, -15.43310546875, -14.1337890625, -12.83447265625, -11.53515625, -10.23583984375, -8.9365234375, -7.63720703125, -6.337890625, -5.03857421875, -3.7392578125, -2.43994140625, -1.140625, 0.15869140625, 1.4580078125, 2.75732421875, 4.056640625, 5.35595703125, 6.6552734375, 7.95458984375, 9.25390625, 10.55322265625, 11.8525390625, 13.15185546875, 14.451171875, 15.75048828125, 17.0498046875, 18.34912109375, 19.6484375, 20.94775390625, 22.2470703125, 23.54638671875, 24.845703125, 26.14501953125, 27.4443359375, 28.74365234375, 30.04296875, 31.34228515625, 32.6416015625, 33.94091796875, 35.240234375, 36.53955078125, 37.8388671875, 39.13818359375, 40.4375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 0.0, 6.0, 8.0, 10.0, 27.0, 20.0, 33.0, 39.0, 63.0, 102.0, 147.0, 245.0, 376.0, 665.0, 1166.0, 2217.0, 4285.0, 9233.0, 21702.0, 60860.0, 299699.0, 3234669.0, 438710.0, 74071.0, 25149.0, 10453.0, 4735.0, 2472.0, 1295.0, 699.0, 420.0, 236.0, 160.0, 101.0, 57.0, 52.0, 22.0, 22.0, 19.0, 9.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-149.375, -144.7890625, -140.203125, -135.6171875, -131.03125, -126.4453125, -121.859375, -117.2734375, -112.6875, -108.1015625, -103.515625, -98.9296875, -94.34375, -89.7578125, -85.171875, -80.5859375, -76.0, -71.4140625, -66.828125, -62.2421875, -57.65625, -53.0703125, -48.484375, -43.8984375, -39.3125, -34.7265625, -30.140625, -25.5546875, -20.96875, -16.3828125, -11.796875, -7.2109375, -2.625, 1.9609375, 6.546875, 11.1328125, 15.71875, 20.3046875, 24.890625, 29.4765625, 34.0625, 38.6484375, 43.234375, 47.8203125, 52.40625, 56.9921875, 61.578125, 66.1640625, 70.75, 75.3359375, 79.921875, 84.5078125, 89.09375, 93.6796875, 98.265625, 102.8515625, 107.4375, 112.0234375, 116.609375, 121.1953125, 125.78125, 130.3671875, 134.953125, 139.5390625, 144.125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 6.0, 5.0, 11.0, 18.0, 22.0, 22.0, 41.0, 32.0, 54.0, 83.0, 167.0, 363.0, 768.0, 1135.0, 614.0, 249.0, 154.0, 80.0, 53.0, 44.0, 32.0, 21.0, 24.0, 11.0, 9.0, 12.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-208.0, -202.26953125, -196.5390625, -190.80859375, -185.078125, -179.34765625, -173.6171875, -167.88671875, -162.15625, -156.42578125, -150.6953125, -144.96484375, -139.234375, -133.50390625, -127.7734375, -122.04296875, -116.3125, -110.58203125, -104.8515625, -99.12109375, -93.390625, -87.66015625, -81.9296875, -76.19921875, -70.46875, -64.73828125, -59.0078125, -53.27734375, -47.546875, -41.81640625, -36.0859375, -30.35546875, -24.625, -18.89453125, -13.1640625, -7.43359375, -1.703125, 4.02734375, 9.7578125, 15.48828125, 21.21875, 26.94921875, 32.6796875, 38.41015625, 44.140625, 49.87109375, 55.6015625, 61.33203125, 67.0625, 72.79296875, 78.5234375, 84.25390625, 89.984375, 95.71484375, 101.4453125, 107.17578125, 112.90625, 118.63671875, 124.3671875, 130.09765625, 135.828125, 141.55859375, 147.2890625, 153.01953125, 158.75]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 9.0, 19.0, 46.0, 82.0, 167.0, 199.0, 205.0, 106.0, 66.0, 28.0, 20.0, 13.0, 7.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1288.7979736328125, -1225.997802734375, -1163.1976318359375, -1100.3974609375, -1037.597412109375, -974.7972412109375, -911.9970703125, -849.1968994140625, -786.3967895507812, -723.5966186523438, -660.7965087890625, -597.996337890625, -535.1961669921875, -472.39605712890625, -409.59588623046875, -346.7957458496094, -283.99560546875, -221.19546508789062, -158.3953094482422, -95.59515380859375, -32.795013427734375, 30.005126953125, 92.8052978515625, 155.60543823242188, 218.40557861328125, 281.2057189941406, 344.005859375, 406.8060302734375, 469.6061706542969, 532.4063110351562, 595.2064819335938, 658.006591796875, 720.806640625, 783.6068115234375, 846.4069213867188, 909.2070922851562, 972.0072021484375, 1034.807373046875, 1097.6075439453125, 1160.40771484375, 1223.207763671875, 1286.0079345703125, 1348.80810546875, 1411.608154296875, 1474.4083251953125, 1537.20849609375, 1600.0086669921875, 1662.808837890625, 1725.6090087890625, 1788.4091796875, 1851.2093505859375, 1914.009521484375, 1976.8095703125, 2039.6097412109375, 2102.409912109375, 2165.2099609375, 2228.01025390625, 2290.810302734375, 2353.610595703125, 2416.41064453125, 2479.2109375, 2542.010986328125, 2604.81103515625, 2667.611328125, 2730.411376953125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 3.0, 4.0, 4.0, 7.0, 4.0, 8.0, 15.0, 12.0, 21.0, 17.0, 25.0, 33.0, 25.0, 39.0, 38.0, 41.0, 32.0, 44.0, 51.0, 44.0, 55.0, 60.0, 55.0, 40.0, 46.0, 23.0, 34.0, 34.0, 29.0, 24.0, 34.0, 15.0, 21.0, 18.0, 9.0, 8.0, 7.0, 7.0, 9.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-759.8634033203125, -734.7206420898438, -709.577880859375, -684.4351196289062, -659.2923583984375, -634.1495971679688, -609.0068359375, -583.8640747070312, -558.7213134765625, -533.5785522460938, -508.435791015625, -483.29302978515625, -458.1502685546875, -433.00750732421875, -407.86474609375, -382.72198486328125, -357.5792236328125, -332.43646240234375, -307.293701171875, -282.15093994140625, -257.0081787109375, -231.86541748046875, -206.72265625, -181.57989501953125, -156.4371337890625, -131.29437255859375, -106.151611328125, -81.00885009765625, -55.8660888671875, -30.72332763671875, -5.58056640625, 19.56219482421875, 44.7049560546875, 69.84771728515625, 94.990478515625, 120.13323974609375, 145.2760009765625, 170.41876220703125, 195.5615234375, 220.70428466796875, 245.8470458984375, 270.98980712890625, 296.132568359375, 321.27532958984375, 346.4180908203125, 371.56085205078125, 396.70361328125, 421.84637451171875, 446.9891357421875, 472.13189697265625, 497.274658203125, 522.4174194335938, 547.5601806640625, 572.7029418945312, 597.845703125, 622.9884643554688, 648.1312255859375, 673.2739868164062, 698.416748046875, 723.5595092773438, 748.7022705078125, 773.8450317382812, 798.98779296875, 824.1305541992188, 849.2733154296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 5.0, 7.0, 14.0, 19.0, 30.0, 32.0, 44.0, 62.0, 114.0, 158.0, 221.0, 314.0, 475.0, 790.0, 1214.0, 1994.0, 3372.0, 5948.0, 11091.0, 21933.0, 46881.0, 111505.0, 296807.0, 320822.0, 122825.0, 50899.0, 23572.0, 11875.0, 6234.0, 3548.0, 2083.0, 1289.0, 756.0, 532.0, 367.0, 204.0, 142.0, 98.0, 84.0, 62.0, 37.0, 32.0, 22.0, 17.0, 6.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-102.0625, -98.775390625, -95.48828125, -92.201171875, -88.9140625, -85.626953125, -82.33984375, -79.052734375, -75.765625, -72.478515625, -69.19140625, -65.904296875, -62.6171875, -59.330078125, -56.04296875, -52.755859375, -49.46875, -46.181640625, -42.89453125, -39.607421875, -36.3203125, -33.033203125, -29.74609375, -26.458984375, -23.171875, -19.884765625, -16.59765625, -13.310546875, -10.0234375, -6.736328125, -3.44921875, -0.162109375, 3.125, 6.412109375, 9.69921875, 12.986328125, 16.2734375, 19.560546875, 22.84765625, 26.134765625, 29.421875, 32.708984375, 35.99609375, 39.283203125, 42.5703125, 45.857421875, 49.14453125, 52.431640625, 55.71875, 59.005859375, 62.29296875, 65.580078125, 68.8671875, 72.154296875, 75.44140625, 78.728515625, 82.015625, 85.302734375, 88.58984375, 91.876953125, 95.1640625, 98.451171875, 101.73828125, 105.025390625, 108.3125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 3.0, 8.0, 6.0, 9.0, 16.0, 15.0, 24.0, 18.0, 28.0, 21.0, 36.0, 38.0, 49.0, 43.0, 54.0, 61.0, 63.0, 59.0, 64.0, 53.0, 39.0, 52.0, 31.0, 32.0, 25.0, 27.0, 22.0, 27.0, 16.0, 19.0, 12.0, 9.0, 8.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.6875, -57.646484375, -55.60546875, -53.564453125, -51.5234375, -49.482421875, -47.44140625, -45.400390625, -43.359375, -41.318359375, -39.27734375, -37.236328125, -35.1953125, -33.154296875, -31.11328125, -29.072265625, -27.03125, -24.990234375, -22.94921875, -20.908203125, -18.8671875, -16.826171875, -14.78515625, -12.744140625, -10.703125, -8.662109375, -6.62109375, -4.580078125, -2.5390625, -0.498046875, 1.54296875, 3.583984375, 5.625, 7.666015625, 9.70703125, 11.748046875, 13.7890625, 15.830078125, 17.87109375, 19.912109375, 21.953125, 23.994140625, 26.03515625, 28.076171875, 30.1171875, 32.158203125, 34.19921875, 36.240234375, 38.28125, 40.322265625, 42.36328125, 44.404296875, 46.4453125, 48.486328125, 50.52734375, 52.568359375, 54.609375, 56.650390625, 58.69140625, 60.732421875, 62.7734375, 64.814453125, 66.85546875, 68.896484375, 70.9375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 10.0, 10.0, 9.0, 9.0, 19.0, 26.0, 53.0, 76.0, 116.0, 227.0, 459.0, 925.0, 2273.0, 7239.0, 36011.0, 421492.0, 528496.0, 38892.0, 7834.0, 2331.0, 983.0, 455.0, 236.0, 141.0, 73.0, 45.0, 31.0, 30.0, 16.0, 9.0, 5.0, 9.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-352.0, -341.94921875, -331.8984375, -321.84765625, -311.796875, -301.74609375, -291.6953125, -281.64453125, -271.59375, -261.54296875, -251.4921875, -241.44140625, -231.390625, -221.33984375, -211.2890625, -201.23828125, -191.1875, -181.13671875, -171.0859375, -161.03515625, -150.984375, -140.93359375, -130.8828125, -120.83203125, -110.78125, -100.73046875, -90.6796875, -80.62890625, -70.578125, -60.52734375, -50.4765625, -40.42578125, -30.375, -20.32421875, -10.2734375, -0.22265625, 9.828125, 19.87890625, 29.9296875, 39.98046875, 50.03125, 60.08203125, 70.1328125, 80.18359375, 90.234375, 100.28515625, 110.3359375, 120.38671875, 130.4375, 140.48828125, 150.5390625, 160.58984375, 170.640625, 180.69140625, 190.7421875, 200.79296875, 210.84375, 220.89453125, 230.9453125, 240.99609375, 251.046875, 261.09765625, 271.1484375, 281.19921875, 291.25]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 13.0, 6.0, 9.0, 26.0, 26.0, 31.0, 40.0, 46.0, 55.0, 67.0, 63.0, 84.0, 65.0, 69.0, 61.0, 64.0, 44.0, 48.0, 35.0, 33.0, 25.0, 23.0, 19.0, 14.0, 9.0, 9.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-371.25, -359.87109375, -348.4921875, -337.11328125, -325.734375, -314.35546875, -302.9765625, -291.59765625, -280.21875, -268.83984375, -257.4609375, -246.08203125, -234.703125, -223.32421875, -211.9453125, -200.56640625, -189.1875, -177.80859375, -166.4296875, -155.05078125, -143.671875, -132.29296875, -120.9140625, -109.53515625, -98.15625, -86.77734375, -75.3984375, -64.01953125, -52.640625, -41.26171875, -29.8828125, -18.50390625, -7.125, 4.25390625, 15.6328125, 27.01171875, 38.390625, 49.76953125, 61.1484375, 72.52734375, 83.90625, 95.28515625, 106.6640625, 118.04296875, 129.421875, 140.80078125, 152.1796875, 163.55859375, 174.9375, 186.31640625, 197.6953125, 209.07421875, 220.453125, 231.83203125, 243.2109375, 254.58984375, 265.96875, 277.34765625, 288.7265625, 300.10546875, 311.484375, 322.86328125, 334.2421875, 345.62109375, 357.0]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 10.0, 17.0, 22.0, 43.0, 86.0, 217.0, 572.0, 1817.0, 9337.0, 98324.0, 860616.0, 67617.0, 7392.0, 1578.0, 503.0, 186.0, 85.0, 41.0, 21.0, 10.0, 14.0, 10.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-208.375, -202.80859375, -197.2421875, -191.67578125, -186.109375, -180.54296875, -174.9765625, -169.41015625, -163.84375, -158.27734375, -152.7109375, -147.14453125, -141.578125, -136.01171875, -130.4453125, -124.87890625, -119.3125, -113.74609375, -108.1796875, -102.61328125, -97.046875, -91.48046875, -85.9140625, -80.34765625, -74.78125, -69.21484375, -63.6484375, -58.08203125, -52.515625, -46.94921875, -41.3828125, -35.81640625, -30.25, -24.68359375, -19.1171875, -13.55078125, -7.984375, -2.41796875, 3.1484375, 8.71484375, 14.28125, 19.84765625, 25.4140625, 30.98046875, 36.546875, 42.11328125, 47.6796875, 53.24609375, 58.8125, 64.37890625, 69.9453125, 75.51171875, 81.078125, 86.64453125, 92.2109375, 97.77734375, 103.34375, 108.91015625, 114.4765625, 120.04296875, 125.609375, 131.17578125, 136.7421875, 142.30859375, 147.875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 7.0, 5.0, 14.0, 8.0, 20.0, 30.0, 47.0, 75.0, 94.0, 171.0, 184.0, 127.0, 66.0, 48.0, 29.0, 29.0, 16.0, 10.0, 9.0, 4.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032684326171875, -0.03133201599121094, -0.029979705810546875, -0.028627395629882812, -0.02727508544921875, -0.025922775268554688, -0.024570465087890625, -0.023218154907226562, -0.0218658447265625, -0.020513534545898438, -0.019161224365234375, -0.017808914184570312, -0.01645660400390625, -0.015104293823242188, -0.013751983642578125, -0.012399673461914062, -0.01104736328125, -0.009695053100585938, -0.008342742919921875, -0.0069904327392578125, -0.00563812255859375, -0.0042858123779296875, -0.002933502197265625, -0.0015811920166015625, -0.0002288818359375, 0.0011234283447265625, 0.002475738525390625, 0.0038280487060546875, 0.00518035888671875, 0.0065326690673828125, 0.007884979248046875, 0.009237289428710938, 0.010589599609375, 0.011941909790039062, 0.013294219970703125, 0.014646530151367188, 0.01599884033203125, 0.017351150512695312, 0.018703460693359375, 0.020055770874023438, 0.0214080810546875, 0.022760391235351562, 0.024112701416015625, 0.025465011596679688, 0.02681732177734375, 0.028169631958007812, 0.029521942138671875, 0.030874252319335938, 0.0322265625, 0.03357887268066406, 0.034931182861328125, 0.03628349304199219, 0.03763580322265625, 0.03898811340332031, 0.040340423583984375, 0.04169273376464844, 0.0430450439453125, 0.04439735412597656, 0.045749664306640625, 0.04710197448730469, 0.04845428466796875, 0.04980659484863281, 0.051158905029296875, 0.05251121520996094, 0.053863525390625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 11.0, 14.0, 28.0, 18.0, 46.0, 88.0, 142.0, 279.0, 700.0, 2174.0, 8455.0, 53260.0, 747428.0, 209796.0, 19820.0, 4053.0, 1282.0, 473.0, 213.0, 101.0, 62.0, 42.0, 16.0, 13.0, 8.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-142.0, -137.529296875, -133.05859375, -128.587890625, -124.1171875, -119.646484375, -115.17578125, -110.705078125, -106.234375, -101.763671875, -97.29296875, -92.822265625, -88.3515625, -83.880859375, -79.41015625, -74.939453125, -70.46875, -65.998046875, -61.52734375, -57.056640625, -52.5859375, -48.115234375, -43.64453125, -39.173828125, -34.703125, -30.232421875, -25.76171875, -21.291015625, -16.8203125, -12.349609375, -7.87890625, -3.408203125, 1.0625, 5.533203125, 10.00390625, 14.474609375, 18.9453125, 23.416015625, 27.88671875, 32.357421875, 36.828125, 41.298828125, 45.76953125, 50.240234375, 54.7109375, 59.181640625, 63.65234375, 68.123046875, 72.59375, 77.064453125, 81.53515625, 86.005859375, 90.4765625, 94.947265625, 99.41796875, 103.888671875, 108.359375, 112.830078125, 117.30078125, 121.771484375, 126.2421875, 130.712890625, 135.18359375, 139.654296875, 144.125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 6.0, 7.0, 9.0, 17.0, 16.0, 17.0, 22.0, 46.0, 37.0, 59.0, 56.0, 100.0, 105.0, 88.0, 94.0, 61.0, 57.0, 47.0, 25.0, 23.0, 22.0, 23.0, 12.0, 9.0, 7.0, 11.0, 5.0, 5.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.9375, -84.0390625, -81.140625, -78.2421875, -75.34375, -72.4453125, -69.546875, -66.6484375, -63.75, -60.8515625, -57.953125, -55.0546875, -52.15625, -49.2578125, -46.359375, -43.4609375, -40.5625, -37.6640625, -34.765625, -31.8671875, -28.96875, -26.0703125, -23.171875, -20.2734375, -17.375, -14.4765625, -11.578125, -8.6796875, -5.78125, -2.8828125, 0.015625, 2.9140625, 5.8125, 8.7109375, 11.609375, 14.5078125, 17.40625, 20.3046875, 23.203125, 26.1015625, 29.0, 31.8984375, 34.796875, 37.6953125, 40.59375, 43.4921875, 46.390625, 49.2890625, 52.1875, 55.0859375, 57.984375, 60.8828125, 63.78125, 66.6796875, 69.578125, 72.4765625, 75.375, 78.2734375, 81.171875, 84.0703125, 86.96875, 89.8671875, 92.765625, 95.6640625, 98.5625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 11.0, 10.0, 26.0, 67.0, 134.0, 229.0, 255.0, 145.0, 69.0, 23.0, 16.0, 6.0, 8.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1734.6851806640625, -1652.6103515625, -1570.53564453125, -1488.4609375, -1406.3861083984375, -1324.311279296875, -1242.236572265625, -1160.161865234375, -1078.0870361328125, -996.0122680664062, -913.9375, -831.8627319335938, -749.7879638671875, -667.7131958007812, -585.638427734375, -503.56365966796875, -421.4888916015625, -339.41412353515625, -257.33935546875, -175.26458740234375, -93.1898193359375, -11.11505126953125, 70.959716796875, 153.03448486328125, 235.1092529296875, 317.18402099609375, 399.2587890625, 481.33355712890625, 563.4083251953125, 645.4830932617188, 727.557861328125, 809.6326293945312, 891.70751953125, 973.7822875976562, 1055.8570556640625, 1137.931884765625, 1220.006591796875, 1302.081298828125, 1384.1561279296875, 1466.23095703125, 1548.3056640625, 1630.38037109375, 1712.4552001953125, 1794.530029296875, 1876.604736328125, 1958.679443359375, 2040.7542724609375, 2122.8291015625, 2204.90380859375, 2286.978515625, 2369.05322265625, 2451.128173828125, 2533.202880859375, 2615.277587890625, 2697.3525390625, 2779.42724609375, 2861.501953125, 2943.57666015625, 3025.6513671875, 3107.726318359375, 3189.801025390625, 3271.875732421875, 3353.95068359375, 3436.025390625, 3518.10009765625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 8.0, 8.0, 8.0, 11.0, 14.0, 11.0, 15.0, 11.0, 14.0, 16.0, 28.0, 26.0, 34.0, 45.0, 49.0, 50.0, 56.0, 64.0, 66.0, 60.0, 55.0, 43.0, 43.0, 40.0, 35.0, 32.0, 35.0, 18.0, 11.0, 17.0, 16.0, 12.0, 11.0, 11.0, 4.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1078.020751953125, -1043.714599609375, -1009.4083251953125, -975.1021118164062, -940.7958984375, -906.4896850585938, -872.1834716796875, -837.8772583007812, -803.571044921875, -769.2648315429688, -734.9586181640625, -700.6524047851562, -666.34619140625, -632.0399780273438, -597.7337646484375, -563.4275512695312, -529.121337890625, -494.81512451171875, -460.5089111328125, -426.20269775390625, -391.896484375, -357.59027099609375, -323.2840576171875, -288.97784423828125, -254.671630859375, -220.36541748046875, -186.0592041015625, -151.75299072265625, -117.44677734375, -83.14056396484375, -48.8343505859375, -14.52813720703125, 19.778076171875, 54.08428955078125, 88.3905029296875, 122.69671630859375, 157.0029296875, 191.30914306640625, 225.6153564453125, 259.92156982421875, 294.227783203125, 328.53399658203125, 362.8402099609375, 397.14642333984375, 431.45263671875, 465.75885009765625, 500.0650634765625, 534.3712768554688, 568.677490234375, 602.9837036132812, 637.2899169921875, 671.5961303710938, 705.90234375, 740.2085571289062, 774.5147705078125, 808.8209838867188, 843.127197265625, 877.4334106445312, 911.7396240234375, 946.0458374023438, 980.35205078125, 1014.6582641601562, 1048.9644775390625, 1083.270751953125, 1117.576904296875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 9.0, 9.0, 12.0, 19.0, 21.0, 35.0, 51.0, 65.0, 115.0, 179.0, 219.0, 394.0, 615.0, 951.0, 1672.0, 2748.0, 4701.0, 8298.0, 15384.0, 32885.0, 85752.0, 320626.0, 1339522.0, 1729423.0, 455544.0, 113433.0, 40213.0, 18555.0, 9664.0, 5367.0, 3000.0, 1786.0, 1106.0, 650.0, 420.0, 274.0, 174.0, 118.0, 100.0, 46.0, 33.0, 25.0, 22.0, 13.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-70.9375, -68.7958984375, -66.654296875, -64.5126953125, -62.37109375, -60.2294921875, -58.087890625, -55.9462890625, -53.8046875, -51.6630859375, -49.521484375, -47.3798828125, -45.23828125, -43.0966796875, -40.955078125, -38.8134765625, -36.671875, -34.5302734375, -32.388671875, -30.2470703125, -28.10546875, -25.9638671875, -23.822265625, -21.6806640625, -19.5390625, -17.3974609375, -15.255859375, -13.1142578125, -10.97265625, -8.8310546875, -6.689453125, -4.5478515625, -2.40625, -0.2646484375, 1.876953125, 4.0185546875, 6.16015625, 8.3017578125, 10.443359375, 12.5849609375, 14.7265625, 16.8681640625, 19.009765625, 21.1513671875, 23.29296875, 25.4345703125, 27.576171875, 29.7177734375, 31.859375, 34.0009765625, 36.142578125, 38.2841796875, 40.42578125, 42.5673828125, 44.708984375, 46.8505859375, 48.9921875, 51.1337890625, 53.275390625, 55.4169921875, 57.55859375, 59.7001953125, 61.841796875, 63.9833984375, 66.125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 5.0, 9.0, 1.0, 6.0, 11.0, 15.0, 10.0, 21.0, 23.0, 32.0, 34.0, 30.0, 33.0, 32.0, 42.0, 47.0, 41.0, 48.0, 45.0, 66.0, 52.0, 43.0, 51.0, 26.0, 36.0, 44.0, 31.0, 29.0, 24.0, 19.0, 18.0, 8.0, 11.0, 8.0, 6.0, 12.0, 9.0, 7.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.25, -48.56640625, -46.8828125, -45.19921875, -43.515625, -41.83203125, -40.1484375, -38.46484375, -36.78125, -35.09765625, -33.4140625, -31.73046875, -30.046875, -28.36328125, -26.6796875, -24.99609375, -23.3125, -21.62890625, -19.9453125, -18.26171875, -16.578125, -14.89453125, -13.2109375, -11.52734375, -9.84375, -8.16015625, -6.4765625, -4.79296875, -3.109375, -1.42578125, 0.2578125, 1.94140625, 3.625, 5.30859375, 6.9921875, 8.67578125, 10.359375, 12.04296875, 13.7265625, 15.41015625, 17.09375, 18.77734375, 20.4609375, 22.14453125, 23.828125, 25.51171875, 27.1953125, 28.87890625, 30.5625, 32.24609375, 33.9296875, 35.61328125, 37.296875, 38.98046875, 40.6640625, 42.34765625, 44.03125, 45.71484375, 47.3984375, 49.08203125, 50.765625, 52.44921875, 54.1328125, 55.81640625, 57.5]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 5.0, 11.0, 17.0, 25.0, 32.0, 73.0, 100.0, 204.0, 477.0, 1070.0, 3308.0, 12926.0, 75528.0, 1882966.0, 2122861.0, 76770.0, 12793.0, 3282.0, 1038.0, 459.0, 164.0, 78.0, 40.0, 20.0, 17.0, 7.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.25, -258.6328125, -250.015625, -241.3984375, -232.78125, -224.1640625, -215.546875, -206.9296875, -198.3125, -189.6953125, -181.078125, -172.4609375, -163.84375, -155.2265625, -146.609375, -137.9921875, -129.375, -120.7578125, -112.140625, -103.5234375, -94.90625, -86.2890625, -77.671875, -69.0546875, -60.4375, -51.8203125, -43.203125, -34.5859375, -25.96875, -17.3515625, -8.734375, -0.1171875, 8.5, 17.1171875, 25.734375, 34.3515625, 42.96875, 51.5859375, 60.203125, 68.8203125, 77.4375, 86.0546875, 94.671875, 103.2890625, 111.90625, 120.5234375, 129.140625, 137.7578125, 146.375, 154.9921875, 163.609375, 172.2265625, 180.84375, 189.4609375, 198.078125, 206.6953125, 215.3125, 223.9296875, 232.546875, 241.1640625, 249.78125, 258.3984375, 267.015625, 275.6328125, 284.25]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 9.0, 9.0, 9.0, 16.0, 24.0, 27.0, 42.0, 77.0, 88.0, 142.0, 218.0, 436.0, 781.0, 920.0, 522.0, 279.0, 143.0, 108.0, 65.0, 50.0, 36.0, 20.0, 9.0, 15.0, 12.0, 10.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-338.0, -329.99609375, -321.9921875, -313.98828125, -305.984375, -297.98046875, -289.9765625, -281.97265625, -273.96875, -265.96484375, -257.9609375, -249.95703125, -241.953125, -233.94921875, -225.9453125, -217.94140625, -209.9375, -201.93359375, -193.9296875, -185.92578125, -177.921875, -169.91796875, -161.9140625, -153.91015625, -145.90625, -137.90234375, -129.8984375, -121.89453125, -113.890625, -105.88671875, -97.8828125, -89.87890625, -81.875, -73.87109375, -65.8671875, -57.86328125, -49.859375, -41.85546875, -33.8515625, -25.84765625, -17.84375, -9.83984375, -1.8359375, 6.16796875, 14.171875, 22.17578125, 30.1796875, 38.18359375, 46.1875, 54.19140625, 62.1953125, 70.19921875, 78.203125, 86.20703125, 94.2109375, 102.21484375, 110.21875, 118.22265625, 126.2265625, 134.23046875, 142.234375, 150.23828125, 158.2421875, 166.24609375, 174.25]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 8.0, 17.0, 51.0, 276.0, 473.0, 137.0, 29.0, 8.0, 3.0, 2.0, 3.0], "bins": [-11731.53515625, -11526.765625, -11321.99609375, -11117.2265625, -10912.45703125, -10707.6875, -10502.91796875, -10298.1494140625, -10093.3798828125, -9888.6103515625, -9683.8408203125, -9479.0712890625, -9274.3017578125, -9069.533203125, -8864.763671875, -8659.994140625, -8455.224609375, -8250.455078125, -8045.685546875, -7840.916015625, -7636.14697265625, -7431.37744140625, -7226.60791015625, -7021.83837890625, -6817.068359375, -6612.298828125, -6407.529296875, -6202.759765625, -5997.99072265625, -5793.22119140625, -5588.45166015625, -5383.68212890625, -5178.91259765625, -4974.14306640625, -4769.37353515625, -4564.6044921875, -4359.8349609375, -4155.0654296875, -3950.2958984375, -3745.5263671875, -3540.75732421875, -3335.98779296875, -3131.218505859375, -2926.448974609375, -2721.6796875, -2516.91015625, -2312.140625, -2107.37109375, -1902.6016845703125, -1697.832275390625, -1493.062744140625, -1288.2933349609375, -1083.52392578125, -878.7545166015625, -673.9849853515625, -469.215576171875, -264.4461669921875, -59.676727294921875, 145.09271240234375, 349.8621826171875, 554.631591796875, 759.4010009765625, 964.1705322265625, 1168.93994140625, 1373.7093505859375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 5.0, 7.0, 11.0, 16.0, 21.0, 21.0, 26.0, 22.0, 30.0, 32.0, 43.0, 35.0, 36.0, 33.0, 40.0, 48.0, 53.0, 51.0, 52.0, 58.0, 42.0, 38.0, 38.0, 33.0, 29.0, 32.0, 24.0, 20.0, 21.0, 17.0, 7.0, 12.0, 8.0, 7.0, 7.0, 7.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-930.379638671875, -898.8958740234375, -867.4120483398438, -835.9282836914062, -804.4445190429688, -772.960693359375, -741.4769287109375, -709.9931640625, -678.5093383789062, -647.0255737304688, -615.541748046875, -584.0579833984375, -552.57421875, -521.0903930664062, -489.60662841796875, -458.1228332519531, -426.6390686035156, -395.1552734375, -363.6715087890625, -332.1877136230469, -300.70391845703125, -269.22015380859375, -237.73635864257812, -206.2525634765625, -174.76878356933594, -143.28500366210938, -111.80120849609375, -80.31742858886719, -48.833641052246094, -17.349853515625, 14.133926391601562, 45.61772155761719, 77.10150146484375, 108.58528900146484, 140.06907653808594, 171.5528564453125, 203.03665161132812, 234.5204315185547, 266.00421142578125, 297.4880065917969, 328.9718017578125, 360.4555969238281, 391.9393615722656, 423.42315673828125, 454.9069519042969, 486.3907470703125, 517.87451171875, 549.3582763671875, 580.842041015625, 612.3258056640625, 643.8096313476562, 675.2933959960938, 706.7771606445312, 738.260986328125, 769.7447509765625, 801.228515625, 832.7123413085938, 864.1961059570312, 895.679931640625, 927.1636962890625, 958.6474609375, 990.1312866210938, 1021.6150512695312, 1053.098876953125, 1084.5826416015625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 13.0, 9.0, 25.0, 26.0, 49.0, 57.0, 117.0, 156.0, 227.0, 403.0, 634.0, 1181.0, 2114.0, 3798.0, 7205.0, 14470.0, 29633.0, 63901.0, 144496.0, 337707.0, 246964.0, 103539.0, 46764.0, 21883.0, 10621.0, 5540.0, 3043.0, 1624.0, 889.0, 536.0, 330.0, 207.0, 124.0, 92.0, 55.0, 30.0, 32.0, 13.0, 9.0, 10.0, 4.0, 10.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-131.125, -127.4619140625, -123.798828125, -120.1357421875, -116.47265625, -112.8095703125, -109.146484375, -105.4833984375, -101.8203125, -98.1572265625, -94.494140625, -90.8310546875, -87.16796875, -83.5048828125, -79.841796875, -76.1787109375, -72.515625, -68.8525390625, -65.189453125, -61.5263671875, -57.86328125, -54.2001953125, -50.537109375, -46.8740234375, -43.2109375, -39.5478515625, -35.884765625, -32.2216796875, -28.55859375, -24.8955078125, -21.232421875, -17.5693359375, -13.90625, -10.2431640625, -6.580078125, -2.9169921875, 0.74609375, 4.4091796875, 8.072265625, 11.7353515625, 15.3984375, 19.0615234375, 22.724609375, 26.3876953125, 30.05078125, 33.7138671875, 37.376953125, 41.0400390625, 44.703125, 48.3662109375, 52.029296875, 55.6923828125, 59.35546875, 63.0185546875, 66.681640625, 70.3447265625, 74.0078125, 77.6708984375, 81.333984375, 84.9970703125, 88.66015625, 92.3232421875, 95.986328125, 99.6494140625, 103.3125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 9.0, 3.0, 5.0, 9.0, 5.0, 8.0, 10.0, 16.0, 20.0, 21.0, 17.0, 29.0, 31.0, 33.0, 28.0, 30.0, 50.0, 42.0, 35.0, 43.0, 43.0, 31.0, 51.0, 44.0, 33.0, 36.0, 27.0, 30.0, 33.0, 26.0, 25.0, 21.0, 21.0, 16.0, 17.0, 16.0, 12.0, 10.0, 9.0, 8.0, 9.0, 9.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-48.96875, -47.32470703125, -45.6806640625, -44.03662109375, -42.392578125, -40.74853515625, -39.1044921875, -37.46044921875, -35.81640625, -34.17236328125, -32.5283203125, -30.88427734375, -29.240234375, -27.59619140625, -25.9521484375, -24.30810546875, -22.6640625, -21.02001953125, -19.3759765625, -17.73193359375, -16.087890625, -14.44384765625, -12.7998046875, -11.15576171875, -9.51171875, -7.86767578125, -6.2236328125, -4.57958984375, -2.935546875, -1.29150390625, 0.3525390625, 1.99658203125, 3.640625, 5.28466796875, 6.9287109375, 8.57275390625, 10.216796875, 11.86083984375, 13.5048828125, 15.14892578125, 16.79296875, 18.43701171875, 20.0810546875, 21.72509765625, 23.369140625, 25.01318359375, 26.6572265625, 28.30126953125, 29.9453125, 31.58935546875, 33.2333984375, 34.87744140625, 36.521484375, 38.16552734375, 39.8095703125, 41.45361328125, 43.09765625, 44.74169921875, 46.3857421875, 48.02978515625, 49.673828125, 51.31787109375, 52.9619140625, 54.60595703125, 56.25]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 10.0, 10.0, 13.0, 9.0, 17.0, 28.0, 38.0, 50.0, 63.0, 103.0, 135.0, 191.0, 245.0, 453.0, 674.0, 1134.0, 2150.0, 4855.0, 14821.0, 71937.0, 674960.0, 227161.0, 33499.0, 8629.0, 3092.0, 1638.0, 897.0, 536.0, 379.0, 241.0, 142.0, 119.0, 86.0, 53.0, 51.0, 31.0, 23.0, 19.0, 19.0, 11.0, 5.0, 7.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0], "bins": [-322.5, -313.486328125, -304.47265625, -295.458984375, -286.4453125, -277.431640625, -268.41796875, -259.404296875, -250.390625, -241.376953125, -232.36328125, -223.349609375, -214.3359375, -205.322265625, -196.30859375, -187.294921875, -178.28125, -169.267578125, -160.25390625, -151.240234375, -142.2265625, -133.212890625, -124.19921875, -115.185546875, -106.171875, -97.158203125, -88.14453125, -79.130859375, -70.1171875, -61.103515625, -52.08984375, -43.076171875, -34.0625, -25.048828125, -16.03515625, -7.021484375, 1.9921875, 11.005859375, 20.01953125, 29.033203125, 38.046875, 47.060546875, 56.07421875, 65.087890625, 74.1015625, 83.115234375, 92.12890625, 101.142578125, 110.15625, 119.169921875, 128.18359375, 137.197265625, 146.2109375, 155.224609375, 164.23828125, 173.251953125, 182.265625, 191.279296875, 200.29296875, 209.306640625, 218.3203125, 227.333984375, 236.34765625, 245.361328125, 254.375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 10.0, 11.0, 13.0, 15.0, 18.0, 19.0, 19.0, 33.0, 33.0, 43.0, 48.0, 54.0, 56.0, 59.0, 72.0, 54.0, 55.0, 81.0, 60.0, 41.0, 31.0, 45.0, 23.0, 29.0, 13.0, 11.0, 17.0, 14.0, 7.0, 5.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-451.0, -438.36328125, -425.7265625, -413.08984375, -400.453125, -387.81640625, -375.1796875, -362.54296875, -349.90625, -337.26953125, -324.6328125, -311.99609375, -299.359375, -286.72265625, -274.0859375, -261.44921875, -248.8125, -236.17578125, -223.5390625, -210.90234375, -198.265625, -185.62890625, -172.9921875, -160.35546875, -147.71875, -135.08203125, -122.4453125, -109.80859375, -97.171875, -84.53515625, -71.8984375, -59.26171875, -46.625, -33.98828125, -21.3515625, -8.71484375, 3.921875, 16.55859375, 29.1953125, 41.83203125, 54.46875, 67.10546875, 79.7421875, 92.37890625, 105.015625, 117.65234375, 130.2890625, 142.92578125, 155.5625, 168.19921875, 180.8359375, 193.47265625, 206.109375, 218.74609375, 231.3828125, 244.01953125, 256.65625, 269.29296875, 281.9296875, 294.56640625, 307.203125, 319.83984375, 332.4765625, 345.11328125, 357.75]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 15.0, 12.0, 18.0, 27.0, 53.0, 98.0, 202.0, 358.0, 854.0, 2220.0, 8217.0, 50764.0, 676035.0, 274764.0, 26792.0, 5227.0, 1638.0, 633.0, 280.0, 159.0, 74.0, 39.0, 21.0, 20.0, 13.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.4375, -101.0517578125, -97.666015625, -94.2802734375, -90.89453125, -87.5087890625, -84.123046875, -80.7373046875, -77.3515625, -73.9658203125, -70.580078125, -67.1943359375, -63.80859375, -60.4228515625, -57.037109375, -53.6513671875, -50.265625, -46.8798828125, -43.494140625, -40.1083984375, -36.72265625, -33.3369140625, -29.951171875, -26.5654296875, -23.1796875, -19.7939453125, -16.408203125, -13.0224609375, -9.63671875, -6.2509765625, -2.865234375, 0.5205078125, 3.90625, 7.2919921875, 10.677734375, 14.0634765625, 17.44921875, 20.8349609375, 24.220703125, 27.6064453125, 30.9921875, 34.3779296875, 37.763671875, 41.1494140625, 44.53515625, 47.9208984375, 51.306640625, 54.6923828125, 58.078125, 61.4638671875, 64.849609375, 68.2353515625, 71.62109375, 75.0068359375, 78.392578125, 81.7783203125, 85.1640625, 88.5498046875, 91.935546875, 95.3212890625, 98.70703125, 102.0927734375, 105.478515625, 108.8642578125, 112.25]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 5.0, 8.0, 14.0, 7.0, 16.0, 17.0, 23.0, 22.0, 29.0, 35.0, 19.0, 39.0, 48.0, 58.0, 80.0, 87.0, 82.0, 65.0, 55.0, 33.0, 34.0, 43.0, 35.0, 22.0, 24.0, 16.0, 14.0, 18.0, 11.0, 5.0, 6.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0222320556640625, -0.021589994430541992, -0.020947933197021484, -0.020305871963500977, -0.01966381072998047, -0.01902174949645996, -0.018379688262939453, -0.017737627029418945, -0.017095565795898438, -0.01645350456237793, -0.015811443328857422, -0.015169382095336914, -0.014527320861816406, -0.013885259628295898, -0.01324319839477539, -0.012601137161254883, -0.011959075927734375, -0.011317014694213867, -0.01067495346069336, -0.010032892227172852, -0.009390830993652344, -0.008748769760131836, -0.008106708526611328, -0.00746464729309082, -0.0068225860595703125, -0.006180524826049805, -0.005538463592529297, -0.004896402359008789, -0.004254341125488281, -0.0036122798919677734, -0.0029702186584472656, -0.002328157424926758, -0.00168609619140625, -0.0010440349578857422, -0.0004019737243652344, 0.00024008750915527344, 0.0008821487426757812, 0.001524209976196289, 0.002166271209716797, 0.0028083324432373047, 0.0034503936767578125, 0.00409245491027832, 0.004734516143798828, 0.005376577377319336, 0.006018638610839844, 0.0066606998443603516, 0.007302761077880859, 0.007944822311401367, 0.008586883544921875, 0.009228944778442383, 0.00987100601196289, 0.010513067245483398, 0.011155128479003906, 0.011797189712524414, 0.012439250946044922, 0.01308131217956543, 0.013723373413085938, 0.014365434646606445, 0.015007495880126953, 0.01564955711364746, 0.01629161834716797, 0.016933679580688477, 0.017575740814208984, 0.018217802047729492, 0.01885986328125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 9.0, 8.0, 6.0, 23.0, 26.0, 59.0, 72.0, 164.0, 322.0, 683.0, 1599.0, 5201.0, 28431.0, 427687.0, 545665.0, 30232.0, 5266.0, 1653.0, 681.0, 347.0, 192.0, 90.0, 59.0, 42.0, 20.0, 12.0, 11.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-161.75, -158.0751953125, -154.400390625, -150.7255859375, -147.05078125, -143.3759765625, -139.701171875, -136.0263671875, -132.3515625, -128.6767578125, -125.001953125, -121.3271484375, -117.65234375, -113.9775390625, -110.302734375, -106.6279296875, -102.953125, -99.2783203125, -95.603515625, -91.9287109375, -88.25390625, -84.5791015625, -80.904296875, -77.2294921875, -73.5546875, -69.8798828125, -66.205078125, -62.5302734375, -58.85546875, -55.1806640625, -51.505859375, -47.8310546875, -44.15625, -40.4814453125, -36.806640625, -33.1318359375, -29.45703125, -25.7822265625, -22.107421875, -18.4326171875, -14.7578125, -11.0830078125, -7.408203125, -3.7333984375, -0.05859375, 3.6162109375, 7.291015625, 10.9658203125, 14.640625, 18.3154296875, 21.990234375, 25.6650390625, 29.33984375, 33.0146484375, 36.689453125, 40.3642578125, 44.0390625, 47.7138671875, 51.388671875, 55.0634765625, 58.73828125, 62.4130859375, 66.087890625, 69.7626953125, 73.4375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 5.0, 6.0, 3.0, 3.0, 11.0, 7.0, 18.0, 12.0, 11.0, 18.0, 20.0, 25.0, 32.0, 34.0, 36.0, 39.0, 44.0, 43.0, 45.0, 45.0, 50.0, 50.0, 55.0, 56.0, 38.0, 51.0, 33.0, 34.0, 21.0, 24.0, 24.0, 14.0, 20.0, 10.0, 12.0, 9.0, 9.0, 6.0, 6.0, 4.0, 5.0, 3.0, 6.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-53.875, -52.10791015625, -50.3408203125, -48.57373046875, -46.806640625, -45.03955078125, -43.2724609375, -41.50537109375, -39.73828125, -37.97119140625, -36.2041015625, -34.43701171875, -32.669921875, -30.90283203125, -29.1357421875, -27.36865234375, -25.6015625, -23.83447265625, -22.0673828125, -20.30029296875, -18.533203125, -16.76611328125, -14.9990234375, -13.23193359375, -11.46484375, -9.69775390625, -7.9306640625, -6.16357421875, -4.396484375, -2.62939453125, -0.8623046875, 0.90478515625, 2.671875, 4.43896484375, 6.2060546875, 7.97314453125, 9.740234375, 11.50732421875, 13.2744140625, 15.04150390625, 16.80859375, 18.57568359375, 20.3427734375, 22.10986328125, 23.876953125, 25.64404296875, 27.4111328125, 29.17822265625, 30.9453125, 32.71240234375, 34.4794921875, 36.24658203125, 38.013671875, 39.78076171875, 41.5478515625, 43.31494140625, 45.08203125, 46.84912109375, 48.6162109375, 50.38330078125, 52.150390625, 53.91748046875, 55.6845703125, 57.45166015625, 59.21875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 7.0, 8.0, 18.0, 21.0, 77.0, 160.0, 278.0, 203.0, 114.0, 62.0, 26.0, 13.0, 9.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2113.28076171875, -2031.3466796875, -1949.4127197265625, -1867.478759765625, -1785.544677734375, -1703.610595703125, -1621.6766357421875, -1539.74267578125, -1457.80859375, -1375.87451171875, -1293.9405517578125, -1212.006591796875, -1130.072509765625, -1048.138427734375, -966.2044677734375, -884.2704467773438, -802.33642578125, -720.4024047851562, -638.4683837890625, -556.5343627929688, -474.600341796875, -392.66632080078125, -310.7322998046875, -228.79827880859375, -146.8642578125, -64.93023681640625, 17.0037841796875, 98.93780517578125, 180.871826171875, 262.80584716796875, 344.7398681640625, 426.67388916015625, 508.60791015625, 590.5419311523438, 672.4759521484375, 754.4099731445312, 836.343994140625, 918.2780151367188, 1000.2120361328125, 1082.14599609375, 1164.080078125, 1246.01416015625, 1327.9481201171875, 1409.882080078125, 1491.816162109375, 1573.750244140625, 1655.6842041015625, 1737.6181640625, 1819.55224609375, 1901.486328125, 1983.4202880859375, 2065.354248046875, 2147.288330078125, 2229.222412109375, 2311.15625, 2393.09033203125, 2475.0244140625, 2556.95849609375, 2638.892578125, 2720.826416015625, 2802.760498046875, 2884.694580078125, 2966.62841796875, 3048.5625, 3130.49658203125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 4.0, 9.0, 8.0, 11.0, 14.0, 11.0, 22.0, 18.0, 22.0, 24.0, 22.0, 36.0, 30.0, 43.0, 37.0, 55.0, 76.0, 68.0, 76.0, 61.0, 52.0, 36.0, 38.0, 43.0, 33.0, 25.0, 25.0, 13.0, 16.0, 15.0, 11.0, 9.0, 5.0, 8.0, 5.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1455.0361328125, -1411.7655029296875, -1368.4949951171875, -1325.224365234375, -1281.953857421875, -1238.6832275390625, -1195.41259765625, -1152.14208984375, -1108.8714599609375, -1065.600830078125, -1022.330322265625, -979.0596923828125, -935.7891235351562, -892.5185546875, -849.2479248046875, -805.9773559570312, -762.706787109375, -719.4362182617188, -676.1656494140625, -632.89501953125, -589.6244506835938, -546.3538818359375, -503.0832824707031, -459.81268310546875, -416.5421142578125, -373.27154541015625, -330.0009460449219, -286.7303466796875, -243.45977783203125, -200.18919372558594, -156.91860961914062, -113.64801025390625, -70.3773193359375, -27.106735229492188, 16.163848876953125, 59.43443298339844, 102.70501708984375, 145.97560119628906, 189.24618530273438, 232.51678466796875, 275.787353515625, 319.05792236328125, 362.3285217285156, 405.59912109375, 448.86968994140625, 492.1402587890625, 535.410888671875, 578.6814575195312, 621.9520263671875, 665.2225952148438, 708.4931640625, 751.7637939453125, 795.0343627929688, 838.304931640625, 881.5755615234375, 924.8461303710938, 968.11669921875, 1011.3872680664062, 1054.6578369140625, 1097.928466796875, 1141.198974609375, 1184.4696044921875, 1227.740234375, 1271.0107421875, 1314.2813720703125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 10.0, 15.0, 34.0, 40.0, 57.0, 86.0, 150.0, 240.0, 436.0, 701.0, 1196.0, 2104.0, 3890.0, 7216.0, 14909.0, 36036.0, 116678.0, 493805.0, 1742292.0, 1326649.0, 319126.0, 77136.0, 26521.0, 11622.0, 5715.0, 3136.0, 1821.0, 991.0, 614.0, 362.0, 243.0, 139.0, 99.0, 57.0, 48.0, 35.0, 21.0, 19.0, 13.0, 2.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.40625, -52.21728515625, -50.0283203125, -47.83935546875, -45.650390625, -43.46142578125, -41.2724609375, -39.08349609375, -36.89453125, -34.70556640625, -32.5166015625, -30.32763671875, -28.138671875, -25.94970703125, -23.7607421875, -21.57177734375, -19.3828125, -17.19384765625, -15.0048828125, -12.81591796875, -10.626953125, -8.43798828125, -6.2490234375, -4.06005859375, -1.87109375, 0.31787109375, 2.5068359375, 4.69580078125, 6.884765625, 9.07373046875, 11.2626953125, 13.45166015625, 15.640625, 17.82958984375, 20.0185546875, 22.20751953125, 24.396484375, 26.58544921875, 28.7744140625, 30.96337890625, 33.15234375, 35.34130859375, 37.5302734375, 39.71923828125, 41.908203125, 44.09716796875, 46.2861328125, 48.47509765625, 50.6640625, 52.85302734375, 55.0419921875, 57.23095703125, 59.419921875, 61.60888671875, 63.7978515625, 65.98681640625, 68.17578125, 70.36474609375, 72.5537109375, 74.74267578125, 76.931640625, 79.12060546875, 81.3095703125, 83.49853515625, 85.6875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 10.0, 7.0, 5.0, 14.0, 12.0, 19.0, 26.0, 22.0, 48.0, 42.0, 44.0, 67.0, 51.0, 70.0, 66.0, 60.0, 60.0, 57.0, 51.0, 51.0, 46.0, 34.0, 41.0, 26.0, 17.0, 18.0, 12.0, 14.0, 1.0, 8.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.8125, -74.1767578125, -71.541015625, -68.9052734375, -66.26953125, -63.6337890625, -60.998046875, -58.3623046875, -55.7265625, -53.0908203125, -50.455078125, -47.8193359375, -45.18359375, -42.5478515625, -39.912109375, -37.2763671875, -34.640625, -32.0048828125, -29.369140625, -26.7333984375, -24.09765625, -21.4619140625, -18.826171875, -16.1904296875, -13.5546875, -10.9189453125, -8.283203125, -5.6474609375, -3.01171875, -0.3759765625, 2.259765625, 4.8955078125, 7.53125, 10.1669921875, 12.802734375, 15.4384765625, 18.07421875, 20.7099609375, 23.345703125, 25.9814453125, 28.6171875, 31.2529296875, 33.888671875, 36.5244140625, 39.16015625, 41.7958984375, 44.431640625, 47.0673828125, 49.703125, 52.3388671875, 54.974609375, 57.6103515625, 60.24609375, 62.8818359375, 65.517578125, 68.1533203125, 70.7890625, 73.4248046875, 76.060546875, 78.6962890625, 81.33203125, 83.9677734375, 86.603515625, 89.2392578125, 91.875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 5.0, 8.0, 12.0, 12.0, 14.0, 27.0, 27.0, 62.0, 107.0, 144.0, 262.0, 524.0, 1083.0, 2562.0, 6578.0, 19987.0, 73282.0, 457305.0, 3117858.0, 413408.0, 69165.0, 19935.0, 6817.0, 2677.0, 1129.0, 559.0, 269.0, 146.0, 103.0, 59.0, 46.0, 34.0, 16.0, 26.0, 10.0, 4.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-136.875, -132.232421875, -127.58984375, -122.947265625, -118.3046875, -113.662109375, -109.01953125, -104.376953125, -99.734375, -95.091796875, -90.44921875, -85.806640625, -81.1640625, -76.521484375, -71.87890625, -67.236328125, -62.59375, -57.951171875, -53.30859375, -48.666015625, -44.0234375, -39.380859375, -34.73828125, -30.095703125, -25.453125, -20.810546875, -16.16796875, -11.525390625, -6.8828125, -2.240234375, 2.40234375, 7.044921875, 11.6875, 16.330078125, 20.97265625, 25.615234375, 30.2578125, 34.900390625, 39.54296875, 44.185546875, 48.828125, 53.470703125, 58.11328125, 62.755859375, 67.3984375, 72.041015625, 76.68359375, 81.326171875, 85.96875, 90.611328125, 95.25390625, 99.896484375, 104.5390625, 109.181640625, 113.82421875, 118.466796875, 123.109375, 127.751953125, 132.39453125, 137.037109375, 141.6796875, 146.322265625, 150.96484375, 155.607421875, 160.25]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 5.0, 8.0, 10.0, 5.0, 8.0, 15.0, 12.0, 15.0, 33.0, 35.0, 35.0, 57.0, 70.0, 87.0, 118.0, 151.0, 226.0, 359.0, 443.0, 531.0, 515.0, 357.0, 261.0, 175.0, 127.0, 83.0, 67.0, 45.0, 42.0, 29.0, 27.0, 19.0, 20.0, 16.0, 10.0, 9.0, 7.0, 10.0, 4.0, 3.0, 9.0, 1.0, 7.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-131.875, -127.5703125, -123.265625, -118.9609375, -114.65625, -110.3515625, -106.046875, -101.7421875, -97.4375, -93.1328125, -88.828125, -84.5234375, -80.21875, -75.9140625, -71.609375, -67.3046875, -63.0, -58.6953125, -54.390625, -50.0859375, -45.78125, -41.4765625, -37.171875, -32.8671875, -28.5625, -24.2578125, -19.953125, -15.6484375, -11.34375, -7.0390625, -2.734375, 1.5703125, 5.875, 10.1796875, 14.484375, 18.7890625, 23.09375, 27.3984375, 31.703125, 36.0078125, 40.3125, 44.6171875, 48.921875, 53.2265625, 57.53125, 61.8359375, 66.140625, 70.4453125, 74.75, 79.0546875, 83.359375, 87.6640625, 91.96875, 96.2734375, 100.578125, 104.8828125, 109.1875, 113.4921875, 117.796875, 122.1015625, 126.40625, 130.7109375, 135.015625, 139.3203125, 143.625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 10.0, 56.0, 349.0, 439.0, 113.0, 20.0, 10.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1325.0260009765625, -1164.0267333984375, -1003.027587890625, -842.0283203125, -681.0291137695312, -520.0299072265625, -359.0306396484375, -198.031494140625, -37.0322265625, 123.96699523925781, 284.9662170410156, 445.9654541015625, 606.9646606445312, 767.9638671875, 928.963134765625, 1089.9622802734375, 1250.9615478515625, 1411.9608154296875, 1572.9599609375, 1733.959228515625, 1894.95849609375, 2055.95751953125, 2216.95703125, 2377.9560546875, 2538.955322265625, 2699.95458984375, 2860.953857421875, 3021.953125, 3182.9521484375, 3343.951416015625, 3504.95068359375, 3665.94970703125, 3826.94873046875, 3987.947998046875, 4148.947265625, 4309.9462890625, 4470.94580078125, 4631.94482421875, 4792.9443359375, 4953.943359375, 5114.9423828125, 5275.94140625, 5436.94091796875, 5597.93994140625, 5758.939453125, 5919.9384765625, 6080.9375, 6241.93701171875, 6402.9365234375, 6563.935546875, 6724.93505859375, 6885.93408203125, 7046.93359375, 7207.9326171875, 7368.931640625, 7529.93115234375, 7690.93017578125, 7851.92919921875, 8012.9287109375, 8173.927734375, 8334.9267578125, 8495.92578125, 8656.92578125, 8817.9248046875, 8978.923828125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 11.0, 4.0, 5.0, 4.0, 7.0, 9.0, 17.0, 8.0, 18.0, 19.0, 19.0, 25.0, 25.0, 32.0, 24.0, 27.0, 34.0, 39.0, 50.0, 34.0, 57.0, 52.0, 50.0, 51.0, 41.0, 44.0, 40.0, 24.0, 38.0, 25.0, 35.0, 23.0, 13.0, 24.0, 16.0, 8.0, 9.0, 7.0, 7.0, 9.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-795.8304443359375, -770.4745483398438, -745.1187133789062, -719.7628173828125, -694.406982421875, -669.0510864257812, -643.6952514648438, -618.33935546875, -592.9835205078125, -567.6276245117188, -542.2717895507812, -516.9158935546875, -491.56005859375, -466.2041931152344, -440.84832763671875, -415.492431640625, -390.1365661621094, -364.78070068359375, -339.4248352050781, -314.0689697265625, -288.7131042480469, -263.35723876953125, -238.00135803222656, -212.64549255371094, -187.2896270751953, -161.9337615966797, -136.57789611816406, -111.2220230102539, -85.86615753173828, -60.510292053222656, -35.1544189453125, -9.798553466796875, 15.55731201171875, 40.913177490234375, 66.26904296875, 91.62491607666016, 116.98078155517578, 142.33663940429688, 167.69252014160156, 193.0483856201172, 218.4042510986328, 243.76011657714844, 269.1159973144531, 294.47186279296875, 319.8277282714844, 345.18359375, 370.5394592285156, 395.89532470703125, 421.2511901855469, 446.6070556640625, 471.9629211425781, 497.31878662109375, 522.6746826171875, 548.030517578125, 573.3864135742188, 598.7422485351562, 624.09814453125, 649.4540405273438, 674.8098754882812, 700.165771484375, 725.5216064453125, 750.8775024414062, 776.2333374023438, 801.5892333984375, 826.945068359375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 9.0, 18.0, 19.0, 33.0, 37.0, 61.0, 109.0, 145.0, 217.0, 345.0, 543.0, 887.0, 1516.0, 2699.0, 5034.0, 9780.0, 19612.0, 41800.0, 93534.0, 237262.0, 357681.0, 152782.0, 64383.0, 29486.0, 14233.0, 7151.0, 3899.0, 2121.0, 1202.0, 706.0, 441.0, 258.0, 182.0, 124.0, 77.0, 69.0, 31.0, 19.0, 19.0, 9.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-104.8125, -101.4609375, -98.109375, -94.7578125, -91.40625, -88.0546875, -84.703125, -81.3515625, -78.0, -74.6484375, -71.296875, -67.9453125, -64.59375, -61.2421875, -57.890625, -54.5390625, -51.1875, -47.8359375, -44.484375, -41.1328125, -37.78125, -34.4296875, -31.078125, -27.7265625, -24.375, -21.0234375, -17.671875, -14.3203125, -10.96875, -7.6171875, -4.265625, -0.9140625, 2.4375, 5.7890625, 9.140625, 12.4921875, 15.84375, 19.1953125, 22.546875, 25.8984375, 29.25, 32.6015625, 35.953125, 39.3046875, 42.65625, 46.0078125, 49.359375, 52.7109375, 56.0625, 59.4140625, 62.765625, 66.1171875, 69.46875, 72.8203125, 76.171875, 79.5234375, 82.875, 86.2265625, 89.578125, 92.9296875, 96.28125, 99.6328125, 102.984375, 106.3359375, 109.6875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 9.0, 3.0, 15.0, 13.0, 21.0, 20.0, 23.0, 28.0, 46.0, 31.0, 48.0, 50.0, 54.0, 52.0, 57.0, 53.0, 54.0, 49.0, 49.0, 46.0, 47.0, 44.0, 39.0, 24.0, 23.0, 24.0, 17.0, 9.0, 13.0, 10.0, 10.0, 5.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.25, -65.7763671875, -63.302734375, -60.8291015625, -58.35546875, -55.8818359375, -53.408203125, -50.9345703125, -48.4609375, -45.9873046875, -43.513671875, -41.0400390625, -38.56640625, -36.0927734375, -33.619140625, -31.1455078125, -28.671875, -26.1982421875, -23.724609375, -21.2509765625, -18.77734375, -16.3037109375, -13.830078125, -11.3564453125, -8.8828125, -6.4091796875, -3.935546875, -1.4619140625, 1.01171875, 3.4853515625, 5.958984375, 8.4326171875, 10.90625, 13.3798828125, 15.853515625, 18.3271484375, 20.80078125, 23.2744140625, 25.748046875, 28.2216796875, 30.6953125, 33.1689453125, 35.642578125, 38.1162109375, 40.58984375, 43.0634765625, 45.537109375, 48.0107421875, 50.484375, 52.9580078125, 55.431640625, 57.9052734375, 60.37890625, 62.8525390625, 65.326171875, 67.7998046875, 70.2734375, 72.7470703125, 75.220703125, 77.6943359375, 80.16796875, 82.6416015625, 85.115234375, 87.5888671875, 90.0625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 13.0, 11.0, 28.0, 32.0, 40.0, 70.0, 109.0, 185.0, 284.0, 445.0, 871.0, 1825.0, 5308.0, 24887.0, 236698.0, 708712.0, 54884.0, 8888.0, 2598.0, 1095.0, 601.0, 344.0, 208.0, 134.0, 97.0, 64.0, 38.0, 20.0, 18.0, 11.0, 8.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-331.0, -321.3203125, -311.640625, -301.9609375, -292.28125, -282.6015625, -272.921875, -263.2421875, -253.5625, -243.8828125, -234.203125, -224.5234375, -214.84375, -205.1640625, -195.484375, -185.8046875, -176.125, -166.4453125, -156.765625, -147.0859375, -137.40625, -127.7265625, -118.046875, -108.3671875, -98.6875, -89.0078125, -79.328125, -69.6484375, -59.96875, -50.2890625, -40.609375, -30.9296875, -21.25, -11.5703125, -1.890625, 7.7890625, 17.46875, 27.1484375, 36.828125, 46.5078125, 56.1875, 65.8671875, 75.546875, 85.2265625, 94.90625, 104.5859375, 114.265625, 123.9453125, 133.625, 143.3046875, 152.984375, 162.6640625, 172.34375, 182.0234375, 191.703125, 201.3828125, 211.0625, 220.7421875, 230.421875, 240.1015625, 249.78125, 259.4609375, 269.140625, 278.8203125, 288.5]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 9.0, 19.0, 25.0, 21.0, 37.0, 46.0, 45.0, 47.0, 68.0, 48.0, 68.0, 64.0, 60.0, 60.0, 69.0, 55.0, 41.0, 44.0, 39.0, 21.0, 24.0, 28.0, 17.0, 16.0, 10.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-299.75, -287.78125, -275.8125, -263.84375, -251.875, -239.90625, -227.9375, -215.96875, -204.0, -192.03125, -180.0625, -168.09375, -156.125, -144.15625, -132.1875, -120.21875, -108.25, -96.28125, -84.3125, -72.34375, -60.375, -48.40625, -36.4375, -24.46875, -12.5, -0.53125, 11.4375, 23.40625, 35.375, 47.34375, 59.3125, 71.28125, 83.25, 95.21875, 107.1875, 119.15625, 131.125, 143.09375, 155.0625, 167.03125, 179.0, 190.96875, 202.9375, 214.90625, 226.875, 238.84375, 250.8125, 262.78125, 274.75, 286.71875, 298.6875, 310.65625, 322.625, 334.59375, 346.5625, 358.53125, 370.5, 382.46875, 394.4375, 406.40625, 418.375, 430.34375, 442.3125, 454.28125, 466.25]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 6.0, 4.0, 8.0, 12.0, 21.0, 19.0, 29.0, 42.0, 73.0, 117.0, 181.0, 307.0, 489.0, 1037.0, 2349.0, 5822.0, 18135.0, 82304.0, 583264.0, 283092.0, 50661.0, 12485.0, 4330.0, 1777.0, 820.0, 444.0, 257.0, 148.0, 96.0, 59.0, 38.0, 23.0, 24.0, 21.0, 10.0, 8.0, 5.0, 10.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-63.3125, -61.38525390625, -59.4580078125, -57.53076171875, -55.603515625, -53.67626953125, -51.7490234375, -49.82177734375, -47.89453125, -45.96728515625, -44.0400390625, -42.11279296875, -40.185546875, -38.25830078125, -36.3310546875, -34.40380859375, -32.4765625, -30.54931640625, -28.6220703125, -26.69482421875, -24.767578125, -22.84033203125, -20.9130859375, -18.98583984375, -17.05859375, -15.13134765625, -13.2041015625, -11.27685546875, -9.349609375, -7.42236328125, -5.4951171875, -3.56787109375, -1.640625, 0.28662109375, 2.2138671875, 4.14111328125, 6.068359375, 7.99560546875, 9.9228515625, 11.85009765625, 13.77734375, 15.70458984375, 17.6318359375, 19.55908203125, 21.486328125, 23.41357421875, 25.3408203125, 27.26806640625, 29.1953125, 31.12255859375, 33.0498046875, 34.97705078125, 36.904296875, 38.83154296875, 40.7587890625, 42.68603515625, 44.61328125, 46.54052734375, 48.4677734375, 50.39501953125, 52.322265625, 54.24951171875, 56.1767578125, 58.10400390625, 60.03125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 3.0, 6.0, 8.0, 8.0, 9.0, 17.0, 34.0, 37.0, 52.0, 74.0, 96.0, 116.0, 142.0, 109.0, 72.0, 66.0, 54.0, 24.0, 19.0, 12.0, 9.0, 5.0, 9.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0390625, -0.038178443908691406, -0.03729438781738281, -0.03641033172607422, -0.035526275634765625, -0.03464221954345703, -0.03375816345214844, -0.032874107360839844, -0.03199005126953125, -0.031105995178222656, -0.030221939086914062, -0.02933788299560547, -0.028453826904296875, -0.02756977081298828, -0.026685714721679688, -0.025801658630371094, -0.0249176025390625, -0.024033546447753906, -0.023149490356445312, -0.02226543426513672, -0.021381378173828125, -0.02049732208251953, -0.019613265991210938, -0.018729209899902344, -0.01784515380859375, -0.016961097717285156, -0.016077041625976562, -0.015192985534667969, -0.014308929443359375, -0.013424873352050781, -0.012540817260742188, -0.011656761169433594, -0.010772705078125, -0.009888648986816406, -0.009004592895507812, -0.008120536804199219, -0.007236480712890625, -0.006352424621582031, -0.0054683685302734375, -0.004584312438964844, -0.00370025634765625, -0.0028162002563476562, -0.0019321441650390625, -0.0010480880737304688, -0.000164031982421875, 0.0007200241088867188, 0.0016040802001953125, 0.0024881362915039062, 0.0033721923828125, 0.004256248474121094, 0.0051403045654296875, 0.006024360656738281, 0.006908416748046875, 0.007792472839355469, 0.008676528930664062, 0.009560585021972656, 0.01044464111328125, 0.011328697204589844, 0.012212753295898438, 0.013096809387207031, 0.013980865478515625, 0.014864921569824219, 0.015748977661132812, 0.016633033752441406, 0.01751708984375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 12.0, 16.0, 16.0, 41.0, 76.0, 188.0, 471.0, 1364.0, 6576.0, 119533.0, 881243.0, 34024.0, 3517.0, 890.0, 294.0, 148.0, 59.0, 26.0, 20.0, 14.0, 14.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.625, -96.48828125, -92.3515625, -88.21484375, -84.078125, -79.94140625, -75.8046875, -71.66796875, -67.53125, -63.39453125, -59.2578125, -55.12109375, -50.984375, -46.84765625, -42.7109375, -38.57421875, -34.4375, -30.30078125, -26.1640625, -22.02734375, -17.890625, -13.75390625, -9.6171875, -5.48046875, -1.34375, 2.79296875, 6.9296875, 11.06640625, 15.203125, 19.33984375, 23.4765625, 27.61328125, 31.75, 35.88671875, 40.0234375, 44.16015625, 48.296875, 52.43359375, 56.5703125, 60.70703125, 64.84375, 68.98046875, 73.1171875, 77.25390625, 81.390625, 85.52734375, 89.6640625, 93.80078125, 97.9375, 102.07421875, 106.2109375, 110.34765625, 114.484375, 118.62109375, 122.7578125, 126.89453125, 131.03125, 135.16796875, 139.3046875, 143.44140625, 147.578125, 151.71484375, 155.8515625, 159.98828125, 164.125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 8.0, 14.0, 17.0, 22.0, 31.0, 27.0, 46.0, 45.0, 52.0, 48.0, 66.0, 77.0, 75.0, 74.0, 64.0, 57.0, 57.0, 40.0, 42.0, 41.0, 28.0, 15.0, 15.0, 9.0, 7.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.1875, -58.33935546875, -56.4912109375, -54.64306640625, -52.794921875, -50.94677734375, -49.0986328125, -47.25048828125, -45.40234375, -43.55419921875, -41.7060546875, -39.85791015625, -38.009765625, -36.16162109375, -34.3134765625, -32.46533203125, -30.6171875, -28.76904296875, -26.9208984375, -25.07275390625, -23.224609375, -21.37646484375, -19.5283203125, -17.68017578125, -15.83203125, -13.98388671875, -12.1357421875, -10.28759765625, -8.439453125, -6.59130859375, -4.7431640625, -2.89501953125, -1.046875, 0.80126953125, 2.6494140625, 4.49755859375, 6.345703125, 8.19384765625, 10.0419921875, 11.89013671875, 13.73828125, 15.58642578125, 17.4345703125, 19.28271484375, 21.130859375, 22.97900390625, 24.8271484375, 26.67529296875, 28.5234375, 30.37158203125, 32.2197265625, 34.06787109375, 35.916015625, 37.76416015625, 39.6123046875, 41.46044921875, 43.30859375, 45.15673828125, 47.0048828125, 48.85302734375, 50.701171875, 52.54931640625, 54.3974609375, 56.24560546875, 58.09375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 8.0, 29.0, 58.0, 157.0, 324.0, 244.0, 95.0, 50.0, 14.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2960.052978515625, -2874.81982421875, -2789.586669921875, -2704.353515625, -2619.120361328125, -2533.88720703125, -2448.654052734375, -2363.4208984375, -2278.187744140625, -2192.95458984375, -2107.721435546875, -2022.48828125, -1937.255126953125, -1852.02197265625, -1766.788818359375, -1681.5556640625, -1596.322509765625, -1511.08935546875, -1425.856201171875, -1340.623046875, -1255.389892578125, -1170.15673828125, -1084.923583984375, -999.6904296875, -914.457275390625, -829.22412109375, -743.990966796875, -658.7578125, -573.524658203125, -488.29150390625, -403.058349609375, -317.8251953125, -232.592041015625, -147.35888671875, -62.125732421875, 23.107421875, 108.340576171875, 193.57373046875, 278.806884765625, 364.0400390625, 449.273193359375, 534.50634765625, 619.739501953125, 704.97265625, 790.205810546875, 875.43896484375, 960.672119140625, 1045.9052734375, 1131.138427734375, 1216.37158203125, 1301.604736328125, 1386.837890625, 1472.071044921875, 1557.30419921875, 1642.537353515625, 1727.7705078125, 1813.003662109375, 1898.23681640625, 1983.469970703125, 2068.703125, 2153.936279296875, 2239.16943359375, 2324.402587890625, 2409.6357421875, 2494.868896484375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 5.0, 6.0, 12.0, 9.0, 13.0, 12.0, 14.0, 12.0, 14.0, 14.0, 26.0, 32.0, 32.0, 38.0, 30.0, 33.0, 47.0, 51.0, 57.0, 82.0, 61.0, 47.0, 39.0, 29.0, 30.0, 23.0, 33.0, 22.0, 35.0, 21.0, 21.0, 15.0, 9.0, 13.0, 14.0, 9.0, 7.0, 5.0, 5.0, 7.0, 1.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1181.378662109375, -1148.8143310546875, -1116.25, -1083.685791015625, -1051.1214599609375, -1018.55712890625, -985.9927978515625, -953.428466796875, -920.8641967773438, -888.2998657226562, -855.735595703125, -823.1712646484375, -790.60693359375, -758.0426635742188, -725.4783325195312, -692.9140625, -660.3497314453125, -627.785400390625, -595.2211303710938, -562.6567993164062, -530.092529296875, -497.5281982421875, -464.9638671875, -432.3995666503906, -399.83526611328125, -367.2709655761719, -334.7066650390625, -302.142333984375, -269.5780334472656, -237.01373291015625, -204.4494171142578, -171.88510131835938, -139.32086181640625, -106.75655364990234, -74.19224548339844, -41.62793731689453, -9.063629150390625, 23.50067138671875, 56.06498718261719, 88.62930297851562, 121.193603515625, 153.75790405273438, 186.3222198486328, 218.88653564453125, 251.45083618164062, 284.01513671875, 316.5794677734375, 349.1437683105469, 381.70806884765625, 414.2723693847656, 446.836669921875, 479.4010009765625, 511.9653015136719, 544.5296020507812, 577.0939331054688, 609.658203125, 642.2225341796875, 674.786865234375, 707.3511352539062, 739.9154663085938, 772.479736328125, 805.0440673828125, 837.6083984375, 870.1727294921875, 902.7369995117188]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 11.0, 9.0, 22.0, 33.0, 46.0, 60.0, 78.0, 146.0, 228.0, 406.0, 697.0, 1339.0, 2702.0, 6160.0, 16755.0, 69253.0, 536323.0, 2578308.0, 847198.0, 98720.0, 21584.0, 7502.0, 3215.0, 1529.0, 789.0, 438.0, 244.0, 149.0, 83.0, 77.0, 44.0, 32.0, 25.0, 18.0, 15.0, 7.0, 5.0, 6.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.5625, -97.380859375, -94.19921875, -91.017578125, -87.8359375, -84.654296875, -81.47265625, -78.291015625, -75.109375, -71.927734375, -68.74609375, -65.564453125, -62.3828125, -59.201171875, -56.01953125, -52.837890625, -49.65625, -46.474609375, -43.29296875, -40.111328125, -36.9296875, -33.748046875, -30.56640625, -27.384765625, -24.203125, -21.021484375, -17.83984375, -14.658203125, -11.4765625, -8.294921875, -5.11328125, -1.931640625, 1.25, 4.431640625, 7.61328125, 10.794921875, 13.9765625, 17.158203125, 20.33984375, 23.521484375, 26.703125, 29.884765625, 33.06640625, 36.248046875, 39.4296875, 42.611328125, 45.79296875, 48.974609375, 52.15625, 55.337890625, 58.51953125, 61.701171875, 64.8828125, 68.064453125, 71.24609375, 74.427734375, 77.609375, 80.791015625, 83.97265625, 87.154296875, 90.3359375, 93.517578125, 96.69921875, 99.880859375, 103.0625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 7.0, 6.0, 8.0, 14.0, 16.0, 18.0, 26.0, 29.0, 35.0, 28.0, 30.0, 40.0, 30.0, 35.0, 44.0, 50.0, 42.0, 57.0, 52.0, 36.0, 46.0, 41.0, 35.0, 35.0, 29.0, 32.0, 34.0, 23.0, 21.0, 21.0, 12.0, 16.0, 10.0, 7.0, 4.0, 11.0, 9.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.90625, -61.87841796875, -59.8505859375, -57.82275390625, -55.794921875, -53.76708984375, -51.7392578125, -49.71142578125, -47.68359375, -45.65576171875, -43.6279296875, -41.60009765625, -39.572265625, -37.54443359375, -35.5166015625, -33.48876953125, -31.4609375, -29.43310546875, -27.4052734375, -25.37744140625, -23.349609375, -21.32177734375, -19.2939453125, -17.26611328125, -15.23828125, -13.21044921875, -11.1826171875, -9.15478515625, -7.126953125, -5.09912109375, -3.0712890625, -1.04345703125, 0.984375, 3.01220703125, 5.0400390625, 7.06787109375, 9.095703125, 11.12353515625, 13.1513671875, 15.17919921875, 17.20703125, 19.23486328125, 21.2626953125, 23.29052734375, 25.318359375, 27.34619140625, 29.3740234375, 31.40185546875, 33.4296875, 35.45751953125, 37.4853515625, 39.51318359375, 41.541015625, 43.56884765625, 45.5966796875, 47.62451171875, 49.65234375, 51.68017578125, 53.7080078125, 55.73583984375, 57.763671875, 59.79150390625, 61.8193359375, 63.84716796875, 65.875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 7.0, 17.0, 24.0, 27.0, 53.0, 78.0, 114.0, 220.0, 532.0, 1393.0, 4674.0, 22882.0, 278022.0, 3724162.0, 140391.0, 16005.0, 3623.0, 1148.0, 460.0, 181.0, 108.0, 47.0, 37.0, 18.0, 13.0, 7.0, 9.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-275.0, -267.23046875, -259.4609375, -251.69140625, -243.921875, -236.15234375, -228.3828125, -220.61328125, -212.84375, -205.07421875, -197.3046875, -189.53515625, -181.765625, -173.99609375, -166.2265625, -158.45703125, -150.6875, -142.91796875, -135.1484375, -127.37890625, -119.609375, -111.83984375, -104.0703125, -96.30078125, -88.53125, -80.76171875, -72.9921875, -65.22265625, -57.453125, -49.68359375, -41.9140625, -34.14453125, -26.375, -18.60546875, -10.8359375, -3.06640625, 4.703125, 12.47265625, 20.2421875, 28.01171875, 35.78125, 43.55078125, 51.3203125, 59.08984375, 66.859375, 74.62890625, 82.3984375, 90.16796875, 97.9375, 105.70703125, 113.4765625, 121.24609375, 129.015625, 136.78515625, 144.5546875, 152.32421875, 160.09375, 167.86328125, 175.6328125, 183.40234375, 191.171875, 198.94140625, 206.7109375, 214.48046875, 222.25]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 13.0, 16.0, 13.0, 17.0, 28.0, 36.0, 49.0, 82.0, 136.0, 217.0, 428.0, 651.0, 800.0, 598.0, 369.0, 189.0, 129.0, 70.0, 60.0, 35.0, 22.0, 22.0, 13.0, 12.0, 11.0, 11.0, 14.0, 3.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-208.625, -203.05078125, -197.4765625, -191.90234375, -186.328125, -180.75390625, -175.1796875, -169.60546875, -164.03125, -158.45703125, -152.8828125, -147.30859375, -141.734375, -136.16015625, -130.5859375, -125.01171875, -119.4375, -113.86328125, -108.2890625, -102.71484375, -97.140625, -91.56640625, -85.9921875, -80.41796875, -74.84375, -69.26953125, -63.6953125, -58.12109375, -52.546875, -46.97265625, -41.3984375, -35.82421875, -30.25, -24.67578125, -19.1015625, -13.52734375, -7.953125, -2.37890625, 3.1953125, 8.76953125, 14.34375, 19.91796875, 25.4921875, 31.06640625, 36.640625, 42.21484375, 47.7890625, 53.36328125, 58.9375, 64.51171875, 70.0859375, 75.66015625, 81.234375, 86.80859375, 92.3828125, 97.95703125, 103.53125, 109.10546875, 114.6796875, 120.25390625, 125.828125, 131.40234375, 136.9765625, 142.55078125, 148.125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 6.0, 4.0, 5.0, 14.0, 33.0, 62.0, 166.0, 259.0, 198.0, 133.0, 55.0, 26.0, 20.0, 8.0, 1.0, 1.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1606.7406005859375, -1539.2440185546875, -1471.74755859375, -1404.2509765625, -1336.75439453125, -1269.2578125, -1201.7613525390625, -1134.2647705078125, -1066.768310546875, -999.2717895507812, -931.7752075195312, -864.2786865234375, -796.7821044921875, -729.2855834960938, -661.7890625, -594.29248046875, -526.7958984375, -459.2993469238281, -391.80279541015625, -324.3062744140625, -256.8097229003906, -189.31317138671875, -121.816650390625, -54.320098876953125, 13.17645263671875, 80.6729965209961, 148.16954040527344, 215.66607666015625, 283.1626281738281, 350.6591796875, 418.15570068359375, 485.6522521972656, 553.148681640625, 620.6452026367188, 688.1417846679688, 755.6383056640625, 823.1348876953125, 890.6314086914062, 958.1279296875, 1025.62451171875, 1093.12109375, 1160.61767578125, 1228.1141357421875, 1295.6107177734375, 1363.1072998046875, 1430.603759765625, 1498.100341796875, 1565.596923828125, 1633.0933837890625, 1700.5899658203125, 1768.08642578125, 1835.5830078125, 1903.07958984375, 1970.576171875, 2038.0726318359375, 2105.569091796875, 2173.065673828125, 2240.562255859375, 2308.058837890625, 2375.55517578125, 2443.0517578125, 2510.54833984375, 2578.044921875, 2645.54150390625, 2713.0380859375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 14.0, 10.0, 16.0, 15.0, 18.0, 23.0, 23.0, 26.0, 35.0, 33.0, 29.0, 50.0, 36.0, 50.0, 46.0, 44.0, 55.0, 51.0, 52.0, 47.0, 49.0, 35.0, 39.0, 29.0, 33.0, 21.0, 23.0, 16.0, 18.0, 12.0, 13.0, 11.0, 5.0, 3.0, 8.0, 1.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-986.668701171875, -959.8295288085938, -932.9903564453125, -906.1511840820312, -879.31201171875, -852.472900390625, -825.6337280273438, -798.7945556640625, -771.9553833007812, -745.1162109375, -718.2770385742188, -691.4378662109375, -664.5987548828125, -637.759521484375, -610.92041015625, -584.0812377929688, -557.2420654296875, -530.4028930664062, -503.563720703125, -476.7245788574219, -449.8854064941406, -423.0462341308594, -396.20709228515625, -369.367919921875, -342.52874755859375, -315.6895751953125, -288.85040283203125, -262.0112609863281, -235.17208862304688, -208.33291625976562, -181.49375915527344, -154.65460205078125, -127.81549072265625, -100.97632598876953, -74.13716125488281, -47.297996520996094, -20.458831787109375, 6.380340576171875, 33.21949768066406, 60.05865478515625, 86.8978271484375, 113.73699188232422, 140.57615661621094, 167.41531372070312, 194.25448608398438, 221.09365844726562, 247.9328155517578, 274.77197265625, 301.61114501953125, 328.4503173828125, 355.28948974609375, 382.1286315917969, 408.9678039550781, 435.8069763183594, 462.6461181640625, 489.48529052734375, 516.324462890625, 543.1636352539062, 570.0028076171875, 596.8419799804688, 623.68115234375, 650.520263671875, 677.3594360351562, 704.1986083984375, 731.0377807617188]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 11.0, 15.0, 23.0, 39.0, 36.0, 92.0, 131.0, 232.0, 414.0, 704.0, 1363.0, 2469.0, 5103.0, 10753.0, 24717.0, 61592.0, 163224.0, 352961.0, 256356.0, 99008.0, 38369.0, 16187.0, 7175.0, 3538.0, 1733.0, 981.0, 539.0, 314.0, 170.0, 112.0, 83.0, 47.0, 23.0, 10.0, 14.0, 7.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.4375, -65.779296875, -63.12109375, -60.462890625, -57.8046875, -55.146484375, -52.48828125, -49.830078125, -47.171875, -44.513671875, -41.85546875, -39.197265625, -36.5390625, -33.880859375, -31.22265625, -28.564453125, -25.90625, -23.248046875, -20.58984375, -17.931640625, -15.2734375, -12.615234375, -9.95703125, -7.298828125, -4.640625, -1.982421875, 0.67578125, 3.333984375, 5.9921875, 8.650390625, 11.30859375, 13.966796875, 16.625, 19.283203125, 21.94140625, 24.599609375, 27.2578125, 29.916015625, 32.57421875, 35.232421875, 37.890625, 40.548828125, 43.20703125, 45.865234375, 48.5234375, 51.181640625, 53.83984375, 56.498046875, 59.15625, 61.814453125, 64.47265625, 67.130859375, 69.7890625, 72.447265625, 75.10546875, 77.763671875, 80.421875, 83.080078125, 85.73828125, 88.396484375, 91.0546875, 93.712890625, 96.37109375, 99.029296875, 101.6875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 7.0, 7.0, 10.0, 17.0, 19.0, 27.0, 17.0, 27.0, 31.0, 30.0, 35.0, 35.0, 43.0, 46.0, 53.0, 43.0, 62.0, 47.0, 47.0, 49.0, 44.0, 38.0, 30.0, 38.0, 23.0, 27.0, 19.0, 25.0, 16.0, 14.0, 18.0, 12.0, 11.0, 7.0, 5.0, 6.0, 2.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.125, -71.9541015625, -69.783203125, -67.6123046875, -65.44140625, -63.2705078125, -61.099609375, -58.9287109375, -56.7578125, -54.5869140625, -52.416015625, -50.2451171875, -48.07421875, -45.9033203125, -43.732421875, -41.5615234375, -39.390625, -37.2197265625, -35.048828125, -32.8779296875, -30.70703125, -28.5361328125, -26.365234375, -24.1943359375, -22.0234375, -19.8525390625, -17.681640625, -15.5107421875, -13.33984375, -11.1689453125, -8.998046875, -6.8271484375, -4.65625, -2.4853515625, -0.314453125, 1.8564453125, 4.02734375, 6.1982421875, 8.369140625, 10.5400390625, 12.7109375, 14.8818359375, 17.052734375, 19.2236328125, 21.39453125, 23.5654296875, 25.736328125, 27.9072265625, 30.078125, 32.2490234375, 34.419921875, 36.5908203125, 38.76171875, 40.9326171875, 43.103515625, 45.2744140625, 47.4453125, 49.6162109375, 51.787109375, 53.9580078125, 56.12890625, 58.2998046875, 60.470703125, 62.6416015625, 64.8125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 8.0, 12.0, 24.0, 38.0, 65.0, 155.0, 481.0, 1544.0, 9270.0, 166689.0, 834431.0, 31023.0, 3473.0, 835.0, 281.0, 94.0, 64.0, 27.0, 13.0, 14.0, 8.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.25, -256.2265625, -245.203125, -234.1796875, -223.15625, -212.1328125, -201.109375, -190.0859375, -179.0625, -168.0390625, -157.015625, -145.9921875, -134.96875, -123.9453125, -112.921875, -101.8984375, -90.875, -79.8515625, -68.828125, -57.8046875, -46.78125, -35.7578125, -24.734375, -13.7109375, -2.6875, 8.3359375, 19.359375, 30.3828125, 41.40625, 52.4296875, 63.453125, 74.4765625, 85.5, 96.5234375, 107.546875, 118.5703125, 129.59375, 140.6171875, 151.640625, 162.6640625, 173.6875, 184.7109375, 195.734375, 206.7578125, 217.78125, 228.8046875, 239.828125, 250.8515625, 261.875, 272.8984375, 283.921875, 294.9453125, 305.96875, 316.9921875, 328.015625, 339.0390625, 350.0625, 361.0859375, 372.109375, 383.1328125, 394.15625, 405.1796875, 416.203125, 427.2265625, 438.25]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 11.0, 9.0, 23.0, 21.0, 44.0, 59.0, 72.0, 73.0, 80.0, 88.0, 80.0, 87.0, 60.0, 60.0, 48.0, 42.0, 40.0, 41.0, 17.0, 14.0, 6.0, 11.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-467.0, -454.046875, -441.09375, -428.140625, -415.1875, -402.234375, -389.28125, -376.328125, -363.375, -350.421875, -337.46875, -324.515625, -311.5625, -298.609375, -285.65625, -272.703125, -259.75, -246.796875, -233.84375, -220.890625, -207.9375, -194.984375, -182.03125, -169.078125, -156.125, -143.171875, -130.21875, -117.265625, -104.3125, -91.359375, -78.40625, -65.453125, -52.5, -39.546875, -26.59375, -13.640625, -0.6875, 12.265625, 25.21875, 38.171875, 51.125, 64.078125, 77.03125, 89.984375, 102.9375, 115.890625, 128.84375, 141.796875, 154.75, 167.703125, 180.65625, 193.609375, 206.5625, 219.515625, 232.46875, 245.421875, 258.375, 271.328125, 284.28125, 297.234375, 310.1875, 323.140625, 336.09375, 349.046875, 362.0]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 8.0, 17.0, 18.0, 35.0, 70.0, 106.0, 229.0, 414.0, 907.0, 2309.0, 6156.0, 21591.0, 96446.0, 596482.0, 253661.0, 50463.0, 12662.0, 4040.0, 1513.0, 692.0, 326.0, 173.0, 77.0, 54.0, 25.0, 27.0, 18.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.125, -45.5947265625, -44.064453125, -42.5341796875, -41.00390625, -39.4736328125, -37.943359375, -36.4130859375, -34.8828125, -33.3525390625, -31.822265625, -30.2919921875, -28.76171875, -27.2314453125, -25.701171875, -24.1708984375, -22.640625, -21.1103515625, -19.580078125, -18.0498046875, -16.51953125, -14.9892578125, -13.458984375, -11.9287109375, -10.3984375, -8.8681640625, -7.337890625, -5.8076171875, -4.27734375, -2.7470703125, -1.216796875, 0.3134765625, 1.84375, 3.3740234375, 4.904296875, 6.4345703125, 7.96484375, 9.4951171875, 11.025390625, 12.5556640625, 14.0859375, 15.6162109375, 17.146484375, 18.6767578125, 20.20703125, 21.7373046875, 23.267578125, 24.7978515625, 26.328125, 27.8583984375, 29.388671875, 30.9189453125, 32.44921875, 33.9794921875, 35.509765625, 37.0400390625, 38.5703125, 40.1005859375, 41.630859375, 43.1611328125, 44.69140625, 46.2216796875, 47.751953125, 49.2822265625, 50.8125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 8.0, 11.0, 10.0, 17.0, 36.0, 29.0, 46.0, 67.0, 90.0, 115.0, 109.0, 92.0, 81.0, 75.0, 59.0, 36.0, 30.0, 23.0, 19.0, 12.0, 12.0, 7.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0142059326171875, -0.013648748397827148, -0.013091564178466797, -0.012534379959106445, -0.011977195739746094, -0.011420011520385742, -0.01086282730102539, -0.010305643081665039, -0.009748458862304688, -0.009191274642944336, -0.008634090423583984, -0.008076906204223633, -0.007519721984863281, -0.00696253776550293, -0.006405353546142578, -0.0058481693267822266, -0.005290985107421875, -0.0047338008880615234, -0.004176616668701172, -0.0036194324493408203, -0.0030622482299804688, -0.002505064010620117, -0.0019478797912597656, -0.001390695571899414, -0.0008335113525390625, -0.00027632713317871094, 0.0002808570861816406, 0.0008380413055419922, 0.0013952255249023438, 0.0019524097442626953, 0.002509593963623047, 0.0030667781829833984, 0.00362396240234375, 0.0041811466217041016, 0.004738330841064453, 0.005295515060424805, 0.005852699279785156, 0.006409883499145508, 0.006967067718505859, 0.007524251937866211, 0.008081436157226562, 0.008638620376586914, 0.009195804595947266, 0.009752988815307617, 0.010310173034667969, 0.01086735725402832, 0.011424541473388672, 0.011981725692749023, 0.012538909912109375, 0.013096094131469727, 0.013653278350830078, 0.01421046257019043, 0.014767646789550781, 0.015324831008911133, 0.015882015228271484, 0.016439199447631836, 0.016996383666992188, 0.01755356788635254, 0.01811075210571289, 0.018667936325073242, 0.019225120544433594, 0.019782304763793945, 0.020339488983154297, 0.02089667320251465, 0.021453857421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 6.0, 4.0, 3.0, 7.0, 19.0, 13.0, 25.0, 30.0, 50.0, 96.0, 172.0, 307.0, 710.0, 1808.0, 5350.0, 18402.0, 85722.0, 576002.0, 285429.0, 55109.0, 12882.0, 3807.0, 1420.0, 584.0, 253.0, 117.0, 64.0, 48.0, 39.0, 29.0, 10.0, 9.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-54.0, -52.4052734375, -50.810546875, -49.2158203125, -47.62109375, -46.0263671875, -44.431640625, -42.8369140625, -41.2421875, -39.6474609375, -38.052734375, -36.4580078125, -34.86328125, -33.2685546875, -31.673828125, -30.0791015625, -28.484375, -26.8896484375, -25.294921875, -23.7001953125, -22.10546875, -20.5107421875, -18.916015625, -17.3212890625, -15.7265625, -14.1318359375, -12.537109375, -10.9423828125, -9.34765625, -7.7529296875, -6.158203125, -4.5634765625, -2.96875, -1.3740234375, 0.220703125, 1.8154296875, 3.41015625, 5.0048828125, 6.599609375, 8.1943359375, 9.7890625, 11.3837890625, 12.978515625, 14.5732421875, 16.16796875, 17.7626953125, 19.357421875, 20.9521484375, 22.546875, 24.1416015625, 25.736328125, 27.3310546875, 28.92578125, 30.5205078125, 32.115234375, 33.7099609375, 35.3046875, 36.8994140625, 38.494140625, 40.0888671875, 41.68359375, 43.2783203125, 44.873046875, 46.4677734375, 48.0625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 9.0, 12.0, 11.0, 19.0, 13.0, 29.0, 33.0, 43.0, 44.0, 43.0, 51.0, 73.0, 89.0, 67.0, 58.0, 67.0, 61.0, 58.0, 42.0, 40.0, 28.0, 29.0, 11.0, 15.0, 11.0, 8.0, 7.0, 8.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.625, -46.1416015625, -44.658203125, -43.1748046875, -41.69140625, -40.2080078125, -38.724609375, -37.2412109375, -35.7578125, -34.2744140625, -32.791015625, -31.3076171875, -29.82421875, -28.3408203125, -26.857421875, -25.3740234375, -23.890625, -22.4072265625, -20.923828125, -19.4404296875, -17.95703125, -16.4736328125, -14.990234375, -13.5068359375, -12.0234375, -10.5400390625, -9.056640625, -7.5732421875, -6.08984375, -4.6064453125, -3.123046875, -1.6396484375, -0.15625, 1.3271484375, 2.810546875, 4.2939453125, 5.77734375, 7.2607421875, 8.744140625, 10.2275390625, 11.7109375, 13.1943359375, 14.677734375, 16.1611328125, 17.64453125, 19.1279296875, 20.611328125, 22.0947265625, 23.578125, 25.0615234375, 26.544921875, 28.0283203125, 29.51171875, 30.9951171875, 32.478515625, 33.9619140625, 35.4453125, 36.9287109375, 38.412109375, 39.8955078125, 41.37890625, 42.8623046875, 44.345703125, 45.8291015625, 47.3125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 9.0, 19.0, 43.0, 70.0, 113.0, 199.0, 238.0, 120.0, 82.0, 40.0, 20.0, 15.0, 11.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1245.5618896484375, -1204.123779296875, -1162.6856689453125, -1121.24755859375, -1079.8094482421875, -1038.371337890625, -996.9331665039062, -955.4950561523438, -914.0569458007812, -872.6188354492188, -831.1807250976562, -789.7426147460938, -748.304443359375, -706.8663330078125, -665.42822265625, -623.9901123046875, -582.552001953125, -541.1138916015625, -499.67578125, -458.2376403808594, -416.7995300292969, -375.3614196777344, -333.92327880859375, -292.48516845703125, -251.04705810546875, -209.60894775390625, -168.1708221435547, -126.73270416259766, -85.29458618164062, -43.856475830078125, -2.4183502197265625, 39.019775390625, 80.457763671875, 121.89588165283203, 163.33399963378906, 204.77212524414062, 246.21023559570312, 287.6483459472656, 329.08648681640625, 370.52459716796875, 411.96270751953125, 453.40081787109375, 494.83892822265625, 536.2770385742188, 577.7152099609375, 619.1533203125, 660.5914306640625, 702.029541015625, 743.4676513671875, 784.90576171875, 826.3438720703125, 867.781982421875, 909.2200927734375, 950.658203125, 992.0963745117188, 1033.534423828125, 1074.97265625, 1116.4107666015625, 1157.848876953125, 1199.2869873046875, 1240.72509765625, 1282.1632080078125, 1323.601318359375, 1365.03955078125, 1406.4775390625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 7.0, 15.0, 9.0, 8.0, 6.0, 16.0, 22.0, 15.0, 29.0, 27.0, 28.0, 33.0, 32.0, 32.0, 52.0, 66.0, 94.0, 76.0, 69.0, 56.0, 41.0, 35.0, 31.0, 16.0, 26.0, 26.0, 27.0, 23.0, 12.0, 9.0, 19.0, 7.0, 11.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1107.3682861328125, -1075.04150390625, -1042.7147216796875, -1010.3878784179688, -978.0610961914062, -945.7343139648438, -913.407470703125, -881.0806884765625, -848.75390625, -816.4271240234375, -784.100341796875, -751.7734985351562, -719.4467163085938, -687.1199340820312, -654.7930908203125, -622.46630859375, -590.1395263671875, -557.812744140625, -525.4859619140625, -493.15911865234375, -460.83233642578125, -428.50555419921875, -396.1787414550781, -363.8519287109375, -331.525146484375, -299.1983642578125, -266.8715515136719, -234.5447540283203, -202.21795654296875, -169.8911590576172, -137.56436157226562, -105.23756408691406, -72.9107666015625, -40.58396911621094, -8.257171630859375, 24.069625854492188, 56.39642333984375, 88.72322082519531, 121.05001831054688, 153.37681579589844, 185.70361328125, 218.03041076660156, 250.35720825195312, 282.68402099609375, 315.01080322265625, 347.33758544921875, 379.6643981933594, 411.9912109375, 444.3179931640625, 476.644775390625, 508.9715881347656, 541.2984008789062, 573.6251831054688, 605.9519653320312, 638.27880859375, 670.6055908203125, 702.932373046875, 735.2591552734375, 767.5859375, 799.9127807617188, 832.2395629882812, 864.5663452148438, 896.8931884765625, 929.219970703125, 961.5467529296875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 3.0, 8.0, 16.0, 13.0, 23.0, 24.0, 27.0, 34.0, 51.0, 83.0, 243.0, 818.0, 3523.0, 28514.0, 1314904.0, 2782705.0, 55767.0, 5619.0, 1155.0, 365.0, 123.0, 81.0, 35.0, 35.0, 28.0, 18.0, 16.0, 6.0, 14.0, 5.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-243.0, -236.625, -230.25, -223.875, -217.5, -211.125, -204.75, -198.375, -192.0, -185.625, -179.25, -172.875, -166.5, -160.125, -153.75, -147.375, -141.0, -134.625, -128.25, -121.875, -115.5, -109.125, -102.75, -96.375, -90.0, -83.625, -77.25, -70.875, -64.5, -58.125, -51.75, -45.375, -39.0, -32.625, -26.25, -19.875, -13.5, -7.125, -0.75, 5.625, 12.0, 18.375, 24.75, 31.125, 37.5, 43.875, 50.25, 56.625, 63.0, 69.375, 75.75, 82.125, 88.5, 94.875, 101.25, 107.625, 114.0, 120.375, 126.75, 133.125, 139.5, 145.875, 152.25, 158.625, 165.0]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 11.0, 4.0, 9.0, 12.0, 18.0, 13.0, 25.0, 29.0, 29.0, 29.0, 44.0, 39.0, 44.0, 55.0, 59.0, 61.0, 48.0, 44.0, 61.0, 45.0, 40.0, 47.0, 38.0, 43.0, 37.0, 24.0, 20.0, 19.0, 15.0, 8.0, 9.0, 7.0, 5.0, 5.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-90.875, -88.3798828125, -85.884765625, -83.3896484375, -80.89453125, -78.3994140625, -75.904296875, -73.4091796875, -70.9140625, -68.4189453125, -65.923828125, -63.4287109375, -60.93359375, -58.4384765625, -55.943359375, -53.4482421875, -50.953125, -48.4580078125, -45.962890625, -43.4677734375, -40.97265625, -38.4775390625, -35.982421875, -33.4873046875, -30.9921875, -28.4970703125, -26.001953125, -23.5068359375, -21.01171875, -18.5166015625, -16.021484375, -13.5263671875, -11.03125, -8.5361328125, -6.041015625, -3.5458984375, -1.05078125, 1.4443359375, 3.939453125, 6.4345703125, 8.9296875, 11.4248046875, 13.919921875, 16.4150390625, 18.91015625, 21.4052734375, 23.900390625, 26.3955078125, 28.890625, 31.3857421875, 33.880859375, 36.3759765625, 38.87109375, 41.3662109375, 43.861328125, 46.3564453125, 48.8515625, 51.3466796875, 53.841796875, 56.3369140625, 58.83203125, 61.3271484375, 63.822265625, 66.3173828125, 68.8125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 6.0, 4.0, 13.0, 16.0, 33.0, 58.0, 111.0, 298.0, 1074.0, 8215.0, 318352.0, 3833625.0, 29207.0, 2361.0, 525.0, 198.0, 84.0, 30.0, 20.0, 20.0, 7.0, 5.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.875, -196.470703125, -185.06640625, -173.662109375, -162.2578125, -150.853515625, -139.44921875, -128.044921875, -116.640625, -105.236328125, -93.83203125, -82.427734375, -71.0234375, -59.619140625, -48.21484375, -36.810546875, -25.40625, -14.001953125, -2.59765625, 8.806640625, 20.2109375, 31.615234375, 43.01953125, 54.423828125, 65.828125, 77.232421875, 88.63671875, 100.041015625, 111.4453125, 122.849609375, 134.25390625, 145.658203125, 157.0625, 168.466796875, 179.87109375, 191.275390625, 202.6796875, 214.083984375, 225.48828125, 236.892578125, 248.296875, 259.701171875, 271.10546875, 282.509765625, 293.9140625, 305.318359375, 316.72265625, 328.126953125, 339.53125, 350.935546875, 362.33984375, 373.744140625, 385.1484375, 396.552734375, 407.95703125, 419.361328125, 430.765625, 442.169921875, 453.57421875, 464.978515625, 476.3828125, 487.787109375, 499.19140625, 510.595703125, 522.0]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 3.0, 12.0, 5.0, 11.0, 18.0, 20.0, 32.0, 60.0, 75.0, 152.0, 258.0, 529.0, 867.0, 861.0, 524.0, 273.0, 147.0, 69.0, 56.0, 27.0, 21.0, 16.0, 16.0, 7.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.5, -155.294921875, -149.08984375, -142.884765625, -136.6796875, -130.474609375, -124.26953125, -118.064453125, -111.859375, -105.654296875, -99.44921875, -93.244140625, -87.0390625, -80.833984375, -74.62890625, -68.423828125, -62.21875, -56.013671875, -49.80859375, -43.603515625, -37.3984375, -31.193359375, -24.98828125, -18.783203125, -12.578125, -6.373046875, -0.16796875, 6.037109375, 12.2421875, 18.447265625, 24.65234375, 30.857421875, 37.0625, 43.267578125, 49.47265625, 55.677734375, 61.8828125, 68.087890625, 74.29296875, 80.498046875, 86.703125, 92.908203125, 99.11328125, 105.318359375, 111.5234375, 117.728515625, 123.93359375, 130.138671875, 136.34375, 142.548828125, 148.75390625, 154.958984375, 161.1640625, 167.369140625, 173.57421875, 179.779296875, 185.984375, 192.189453125, 198.39453125, 204.599609375, 210.8046875, 217.009765625, 223.21484375, 229.419921875, 235.625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 13.0, 62.0, 173.0, 349.0, 258.0, 95.0, 35.0, 12.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4054.216064453125, -3972.801513671875, -3891.38671875, -3809.97216796875, -3728.5576171875, -3647.14306640625, -3565.728271484375, -3484.313720703125, -3402.89892578125, -3321.484375, -3240.069580078125, -3158.655029296875, -3077.240478515625, -2995.82568359375, -2914.4111328125, -2832.99658203125, -2751.58203125, -2670.16748046875, -2588.752685546875, -2507.338134765625, -2425.923583984375, -2344.5087890625, -2263.09423828125, -2181.6796875, -2100.26513671875, -2018.8504638671875, -1937.4359130859375, -1856.021240234375, -1774.606689453125, -1693.1920166015625, -1611.77734375, -1530.36279296875, -1448.947998046875, -1367.5333251953125, -1286.1187744140625, -1204.7041015625, -1123.28955078125, -1041.8748779296875, -960.460205078125, -879.0455932617188, -797.6309814453125, -716.2163696289062, -634.8017578125, -553.3870849609375, -471.97247314453125, -390.557861328125, -309.1432189941406, -227.72857666015625, -146.31396484375, -64.89933776855469, 16.515289306640625, 97.92991638183594, 179.34454345703125, 260.7591552734375, 342.1737976074219, 423.58843994140625, 505.0030517578125, 586.4176635742188, 667.832275390625, 749.2469482421875, 830.6615600585938, 912.076171875, 993.4908447265625, 1074.905517578125, 1156.320068359375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 5.0, 8.0, 7.0, 9.0, 10.0, 16.0, 22.0, 20.0, 17.0, 30.0, 32.0, 37.0, 25.0, 41.0, 35.0, 38.0, 41.0, 34.0, 29.0, 37.0, 40.0, 40.0, 49.0, 32.0, 40.0, 38.0, 30.0, 35.0, 28.0, 22.0, 21.0, 23.0, 17.0, 10.0, 18.0, 13.0, 10.0, 9.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-566.1646118164062, -547.57373046875, -528.9827880859375, -510.39190673828125, -491.8009948730469, -473.2100830078125, -454.61920166015625, -436.0282897949219, -417.4373779296875, -398.8464660644531, -380.25555419921875, -361.6646728515625, -343.0737609863281, -324.48284912109375, -305.8919677734375, -287.3010559082031, -268.71014404296875, -250.11923217773438, -231.52833557128906, -212.93743896484375, -194.34652709960938, -175.755615234375, -157.1647186279297, -138.57382202148438, -119.98291015625, -101.39200592041016, -82.80110168457031, -64.21019744873047, -45.619293212890625, -27.02838897705078, -8.437484741210938, 10.153411865234375, 28.7442626953125, 47.335166931152344, 65.92607116699219, 84.51697540283203, 103.10787963867188, 121.69878387451172, 140.28968811035156, 158.88058471679688, 177.47149658203125, 196.06240844726562, 214.65330505371094, 233.24420166015625, 251.83511352539062, 270.426025390625, 289.01690673828125, 307.6078186035156, 326.19873046875, 344.7896423339844, 363.38055419921875, 381.971435546875, 400.5623474121094, 419.15325927734375, 437.744140625, 456.3350524902344, 474.92596435546875, 493.5168762207031, 512.1077880859375, 530.6986694335938, 549.28955078125, 567.8804931640625, 586.4713745117188, 605.062255859375, 623.6531982421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 12.0, 8.0, 23.0, 16.0, 28.0, 67.0, 90.0, 145.0, 194.0, 333.0, 544.0, 928.0, 1480.0, 2787.0, 5027.0, 9733.0, 18793.0, 39736.0, 87738.0, 204591.0, 331554.0, 188855.0, 81194.0, 36934.0, 17896.0, 8915.0, 4702.0, 2480.0, 1436.0, 877.0, 539.0, 341.0, 218.0, 135.0, 67.0, 44.0, 27.0, 26.0, 19.0, 10.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-79.4375, -77.19677734375, -74.9560546875, -72.71533203125, -70.474609375, -68.23388671875, -65.9931640625, -63.75244140625, -61.51171875, -59.27099609375, -57.0302734375, -54.78955078125, -52.548828125, -50.30810546875, -48.0673828125, -45.82666015625, -43.5859375, -41.34521484375, -39.1044921875, -36.86376953125, -34.623046875, -32.38232421875, -30.1416015625, -27.90087890625, -25.66015625, -23.41943359375, -21.1787109375, -18.93798828125, -16.697265625, -14.45654296875, -12.2158203125, -9.97509765625, -7.734375, -5.49365234375, -3.2529296875, -1.01220703125, 1.228515625, 3.46923828125, 5.7099609375, 7.95068359375, 10.19140625, 12.43212890625, 14.6728515625, 16.91357421875, 19.154296875, 21.39501953125, 23.6357421875, 25.87646484375, 28.1171875, 30.35791015625, 32.5986328125, 34.83935546875, 37.080078125, 39.32080078125, 41.5615234375, 43.80224609375, 46.04296875, 48.28369140625, 50.5244140625, 52.76513671875, 55.005859375, 57.24658203125, 59.4873046875, 61.72802734375, 63.96875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 7.0, 6.0, 10.0, 7.0, 7.0, 11.0, 19.0, 19.0, 24.0, 19.0, 31.0, 38.0, 30.0, 35.0, 42.0, 51.0, 47.0, 42.0, 49.0, 40.0, 50.0, 52.0, 47.0, 43.0, 36.0, 27.0, 35.0, 32.0, 21.0, 17.0, 22.0, 14.0, 13.0, 8.0, 10.0, 5.0, 7.0, 10.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-71.75, -69.5888671875, -67.427734375, -65.2666015625, -63.10546875, -60.9443359375, -58.783203125, -56.6220703125, -54.4609375, -52.2998046875, -50.138671875, -47.9775390625, -45.81640625, -43.6552734375, -41.494140625, -39.3330078125, -37.171875, -35.0107421875, -32.849609375, -30.6884765625, -28.52734375, -26.3662109375, -24.205078125, -22.0439453125, -19.8828125, -17.7216796875, -15.560546875, -13.3994140625, -11.23828125, -9.0771484375, -6.916015625, -4.7548828125, -2.59375, -0.4326171875, 1.728515625, 3.8896484375, 6.05078125, 8.2119140625, 10.373046875, 12.5341796875, 14.6953125, 16.8564453125, 19.017578125, 21.1787109375, 23.33984375, 25.5009765625, 27.662109375, 29.8232421875, 31.984375, 34.1455078125, 36.306640625, 38.4677734375, 40.62890625, 42.7900390625, 44.951171875, 47.1123046875, 49.2734375, 51.4345703125, 53.595703125, 55.7568359375, 57.91796875, 60.0791015625, 62.240234375, 64.4013671875, 66.5625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 7.0, 4.0, 4.0, 2.0, 5.0, 10.0, 13.0, 16.0, 23.0, 25.0, 49.0, 45.0, 90.0, 123.0, 213.0, 363.0, 679.0, 1400.0, 3719.0, 13234.0, 77974.0, 765463.0, 154751.0, 21104.0, 5387.0, 1947.0, 797.0, 423.0, 225.0, 135.0, 94.0, 66.0, 34.0, 22.0, 21.0, 20.0, 15.0, 13.0, 5.0, 9.0, 6.0, 7.0, 7.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.375, -202.962890625, -196.55078125, -190.138671875, -183.7265625, -177.314453125, -170.90234375, -164.490234375, -158.078125, -151.666015625, -145.25390625, -138.841796875, -132.4296875, -126.017578125, -119.60546875, -113.193359375, -106.78125, -100.369140625, -93.95703125, -87.544921875, -81.1328125, -74.720703125, -68.30859375, -61.896484375, -55.484375, -49.072265625, -42.66015625, -36.248046875, -29.8359375, -23.423828125, -17.01171875, -10.599609375, -4.1875, 2.224609375, 8.63671875, 15.048828125, 21.4609375, 27.873046875, 34.28515625, 40.697265625, 47.109375, 53.521484375, 59.93359375, 66.345703125, 72.7578125, 79.169921875, 85.58203125, 91.994140625, 98.40625, 104.818359375, 111.23046875, 117.642578125, 124.0546875, 130.466796875, 136.87890625, 143.291015625, 149.703125, 156.115234375, 162.52734375, 168.939453125, 175.3515625, 181.763671875, 188.17578125, 194.587890625, 201.0]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 1.0, 2.0, 10.0, 8.0, 11.0, 14.0, 32.0, 40.0, 33.0, 36.0, 47.0, 56.0, 70.0, 84.0, 86.0, 81.0, 71.0, 48.0, 69.0, 44.0, 50.0, 28.0, 18.0, 12.0, 14.0, 7.0, 6.0, 3.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-435.75, -423.56640625, -411.3828125, -399.19921875, -387.015625, -374.83203125, -362.6484375, -350.46484375, -338.28125, -326.09765625, -313.9140625, -301.73046875, -289.546875, -277.36328125, -265.1796875, -252.99609375, -240.8125, -228.62890625, -216.4453125, -204.26171875, -192.078125, -179.89453125, -167.7109375, -155.52734375, -143.34375, -131.16015625, -118.9765625, -106.79296875, -94.609375, -82.42578125, -70.2421875, -58.05859375, -45.875, -33.69140625, -21.5078125, -9.32421875, 2.859375, 15.04296875, 27.2265625, 39.41015625, 51.59375, 63.77734375, 75.9609375, 88.14453125, 100.328125, 112.51171875, 124.6953125, 136.87890625, 149.0625, 161.24609375, 173.4296875, 185.61328125, 197.796875, 209.98046875, 222.1640625, 234.34765625, 246.53125, 258.71484375, 270.8984375, 283.08203125, 295.265625, 307.44921875, 319.6328125, 331.81640625, 344.0]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 9.0, 7.0, 15.0, 20.0, 20.0, 43.0, 45.0, 78.0, 137.0, 224.0, 326.0, 603.0, 1142.0, 2304.0, 5096.0, 13131.0, 40058.0, 157232.0, 651623.0, 123544.0, 32657.0, 11319.0, 4386.0, 2092.0, 1009.0, 560.0, 350.0, 176.0, 98.0, 74.0, 55.0, 29.0, 25.0, 22.0, 18.0, 7.0, 4.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.65625, -33.29296875, -31.9296875, -30.56640625, -29.203125, -27.83984375, -26.4765625, -25.11328125, -23.75, -22.38671875, -21.0234375, -19.66015625, -18.296875, -16.93359375, -15.5703125, -14.20703125, -12.84375, -11.48046875, -10.1171875, -8.75390625, -7.390625, -6.02734375, -4.6640625, -3.30078125, -1.9375, -0.57421875, 0.7890625, 2.15234375, 3.515625, 4.87890625, 6.2421875, 7.60546875, 8.96875, 10.33203125, 11.6953125, 13.05859375, 14.421875, 15.78515625, 17.1484375, 18.51171875, 19.875, 21.23828125, 22.6015625, 23.96484375, 25.328125, 26.69140625, 28.0546875, 29.41796875, 30.78125, 32.14453125, 33.5078125, 34.87109375, 36.234375, 37.59765625, 38.9609375, 40.32421875, 41.6875, 43.05078125, 44.4140625, 45.77734375, 47.140625, 48.50390625, 49.8671875, 51.23046875, 52.59375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 7.0, 7.0, 11.0, 13.0, 18.0, 25.0, 23.0, 63.0, 72.0, 76.0, 107.0, 157.0, 113.0, 83.0, 55.0, 46.0, 32.0, 23.0, 23.0, 11.0, 7.0, 3.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0198516845703125, -0.019176006317138672, -0.018500328063964844, -0.017824649810791016, -0.017148971557617188, -0.01647329330444336, -0.01579761505126953, -0.015121936798095703, -0.014446258544921875, -0.013770580291748047, -0.013094902038574219, -0.01241922378540039, -0.011743545532226562, -0.011067867279052734, -0.010392189025878906, -0.009716510772705078, -0.00904083251953125, -0.008365154266357422, -0.007689476013183594, -0.007013797760009766, -0.0063381195068359375, -0.005662441253662109, -0.004986763000488281, -0.004311084747314453, -0.003635406494140625, -0.002959728240966797, -0.0022840499877929688, -0.0016083717346191406, -0.0009326934814453125, -0.0002570152282714844, 0.00041866302490234375, 0.0010943412780761719, 0.00177001953125, 0.002445697784423828, 0.0031213760375976562, 0.0037970542907714844, 0.0044727325439453125, 0.005148410797119141, 0.005824089050292969, 0.006499767303466797, 0.007175445556640625, 0.007851123809814453, 0.008526802062988281, 0.00920248031616211, 0.009878158569335938, 0.010553836822509766, 0.011229515075683594, 0.011905193328857422, 0.01258087158203125, 0.013256549835205078, 0.013932228088378906, 0.014607906341552734, 0.015283584594726562, 0.01595926284790039, 0.01663494110107422, 0.017310619354248047, 0.017986297607421875, 0.018661975860595703, 0.01933765411376953, 0.02001333236694336, 0.020689010620117188, 0.021364688873291016, 0.022040367126464844, 0.022716045379638672, 0.0233917236328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 6.0, 4.0, 12.0, 10.0, 13.0, 21.0, 43.0, 53.0, 63.0, 136.0, 236.0, 371.0, 868.0, 1953.0, 5273.0, 18780.0, 97322.0, 742570.0, 144898.0, 24830.0, 6705.0, 2275.0, 947.0, 498.0, 273.0, 117.0, 81.0, 70.0, 39.0, 22.0, 16.0, 10.0, 6.0, 9.0, 11.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-60.4375, -58.58349609375, -56.7294921875, -54.87548828125, -53.021484375, -51.16748046875, -49.3134765625, -47.45947265625, -45.60546875, -43.75146484375, -41.8974609375, -40.04345703125, -38.189453125, -36.33544921875, -34.4814453125, -32.62744140625, -30.7734375, -28.91943359375, -27.0654296875, -25.21142578125, -23.357421875, -21.50341796875, -19.6494140625, -17.79541015625, -15.94140625, -14.08740234375, -12.2333984375, -10.37939453125, -8.525390625, -6.67138671875, -4.8173828125, -2.96337890625, -1.109375, 0.74462890625, 2.5986328125, 4.45263671875, 6.306640625, 8.16064453125, 10.0146484375, 11.86865234375, 13.72265625, 15.57666015625, 17.4306640625, 19.28466796875, 21.138671875, 22.99267578125, 24.8466796875, 26.70068359375, 28.5546875, 30.40869140625, 32.2626953125, 34.11669921875, 35.970703125, 37.82470703125, 39.6787109375, 41.53271484375, 43.38671875, 45.24072265625, 47.0947265625, 48.94873046875, 50.802734375, 52.65673828125, 54.5107421875, 56.36474609375, 58.21875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 8.0, 8.0, 4.0, 8.0, 14.0, 10.0, 14.0, 18.0, 24.0, 29.0, 25.0, 49.0, 58.0, 55.0, 56.0, 93.0, 71.0, 67.0, 66.0, 58.0, 45.0, 31.0, 33.0, 28.0, 21.0, 12.0, 16.0, 8.0, 8.0, 11.0, 10.0, 8.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0], "bins": [-42.25, -41.017578125, -39.78515625, -38.552734375, -37.3203125, -36.087890625, -34.85546875, -33.623046875, -32.390625, -31.158203125, -29.92578125, -28.693359375, -27.4609375, -26.228515625, -24.99609375, -23.763671875, -22.53125, -21.298828125, -20.06640625, -18.833984375, -17.6015625, -16.369140625, -15.13671875, -13.904296875, -12.671875, -11.439453125, -10.20703125, -8.974609375, -7.7421875, -6.509765625, -5.27734375, -4.044921875, -2.8125, -1.580078125, -0.34765625, 0.884765625, 2.1171875, 3.349609375, 4.58203125, 5.814453125, 7.046875, 8.279296875, 9.51171875, 10.744140625, 11.9765625, 13.208984375, 14.44140625, 15.673828125, 16.90625, 18.138671875, 19.37109375, 20.603515625, 21.8359375, 23.068359375, 24.30078125, 25.533203125, 26.765625, 27.998046875, 29.23046875, 30.462890625, 31.6953125, 32.927734375, 34.16015625, 35.392578125, 36.625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 12.0, 5.0, 11.0, 16.0, 27.0, 60.0, 82.0, 140.0, 268.0, 136.0, 101.0, 55.0, 38.0, 12.0, 7.0, 9.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1242.4111328125, -1208.351806640625, -1174.29248046875, -1140.233154296875, -1106.173828125, -1072.114501953125, -1038.05517578125, -1003.9957885742188, -969.9364624023438, -935.8771362304688, -901.8178100585938, -867.7584838867188, -833.6990966796875, -799.6397705078125, -765.5804443359375, -731.5211181640625, -697.4617919921875, -663.4024658203125, -629.3431396484375, -595.2838134765625, -561.2244873046875, -527.1651611328125, -493.10577392578125, -459.04644775390625, -424.98712158203125, -390.92779541015625, -356.86846923828125, -322.8091125488281, -288.7497863769531, -254.69046020507812, -220.63111877441406, -186.57177734375, -152.5123291015625, -118.45299530029297, -84.39366149902344, -50.334327697753906, -16.274993896484375, 17.784332275390625, 51.84367370605469, 85.90301513671875, 119.96234130859375, 154.02166748046875, 188.0810089111328, 222.14035034179688, 256.1996765136719, 290.2590026855469, 324.318359375, 358.377685546875, 392.43701171875, 426.496337890625, 460.5556640625, 494.6150207519531, 528.67431640625, 562.733642578125, 596.7930297851562, 630.8523559570312, 664.9116821289062, 698.9710083007812, 733.0303344726562, 767.0896606445312, 801.1490478515625, 835.2083740234375, 869.2677001953125, 903.3270263671875, 937.3863525390625]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 10.0, 5.0, 9.0, 12.0, 12.0, 14.0, 13.0, 18.0, 18.0, 25.0, 31.0, 26.0, 38.0, 34.0, 53.0, 69.0, 92.0, 98.0, 77.0, 48.0, 42.0, 30.0, 28.0, 28.0, 21.0, 21.0, 24.0, 15.0, 16.0, 9.0, 11.0, 12.0, 4.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-854.59912109375, -822.7855224609375, -790.971923828125, -759.1583251953125, -727.3446655273438, -695.5310668945312, -663.7174682617188, -631.9038696289062, -600.0902709960938, -568.2766723632812, -536.4630737304688, -504.6494445800781, -472.8358459472656, -441.022216796875, -409.2086181640625, -377.39501953125, -345.5813903808594, -313.7677917480469, -281.95416259765625, -250.14056396484375, -218.32696533203125, -186.5133514404297, -154.69973754882812, -122.88613891601562, -91.07252502441406, -59.25891876220703, -27.445308685302734, 4.3683013916015625, 36.181907653808594, 67.99551391601562, 99.80912780761719, 131.6227264404297, 163.43634033203125, 195.2499542236328, 227.0635528564453, 258.8771667480469, 290.6907653808594, 322.50439453125, 354.3179931640625, 386.131591796875, 417.9451904296875, 449.7587890625, 481.5724182128906, 513.385986328125, 545.1996459960938, 577.0132446289062, 608.8268432617188, 640.6404418945312, 672.4541015625, 704.2677001953125, 736.081298828125, 767.8948974609375, 799.7085571289062, 831.5221557617188, 863.3357543945312, 895.1493530273438, 926.9629516601562, 958.7765502929688, 990.5901489257812, 1022.40380859375, 1054.2174072265625, 1086.031005859375, 1117.8446044921875, 1149.658203125, 1181.4718017578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 6.0, 8.0, 12.0, 22.0, 46.0, 71.0, 115.0, 180.0, 318.0, 575.0, 1184.0, 2464.0, 5941.0, 17941.0, 76239.0, 454744.0, 2179492.0, 1188717.0, 207356.0, 40038.0, 10766.0, 4077.0, 1853.0, 942.0, 513.0, 250.0, 166.0, 89.0, 59.0, 32.0, 19.0, 20.0, 9.0, 3.0, 5.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.78125, -57.15673828125, -54.5322265625, -51.90771484375, -49.283203125, -46.65869140625, -44.0341796875, -41.40966796875, -38.78515625, -36.16064453125, -33.5361328125, -30.91162109375, -28.287109375, -25.66259765625, -23.0380859375, -20.41357421875, -17.7890625, -15.16455078125, -12.5400390625, -9.91552734375, -7.291015625, -4.66650390625, -2.0419921875, 0.58251953125, 3.20703125, 5.83154296875, 8.4560546875, 11.08056640625, 13.705078125, 16.32958984375, 18.9541015625, 21.57861328125, 24.203125, 26.82763671875, 29.4521484375, 32.07666015625, 34.701171875, 37.32568359375, 39.9501953125, 42.57470703125, 45.19921875, 47.82373046875, 50.4482421875, 53.07275390625, 55.697265625, 58.32177734375, 60.9462890625, 63.57080078125, 66.1953125, 68.81982421875, 71.4443359375, 74.06884765625, 76.693359375, 79.31787109375, 81.9423828125, 84.56689453125, 87.19140625, 89.81591796875, 92.4404296875, 95.06494140625, 97.689453125, 100.31396484375, 102.9384765625, 105.56298828125, 108.1875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 5.0, 4.0, 6.0, 3.0, 9.0, 6.0, 11.0, 12.0, 26.0, 23.0, 19.0, 22.0, 22.0, 30.0, 37.0, 41.0, 41.0, 35.0, 38.0, 49.0, 59.0, 60.0, 57.0, 36.0, 40.0, 38.0, 36.0, 26.0, 35.0, 33.0, 29.0, 27.0, 15.0, 14.0, 15.0, 6.0, 5.0, 5.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.0625, -65.84765625, -63.6328125, -61.41796875, -59.203125, -56.98828125, -54.7734375, -52.55859375, -50.34375, -48.12890625, -45.9140625, -43.69921875, -41.484375, -39.26953125, -37.0546875, -34.83984375, -32.625, -30.41015625, -28.1953125, -25.98046875, -23.765625, -21.55078125, -19.3359375, -17.12109375, -14.90625, -12.69140625, -10.4765625, -8.26171875, -6.046875, -3.83203125, -1.6171875, 0.59765625, 2.8125, 5.02734375, 7.2421875, 9.45703125, 11.671875, 13.88671875, 16.1015625, 18.31640625, 20.53125, 22.74609375, 24.9609375, 27.17578125, 29.390625, 31.60546875, 33.8203125, 36.03515625, 38.25, 40.46484375, 42.6796875, 44.89453125, 47.109375, 49.32421875, 51.5390625, 53.75390625, 55.96875, 58.18359375, 60.3984375, 62.61328125, 64.828125, 67.04296875, 69.2578125, 71.47265625, 73.6875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 4.0, 17.0, 21.0, 47.0, 102.0, 253.0, 622.0, 2577.0, 24627.0, 3639374.0, 514231.0, 9854.0, 1638.0, 503.0, 206.0, 82.0, 39.0, 24.0, 12.0, 16.0, 6.0, 1.0, 4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-331.0, -320.6015625, -310.203125, -299.8046875, -289.40625, -279.0078125, -268.609375, -258.2109375, -247.8125, -237.4140625, -227.015625, -216.6171875, -206.21875, -195.8203125, -185.421875, -175.0234375, -164.625, -154.2265625, -143.828125, -133.4296875, -123.03125, -112.6328125, -102.234375, -91.8359375, -81.4375, -71.0390625, -60.640625, -50.2421875, -39.84375, -29.4453125, -19.046875, -8.6484375, 1.75, 12.1484375, 22.546875, 32.9453125, 43.34375, 53.7421875, 64.140625, 74.5390625, 84.9375, 95.3359375, 105.734375, 116.1328125, 126.53125, 136.9296875, 147.328125, 157.7265625, 168.125, 178.5234375, 188.921875, 199.3203125, 209.71875, 220.1171875, 230.515625, 240.9140625, 251.3125, 261.7109375, 272.109375, 282.5078125, 292.90625, 303.3046875, 313.703125, 324.1015625, 334.5]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 14.0, 12.0, 31.0, 27.0, 71.0, 83.0, 197.0, 413.0, 741.0, 1001.0, 697.0, 327.0, 181.0, 96.0, 72.0, 35.0, 27.0, 16.0, 8.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.625, -136.951171875, -130.27734375, -123.603515625, -116.9296875, -110.255859375, -103.58203125, -96.908203125, -90.234375, -83.560546875, -76.88671875, -70.212890625, -63.5390625, -56.865234375, -50.19140625, -43.517578125, -36.84375, -30.169921875, -23.49609375, -16.822265625, -10.1484375, -3.474609375, 3.19921875, 9.873046875, 16.546875, 23.220703125, 29.89453125, 36.568359375, 43.2421875, 49.916015625, 56.58984375, 63.263671875, 69.9375, 76.611328125, 83.28515625, 89.958984375, 96.6328125, 103.306640625, 109.98046875, 116.654296875, 123.328125, 130.001953125, 136.67578125, 143.349609375, 150.0234375, 156.697265625, 163.37109375, 170.044921875, 176.71875, 183.392578125, 190.06640625, 196.740234375, 203.4140625, 210.087890625, 216.76171875, 223.435546875, 230.109375, 236.783203125, 243.45703125, 250.130859375, 256.8046875, 263.478515625, 270.15234375, 276.826171875, 283.5]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 12.0, 5.0, 13.0, 23.0, 53.0, 43.0, 90.0, 150.0, 162.0, 137.0, 100.0, 70.0, 40.0, 28.0, 21.0, 11.0, 15.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1168.4798583984375, -1135.7244873046875, -1102.9691162109375, -1070.2138671875, -1037.45849609375, -1004.703125, -971.94775390625, -939.1923828125, -906.4370727539062, -873.6817016601562, -840.9263916015625, -808.1710205078125, -775.4156494140625, -742.6603393554688, -709.9049682617188, -677.149658203125, -644.394287109375, -611.638916015625, -578.8836059570312, -546.1282348632812, -513.3729248046875, -480.6175537109375, -447.8621826171875, -415.1068420410156, -382.35150146484375, -349.5961608886719, -316.8408203125, -284.08544921875, -251.33010864257812, -218.57476806640625, -185.8194122314453, -153.06405639648438, -120.30865478515625, -87.55330657958984, -54.79795837402344, -22.04261016845703, 10.712738037109375, 43.46807861328125, 76.22343444824219, 108.97879028320312, 141.734130859375, 174.48947143554688, 207.2448272705078, 240.00018310546875, 272.7555236816406, 305.5108642578125, 338.2662353515625, 371.0215759277344, 403.77691650390625, 436.5322570800781, 469.28759765625, 502.04296875, 534.79833984375, 567.5536499023438, 600.3090209960938, 633.0643310546875, 665.8197021484375, 698.5750732421875, 731.3303833007812, 764.0857543945312, 796.841064453125, 829.596435546875, 862.351806640625, 895.107177734375, 927.8624877929688]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 8.0, 4.0, 6.0, 11.0, 7.0, 17.0, 20.0, 18.0, 25.0, 30.0, 39.0, 41.0, 50.0, 75.0, 83.0, 55.0, 64.0, 58.0, 56.0, 64.0, 55.0, 33.0, 37.0, 24.0, 16.0, 25.0, 17.0, 15.0, 15.0, 2.0, 9.0, 5.0, 11.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-965.2545166015625, -937.2748413085938, -909.2951049804688, -881.3154296875, -853.335693359375, -825.3560180664062, -797.3763427734375, -769.3966064453125, -741.4168701171875, -713.4371948242188, -685.4574584960938, -657.477783203125, -629.498046875, -601.5183715820312, -573.5386962890625, -545.5589599609375, -517.5792846679688, -489.5995788574219, -461.619873046875, -433.64019775390625, -405.66046142578125, -377.6807861328125, -349.7010803222656, -321.72137451171875, -293.7416687011719, -265.761962890625, -237.78225708007812, -209.8025665283203, -181.82286071777344, -153.84315490722656, -125.86346435546875, -97.88375854492188, -69.90399169921875, -41.92428970336914, -13.944587707519531, 14.035110473632812, 42.01481628417969, 69.99452209472656, 97.97421264648438, 125.95391845703125, 153.93362426757812, 181.913330078125, 209.89303588867188, 237.8727264404297, 265.8524169921875, 293.8321533203125, 321.81182861328125, 349.7915344238281, 377.771240234375, 405.7509460449219, 433.73065185546875, 461.7103271484375, 489.6900634765625, 517.6697387695312, 545.6494140625, 573.629150390625, 601.60888671875, 629.5885620117188, 657.5682983398438, 685.5479736328125, 713.5277099609375, 741.5073852539062, 769.487060546875, 797.466796875, 825.4464721679688]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 10.0, 22.0, 26.0, 50.0, 55.0, 114.0, 160.0, 302.0, 424.0, 775.0, 1321.0, 2372.0, 4587.0, 9057.0, 20227.0, 47293.0, 125805.0, 348342.0, 304453.0, 106614.0, 41377.0, 17624.0, 8302.0, 4219.0, 2123.0, 1161.0, 662.0, 409.0, 241.0, 157.0, 99.0, 56.0, 44.0, 22.0, 11.0, 11.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.6875, -89.8720703125, -87.056640625, -84.2412109375, -81.42578125, -78.6103515625, -75.794921875, -72.9794921875, -70.1640625, -67.3486328125, -64.533203125, -61.7177734375, -58.90234375, -56.0869140625, -53.271484375, -50.4560546875, -47.640625, -44.8251953125, -42.009765625, -39.1943359375, -36.37890625, -33.5634765625, -30.748046875, -27.9326171875, -25.1171875, -22.3017578125, -19.486328125, -16.6708984375, -13.85546875, -11.0400390625, -8.224609375, -5.4091796875, -2.59375, 0.2216796875, 3.037109375, 5.8525390625, 8.66796875, 11.4833984375, 14.298828125, 17.1142578125, 19.9296875, 22.7451171875, 25.560546875, 28.3759765625, 31.19140625, 34.0068359375, 36.822265625, 39.6376953125, 42.453125, 45.2685546875, 48.083984375, 50.8994140625, 53.71484375, 56.5302734375, 59.345703125, 62.1611328125, 64.9765625, 67.7919921875, 70.607421875, 73.4228515625, 76.23828125, 79.0537109375, 81.869140625, 84.6845703125, 87.5]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 7.0, 5.0, 8.0, 17.0, 15.0, 15.0, 18.0, 23.0, 15.0, 17.0, 27.0, 35.0, 33.0, 26.0, 38.0, 37.0, 38.0, 52.0, 45.0, 46.0, 53.0, 50.0, 45.0, 46.0, 29.0, 45.0, 32.0, 25.0, 28.0, 25.0, 22.0, 16.0, 9.0, 11.0, 9.0, 8.0, 7.0, 3.0, 3.0, 3.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.65625, -57.58056640625, -55.5048828125, -53.42919921875, -51.353515625, -49.27783203125, -47.2021484375, -45.12646484375, -43.05078125, -40.97509765625, -38.8994140625, -36.82373046875, -34.748046875, -32.67236328125, -30.5966796875, -28.52099609375, -26.4453125, -24.36962890625, -22.2939453125, -20.21826171875, -18.142578125, -16.06689453125, -13.9912109375, -11.91552734375, -9.83984375, -7.76416015625, -5.6884765625, -3.61279296875, -1.537109375, 0.53857421875, 2.6142578125, 4.68994140625, 6.765625, 8.84130859375, 10.9169921875, 12.99267578125, 15.068359375, 17.14404296875, 19.2197265625, 21.29541015625, 23.37109375, 25.44677734375, 27.5224609375, 29.59814453125, 31.673828125, 33.74951171875, 35.8251953125, 37.90087890625, 39.9765625, 42.05224609375, 44.1279296875, 46.20361328125, 48.279296875, 50.35498046875, 52.4306640625, 54.50634765625, 56.58203125, 58.65771484375, 60.7333984375, 62.80908203125, 64.884765625, 66.96044921875, 69.0361328125, 71.11181640625, 73.1875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 6.0, 8.0, 20.0, 27.0, 45.0, 75.0, 93.0, 136.0, 287.0, 512.0, 1048.0, 2917.0, 12828.0, 131012.0, 842090.0, 47045.0, 6710.0, 1904.0, 789.0, 398.0, 222.0, 122.0, 81.0, 53.0, 45.0, 25.0, 13.0, 13.0, 12.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-285.5, -277.4140625, -269.328125, -261.2421875, -253.15625, -245.0703125, -236.984375, -228.8984375, -220.8125, -212.7265625, -204.640625, -196.5546875, -188.46875, -180.3828125, -172.296875, -164.2109375, -156.125, -148.0390625, -139.953125, -131.8671875, -123.78125, -115.6953125, -107.609375, -99.5234375, -91.4375, -83.3515625, -75.265625, -67.1796875, -59.09375, -51.0078125, -42.921875, -34.8359375, -26.75, -18.6640625, -10.578125, -2.4921875, 5.59375, 13.6796875, 21.765625, 29.8515625, 37.9375, 46.0234375, 54.109375, 62.1953125, 70.28125, 78.3671875, 86.453125, 94.5390625, 102.625, 110.7109375, 118.796875, 126.8828125, 134.96875, 143.0546875, 151.140625, 159.2265625, 167.3125, 175.3984375, 183.484375, 191.5703125, 199.65625, 207.7421875, 215.828125, 223.9140625, 232.0]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 11.0, 16.0, 13.0, 14.0, 20.0, 21.0, 23.0, 34.0, 41.0, 51.0, 52.0, 55.0, 61.0, 66.0, 75.0, 68.0, 67.0, 49.0, 50.0, 30.0, 32.0, 28.0, 23.0, 12.0, 17.0, 15.0, 13.0, 5.0, 10.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-348.25, -338.515625, -328.78125, -319.046875, -309.3125, -299.578125, -289.84375, -280.109375, -270.375, -260.640625, -250.90625, -241.171875, -231.4375, -221.703125, -211.96875, -202.234375, -192.5, -182.765625, -173.03125, -163.296875, -153.5625, -143.828125, -134.09375, -124.359375, -114.625, -104.890625, -95.15625, -85.421875, -75.6875, -65.953125, -56.21875, -46.484375, -36.75, -27.015625, -17.28125, -7.546875, 2.1875, 11.921875, 21.65625, 31.390625, 41.125, 50.859375, 60.59375, 70.328125, 80.0625, 89.796875, 99.53125, 109.265625, 119.0, 128.734375, 138.46875, 148.203125, 157.9375, 167.671875, 177.40625, 187.140625, 196.875, 206.609375, 216.34375, 226.078125, 235.8125, 245.546875, 255.28125, 265.015625, 274.75]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 2.0, 14.0, 22.0, 29.0, 32.0, 36.0, 65.0, 90.0, 139.0, 204.0, 364.0, 677.0, 1200.0, 2155.0, 4635.0, 10729.0, 28651.0, 101497.0, 650064.0, 176914.0, 43486.0, 15080.0, 6183.0, 2884.0, 1403.0, 770.0, 428.0, 261.0, 174.0, 96.0, 79.0, 51.0, 37.0, 29.0, 20.0, 15.0, 9.0, 3.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.0, -29.95556640625, -28.9111328125, -27.86669921875, -26.822265625, -25.77783203125, -24.7333984375, -23.68896484375, -22.64453125, -21.60009765625, -20.5556640625, -19.51123046875, -18.466796875, -17.42236328125, -16.3779296875, -15.33349609375, -14.2890625, -13.24462890625, -12.2001953125, -11.15576171875, -10.111328125, -9.06689453125, -8.0224609375, -6.97802734375, -5.93359375, -4.88916015625, -3.8447265625, -2.80029296875, -1.755859375, -0.71142578125, 0.3330078125, 1.37744140625, 2.421875, 3.46630859375, 4.5107421875, 5.55517578125, 6.599609375, 7.64404296875, 8.6884765625, 9.73291015625, 10.77734375, 11.82177734375, 12.8662109375, 13.91064453125, 14.955078125, 15.99951171875, 17.0439453125, 18.08837890625, 19.1328125, 20.17724609375, 21.2216796875, 22.26611328125, 23.310546875, 24.35498046875, 25.3994140625, 26.44384765625, 27.48828125, 28.53271484375, 29.5771484375, 30.62158203125, 31.666015625, 32.71044921875, 33.7548828125, 34.79931640625, 35.84375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 14.0, 14.0, 18.0, 32.0, 40.0, 62.0, 76.0, 99.0, 121.0, 146.0, 101.0, 76.0, 65.0, 32.0, 26.0, 15.0, 12.0, 12.0, 10.0, 11.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169219970703125, -0.01629638671875, -0.0156707763671875, -0.015045166015625, -0.0144195556640625, -0.0137939453125, -0.0131683349609375, -0.012542724609375, -0.0119171142578125, -0.01129150390625, -0.0106658935546875, -0.010040283203125, -0.0094146728515625, -0.0087890625, -0.0081634521484375, -0.007537841796875, -0.0069122314453125, -0.00628662109375, -0.0056610107421875, -0.005035400390625, -0.0044097900390625, -0.0037841796875, -0.0031585693359375, -0.002532958984375, -0.0019073486328125, -0.00128173828125, -0.0006561279296875, -3.0517578125e-05, 0.0005950927734375, 0.001220703125, 0.0018463134765625, 0.002471923828125, 0.0030975341796875, 0.00372314453125, 0.0043487548828125, 0.004974365234375, 0.0055999755859375, 0.0062255859375, 0.0068511962890625, 0.007476806640625, 0.0081024169921875, 0.00872802734375, 0.0093536376953125, 0.009979248046875, 0.0106048583984375, 0.01123046875, 0.0118560791015625, 0.012481689453125, 0.0131072998046875, 0.01373291015625, 0.0143585205078125, 0.014984130859375, 0.0156097412109375, 0.0162353515625, 0.0168609619140625, 0.017486572265625, 0.0181121826171875, 0.01873779296875, 0.0193634033203125, 0.019989013671875, 0.0206146240234375, 0.021240234375, 0.0218658447265625, 0.022491455078125, 0.0231170654296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 9.0, 8.0, 11.0, 16.0, 41.0, 106.0, 201.0, 620.0, 2350.0, 20172.0, 854307.0, 161564.0, 7138.0, 1281.0, 390.0, 152.0, 84.0, 37.0, 27.0, 13.0, 11.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-107.6875, -104.5927734375, -101.498046875, -98.4033203125, -95.30859375, -92.2138671875, -89.119140625, -86.0244140625, -82.9296875, -79.8349609375, -76.740234375, -73.6455078125, -70.55078125, -67.4560546875, -64.361328125, -61.2666015625, -58.171875, -55.0771484375, -51.982421875, -48.8876953125, -45.79296875, -42.6982421875, -39.603515625, -36.5087890625, -33.4140625, -30.3193359375, -27.224609375, -24.1298828125, -21.03515625, -17.9404296875, -14.845703125, -11.7509765625, -8.65625, -5.5615234375, -2.466796875, 0.6279296875, 3.72265625, 6.8173828125, 9.912109375, 13.0068359375, 16.1015625, 19.1962890625, 22.291015625, 25.3857421875, 28.48046875, 31.5751953125, 34.669921875, 37.7646484375, 40.859375, 43.9541015625, 47.048828125, 50.1435546875, 53.23828125, 56.3330078125, 59.427734375, 62.5224609375, 65.6171875, 68.7119140625, 71.806640625, 74.9013671875, 77.99609375, 81.0908203125, 84.185546875, 87.2802734375, 90.375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 4.0, 4.0, 12.0, 15.0, 24.0, 48.0, 79.0, 116.0, 133.0, 141.0, 120.0, 90.0, 78.0, 38.0, 31.0, 24.0, 10.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-87.6875, -85.2197265625, -82.751953125, -80.2841796875, -77.81640625, -75.3486328125, -72.880859375, -70.4130859375, -67.9453125, -65.4775390625, -63.009765625, -60.5419921875, -58.07421875, -55.6064453125, -53.138671875, -50.6708984375, -48.203125, -45.7353515625, -43.267578125, -40.7998046875, -38.33203125, -35.8642578125, -33.396484375, -30.9287109375, -28.4609375, -25.9931640625, -23.525390625, -21.0576171875, -18.58984375, -16.1220703125, -13.654296875, -11.1865234375, -8.71875, -6.2509765625, -3.783203125, -1.3154296875, 1.15234375, 3.6201171875, 6.087890625, 8.5556640625, 11.0234375, 13.4912109375, 15.958984375, 18.4267578125, 20.89453125, 23.3623046875, 25.830078125, 28.2978515625, 30.765625, 33.2333984375, 35.701171875, 38.1689453125, 40.63671875, 43.1044921875, 45.572265625, 48.0400390625, 50.5078125, 52.9755859375, 55.443359375, 57.9111328125, 60.37890625, 62.8466796875, 65.314453125, 67.7822265625, 70.25]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 14.0, 36.0, 68.0, 191.0, 424.0, 135.0, 67.0, 32.0, 11.0, 11.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1262.30615234375, -1202.849365234375, -1143.3924560546875, -1083.9356689453125, -1024.4788818359375, -965.02197265625, -905.565185546875, -846.1083374023438, -786.6514892578125, -727.1946411132812, -667.7378540039062, -608.281005859375, -548.8241577148438, -489.3673400878906, -429.9105224609375, -370.45367431640625, -310.99688720703125, -251.54005432128906, -192.08322143554688, -132.62640380859375, -73.16957092285156, -13.712738037109375, 45.74407958984375, 105.200927734375, 164.65774536132812, 224.1145782470703, 283.5714111328125, 343.0282287597656, 402.48504638671875, 461.94189453125, 521.398681640625, 580.8555908203125, 640.3123779296875, 699.7692260742188, 759.2260131835938, 818.682861328125, 878.1397094726562, 937.5965576171875, 997.0533447265625, 1056.51025390625, 1115.967041015625, 1175.423828125, 1234.8807373046875, 1294.3375244140625, 1353.7943115234375, 1413.251220703125, 1472.7080078125, 1532.164794921875, 1591.62158203125, 1651.078369140625, 1710.5352783203125, 1769.9920654296875, 1829.4488525390625, 1888.90576171875, 1948.362548828125, 2007.8193359375, 2067.2763671875, 2126.733154296875, 2186.18994140625, 2245.64697265625, 2305.103759765625, 2364.560546875, 2424.017333984375, 2483.47412109375, 2542.930908203125]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 5.0, 5.0, 9.0, 14.0, 9.0, 20.0, 24.0, 23.0, 22.0, 27.0, 28.0, 39.0, 46.0, 82.0, 185.0, 126.0, 71.0, 54.0, 38.0, 36.0, 25.0, 21.0, 26.0, 23.0, 10.0, 17.0, 11.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1369.1583251953125, -1328.6373291015625, -1288.1162109375, -1247.59521484375, -1207.07421875, -1166.55322265625, -1126.0321044921875, -1085.5111083984375, -1044.989990234375, -1004.4689331054688, -963.9479370117188, -923.4268798828125, -882.9058837890625, -842.3848266601562, -801.86376953125, -761.3427734375, -720.82177734375, -680.3007202148438, -639.7797241210938, -599.2586669921875, -558.7376708984375, -518.2166137695312, -477.695556640625, -437.1745300292969, -396.65350341796875, -356.1324768066406, -315.6114501953125, -275.09039306640625, -234.56936645507812, -194.04833984375, -153.5272979736328, -113.00625610351562, -72.4853515625, -31.964317321777344, 8.556716918945312, 49.07775115966797, 89.59878540039062, 130.11981201171875, 170.64085388183594, 211.16189575195312, 251.68292236328125, 292.2039489746094, 332.7249755859375, 373.24603271484375, 413.7670593261719, 454.2880859375, 494.80914306640625, 535.3302001953125, 575.8511962890625, 616.3722534179688, 656.8932495117188, 697.414306640625, 737.935302734375, 778.4563598632812, 818.9774169921875, 859.4984130859375, 900.0194702148438, 940.54052734375, 981.0615234375, 1021.5825805664062, 1062.1036376953125, 1102.6246337890625, 1143.1456298828125, 1183.666748046875, 1224.187744140625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 8.0, 8.0, 21.0, 19.0, 33.0, 33.0, 41.0, 61.0, 107.0, 151.0, 243.0, 430.0, 834.0, 1858.0, 4716.0, 13847.0, 56659.0, 426810.0, 2466978.0, 1060649.0, 124662.0, 24012.0, 7044.0, 2487.0, 1149.0, 562.0, 278.0, 187.0, 144.0, 75.0, 41.0, 48.0, 21.0, 22.0, 16.0, 13.0, 4.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.625, -146.84375, -142.0625, -137.28125, -132.5, -127.71875, -122.9375, -118.15625, -113.375, -108.59375, -103.8125, -99.03125, -94.25, -89.46875, -84.6875, -79.90625, -75.125, -70.34375, -65.5625, -60.78125, -56.0, -51.21875, -46.4375, -41.65625, -36.875, -32.09375, -27.3125, -22.53125, -17.75, -12.96875, -8.1875, -3.40625, 1.375, 6.15625, 10.9375, 15.71875, 20.5, 25.28125, 30.0625, 34.84375, 39.625, 44.40625, 49.1875, 53.96875, 58.75, 63.53125, 68.3125, 73.09375, 77.875, 82.65625, 87.4375, 92.21875, 97.0, 101.78125, 106.5625, 111.34375, 116.125, 120.90625, 125.6875, 130.46875, 135.25, 140.03125, 144.8125, 149.59375, 154.375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 10.0, 5.0, 17.0, 18.0, 15.0, 30.0, 27.0, 27.0, 28.0, 34.0, 43.0, 44.0, 50.0, 45.0, 48.0, 48.0, 49.0, 43.0, 46.0, 45.0, 39.0, 35.0, 46.0, 38.0, 26.0, 22.0, 20.0, 15.0, 22.0, 17.0, 8.0, 10.0, 5.0, 6.0, 1.0, 3.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.5, -78.2666015625, -76.033203125, -73.7998046875, -71.56640625, -69.3330078125, -67.099609375, -64.8662109375, -62.6328125, -60.3994140625, -58.166015625, -55.9326171875, -53.69921875, -51.4658203125, -49.232421875, -46.9990234375, -44.765625, -42.5322265625, -40.298828125, -38.0654296875, -35.83203125, -33.5986328125, -31.365234375, -29.1318359375, -26.8984375, -24.6650390625, -22.431640625, -20.1982421875, -17.96484375, -15.7314453125, -13.498046875, -11.2646484375, -9.03125, -6.7978515625, -4.564453125, -2.3310546875, -0.09765625, 2.1357421875, 4.369140625, 6.6025390625, 8.8359375, 11.0693359375, 13.302734375, 15.5361328125, 17.76953125, 20.0029296875, 22.236328125, 24.4697265625, 26.703125, 28.9365234375, 31.169921875, 33.4033203125, 35.63671875, 37.8701171875, 40.103515625, 42.3369140625, 44.5703125, 46.8037109375, 49.037109375, 51.2705078125, 53.50390625, 55.7373046875, 57.970703125, 60.2041015625, 62.4375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 12.0, 17.0, 31.0, 75.0, 266.0, 1060.0, 16194.0, 4164208.0, 11096.0, 941.0, 239.0, 75.0, 39.0, 14.0, 9.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1395.0, -1358.7265625, -1322.453125, -1286.1796875, -1249.90625, -1213.6328125, -1177.359375, -1141.0859375, -1104.8125, -1068.5390625, -1032.265625, -995.9921875, -959.71875, -923.4453125, -887.171875, -850.8984375, -814.625, -778.3515625, -742.078125, -705.8046875, -669.53125, -633.2578125, -596.984375, -560.7109375, -524.4375, -488.1640625, -451.890625, -415.6171875, -379.34375, -343.0703125, -306.796875, -270.5234375, -234.25, -197.9765625, -161.703125, -125.4296875, -89.15625, -52.8828125, -16.609375, 19.6640625, 55.9375, 92.2109375, 128.484375, 164.7578125, 201.03125, 237.3046875, 273.578125, 309.8515625, 346.125, 382.3984375, 418.671875, 454.9453125, 491.21875, 527.4921875, 563.765625, 600.0390625, 636.3125, 672.5859375, 708.859375, 745.1328125, 781.40625, 817.6796875, 853.953125, 890.2265625, 926.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 12.0, 26.0, 31.0, 84.0, 179.0, 428.0, 1015.0, 1367.0, 504.0, 236.0, 87.0, 58.0, 25.0, 10.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-692.0, -675.953125, -659.90625, -643.859375, -627.8125, -611.765625, -595.71875, -579.671875, -563.625, -547.578125, -531.53125, -515.484375, -499.4375, -483.390625, -467.34375, -451.296875, -435.25, -419.203125, -403.15625, -387.109375, -371.0625, -355.015625, -338.96875, -322.921875, -306.875, -290.828125, -274.78125, -258.734375, -242.6875, -226.640625, -210.59375, -194.546875, -178.5, -162.453125, -146.40625, -130.359375, -114.3125, -98.265625, -82.21875, -66.171875, -50.125, -34.078125, -18.03125, -1.984375, 14.0625, 30.109375, 46.15625, 62.203125, 78.25, 94.296875, 110.34375, 126.390625, 142.4375, 158.484375, 174.53125, 190.578125, 206.625, 222.671875, 238.71875, 254.765625, 270.8125, 286.859375, 302.90625, 318.953125, 335.0]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 7.0, 4.0, 7.0, 16.0, 32.0, 40.0, 67.0, 99.0, 138.0, 169.0, 145.0, 99.0, 67.0, 33.0, 31.0, 8.0, 10.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2266.616943359375, -2194.469970703125, -2122.322998046875, -2050.176025390625, -1978.0291748046875, -1905.8822021484375, -1833.7353515625, -1761.58837890625, -1689.44140625, -1617.29443359375, -1545.1474609375, -1473.0006103515625, -1400.8536376953125, -1328.7066650390625, -1256.559814453125, -1184.412841796875, -1112.265869140625, -1040.118896484375, -967.9719848632812, -895.8250732421875, -823.6781005859375, -751.5311279296875, -679.3842163085938, -607.2373046875, -535.09033203125, -462.9433898925781, -390.79644775390625, -318.6495056152344, -246.5025634765625, -174.35562133789062, -102.20867919921875, -30.061737060546875, 42.085205078125, 114.23214721679688, 186.37908935546875, 258.5260314941406, 330.6729736328125, 402.8199157714844, 474.96685791015625, 547.11376953125, 619.2607421875, 691.40771484375, 763.5546264648438, 835.7015380859375, 907.8485107421875, 979.9954833984375, 1052.142333984375, 1124.289306640625, 1196.436279296875, 1268.583251953125, 1340.730224609375, 1412.8770751953125, 1485.0240478515625, 1557.1710205078125, 1629.31787109375, 1701.46484375, 1773.61181640625, 1845.7587890625, 1917.90576171875, 1990.0526123046875, 2062.19970703125, 2134.346435546875, 2206.493408203125, 2278.640380859375, 2350.787353515625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 5.0, 2.0, 4.0, 2.0, 8.0, 8.0, 7.0, 10.0, 8.0, 16.0, 12.0, 24.0, 16.0, 17.0, 25.0, 19.0, 22.0, 26.0, 31.0, 41.0, 50.0, 46.0, 42.0, 54.0, 37.0, 51.0, 43.0, 43.0, 37.0, 32.0, 36.0, 29.0, 28.0, 30.0, 21.0, 25.0, 20.0, 11.0, 12.0, 12.0, 10.0, 8.0, 9.0, 4.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-1103.2652587890625, -1070.904052734375, -1038.54296875, -1006.1817626953125, -973.820556640625, -941.4593505859375, -909.0982055664062, -876.737060546875, -844.3758544921875, -812.0146484375, -779.6535034179688, -747.2923583984375, -714.93115234375, -682.5699462890625, -650.2088012695312, -617.84765625, -585.4864501953125, -553.125244140625, -520.7640991210938, -488.4029235839844, -456.041748046875, -423.6805725097656, -391.31939697265625, -358.9582214355469, -326.5970458984375, -294.2358703613281, -261.87469482421875, -229.51351928710938, -197.15234375, -164.79116821289062, -132.42999267578125, -100.06881713867188, -67.7076416015625, -35.346466064453125, -2.98529052734375, 29.375885009765625, 61.737060546875, 94.09823608398438, 126.45941162109375, 158.82058715820312, 191.1817626953125, 223.54293823242188, 255.90411376953125, 288.2652893066406, 320.62646484375, 352.9876403808594, 385.34881591796875, 417.7099914550781, 450.0711669921875, 482.4323425292969, 514.7935180664062, 547.1546630859375, 579.515869140625, 611.8770751953125, 644.2382202148438, 676.599365234375, 708.9605712890625, 741.32177734375, 773.6829223632812, 806.0440673828125, 838.4052734375, 870.7664794921875, 903.1276245117188, 935.48876953125, 967.8499755859375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 16.0, 16.0, 27.0, 25.0, 31.0, 47.0, 70.0, 104.0, 154.0, 258.0, 457.0, 765.0, 1356.0, 2606.0, 5341.0, 11515.0, 28246.0, 79388.0, 319286.0, 438819.0, 99121.0, 34393.0, 13667.0, 6168.0, 2956.0, 1486.0, 840.0, 505.0, 306.0, 209.0, 105.0, 67.0, 44.0, 33.0, 29.0, 19.0, 15.0, 15.0, 8.0, 9.0, 8.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-134.625, -130.6767578125, -126.728515625, -122.7802734375, -118.83203125, -114.8837890625, -110.935546875, -106.9873046875, -103.0390625, -99.0908203125, -95.142578125, -91.1943359375, -87.24609375, -83.2978515625, -79.349609375, -75.4013671875, -71.453125, -67.5048828125, -63.556640625, -59.6083984375, -55.66015625, -51.7119140625, -47.763671875, -43.8154296875, -39.8671875, -35.9189453125, -31.970703125, -28.0224609375, -24.07421875, -20.1259765625, -16.177734375, -12.2294921875, -8.28125, -4.3330078125, -0.384765625, 3.5634765625, 7.51171875, 11.4599609375, 15.408203125, 19.3564453125, 23.3046875, 27.2529296875, 31.201171875, 35.1494140625, 39.09765625, 43.0458984375, 46.994140625, 50.9423828125, 54.890625, 58.8388671875, 62.787109375, 66.7353515625, 70.68359375, 74.6318359375, 78.580078125, 82.5283203125, 86.4765625, 90.4248046875, 94.373046875, 98.3212890625, 102.26953125, 106.2177734375, 110.166015625, 114.1142578125, 118.0625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 6.0, 12.0, 14.0, 9.0, 26.0, 35.0, 47.0, 50.0, 54.0, 76.0, 76.0, 81.0, 83.0, 85.0, 79.0, 67.0, 39.0, 40.0, 35.0, 22.0, 13.0, 14.0, 15.0, 3.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-212.75, -207.6630859375, -202.576171875, -197.4892578125, -192.40234375, -187.3154296875, -182.228515625, -177.1416015625, -172.0546875, -166.9677734375, -161.880859375, -156.7939453125, -151.70703125, -146.6201171875, -141.533203125, -136.4462890625, -131.359375, -126.2724609375, -121.185546875, -116.0986328125, -111.01171875, -105.9248046875, -100.837890625, -95.7509765625, -90.6640625, -85.5771484375, -80.490234375, -75.4033203125, -70.31640625, -65.2294921875, -60.142578125, -55.0556640625, -49.96875, -44.8818359375, -39.794921875, -34.7080078125, -29.62109375, -24.5341796875, -19.447265625, -14.3603515625, -9.2734375, -4.1865234375, 0.900390625, 5.9873046875, 11.07421875, 16.1611328125, 21.248046875, 26.3349609375, 31.421875, 36.5087890625, 41.595703125, 46.6826171875, 51.76953125, 56.8564453125, 61.943359375, 67.0302734375, 72.1171875, 77.2041015625, 82.291015625, 87.3779296875, 92.46484375, 97.5517578125, 102.638671875, 107.7255859375, 112.8125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 5.0, 10.0, 9.0, 17.0, 32.0, 35.0, 56.0, 112.0, 206.0, 388.0, 806.0, 2227.0, 8347.0, 75714.0, 919307.0, 33382.0, 5256.0, 1452.0, 560.0, 278.0, 147.0, 82.0, 37.0, 22.0, 23.0, 13.0, 11.0, 4.0, 4.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-377.5, -367.65625, -357.8125, -347.96875, -338.125, -328.28125, -318.4375, -308.59375, -298.75, -288.90625, -279.0625, -269.21875, -259.375, -249.53125, -239.6875, -229.84375, -220.0, -210.15625, -200.3125, -190.46875, -180.625, -170.78125, -160.9375, -151.09375, -141.25, -131.40625, -121.5625, -111.71875, -101.875, -92.03125, -82.1875, -72.34375, -62.5, -52.65625, -42.8125, -32.96875, -23.125, -13.28125, -3.4375, 6.40625, 16.25, 26.09375, 35.9375, 45.78125, 55.625, 65.46875, 75.3125, 85.15625, 95.0, 104.84375, 114.6875, 124.53125, 134.375, 144.21875, 154.0625, 163.90625, 173.75, 183.59375, 193.4375, 203.28125, 213.125, 222.96875, 232.8125, 242.65625, 252.5]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 3.0, 8.0, 13.0, 16.0, 10.0, 14.0, 24.0, 28.0, 45.0, 56.0, 60.0, 89.0, 110.0, 94.0, 95.0, 65.0, 46.0, 35.0, 28.0, 24.0, 19.0, 19.0, 16.0, 12.0, 13.0, 10.0, 8.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-627.0, -609.09375, -591.1875, -573.28125, -555.375, -537.46875, -519.5625, -501.65625, -483.75, -465.84375, -447.9375, -430.03125, -412.125, -394.21875, -376.3125, -358.40625, -340.5, -322.59375, -304.6875, -286.78125, -268.875, -250.96875, -233.0625, -215.15625, -197.25, -179.34375, -161.4375, -143.53125, -125.625, -107.71875, -89.8125, -71.90625, -54.0, -36.09375, -18.1875, -0.28125, 17.625, 35.53125, 53.4375, 71.34375, 89.25, 107.15625, 125.0625, 142.96875, 160.875, 178.78125, 196.6875, 214.59375, 232.5, 250.40625, 268.3125, 286.21875, 304.125, 322.03125, 339.9375, 357.84375, 375.75, 393.65625, 411.5625, 429.46875, 447.375, 465.28125, 483.1875, 501.09375, 519.0]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 8.0, 16.0, 26.0, 33.0, 30.0, 78.0, 118.0, 140.0, 238.0, 369.0, 525.0, 940.0, 1736.0, 3098.0, 6532.0, 14557.0, 36848.0, 125883.0, 731061.0, 78087.0, 26233.0, 11096.0, 4959.0, 2580.0, 1295.0, 757.0, 448.0, 314.0, 142.0, 105.0, 83.0, 57.0, 39.0, 36.0, 27.0, 16.0, 10.0, 10.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.65625, -31.73193359375, -30.8076171875, -29.88330078125, -28.958984375, -28.03466796875, -27.1103515625, -26.18603515625, -25.26171875, -24.33740234375, -23.4130859375, -22.48876953125, -21.564453125, -20.64013671875, -19.7158203125, -18.79150390625, -17.8671875, -16.94287109375, -16.0185546875, -15.09423828125, -14.169921875, -13.24560546875, -12.3212890625, -11.39697265625, -10.47265625, -9.54833984375, -8.6240234375, -7.69970703125, -6.775390625, -5.85107421875, -4.9267578125, -4.00244140625, -3.078125, -2.15380859375, -1.2294921875, -0.30517578125, 0.619140625, 1.54345703125, 2.4677734375, 3.39208984375, 4.31640625, 5.24072265625, 6.1650390625, 7.08935546875, 8.013671875, 8.93798828125, 9.8623046875, 10.78662109375, 11.7109375, 12.63525390625, 13.5595703125, 14.48388671875, 15.408203125, 16.33251953125, 17.2568359375, 18.18115234375, 19.10546875, 20.02978515625, 20.9541015625, 21.87841796875, 22.802734375, 23.72705078125, 24.6513671875, 25.57568359375, 26.5]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 10.0, 9.0, 16.0, 11.0, 17.0, 30.0, 32.0, 54.0, 60.0, 100.0, 102.0, 110.0, 114.0, 75.0, 45.0, 24.0, 18.0, 20.0, 23.0, 28.0, 10.0, 13.0, 6.0, 11.0, 6.0, 8.0, 2.0, 5.0, 9.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0151824951171875, -0.014662981033325195, -0.01414346694946289, -0.013623952865600586, -0.013104438781738281, -0.012584924697875977, -0.012065410614013672, -0.011545896530151367, -0.011026382446289062, -0.010506868362426758, -0.009987354278564453, -0.009467840194702148, -0.008948326110839844, -0.008428812026977539, -0.007909297943115234, -0.00738978385925293, -0.006870269775390625, -0.00635075569152832, -0.005831241607666016, -0.005311727523803711, -0.004792213439941406, -0.0042726993560791016, -0.003753185272216797, -0.003233671188354492, -0.0027141571044921875, -0.002194643020629883, -0.0016751289367675781, -0.0011556148529052734, -0.0006361007690429688, -0.00011658668518066406, 0.0004029273986816406, 0.0009224414825439453, 0.00144195556640625, 0.0019614696502685547, 0.0024809837341308594, 0.003000497817993164, 0.0035200119018554688, 0.0040395259857177734, 0.004559040069580078, 0.005078554153442383, 0.0055980682373046875, 0.006117582321166992, 0.006637096405029297, 0.0071566104888916016, 0.007676124572753906, 0.008195638656616211, 0.008715152740478516, 0.00923466682434082, 0.009754180908203125, 0.01027369499206543, 0.010793209075927734, 0.011312723159790039, 0.011832237243652344, 0.012351751327514648, 0.012871265411376953, 0.013390779495239258, 0.013910293579101562, 0.014429807662963867, 0.014949321746826172, 0.015468835830688477, 0.01598834991455078, 0.016507863998413086, 0.01702737808227539, 0.017546892166137695, 0.01806640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 0.0, 8.0, 4.0, 6.0, 7.0, 10.0, 23.0, 32.0, 33.0, 45.0, 72.0, 105.0, 126.0, 184.0, 328.0, 541.0, 866.0, 1414.0, 2353.0, 4595.0, 9504.0, 21076.0, 58059.0, 628716.0, 239931.0, 45726.0, 17461.0, 8073.0, 4024.0, 2032.0, 1185.0, 673.0, 481.0, 277.0, 181.0, 122.0, 63.0, 49.0, 36.0, 44.0, 20.0, 21.0, 10.0, 10.0, 6.0, 7.0, 7.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-25.796875, -24.9619140625, -24.126953125, -23.2919921875, -22.45703125, -21.6220703125, -20.787109375, -19.9521484375, -19.1171875, -18.2822265625, -17.447265625, -16.6123046875, -15.77734375, -14.9423828125, -14.107421875, -13.2724609375, -12.4375, -11.6025390625, -10.767578125, -9.9326171875, -9.09765625, -8.2626953125, -7.427734375, -6.5927734375, -5.7578125, -4.9228515625, -4.087890625, -3.2529296875, -2.41796875, -1.5830078125, -0.748046875, 0.0869140625, 0.921875, 1.7568359375, 2.591796875, 3.4267578125, 4.26171875, 5.0966796875, 5.931640625, 6.7666015625, 7.6015625, 8.4365234375, 9.271484375, 10.1064453125, 10.94140625, 11.7763671875, 12.611328125, 13.4462890625, 14.28125, 15.1162109375, 15.951171875, 16.7861328125, 17.62109375, 18.4560546875, 19.291015625, 20.1259765625, 20.9609375, 21.7958984375, 22.630859375, 23.4658203125, 24.30078125, 25.1357421875, 25.970703125, 26.8056640625, 27.640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 5.0, 1.0, 3.0, 6.0, 6.0, 4.0, 13.0, 9.0, 5.0, 13.0, 8.0, 20.0, 25.0, 8.0, 36.0, 32.0, 29.0, 65.0, 60.0, 76.0, 75.0, 83.0, 72.0, 55.0, 59.0, 43.0, 27.0, 19.0, 21.0, 22.0, 13.0, 21.0, 4.0, 5.0, 11.0, 4.0, 7.0, 8.0, 2.0, 4.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-53.28125, -51.8720703125, -50.462890625, -49.0537109375, -47.64453125, -46.2353515625, -44.826171875, -43.4169921875, -42.0078125, -40.5986328125, -39.189453125, -37.7802734375, -36.37109375, -34.9619140625, -33.552734375, -32.1435546875, -30.734375, -29.3251953125, -27.916015625, -26.5068359375, -25.09765625, -23.6884765625, -22.279296875, -20.8701171875, -19.4609375, -18.0517578125, -16.642578125, -15.2333984375, -13.82421875, -12.4150390625, -11.005859375, -9.5966796875, -8.1875, -6.7783203125, -5.369140625, -3.9599609375, -2.55078125, -1.1416015625, 0.267578125, 1.6767578125, 3.0859375, 4.4951171875, 5.904296875, 7.3134765625, 8.72265625, 10.1318359375, 11.541015625, 12.9501953125, 14.359375, 15.7685546875, 17.177734375, 18.5869140625, 19.99609375, 21.4052734375, 22.814453125, 24.2236328125, 25.6328125, 27.0419921875, 28.451171875, 29.8603515625, 31.26953125, 32.6787109375, 34.087890625, 35.4970703125, 36.90625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 14.0, 21.0, 64.0, 132.0, 566.0, 121.0, 43.0, 18.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3842.87158203125, -3745.427734375, -3647.983642578125, -3550.53955078125, -3453.095703125, -3355.65185546875, -3258.207763671875, -3160.763671875, -3063.31982421875, -2965.8759765625, -2868.431884765625, -2770.98779296875, -2673.5439453125, -2576.10009765625, -2478.656005859375, -2381.2119140625, -2283.76806640625, -2186.32421875, -2088.880126953125, -1991.4361572265625, -1893.9921875, -1796.5482177734375, -1699.104248046875, -1601.6602783203125, -1504.21630859375, -1406.7723388671875, -1309.328369140625, -1211.8843994140625, -1114.4404296875, -1016.9964599609375, -919.552490234375, -822.1085205078125, -724.664794921875, -627.2208251953125, -529.77685546875, -432.3328857421875, -334.888916015625, -237.4449462890625, -140.0009765625, -42.5570068359375, 54.886962890625, 152.3309326171875, 249.77490234375, 347.2188720703125, 444.662841796875, 542.1068115234375, 639.55078125, 736.9947509765625, 834.438720703125, 931.8826904296875, 1029.32666015625, 1126.7706298828125, 1224.214599609375, 1321.6585693359375, 1419.1025390625, 1516.5465087890625, 1613.990478515625, 1711.4344482421875, 1808.87841796875, 1906.3223876953125, 2003.766357421875, 2101.21044921875, 2198.654296875, 2296.09814453125, 2393.542236328125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 6.0, 3.0, 11.0, 6.0, 10.0, 8.0, 14.0, 11.0, 18.0, 25.0, 22.0, 22.0, 22.0, 24.0, 33.0, 42.0, 101.0, 224.0, 131.0, 39.0, 28.0, 28.0, 24.0, 17.0, 16.0, 16.0, 15.0, 8.0, 22.0, 9.0, 4.0, 6.0, 5.0, 13.0, 3.0, 8.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1208.075927734375, -1169.9229736328125, -1131.77001953125, -1093.6170654296875, -1055.464111328125, -1017.3110961914062, -979.1581420898438, -941.005126953125, -902.8521728515625, -864.69921875, -826.5462646484375, -788.393310546875, -750.2402954101562, -712.0873413085938, -673.9343872070312, -635.7813720703125, -597.6284790039062, -559.4755249023438, -521.3225708007812, -483.1695861816406, -445.0166015625, -406.8636474609375, -368.710693359375, -330.5577087402344, -292.4047546386719, -254.2517852783203, -216.09881591796875, -177.94586181640625, -139.7928924560547, -101.63992309570312, -63.486968994140625, -25.333984375, 12.8189697265625, 50.9719352722168, 89.1249008178711, 127.27786254882812, 165.4308319091797, 203.58380126953125, 241.73675537109375, 279.8897399902344, 318.0426940917969, 356.1956481933594, 394.3486328125, 432.5015869140625, 470.654541015625, 508.8075256347656, 546.96044921875, 585.1134643554688, 623.2664184570312, 661.4193725585938, 699.5723266601562, 737.725341796875, 775.8782958984375, 814.03125, 852.1842041015625, 890.337158203125, 928.4901123046875, 966.64306640625, 1004.7960205078125, 1042.948974609375, 1081.1019287109375, 1119.2548828125, 1157.407958984375, 1195.5609130859375, 1233.7138671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 11.0, 12.0, 14.0, 11.0, 22.0, 14.0, 20.0, 21.0, 24.0, 28.0, 34.0, 45.0, 62.0, 141.0, 155.0, 65.0, 45.0, 41.0, 25.0, 34.0, 22.0, 21.0, 29.0, 17.0, 22.0, 10.0, 7.0, 9.0, 7.0, 4.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.0, -124.71875, -121.4375, -118.15625, -114.875, -111.59375, -108.3125, -105.03125, -101.75, -98.46875, -95.1875, -91.90625, -88.625, -85.34375, -82.0625, -78.78125, -75.5, -72.21875, -68.9375, -65.65625, -62.375, -59.09375, -55.8125, -52.53125, -49.25, -45.96875, -42.6875, -39.40625, -36.125, -32.84375, -29.5625, -26.28125, -23.0, -19.71875, -16.4375, -13.15625, -9.875, -6.59375, -3.3125, -0.03125, 3.25, 6.53125, 9.8125, 13.09375, 16.375, 19.65625, 22.9375, 26.21875, 29.5, 32.78125, 36.0625, 39.34375, 42.625, 45.90625, 49.1875, 52.46875, 55.75, 59.03125, 62.3125, 65.59375, 68.875, 72.15625, 75.4375, 78.71875, 82.0]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 2.0, 4.0, 16.0, 18.0, 24.0, 34.0, 46.0, 44.0, 61.0, 163.0, 252.0, 621.0, 1768.0, 7060.0, 399539.0, 7967438.0, 8207.0, 1950.0, 641.0, 266.0, 141.0, 94.0, 40.0, 46.0, 26.0, 17.0, 7.0, 7.0, 15.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-734.0562744140625, -713.1082763671875, -692.1602172851562, -671.212158203125, -650.26416015625, -629.316162109375, -608.3681030273438, -587.4200439453125, -566.4720458984375, -545.5240478515625, -524.5759887695312, -503.6279602050781, -482.679931640625, -461.7319030761719, -440.78387451171875, -419.8358459472656, -398.8878173828125, -377.9397888183594, -356.99176025390625, -336.0437316894531, -315.095703125, -294.1476745605469, -273.19964599609375, -252.25161743164062, -231.3035888671875, -210.35556030273438, -189.40753173828125, -168.45950317382812, -147.511474609375, -126.56344604492188, -105.61541748046875, -84.66738891601562, -63.7193603515625, -42.771331787109375, -21.82330322265625, -0.875274658203125, 20.07275390625, 41.020782470703125, 61.96881103515625, 82.91683959960938, 103.8648681640625, 124.81289672851562, 145.76092529296875, 166.70895385742188, 187.656982421875, 208.60501098632812, 229.55303955078125, 250.50106811523438, 271.4490966796875, 292.3971252441406, 313.34515380859375, 334.2931823730469, 355.2412109375, 376.1892395019531, 397.13726806640625, 418.0852966308594, 439.0333251953125, 459.9813537597656, 480.92938232421875, 501.8774108886719, 522.825439453125, 543.7734375, 564.7214965820312, 585.6695556640625, 606.6175537109375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 5.0, 4.0, 2.0, 5.0, 3.0, 7.0, 2.0, 6.0, 3.0, 4.0, 4.0, 1.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-653.5410766601562, -628.9877319335938, -604.434326171875, -579.8809814453125, -555.3275756835938, -530.7742309570312, -506.2208557128906, -481.66748046875, -457.1141052246094, -432.56072998046875, -408.0073547363281, -383.4539794921875, -358.900634765625, -334.34722900390625, -309.79388427734375, -285.2405090332031, -260.6871337890625, -236.13375854492188, -211.58038330078125, -187.0270233154297, -162.47364807128906, -137.92027282714844, -113.36691284179688, -88.81353759765625, -64.26016235351562, -39.706790924072266, -15.153419494628906, 9.399948120117188, 33.95332336425781, 58.50669860839844, 83.06005859375, 107.61343383789062, 132.166748046875, 156.72012329101562, 181.27349853515625, 205.8268585205078, 230.38023376464844, 254.93360900878906, 279.4869689941406, 304.04034423828125, 328.5937194824219, 353.1470947265625, 377.7004699707031, 402.25384521484375, 426.80718994140625, 451.360595703125, 475.9139404296875, 500.4673156738281, 525.0206909179688, 549.5740356445312, 574.12744140625, 598.6807861328125, 623.2341918945312, 647.7875366210938, 672.3409423828125, 696.894287109375, 721.4476318359375, 746.0009765625, 770.5543823242188, 795.1077270507812, 819.6611328125, 844.2144775390625, 868.767822265625, 893.3212280273438, 917.8746337890625]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 8.0, 6.0, 10.0, 11.0, 32.0, 25.0, 33.0, 46.0, 56.0, 57.0, 58.0, 60.0, 53.0, 69.0, 61.0, 69.0, 51.0, 65.0, 50.0, 32.0, 36.0, 23.0, 24.0, 17.0, 9.0, 6.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-103.1875, -100.443359375, -97.69921875, -94.955078125, -92.2109375, -89.466796875, -86.72265625, -83.978515625, -81.234375, -78.490234375, -75.74609375, -73.001953125, -70.2578125, -67.513671875, -64.76953125, -62.025390625, -59.28125, -56.537109375, -53.79296875, -51.048828125, -48.3046875, -45.560546875, -42.81640625, -40.072265625, -37.328125, -34.583984375, -31.83984375, -29.095703125, -26.3515625, -23.607421875, -20.86328125, -18.119140625, -15.375, -12.630859375, -9.88671875, -7.142578125, -4.3984375, -1.654296875, 1.08984375, 3.833984375, 6.578125, 9.322265625, 12.06640625, 14.810546875, 17.5546875, 20.298828125, 23.04296875, 25.787109375, 28.53125, 31.275390625, 34.01953125, 36.763671875, 39.5078125, 42.251953125, 44.99609375, 47.740234375, 50.484375, 53.228515625, 55.97265625, 58.716796875, 61.4609375, 64.205078125, 66.94921875, 69.693359375, 72.4375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 13.0, 13.0, 29.0, 36.0, 58.0, 111.0, 197.0, 379.0, 885.0, 1997.0, 5121.0, 14731.0, 46749.0, 157176.0, 199396.0, 65588.0, 19744.0, 7078.0, 2651.0, 1068.0, 579.0, 279.0, 162.0, 82.0, 54.0, 21.0, 17.0, 14.0, 7.0, 9.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-595.0, -574.578125, -554.15625, -533.734375, -513.3125, -492.890625, -472.46875, -452.046875, -431.625, -411.203125, -390.78125, -370.359375, -349.9375, -329.515625, -309.09375, -288.671875, -268.25, -247.828125, -227.40625, -206.984375, -186.5625, -166.140625, -145.71875, -125.296875, -104.875, -84.453125, -64.03125, -43.609375, -23.1875, -2.765625, 17.65625, 38.078125, 58.5, 78.921875, 99.34375, 119.765625, 140.1875, 160.609375, 181.03125, 201.453125, 221.875, 242.296875, 262.71875, 283.140625, 303.5625, 323.984375, 344.40625, 364.828125, 385.25, 405.671875, 426.09375, 446.515625, 466.9375, 487.359375, 507.78125, 528.203125, 548.625, 569.046875, 589.46875, 609.890625, 630.3125, 650.734375, 671.15625, 691.578125, 712.0]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 6.0, 6.0, 4.0, 10.0, 11.0, 14.0, 11.0, 18.0, 16.0, 23.0, 26.0, 51.0, 46.0, 40.0, 48.0, 49.0, 37.0, 49.0, 53.0, 57.0, 54.0, 47.0, 36.0, 42.0, 42.0, 34.0, 26.0, 25.0, 17.0, 14.0, 17.0, 17.0, 10.0, 6.0, 4.0, 12.0, 6.0, 4.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.1875, -80.6728515625, -78.158203125, -75.6435546875, -73.12890625, -70.6142578125, -68.099609375, -65.5849609375, -63.0703125, -60.5556640625, -58.041015625, -55.5263671875, -53.01171875, -50.4970703125, -47.982421875, -45.4677734375, -42.953125, -40.4384765625, -37.923828125, -35.4091796875, -32.89453125, -30.3798828125, -27.865234375, -25.3505859375, -22.8359375, -20.3212890625, -17.806640625, -15.2919921875, -12.77734375, -10.2626953125, -7.748046875, -5.2333984375, -2.71875, -0.2041015625, 2.310546875, 4.8251953125, 7.33984375, 9.8544921875, 12.369140625, 14.8837890625, 17.3984375, 19.9130859375, 22.427734375, 24.9423828125, 27.45703125, 29.9716796875, 32.486328125, 35.0009765625, 37.515625, 40.0302734375, 42.544921875, 45.0595703125, 47.57421875, 50.0888671875, 52.603515625, 55.1181640625, 57.6328125, 60.1474609375, 62.662109375, 65.1767578125, 67.69140625, 70.2060546875, 72.720703125, 75.2353515625, 77.75]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 2.0, 3.0, 6.0, 1.0, 5.0, 9.0, 20.0, 45.0, 53.0, 75.0, 69.0, 70.0, 32.0, 31.0, 13.0, 8.0, 6.0, 4.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-642.891845703125, -625.7798461914062, -608.6679077148438, -591.555908203125, -574.4439086914062, -557.3319091796875, -540.219970703125, -523.1079711914062, -505.9959716796875, -488.8840026855469, -471.7720031738281, -454.6600341796875, -437.54803466796875, -420.4360656738281, -403.3240966796875, -386.21209716796875, -369.1001281738281, -351.9881591796875, -334.87615966796875, -317.7641906738281, -300.6521911621094, -283.54022216796875, -266.42822265625, -249.31625366210938, -232.2042694091797, -215.09228515625, -197.9803009033203, -180.86831665039062, -163.75634765625, -146.64434814453125, -129.53237915039062, -112.42039489746094, -95.30838012695312, -78.19639587402344, -61.084415435791016, -43.972434997558594, -26.860450744628906, -9.748466491699219, 7.3635101318359375, 24.475494384765625, 41.58747863769531, 58.699462890625, 75.81144714355469, 92.92342376708984, 110.03540802001953, 127.14739227294922, 144.25936889648438, 161.37135314941406, 178.48333740234375, 195.59532165527344, 212.70730590820312, 229.81927490234375, 246.9312744140625, 264.0432434082031, 281.15521240234375, 298.2672119140625, 315.37921142578125, 332.4911804199219, 349.6031799316406, 366.71514892578125, 383.8271484375, 400.9391174316406, 418.05108642578125, 435.1630859375, 452.2750549316406]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 5.0, 1.0, 8.0, 2.0, 0.0, 5.0, 5.0, 4.0, 4.0, 4.0, 8.0, 10.0, 20.0, 52.0, 59.0, 80.0, 79.0, 37.0, 23.0, 16.0, 16.0, 11.0, 2.0, 3.0, 5.0, 1.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-445.65655517578125, -431.13250732421875, -416.6084289550781, -402.0843811035156, -387.5603332519531, -373.0362548828125, -358.51220703125, -343.9881591796875, -329.464111328125, -314.9400634765625, -300.4159851074219, -285.8919372558594, -271.3678894042969, -256.84381103515625, -242.31976318359375, -227.79571533203125, -213.27163696289062, -198.74757385253906, -184.22352600097656, -169.699462890625, -155.1754150390625, -140.65135192871094, -126.12728881835938, -111.60323333740234, -97.07917785644531, -82.55512237548828, -68.03106689453125, -53.50700378417969, -38.982948303222656, -24.458892822265625, -9.934829711914062, 4.589225769042969, 19.11328125, 33.63733673095703, 48.16139602661133, 62.685455322265625, 77.20951080322266, 91.73356628417969, 106.25762939453125, 120.78168487548828, 135.3057403564453, 149.82980346679688, 164.35385131835938, 178.87791442871094, 193.4019775390625, 207.926025390625, 222.45008850097656, 236.97415161132812, 251.49819946289062, 266.0222473144531, 280.54632568359375, 295.07037353515625, 309.59442138671875, 324.11846923828125, 338.6425476074219, 353.1665954589844, 367.690673828125, 382.2147216796875, 396.7388000488281, 411.2628479003906, 425.7868957519531, 440.31097412109375, 454.83502197265625, 469.35906982421875, 483.88311767578125]}, "eval/loss": 0.717689573764801, "eval/wer": 0.12834192780642603, "eval/runtime": 818.6465, "eval/samples_per_second": 3.227, "eval/steps_per_second": 0.404, "train/train_runtime": 35320.0928, "train/train_samples_per_second": 20.2, "train/train_steps_per_second": 0.631, "train/total_flos": 0.0, "train/train_loss": 0.08645637407097047} \ No newline at end of file +{"train/loss": 0.4226, "train/learning_rate": 1.267605633802817e-08, "train/epoch": 25.0, "train/global_step": 22300, "_runtime": 36452, "_timestamp": 1648177792, "_step": 5804, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 6.0, 7.0, 11.0, 11.0, 20.0, 11.0, 14.0, 23.0, 26.0, 38.0, 45.0, 46.0, 65.0, 51.0, 60.0, 89.0, 87.0, 60.0, 64.0, 45.0, 40.0, 34.0, 22.0, 25.0, 14.0, 13.0, 11.0, 11.0, 8.0, 3.0, 5.0, 7.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.9212875366211, -70.6487808227539, -68.37626647949219, -66.103759765625, -63.83124542236328, -61.558738708496094, -59.28622817993164, -57.01371765136719, -54.741207122802734, -52.46869659423828, -50.19618606567383, -47.923675537109375, -45.65116882324219, -43.37865447998047, -41.10614776611328, -38.83363723754883, -36.561126708984375, -34.28861618041992, -32.01610565185547, -29.74359703063965, -27.471086502075195, -25.198575973510742, -22.926067352294922, -20.65355682373047, -18.381046295166016, -16.108535766601562, -13.836026191711426, -11.563516616821289, -9.291006088256836, -7.018495559692383, -4.745985984802246, -2.4734764099121094, -0.200958251953125, 2.07155179977417, 4.344061851501465, 6.61657190322876, 8.889081954956055, 11.161592483520508, 13.434102058410645, 15.706611633300781, 17.979122161865234, 20.251632690429688, 22.52414321899414, 24.79665184020996, 27.069162368774414, 29.341672897338867, 31.614181518554688, 33.88669204711914, 36.159202575683594, 38.43171310424805, 40.7042236328125, 42.97673416137695, 45.249244689941406, 47.521751403808594, 49.79426193237305, 52.0667724609375, 54.33928298950195, 56.611793518066406, 58.88430404663086, 61.15681457519531, 63.4293212890625, 65.70183563232422, 67.9743423461914, 70.24685668945312, 72.51936340332031]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 7.0, 5.0, 10.0, 12.0, 19.0, 19.0, 23.0, 12.0, 26.0, 25.0, 37.0, 27.0, 17.0, 37.0, 38.0, 45.0, 38.0, 52.0, 47.0, 29.0, 52.0, 38.0, 43.0, 46.0, 35.0, 37.0, 25.0, 26.0, 29.0, 22.0, 33.0, 14.0, 17.0, 18.0, 12.0, 4.0, 6.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.53594207763672, -54.687095642089844, -52.8382453918457, -50.98939895629883, -49.14055252075195, -47.29170227050781, -45.44285583496094, -43.59400939941406, -41.74516296386719, -39.89631652832031, -38.04746627807617, -36.1986198425293, -34.34977340698242, -32.50092315673828, -30.652076721191406, -28.80323028564453, -26.954381942749023, -25.105533599853516, -23.25668716430664, -21.407838821411133, -19.558992385864258, -17.71014404296875, -15.861296653747559, -14.012449264526367, -12.163601875305176, -10.314754486083984, -8.465907096862793, -6.617059230804443, -4.768211841583252, -2.9193639755249023, -1.070516586303711, 0.7783308029174805, 2.627178192138672, 4.476025581359863, 6.324872970581055, 8.173721313476562, 10.022567749023438, 11.871416091918945, 13.720263481140137, 15.569110870361328, 17.417957305908203, 19.26680564880371, 21.115652084350586, 22.964500427246094, 24.81334686279297, 26.662195205688477, 28.511043548583984, 30.35988998413086, 32.208740234375, 34.057586669921875, 35.906436920166016, 37.75528335571289, 39.604129791259766, 41.452980041503906, 43.30182647705078, 45.150672912597656, 46.99951934814453, 48.848365783691406, 50.69721603393555, 52.54606246948242, 54.3949089050293, 56.24375915527344, 58.09260559082031, 59.94145202636719, 61.79029846191406]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 10.0, 10.0, 21.0, 26.0, 44.0, 83.0, 134.0, 211.0, 327.0, 586.0, 931.0, 1394.0, 2381.0, 3782.0, 6175.0, 10901.0, 18717.0, 34611.0, 67966.0, 161762.0, 685990.0, 2363443.0, 548131.0, 146489.0, 64826.0, 32758.0, 17488.0, 9830.0, 5845.0, 3556.0, 2130.0, 1248.0, 867.0, 542.0, 362.0, 241.0, 149.0, 93.0, 73.0, 40.0, 38.0, 33.0, 15.0, 11.0, 8.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-158.25, -152.685546875, -147.12109375, -141.556640625, -135.9921875, -130.427734375, -124.86328125, -119.298828125, -113.734375, -108.169921875, -102.60546875, -97.041015625, -91.4765625, -85.912109375, -80.34765625, -74.783203125, -69.21875, -63.654296875, -58.08984375, -52.525390625, -46.9609375, -41.396484375, -35.83203125, -30.267578125, -24.703125, -19.138671875, -13.57421875, -8.009765625, -2.4453125, 3.119140625, 8.68359375, 14.248046875, 19.8125, 25.376953125, 30.94140625, 36.505859375, 42.0703125, 47.634765625, 53.19921875, 58.763671875, 64.328125, 69.892578125, 75.45703125, 81.021484375, 86.5859375, 92.150390625, 97.71484375, 103.279296875, 108.84375, 114.408203125, 119.97265625, 125.537109375, 131.1015625, 136.666015625, 142.23046875, 147.794921875, 153.359375, 158.923828125, 164.48828125, 170.052734375, 175.6171875, 181.181640625, 186.74609375, 192.310546875, 197.875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 8.0, 4.0, 10.0, 9.0, 13.0, 15.0, 20.0, 23.0, 15.0, 19.0, 24.0, 29.0, 28.0, 38.0, 39.0, 47.0, 41.0, 45.0, 41.0, 34.0, 49.0, 34.0, 40.0, 46.0, 35.0, 36.0, 35.0, 44.0, 21.0, 18.0, 35.0, 22.0, 16.0, 10.0, 6.0, 7.0, 10.0, 8.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-63.4375, -61.49560546875, -59.5537109375, -57.61181640625, -55.669921875, -53.72802734375, -51.7861328125, -49.84423828125, -47.90234375, -45.96044921875, -44.0185546875, -42.07666015625, -40.134765625, -38.19287109375, -36.2509765625, -34.30908203125, -32.3671875, -30.42529296875, -28.4833984375, -26.54150390625, -24.599609375, -22.65771484375, -20.7158203125, -18.77392578125, -16.83203125, -14.89013671875, -12.9482421875, -11.00634765625, -9.064453125, -7.12255859375, -5.1806640625, -3.23876953125, -1.296875, 0.64501953125, 2.5869140625, 4.52880859375, 6.470703125, 8.41259765625, 10.3544921875, 12.29638671875, 14.23828125, 16.18017578125, 18.1220703125, 20.06396484375, 22.005859375, 23.94775390625, 25.8896484375, 27.83154296875, 29.7734375, 31.71533203125, 33.6572265625, 35.59912109375, 37.541015625, 39.48291015625, 41.4248046875, 43.36669921875, 45.30859375, 47.25048828125, 49.1923828125, 51.13427734375, 53.076171875, 55.01806640625, 56.9599609375, 58.90185546875, 60.84375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 8.0, 18.0, 12.0, 27.0, 40.0, 59.0, 61.0, 123.0, 172.0, 219.0, 378.0, 518.0, 799.0, 1188.0, 1920.0, 2780.0, 4217.0, 6438.0, 10368.0, 17425.0, 29950.0, 54812.0, 111080.0, 264698.0, 961221.0, 1966680.0, 431117.0, 157512.0, 73304.0, 39152.0, 21986.0, 13041.0, 8045.0, 5078.0, 3254.0, 2147.0, 1441.0, 980.0, 662.0, 416.0, 313.0, 210.0, 133.0, 101.0, 55.0, 43.0, 30.0, 21.0, 10.0, 13.0, 8.0, 5.0, 2.0, 2.0, 2.0], "bins": [-144.5, -140.27734375, -136.0546875, -131.83203125, -127.609375, -123.38671875, -119.1640625, -114.94140625, -110.71875, -106.49609375, -102.2734375, -98.05078125, -93.828125, -89.60546875, -85.3828125, -81.16015625, -76.9375, -72.71484375, -68.4921875, -64.26953125, -60.046875, -55.82421875, -51.6015625, -47.37890625, -43.15625, -38.93359375, -34.7109375, -30.48828125, -26.265625, -22.04296875, -17.8203125, -13.59765625, -9.375, -5.15234375, -0.9296875, 3.29296875, 7.515625, 11.73828125, 15.9609375, 20.18359375, 24.40625, 28.62890625, 32.8515625, 37.07421875, 41.296875, 45.51953125, 49.7421875, 53.96484375, 58.1875, 62.41015625, 66.6328125, 70.85546875, 75.078125, 79.30078125, 83.5234375, 87.74609375, 91.96875, 96.19140625, 100.4140625, 104.63671875, 108.859375, 113.08203125, 117.3046875, 121.52734375, 125.75]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 4.0, 13.0, 10.0, 9.0, 24.0, 25.0, 23.0, 27.0, 39.0, 34.0, 58.0, 85.0, 121.0, 139.0, 177.0, 279.0, 392.0, 639.0, 571.0, 368.0, 270.0, 182.0, 125.0, 92.0, 82.0, 67.0, 38.0, 33.0, 21.0, 28.0, 15.0, 11.0, 12.0, 10.0, 9.0, 9.0, 6.0, 5.0, 2.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-45.4375, -44.05517578125, -42.6728515625, -41.29052734375, -39.908203125, -38.52587890625, -37.1435546875, -35.76123046875, -34.37890625, -32.99658203125, -31.6142578125, -30.23193359375, -28.849609375, -27.46728515625, -26.0849609375, -24.70263671875, -23.3203125, -21.93798828125, -20.5556640625, -19.17333984375, -17.791015625, -16.40869140625, -15.0263671875, -13.64404296875, -12.26171875, -10.87939453125, -9.4970703125, -8.11474609375, -6.732421875, -5.35009765625, -3.9677734375, -2.58544921875, -1.203125, 0.17919921875, 1.5615234375, 2.94384765625, 4.326171875, 5.70849609375, 7.0908203125, 8.47314453125, 9.85546875, 11.23779296875, 12.6201171875, 14.00244140625, 15.384765625, 16.76708984375, 18.1494140625, 19.53173828125, 20.9140625, 22.29638671875, 23.6787109375, 25.06103515625, 26.443359375, 27.82568359375, 29.2080078125, 30.59033203125, 31.97265625, 33.35498046875, 34.7373046875, 36.11962890625, 37.501953125, 38.88427734375, 40.2666015625, 41.64892578125, 43.03125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 10.0, 8.0, 7.0, 16.0, 8.0, 20.0, 26.0, 29.0, 43.0, 62.0, 83.0, 100.0, 122.0, 107.0, 85.0, 76.0, 42.0, 34.0, 32.0, 24.0, 19.0, 6.0, 11.0, 12.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.39942932128906, -132.21673583984375, -128.0340576171875, -123.85136413574219, -119.66867065429688, -115.4859848022461, -111.30329895019531, -107.12060546875, -102.93791961669922, -98.75523376464844, -94.57254028320312, -90.38985443115234, -86.20716857910156, -82.02447509765625, -77.84178924560547, -73.65910339355469, -69.47640991210938, -65.2937240600586, -61.11103057861328, -56.9283447265625, -52.74565505981445, -48.562965393066406, -44.380279541015625, -40.19758987426758, -36.01490020751953, -31.832210540771484, -27.64952278137207, -23.466835021972656, -19.28414535522461, -15.101455688476562, -10.918767929077148, -6.736080169677734, -2.55340576171875, 1.6292829513549805, 5.811971664428711, 9.994660377502441, 14.177349090576172, 18.36003875732422, 22.542726516723633, 26.725414276123047, 30.908103942871094, 35.09079360961914, 39.27348327636719, 43.45616912841797, 47.638858795166016, 51.82154846191406, 56.004234313964844, 60.18692398071289, 64.36961364746094, 68.55229949951172, 72.73499298095703, 76.91767883300781, 81.10037231445312, 85.2830581665039, 89.46574401855469, 93.6484375, 97.83112335205078, 102.01380920410156, 106.19650268554688, 110.37918853759766, 114.56187438964844, 118.74456787109375, 122.92725372314453, 127.10993957519531, 131.29263305664062]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 7.0, 7.0, 13.0, 7.0, 15.0, 11.0, 20.0, 22.0, 25.0, 22.0, 38.0, 24.0, 36.0, 46.0, 43.0, 41.0, 46.0, 53.0, 46.0, 52.0, 39.0, 45.0, 42.0, 40.0, 20.0, 33.0, 29.0, 28.0, 20.0, 21.0, 16.0, 15.0, 12.0, 12.0, 8.0, 10.0, 10.0, 9.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-74.71490478515625, -72.24452209472656, -69.7741470336914, -67.30377197265625, -64.83338928222656, -62.36301040649414, -59.89263153076172, -57.4222526550293, -54.951873779296875, -52.48149490356445, -50.01111602783203, -47.54073715209961, -45.07035827636719, -42.599979400634766, -40.129600524902344, -37.65922164916992, -35.1888427734375, -32.71846389770508, -30.248085021972656, -27.777706146240234, -25.307327270507812, -22.83694839477539, -20.36656951904297, -17.896190643310547, -15.425811767578125, -12.955432891845703, -10.485054016113281, -8.01467514038086, -5.5442962646484375, -3.0739173889160156, -0.6035385131835938, 1.8668403625488281, 4.337226867675781, 6.807605743408203, 9.277984619140625, 11.748363494873047, 14.218742370605469, 16.68912124633789, 19.159500122070312, 21.629878997802734, 24.100257873535156, 26.570636749267578, 29.041015625, 31.511394500732422, 33.981773376464844, 36.452152252197266, 38.92253112792969, 41.39291000366211, 43.86328887939453, 46.33366775512695, 48.804046630859375, 51.2744255065918, 53.74480438232422, 56.21518325805664, 58.68556213378906, 61.155941009521484, 63.626319885253906, 66.09669494628906, 68.56707763671875, 71.03746032714844, 73.5078353881836, 75.97821044921875, 78.44859313964844, 80.91897583007812, 83.38935089111328]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 8.0, 8.0, 19.0, 26.0, 35.0, 52.0, 72.0, 118.0, 150.0, 238.0, 300.0, 445.0, 676.0, 925.0, 1418.0, 2052.0, 3065.0, 4531.0, 6650.0, 10002.0, 15085.0, 23352.0, 37639.0, 62513.0, 109378.0, 212042.0, 244831.0, 125036.0, 69905.0, 41915.0, 26019.0, 16541.0, 10825.0, 7336.0, 4831.0, 3302.0, 2227.0, 1539.0, 1116.0, 706.0, 496.0, 325.0, 240.0, 180.0, 118.0, 93.0, 54.0, 35.0, 26.0, 21.0, 17.0, 4.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-36.90625, -35.7568359375, -34.607421875, -33.4580078125, -32.30859375, -31.1591796875, -30.009765625, -28.8603515625, -27.7109375, -26.5615234375, -25.412109375, -24.2626953125, -23.11328125, -21.9638671875, -20.814453125, -19.6650390625, -18.515625, -17.3662109375, -16.216796875, -15.0673828125, -13.91796875, -12.7685546875, -11.619140625, -10.4697265625, -9.3203125, -8.1708984375, -7.021484375, -5.8720703125, -4.72265625, -3.5732421875, -2.423828125, -1.2744140625, -0.125, 1.0244140625, 2.173828125, 3.3232421875, 4.47265625, 5.6220703125, 6.771484375, 7.9208984375, 9.0703125, 10.2197265625, 11.369140625, 12.5185546875, 13.66796875, 14.8173828125, 15.966796875, 17.1162109375, 18.265625, 19.4150390625, 20.564453125, 21.7138671875, 22.86328125, 24.0126953125, 25.162109375, 26.3115234375, 27.4609375, 28.6103515625, 29.759765625, 30.9091796875, 32.05859375, 33.2080078125, 34.357421875, 35.5068359375, 36.65625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 10.0, 9.0, 12.0, 11.0, 15.0, 14.0, 22.0, 26.0, 31.0, 27.0, 31.0, 37.0, 43.0, 46.0, 40.0, 60.0, 61.0, 54.0, 51.0, 54.0, 39.0, 34.0, 39.0, 23.0, 29.0, 25.0, 22.0, 11.0, 21.0, 15.0, 15.0, 12.0, 8.0, 10.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.875, -79.2421875, -76.609375, -73.9765625, -71.34375, -68.7109375, -66.078125, -63.4453125, -60.8125, -58.1796875, -55.546875, -52.9140625, -50.28125, -47.6484375, -45.015625, -42.3828125, -39.75, -37.1171875, -34.484375, -31.8515625, -29.21875, -26.5859375, -23.953125, -21.3203125, -18.6875, -16.0546875, -13.421875, -10.7890625, -8.15625, -5.5234375, -2.890625, -0.2578125, 2.375, 5.0078125, 7.640625, 10.2734375, 12.90625, 15.5390625, 18.171875, 20.8046875, 23.4375, 26.0703125, 28.703125, 31.3359375, 33.96875, 36.6015625, 39.234375, 41.8671875, 44.5, 47.1328125, 49.765625, 52.3984375, 55.03125, 57.6640625, 60.296875, 62.9296875, 65.5625, 68.1953125, 70.828125, 73.4609375, 76.09375, 78.7265625, 81.359375, 83.9921875, 86.625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 16.0, 12.0, 21.0, 26.0, 45.0, 75.0, 131.0, 225.0, 492.0, 1114.0, 2880.0, 8596.0, 33849.0, 919540.0, 62954.0, 11954.0, 3874.0, 1440.0, 627.0, 265.0, 146.0, 87.0, 48.0, 29.0, 26.0, 13.0, 17.0, 10.0, 6.0, 9.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.75, -107.84765625, -103.9453125, -100.04296875, -96.140625, -92.23828125, -88.3359375, -84.43359375, -80.53125, -76.62890625, -72.7265625, -68.82421875, -64.921875, -61.01953125, -57.1171875, -53.21484375, -49.3125, -45.41015625, -41.5078125, -37.60546875, -33.703125, -29.80078125, -25.8984375, -21.99609375, -18.09375, -14.19140625, -10.2890625, -6.38671875, -2.484375, 1.41796875, 5.3203125, 9.22265625, 13.125, 17.02734375, 20.9296875, 24.83203125, 28.734375, 32.63671875, 36.5390625, 40.44140625, 44.34375, 48.24609375, 52.1484375, 56.05078125, 59.953125, 63.85546875, 67.7578125, 71.66015625, 75.5625, 79.46484375, 83.3671875, 87.26953125, 91.171875, 95.07421875, 98.9765625, 102.87890625, 106.78125, 110.68359375, 114.5859375, 118.48828125, 122.390625, 126.29296875, 130.1953125, 134.09765625, 138.0]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 6.0, 11.0, 17.0, 13.0, 15.0, 23.0, 29.0, 22.0, 20.0, 23.0, 17.0, 31.0, 35.0, 43.0, 37.0, 34.0, 36.0, 47.0, 35.0, 40.0, 44.0, 33.0, 30.0, 41.0, 49.0, 24.0, 28.0, 34.0, 27.0, 28.0, 13.0, 15.0, 12.0, 18.0, 12.0, 9.0, 5.0, 8.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.53125, -48.93505859375, -47.3388671875, -45.74267578125, -44.146484375, -42.55029296875, -40.9541015625, -39.35791015625, -37.76171875, -36.16552734375, -34.5693359375, -32.97314453125, -31.376953125, -29.78076171875, -28.1845703125, -26.58837890625, -24.9921875, -23.39599609375, -21.7998046875, -20.20361328125, -18.607421875, -17.01123046875, -15.4150390625, -13.81884765625, -12.22265625, -10.62646484375, -9.0302734375, -7.43408203125, -5.837890625, -4.24169921875, -2.6455078125, -1.04931640625, 0.546875, 2.14306640625, 3.7392578125, 5.33544921875, 6.931640625, 8.52783203125, 10.1240234375, 11.72021484375, 13.31640625, 14.91259765625, 16.5087890625, 18.10498046875, 19.701171875, 21.29736328125, 22.8935546875, 24.48974609375, 26.0859375, 27.68212890625, 29.2783203125, 30.87451171875, 32.470703125, 34.06689453125, 35.6630859375, 37.25927734375, 38.85546875, 40.45166015625, 42.0478515625, 43.64404296875, 45.240234375, 46.83642578125, 48.4326171875, 50.02880859375, 51.625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 12.0, 11.0, 15.0, 21.0, 30.0, 33.0, 43.0, 59.0, 83.0, 126.0, 208.0, 435.0, 794.0, 1796.0, 5140.0, 21582.0, 946542.0, 57893.0, 8498.0, 2769.0, 1117.0, 524.0, 268.0, 146.0, 107.0, 76.0, 49.0, 30.0, 29.0, 30.0, 15.0, 12.0, 10.0, 5.0, 8.0, 2.0, 7.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.3125, -25.5078125, -24.703125, -23.8984375, -23.09375, -22.2890625, -21.484375, -20.6796875, -19.875, -19.0703125, -18.265625, -17.4609375, -16.65625, -15.8515625, -15.046875, -14.2421875, -13.4375, -12.6328125, -11.828125, -11.0234375, -10.21875, -9.4140625, -8.609375, -7.8046875, -7.0, -6.1953125, -5.390625, -4.5859375, -3.78125, -2.9765625, -2.171875, -1.3671875, -0.5625, 0.2421875, 1.046875, 1.8515625, 2.65625, 3.4609375, 4.265625, 5.0703125, 5.875, 6.6796875, 7.484375, 8.2890625, 9.09375, 9.8984375, 10.703125, 11.5078125, 12.3125, 13.1171875, 13.921875, 14.7265625, 15.53125, 16.3359375, 17.140625, 17.9453125, 18.75, 19.5546875, 20.359375, 21.1640625, 21.96875, 22.7734375, 23.578125, 24.3828125, 25.1875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 10.0, 7.0, 16.0, 22.0, 27.0, 39.0, 49.0, 70.0, 83.0, 108.0, 101.0, 105.0, 96.0, 77.0, 44.0, 32.0, 31.0, 24.0, 13.0, 13.0, 11.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014286041259765625, -0.0013845711946487427, -0.0013405382633209229, -0.001296505331993103, -0.0012524724006652832, -0.0012084394693374634, -0.0011644065380096436, -0.0011203736066818237, -0.001076340675354004, -0.001032307744026184, -0.0009882748126983643, -0.0009442418813705444, -0.0009002089500427246, -0.0008561760187149048, -0.000812143087387085, -0.0007681101560592651, -0.0007240772247314453, -0.0006800442934036255, -0.0006360113620758057, -0.0005919784307479858, -0.000547945499420166, -0.0005039125680923462, -0.00045987963676452637, -0.00041584670543670654, -0.0003718137741088867, -0.0003277808427810669, -0.00028374791145324707, -0.00023971498012542725, -0.00019568204879760742, -0.0001516491174697876, -0.00010761618614196777, -6.358325481414795e-05, -1.9550323486328125e-05, 2.44826078414917e-05, 6.851553916931152e-05, 0.00011254847049713135, 0.00015658140182495117, 0.000200614333152771, 0.0002446472644805908, 0.00028868019580841064, 0.00033271312713623047, 0.0003767460584640503, 0.0004207789897918701, 0.00046481192111968994, 0.0005088448524475098, 0.0005528777837753296, 0.0005969107151031494, 0.0006409436464309692, 0.0006849765777587891, 0.0007290095090866089, 0.0007730424404144287, 0.0008170753717422485, 0.0008611083030700684, 0.0009051412343978882, 0.000949174165725708, 0.0009932070970535278, 0.0010372400283813477, 0.0010812729597091675, 0.0011253058910369873, 0.0011693388223648071, 0.001213371753692627, 0.0012574046850204468, 0.0013014376163482666, 0.0013454705476760864, 0.0013895034790039062]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 11.0, 11.0, 10.0, 20.0, 33.0, 49.0, 44.0, 76.0, 108.0, 146.0, 217.0, 306.0, 352.0, 492.0, 681.0, 911.0, 1266.0, 1732.0, 2524.0, 3726.0, 6371.0, 12084.0, 28814.0, 88302.0, 439730.0, 333502.0, 73171.0, 25142.0, 10758.0, 5804.0, 3628.0, 2362.0, 1669.0, 1200.0, 856.0, 671.0, 457.0, 315.0, 284.0, 207.0, 162.0, 98.0, 58.0, 56.0, 45.0, 37.0, 27.0, 14.0, 5.0, 6.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.589599609375, -18.00732421875, -17.425048828125, -16.8427734375, -16.260498046875, -15.67822265625, -15.095947265625, -14.513671875, -13.931396484375, -13.34912109375, -12.766845703125, -12.1845703125, -11.602294921875, -11.02001953125, -10.437744140625, -9.85546875, -9.273193359375, -8.69091796875, -8.108642578125, -7.5263671875, -6.944091796875, -6.36181640625, -5.779541015625, -5.197265625, -4.614990234375, -4.03271484375, -3.450439453125, -2.8681640625, -2.285888671875, -1.70361328125, -1.121337890625, -0.5390625, 0.043212890625, 0.62548828125, 1.207763671875, 1.7900390625, 2.372314453125, 2.95458984375, 3.536865234375, 4.119140625, 4.701416015625, 5.28369140625, 5.865966796875, 6.4482421875, 7.030517578125, 7.61279296875, 8.195068359375, 8.77734375, 9.359619140625, 9.94189453125, 10.524169921875, 11.1064453125, 11.688720703125, 12.27099609375, 12.853271484375, 13.435546875, 14.017822265625, 14.60009765625, 15.182373046875, 15.7646484375, 16.346923828125, 16.92919921875, 17.511474609375, 18.09375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 3.0, 5.0, 7.0, 6.0, 12.0, 16.0, 18.0, 28.0, 24.0, 32.0, 61.0, 59.0, 70.0, 64.0, 81.0, 69.0, 77.0, 64.0, 57.0, 44.0, 43.0, 32.0, 42.0, 20.0, 9.0, 15.0, 8.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.880859375, -2.770904541015625, -2.66094970703125, -2.550994873046875, -2.4410400390625, -2.331085205078125, -2.22113037109375, -2.111175537109375, -2.001220703125, -1.891265869140625, -1.78131103515625, -1.671356201171875, -1.5614013671875, -1.451446533203125, -1.34149169921875, -1.231536865234375, -1.12158203125, -1.011627197265625, -0.90167236328125, -0.791717529296875, -0.6817626953125, -0.571807861328125, -0.46185302734375, -0.351898193359375, -0.241943359375, -0.131988525390625, -0.02203369140625, 0.087921142578125, 0.1978759765625, 0.307830810546875, 0.41778564453125, 0.527740478515625, 0.6376953125, 0.747650146484375, 0.85760498046875, 0.967559814453125, 1.0775146484375, 1.187469482421875, 1.29742431640625, 1.407379150390625, 1.517333984375, 1.627288818359375, 1.73724365234375, 1.847198486328125, 1.9571533203125, 2.067108154296875, 2.17706298828125, 2.287017822265625, 2.39697265625, 2.506927490234375, 2.61688232421875, 2.726837158203125, 2.8367919921875, 2.946746826171875, 3.05670166015625, 3.166656494140625, 3.276611328125, 3.386566162109375, 3.49652099609375, 3.606475830078125, 3.7164306640625, 3.826385498046875, 3.93634033203125, 4.046295166015625, 4.15625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 11.0, 10.0, 13.0, 17.0, 13.0, 31.0, 45.0, 43.0, 69.0, 103.0, 116.0, 124.0, 102.0, 72.0, 56.0, 34.0, 42.0, 23.0, 22.0, 9.0, 13.0, 9.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.05120849609375, -131.8037872314453, -127.55636596679688, -123.30895233154297, -119.06153106689453, -114.8141098022461, -110.56669616699219, -106.31927490234375, -102.07185363769531, -97.82443237304688, -93.57701110839844, -89.32959747314453, -85.0821762084961, -80.83475494384766, -76.58734130859375, -72.33992004394531, -68.09249877929688, -63.84507751464844, -59.597660064697266, -55.350242614746094, -51.102821350097656, -46.85540008544922, -42.60798263549805, -38.360565185546875, -34.11314392089844, -29.865724563598633, -25.618305206298828, -21.370885848999023, -17.12346649169922, -12.876047134399414, -8.62862777709961, -4.381208419799805, -0.1337738037109375, 4.113645553588867, 8.361064910888672, 12.608484268188477, 16.85590362548828, 21.103322982788086, 25.35074234008789, 29.598161697387695, 33.8455810546875, 38.09300231933594, 42.34041976928711, 46.58783721923828, 50.83525848388672, 55.082679748535156, 59.33009719848633, 63.5775146484375, 67.82493591308594, 72.07235717773438, 76.31977844238281, 80.56719207763672, 84.81461334228516, 89.0620346069336, 93.3094482421875, 97.55686950683594, 101.80429077148438, 106.05171203613281, 110.29913330078125, 114.54654693603516, 118.7939682006836, 123.04138946533203, 127.28880310058594, 131.53622436523438, 135.7836456298828]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 7.0, 10.0, 10.0, 10.0, 14.0, 15.0, 18.0, 21.0, 34.0, 28.0, 30.0, 25.0, 35.0, 50.0, 41.0, 44.0, 41.0, 57.0, 45.0, 47.0, 43.0, 39.0, 48.0, 24.0, 25.0, 35.0, 29.0, 26.0, 18.0, 20.0, 15.0, 16.0, 11.0, 10.0, 11.0, 10.0, 7.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-72.27301788330078, -69.8780288696289, -67.48304748535156, -65.08805847167969, -62.693077087402344, -60.298091888427734, -57.903106689453125, -55.50811767578125, -53.113136291503906, -50.7181510925293, -48.32316589355469, -45.92818069458008, -43.53319549560547, -41.13821029663086, -38.74322509765625, -36.348236083984375, -33.953250885009766, -31.558265686035156, -29.163280487060547, -26.768295288085938, -24.373310089111328, -21.97832489013672, -19.583337783813477, -17.188352584838867, -14.793367385864258, -12.398382186889648, -10.003396987915039, -7.608410835266113, -5.213425636291504, -2.8184404373168945, -0.42345428466796875, 1.9715309143066406, 4.36651611328125, 6.761501312255859, 9.156486511230469, 11.551472663879395, 13.946457862854004, 16.341442108154297, 18.73642921447754, 21.13141441345215, 23.526399612426758, 25.921384811401367, 28.316370010375977, 30.71135711669922, 33.10634231567383, 35.50132751464844, 37.89631271362305, 40.291297912597656, 42.686283111572266, 45.081268310546875, 47.476253509521484, 49.871238708496094, 52.2662239074707, 54.66120910644531, 57.05619812011719, 59.45117950439453, 61.846168518066406, 64.24115753173828, 66.63613891601562, 69.0311279296875, 71.42610931396484, 73.82109832763672, 76.21607971191406, 78.61106872558594, 81.00605010986328]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 7.0, 9.0, 9.0, 23.0, 35.0, 40.0, 64.0, 83.0, 136.0, 194.0, 277.0, 430.0, 640.0, 981.0, 1567.0, 2528.0, 3755.0, 6369.0, 11011.0, 19240.0, 36117.0, 71115.0, 146939.0, 287531.0, 228464.0, 110071.0, 54486.0, 27885.0, 15306.0, 8896.0, 5282.0, 3225.0, 1959.0, 1356.0, 830.0, 549.0, 357.0, 283.0, 166.0, 97.0, 80.0, 57.0, 39.0, 17.0, 18.0, 6.0, 6.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-132.625, -128.455078125, -124.28515625, -120.115234375, -115.9453125, -111.775390625, -107.60546875, -103.435546875, -99.265625, -95.095703125, -90.92578125, -86.755859375, -82.5859375, -78.416015625, -74.24609375, -70.076171875, -65.90625, -61.736328125, -57.56640625, -53.396484375, -49.2265625, -45.056640625, -40.88671875, -36.716796875, -32.546875, -28.376953125, -24.20703125, -20.037109375, -15.8671875, -11.697265625, -7.52734375, -3.357421875, 0.8125, 4.982421875, 9.15234375, 13.322265625, 17.4921875, 21.662109375, 25.83203125, 30.001953125, 34.171875, 38.341796875, 42.51171875, 46.681640625, 50.8515625, 55.021484375, 59.19140625, 63.361328125, 67.53125, 71.701171875, 75.87109375, 80.041015625, 84.2109375, 88.380859375, 92.55078125, 96.720703125, 100.890625, 105.060546875, 109.23046875, 113.400390625, 117.5703125, 121.740234375, 125.91015625, 130.080078125, 134.25]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 11.0, 9.0, 11.0, 9.0, 22.0, 18.0, 28.0, 20.0, 33.0, 29.0, 41.0, 49.0, 44.0, 50.0, 51.0, 56.0, 51.0, 55.0, 50.0, 38.0, 44.0, 30.0, 29.0, 34.0, 26.0, 18.0, 18.0, 15.0, 17.0, 17.0, 8.0, 12.0, 9.0, 7.0, 9.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-76.0, -73.4814453125, -70.962890625, -68.4443359375, -65.92578125, -63.4072265625, -60.888671875, -58.3701171875, -55.8515625, -53.3330078125, -50.814453125, -48.2958984375, -45.77734375, -43.2587890625, -40.740234375, -38.2216796875, -35.703125, -33.1845703125, -30.666015625, -28.1474609375, -25.62890625, -23.1103515625, -20.591796875, -18.0732421875, -15.5546875, -13.0361328125, -10.517578125, -7.9990234375, -5.48046875, -2.9619140625, -0.443359375, 2.0751953125, 4.59375, 7.1123046875, 9.630859375, 12.1494140625, 14.66796875, 17.1865234375, 19.705078125, 22.2236328125, 24.7421875, 27.2607421875, 29.779296875, 32.2978515625, 34.81640625, 37.3349609375, 39.853515625, 42.3720703125, 44.890625, 47.4091796875, 49.927734375, 52.4462890625, 54.96484375, 57.4833984375, 60.001953125, 62.5205078125, 65.0390625, 67.5576171875, 70.076171875, 72.5947265625, 75.11328125, 77.6318359375, 80.150390625, 82.6689453125, 85.1875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 6.0, 3.0, 8.0, 14.0, 17.0, 27.0, 40.0, 58.0, 91.0, 149.0, 217.0, 354.0, 521.0, 878.0, 1416.0, 2378.0, 3933.0, 6984.0, 12526.0, 22547.0, 43374.0, 86977.0, 176099.0, 293109.0, 195071.0, 96162.0, 48461.0, 25005.0, 13551.0, 7573.0, 4424.0, 2537.0, 1547.0, 925.0, 533.0, 357.0, 215.0, 148.0, 102.0, 62.0, 47.0, 40.0, 19.0, 18.0, 6.0, 9.0, 2.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-167.125, -161.83203125, -156.5390625, -151.24609375, -145.953125, -140.66015625, -135.3671875, -130.07421875, -124.78125, -119.48828125, -114.1953125, -108.90234375, -103.609375, -98.31640625, -93.0234375, -87.73046875, -82.4375, -77.14453125, -71.8515625, -66.55859375, -61.265625, -55.97265625, -50.6796875, -45.38671875, -40.09375, -34.80078125, -29.5078125, -24.21484375, -18.921875, -13.62890625, -8.3359375, -3.04296875, 2.25, 7.54296875, 12.8359375, 18.12890625, 23.421875, 28.71484375, 34.0078125, 39.30078125, 44.59375, 49.88671875, 55.1796875, 60.47265625, 65.765625, 71.05859375, 76.3515625, 81.64453125, 86.9375, 92.23046875, 97.5234375, 102.81640625, 108.109375, 113.40234375, 118.6953125, 123.98828125, 129.28125, 134.57421875, 139.8671875, 145.16015625, 150.453125, 155.74609375, 161.0390625, 166.33203125, 171.625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 11.0, 11.0, 13.0, 16.0, 11.0, 17.0, 26.0, 28.0, 34.0, 29.0, 30.0, 34.0, 42.0, 50.0, 39.0, 53.0, 55.0, 47.0, 45.0, 46.0, 37.0, 31.0, 44.0, 40.0, 29.0, 17.0, 13.0, 20.0, 20.0, 16.0, 15.0, 14.0, 16.0, 4.0, 14.0, 6.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-51.0, -49.294921875, -47.58984375, -45.884765625, -44.1796875, -42.474609375, -40.76953125, -39.064453125, -37.359375, -35.654296875, -33.94921875, -32.244140625, -30.5390625, -28.833984375, -27.12890625, -25.423828125, -23.71875, -22.013671875, -20.30859375, -18.603515625, -16.8984375, -15.193359375, -13.48828125, -11.783203125, -10.078125, -8.373046875, -6.66796875, -4.962890625, -3.2578125, -1.552734375, 0.15234375, 1.857421875, 3.5625, 5.267578125, 6.97265625, 8.677734375, 10.3828125, 12.087890625, 13.79296875, 15.498046875, 17.203125, 18.908203125, 20.61328125, 22.318359375, 24.0234375, 25.728515625, 27.43359375, 29.138671875, 30.84375, 32.548828125, 34.25390625, 35.958984375, 37.6640625, 39.369140625, 41.07421875, 42.779296875, 44.484375, 46.189453125, 47.89453125, 49.599609375, 51.3046875, 53.009765625, 54.71484375, 56.419921875, 58.125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 7.0, 17.0, 19.0, 20.0, 45.0, 53.0, 57.0, 100.0, 137.0, 202.0, 312.0, 404.0, 590.0, 820.0, 1241.0, 2002.0, 3255.0, 5975.0, 11291.0, 23167.0, 55385.0, 187198.0, 545706.0, 126151.0, 42782.0, 19098.0, 9268.0, 4970.0, 2920.0, 1735.0, 1072.0, 742.0, 506.0, 376.0, 240.0, 214.0, 133.0, 109.0, 62.0, 39.0, 46.0, 19.0, 19.0, 10.0, 11.0, 10.0, 3.0, 1.0, 3.0, 3.0, 1.0], "bins": [-69.3125, -67.3525390625, -65.392578125, -63.4326171875, -61.47265625, -59.5126953125, -57.552734375, -55.5927734375, -53.6328125, -51.6728515625, -49.712890625, -47.7529296875, -45.79296875, -43.8330078125, -41.873046875, -39.9130859375, -37.953125, -35.9931640625, -34.033203125, -32.0732421875, -30.11328125, -28.1533203125, -26.193359375, -24.2333984375, -22.2734375, -20.3134765625, -18.353515625, -16.3935546875, -14.43359375, -12.4736328125, -10.513671875, -8.5537109375, -6.59375, -4.6337890625, -2.673828125, -0.7138671875, 1.24609375, 3.2060546875, 5.166015625, 7.1259765625, 9.0859375, 11.0458984375, 13.005859375, 14.9658203125, 16.92578125, 18.8857421875, 20.845703125, 22.8056640625, 24.765625, 26.7255859375, 28.685546875, 30.6455078125, 32.60546875, 34.5654296875, 36.525390625, 38.4853515625, 40.4453125, 42.4052734375, 44.365234375, 46.3251953125, 48.28515625, 50.2451171875, 52.205078125, 54.1650390625, 56.125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 4.0, 9.0, 15.0, 11.0, 15.0, 29.0, 45.0, 84.0, 195.0, 240.0, 131.0, 59.0, 55.0, 26.0, 21.0, 13.0, 10.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00860595703125, -0.008380889892578125, -0.00815582275390625, -0.007930755615234375, -0.0077056884765625, -0.007480621337890625, -0.00725555419921875, -0.007030487060546875, -0.006805419921875, -0.006580352783203125, -0.00635528564453125, -0.006130218505859375, -0.0059051513671875, -0.005680084228515625, -0.00545501708984375, -0.005229949951171875, -0.0050048828125, -0.004779815673828125, -0.00455474853515625, -0.004329681396484375, -0.0041046142578125, -0.003879547119140625, -0.00365447998046875, -0.003429412841796875, -0.003204345703125, -0.002979278564453125, -0.00275421142578125, -0.002529144287109375, -0.0023040771484375, -0.002079010009765625, -0.00185394287109375, -0.001628875732421875, -0.00140380859375, -0.001178741455078125, -0.00095367431640625, -0.000728607177734375, -0.0005035400390625, -0.000278472900390625, -5.340576171875e-05, 0.000171661376953125, 0.000396728515625, 0.000621795654296875, 0.00084686279296875, 0.001071929931640625, 0.0012969970703125, 0.001522064208984375, 0.00174713134765625, 0.001972198486328125, 0.002197265625, 0.002422332763671875, 0.00264739990234375, 0.002872467041015625, 0.0030975341796875, 0.003322601318359375, 0.00354766845703125, 0.003772735595703125, 0.003997802734375, 0.004222869873046875, 0.00444793701171875, 0.004673004150390625, 0.0048980712890625, 0.005123138427734375, 0.00534820556640625, 0.005573272705078125, 0.00579833984375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 4.0, 2.0, 1.0, 4.0, 10.0, 3.0, 16.0, 10.0, 12.0, 27.0, 23.0, 40.0, 56.0, 50.0, 83.0, 129.0, 176.0, 254.0, 419.0, 660.0, 1048.0, 1755.0, 3284.0, 6307.0, 13183.0, 36162.0, 165814.0, 655669.0, 111946.0, 27938.0, 10890.0, 5448.0, 2752.0, 1637.0, 918.0, 583.0, 396.0, 260.0, 158.0, 112.0, 71.0, 63.0, 47.0, 44.0, 20.0, 19.0, 19.0, 14.0, 8.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-79.625, -77.0048828125, -74.384765625, -71.7646484375, -69.14453125, -66.5244140625, -63.904296875, -61.2841796875, -58.6640625, -56.0439453125, -53.423828125, -50.8037109375, -48.18359375, -45.5634765625, -42.943359375, -40.3232421875, -37.703125, -35.0830078125, -32.462890625, -29.8427734375, -27.22265625, -24.6025390625, -21.982421875, -19.3623046875, -16.7421875, -14.1220703125, -11.501953125, -8.8818359375, -6.26171875, -3.6416015625, -1.021484375, 1.5986328125, 4.21875, 6.8388671875, 9.458984375, 12.0791015625, 14.69921875, 17.3193359375, 19.939453125, 22.5595703125, 25.1796875, 27.7998046875, 30.419921875, 33.0400390625, 35.66015625, 38.2802734375, 40.900390625, 43.5205078125, 46.140625, 48.7607421875, 51.380859375, 54.0009765625, 56.62109375, 59.2412109375, 61.861328125, 64.4814453125, 67.1015625, 69.7216796875, 72.341796875, 74.9619140625, 77.58203125, 80.2021484375, 82.822265625, 85.4423828125, 88.0625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 5.0, 14.0, 8.0, 13.0, 20.0, 33.0, 48.0, 59.0, 104.0, 169.0, 164.0, 126.0, 67.0, 49.0, 24.0, 17.0, 16.0, 13.0, 7.0, 13.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-27.734375, -27.02783203125, -26.3212890625, -25.61474609375, -24.908203125, -24.20166015625, -23.4951171875, -22.78857421875, -22.08203125, -21.37548828125, -20.6689453125, -19.96240234375, -19.255859375, -18.54931640625, -17.8427734375, -17.13623046875, -16.4296875, -15.72314453125, -15.0166015625, -14.31005859375, -13.603515625, -12.89697265625, -12.1904296875, -11.48388671875, -10.77734375, -10.07080078125, -9.3642578125, -8.65771484375, -7.951171875, -7.24462890625, -6.5380859375, -5.83154296875, -5.125, -4.41845703125, -3.7119140625, -3.00537109375, -2.298828125, -1.59228515625, -0.8857421875, -0.17919921875, 0.52734375, 1.23388671875, 1.9404296875, 2.64697265625, 3.353515625, 4.06005859375, 4.7666015625, 5.47314453125, 6.1796875, 6.88623046875, 7.5927734375, 8.29931640625, 9.005859375, 9.71240234375, 10.4189453125, 11.12548828125, 11.83203125, 12.53857421875, 13.2451171875, 13.95166015625, 14.658203125, 15.36474609375, 16.0712890625, 16.77783203125, 17.484375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 9.0, 4.0, 4.0, 2.0, 16.0, 13.0, 18.0, 21.0, 33.0, 44.0, 58.0, 86.0, 88.0, 124.0, 107.0, 96.0, 73.0, 51.0, 55.0, 30.0, 17.0, 16.0, 9.0, 12.0, 3.0, 11.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.9215850830078, -139.4133758544922, -134.90516662597656, -130.39697265625, -125.88876342773438, -121.38055419921875, -116.87234497070312, -112.36414337158203, -107.85594177246094, -103.34773254394531, -98.83953094482422, -94.3313217163086, -89.8231201171875, -85.31491088867188, -80.80670166015625, -76.29850006103516, -71.79029083251953, -67.2820816040039, -62.77388000488281, -58.26567077636719, -53.757469177246094, -49.24925994873047, -44.74105453491211, -40.23284912109375, -35.72464370727539, -31.21643829345703, -26.708232879638672, -22.20002555847168, -17.69182014465332, -13.183614730834961, -8.675407409667969, -4.167201995849609, 0.34100341796875, 4.849209308624268, 9.357415199279785, 13.865621566772461, 18.37382698059082, 22.88203239440918, 27.390239715576172, 31.89844512939453, 36.40665054321289, 40.91485595703125, 45.42306137084961, 49.93126678466797, 54.439476013183594, 58.94767761230469, 63.45588684082031, 67.96409606933594, 72.47229766845703, 76.98050689697266, 81.48870849609375, 85.99691772460938, 90.50511932373047, 95.0133285522461, 99.52153015136719, 104.02973937988281, 108.53794860839844, 113.04615783691406, 117.55435943603516, 122.06256866455078, 126.57077026367188, 131.0789794921875, 135.58718872070312, 140.09539794921875, 144.6035919189453]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 7.0, 4.0, 7.0, 6.0, 8.0, 19.0, 16.0, 12.0, 18.0, 13.0, 18.0, 39.0, 35.0, 39.0, 37.0, 58.0, 38.0, 45.0, 41.0, 45.0, 37.0, 52.0, 42.0, 39.0, 41.0, 39.0, 35.0, 31.0, 32.0, 24.0, 21.0, 18.0, 18.0, 13.0, 13.0, 9.0, 9.0, 9.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-82.38619995117188, -79.71418762207031, -77.04216766357422, -74.37014770507812, -71.69813537597656, -69.026123046875, -66.3541030883789, -63.68208694458008, -61.01007080078125, -58.33805465698242, -55.666038513183594, -52.994022369384766, -50.32200622558594, -47.64999008178711, -44.97797393798828, -42.30595779418945, -39.633941650390625, -36.9619255065918, -34.28990936279297, -31.61789321899414, -28.945877075195312, -26.273860931396484, -23.601844787597656, -20.929828643798828, -18.2578125, -15.585796356201172, -12.913780212402344, -10.241764068603516, -7.5697479248046875, -4.897731781005859, -2.2257156372070312, 0.4463005065917969, 3.1183090209960938, 5.790325164794922, 8.46234130859375, 11.134357452392578, 13.806373596191406, 16.478389739990234, 19.150405883789062, 21.82242202758789, 24.49443817138672, 27.166454315185547, 29.838470458984375, 32.5104866027832, 35.18250274658203, 37.85451889038086, 40.52653503417969, 43.198551177978516, 45.870567321777344, 48.54258346557617, 51.214599609375, 53.88661575317383, 56.558631896972656, 59.230648040771484, 61.90266418457031, 64.57467651367188, 67.24669647216797, 69.91871643066406, 72.59072875976562, 75.26274108886719, 77.93476104736328, 80.60678100585938, 83.27879333496094, 85.9508056640625, 88.6228256225586]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 13.0, 23.0, 24.0, 36.0, 59.0, 76.0, 117.0, 171.0, 235.0, 328.0, 456.0, 715.0, 1101.0, 1630.0, 2577.0, 4263.0, 7237.0, 14243.0, 32081.0, 103856.0, 642103.0, 2644515.0, 576792.0, 96305.0, 31504.0, 14129.0, 7367.0, 4394.0, 2699.0, 1740.0, 1144.0, 770.0, 510.0, 368.0, 216.0, 147.0, 109.0, 65.0, 45.0, 31.0, 25.0, 12.0, 14.0, 8.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-181.0, -175.59375, -170.1875, -164.78125, -159.375, -153.96875, -148.5625, -143.15625, -137.75, -132.34375, -126.9375, -121.53125, -116.125, -110.71875, -105.3125, -99.90625, -94.5, -89.09375, -83.6875, -78.28125, -72.875, -67.46875, -62.0625, -56.65625, -51.25, -45.84375, -40.4375, -35.03125, -29.625, -24.21875, -18.8125, -13.40625, -8.0, -2.59375, 2.8125, 8.21875, 13.625, 19.03125, 24.4375, 29.84375, 35.25, 40.65625, 46.0625, 51.46875, 56.875, 62.28125, 67.6875, 73.09375, 78.5, 83.90625, 89.3125, 94.71875, 100.125, 105.53125, 110.9375, 116.34375, 121.75, 127.15625, 132.5625, 137.96875, 143.375, 148.78125, 154.1875, 159.59375, 165.0]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 14.0, 10.0, 14.0, 13.0, 13.0, 22.0, 19.0, 37.0, 37.0, 38.0, 46.0, 54.0, 47.0, 49.0, 43.0, 59.0, 50.0, 47.0, 38.0, 47.0, 44.0, 38.0, 38.0, 28.0, 17.0, 22.0, 14.0, 22.0, 11.0, 15.0, 10.0, 10.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-81.4375, -78.85546875, -76.2734375, -73.69140625, -71.109375, -68.52734375, -65.9453125, -63.36328125, -60.78125, -58.19921875, -55.6171875, -53.03515625, -50.453125, -47.87109375, -45.2890625, -42.70703125, -40.125, -37.54296875, -34.9609375, -32.37890625, -29.796875, -27.21484375, -24.6328125, -22.05078125, -19.46875, -16.88671875, -14.3046875, -11.72265625, -9.140625, -6.55859375, -3.9765625, -1.39453125, 1.1875, 3.76953125, 6.3515625, 8.93359375, 11.515625, 14.09765625, 16.6796875, 19.26171875, 21.84375, 24.42578125, 27.0078125, 29.58984375, 32.171875, 34.75390625, 37.3359375, 39.91796875, 42.5, 45.08203125, 47.6640625, 50.24609375, 52.828125, 55.41015625, 57.9921875, 60.57421875, 63.15625, 65.73828125, 68.3203125, 70.90234375, 73.484375, 76.06640625, 78.6484375, 81.23046875, 83.8125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 9.0, 8.0, 15.0, 13.0, 19.0, 47.0, 49.0, 71.0, 82.0, 136.0, 206.0, 279.0, 389.0, 604.0, 880.0, 1234.0, 1931.0, 2954.0, 4645.0, 7504.0, 13340.0, 25530.0, 57206.0, 167293.0, 958999.0, 2459002.0, 323767.0, 88667.0, 35786.0, 17611.0, 9619.0, 5692.0, 3546.0, 2339.0, 1509.0, 1038.0, 655.0, 500.0, 333.0, 237.0, 166.0, 114.0, 72.0, 63.0, 42.0, 26.0, 17.0, 14.0, 14.0, 6.0, 9.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-163.875, -158.453125, -153.03125, -147.609375, -142.1875, -136.765625, -131.34375, -125.921875, -120.5, -115.078125, -109.65625, -104.234375, -98.8125, -93.390625, -87.96875, -82.546875, -77.125, -71.703125, -66.28125, -60.859375, -55.4375, -50.015625, -44.59375, -39.171875, -33.75, -28.328125, -22.90625, -17.484375, -12.0625, -6.640625, -1.21875, 4.203125, 9.625, 15.046875, 20.46875, 25.890625, 31.3125, 36.734375, 42.15625, 47.578125, 53.0, 58.421875, 63.84375, 69.265625, 74.6875, 80.109375, 85.53125, 90.953125, 96.375, 101.796875, 107.21875, 112.640625, 118.0625, 123.484375, 128.90625, 134.328125, 139.75, 145.171875, 150.59375, 156.015625, 161.4375, 166.859375, 172.28125, 177.703125, 183.125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 8.0, 9.0, 7.0, 23.0, 19.0, 25.0, 38.0, 54.0, 77.0, 113.0, 194.0, 265.0, 528.0, 889.0, 689.0, 407.0, 236.0, 145.0, 97.0, 54.0, 40.0, 25.0, 23.0, 18.0, 12.0, 14.0, 7.0, 2.0, 13.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.5, -45.8486328125, -44.197265625, -42.5458984375, -40.89453125, -39.2431640625, -37.591796875, -35.9404296875, -34.2890625, -32.6376953125, -30.986328125, -29.3349609375, -27.68359375, -26.0322265625, -24.380859375, -22.7294921875, -21.078125, -19.4267578125, -17.775390625, -16.1240234375, -14.47265625, -12.8212890625, -11.169921875, -9.5185546875, -7.8671875, -6.2158203125, -4.564453125, -2.9130859375, -1.26171875, 0.3896484375, 2.041015625, 3.6923828125, 5.34375, 6.9951171875, 8.646484375, 10.2978515625, 11.94921875, 13.6005859375, 15.251953125, 16.9033203125, 18.5546875, 20.2060546875, 21.857421875, 23.5087890625, 25.16015625, 26.8115234375, 28.462890625, 30.1142578125, 31.765625, 33.4169921875, 35.068359375, 36.7197265625, 38.37109375, 40.0224609375, 41.673828125, 43.3251953125, 44.9765625, 46.6279296875, 48.279296875, 49.9306640625, 51.58203125, 53.2333984375, 54.884765625, 56.5361328125, 58.1875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 6.0, 4.0, 3.0, 5.0, 6.0, 8.0, 11.0, 14.0, 15.0, 18.0, 26.0, 31.0, 34.0, 54.0, 46.0, 76.0, 105.0, 98.0, 117.0, 69.0, 54.0, 49.0, 38.0, 30.0, 23.0, 20.0, 8.0, 3.0, 8.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-119.2146987915039, -115.4179916381836, -111.62127685546875, -107.82456970214844, -104.02786254882812, -100.23114776611328, -96.43444061279297, -92.63772583007812, -88.84101867675781, -85.0443115234375, -81.24759674072266, -77.45088958740234, -73.6541748046875, -69.85746765136719, -66.06076049804688, -62.2640495300293, -58.46733856201172, -54.67062759399414, -50.87391662597656, -47.07720947265625, -43.28049850463867, -39.483787536621094, -35.68708038330078, -31.890369415283203, -28.093658447265625, -24.296947479248047, -20.5002384185791, -16.703529357910156, -12.906818389892578, -9.110107421875, -5.313398361206055, -1.5166893005371094, 2.2800140380859375, 6.076724052429199, 9.873434066772461, 13.670144081115723, 17.466854095458984, 21.263565063476562, 25.060274124145508, 28.856983184814453, 32.65369415283203, 36.45040512084961, 40.24711608886719, 44.0438232421875, 47.84053421020508, 51.637245178222656, 55.43395233154297, 59.23066329956055, 63.027374267578125, 66.82408142089844, 70.62079620361328, 74.4175033569336, 78.21421813964844, 82.01092529296875, 85.80763244628906, 89.60433959960938, 93.40105438232422, 97.19776153564453, 100.99447631835938, 104.79118347167969, 108.587890625, 112.38460540771484, 116.18131256103516, 119.97802734375, 123.77473449707031]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 10.0, 11.0, 7.0, 9.0, 7.0, 16.0, 24.0, 21.0, 30.0, 34.0, 25.0, 25.0, 28.0, 35.0, 47.0, 44.0, 39.0, 38.0, 40.0, 46.0, 50.0, 35.0, 43.0, 34.0, 33.0, 33.0, 28.0, 39.0, 24.0, 21.0, 20.0, 20.0, 21.0, 12.0, 7.0, 4.0, 5.0, 4.0, 8.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.59225463867188, -78.9365234375, -76.2807846069336, -73.62505340576172, -70.96931457519531, -68.31358337402344, -65.65784454345703, -63.002113342285156, -60.346378326416016, -57.690643310546875, -55.034908294677734, -52.379173278808594, -49.72344207763672, -47.06770324707031, -44.41197204589844, -41.7562370300293, -39.100502014160156, -36.444766998291016, -33.789031982421875, -31.133298873901367, -28.477563858032227, -25.821828842163086, -23.166095733642578, -20.510360717773438, -17.854625701904297, -15.198890686035156, -12.543156623840332, -9.887422561645508, -7.231687545776367, -4.575952529907227, -1.9202184677124023, 0.7355155944824219, 3.3912429809570312, 6.046977519989014, 8.702712059020996, 11.35844612121582, 14.014181137084961, 16.6699161529541, 19.32564926147461, 21.98138427734375, 24.63711929321289, 27.29285430908203, 29.948589324951172, 32.60432434082031, 35.26005554199219, 37.915794372558594, 40.57152557373047, 43.22726058959961, 45.88299560546875, 48.53873062133789, 51.19446563720703, 53.85020065307617, 56.50593566894531, 59.16166687011719, 61.81740188598633, 64.47313690185547, 67.12887573242188, 69.78460693359375, 72.44034576416016, 75.09607696533203, 77.75181579589844, 80.40754699707031, 83.06328582763672, 85.7190170288086, 88.37474822998047]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 15.0, 20.0, 34.0, 49.0, 74.0, 92.0, 130.0, 206.0, 277.0, 380.0, 596.0, 814.0, 1203.0, 1755.0, 2631.0, 3865.0, 5701.0, 8843.0, 13345.0, 21413.0, 34253.0, 56061.0, 91811.0, 151941.0, 210332.0, 169125.0, 103901.0, 63122.0, 38450.0, 23787.0, 15039.0, 9606.0, 6315.0, 4204.0, 2931.0, 1892.0, 1385.0, 918.0, 636.0, 431.0, 278.0, 216.0, 153.0, 80.0, 78.0, 51.0, 36.0, 26.0, 19.0, 11.0, 4.0, 7.0, 5.0, 0.0, 1.0, 2.0, 2.0], "bins": [-46.75, -45.271484375, -43.79296875, -42.314453125, -40.8359375, -39.357421875, -37.87890625, -36.400390625, -34.921875, -33.443359375, -31.96484375, -30.486328125, -29.0078125, -27.529296875, -26.05078125, -24.572265625, -23.09375, -21.615234375, -20.13671875, -18.658203125, -17.1796875, -15.701171875, -14.22265625, -12.744140625, -11.265625, -9.787109375, -8.30859375, -6.830078125, -5.3515625, -3.873046875, -2.39453125, -0.916015625, 0.5625, 2.041015625, 3.51953125, 4.998046875, 6.4765625, 7.955078125, 9.43359375, 10.912109375, 12.390625, 13.869140625, 15.34765625, 16.826171875, 18.3046875, 19.783203125, 21.26171875, 22.740234375, 24.21875, 25.697265625, 27.17578125, 28.654296875, 30.1328125, 31.611328125, 33.08984375, 34.568359375, 36.046875, 37.525390625, 39.00390625, 40.482421875, 41.9609375, 43.439453125, 44.91796875, 46.396484375, 47.875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 10.0, 9.0, 4.0, 6.0, 10.0, 23.0, 16.0, 22.0, 30.0, 31.0, 18.0, 31.0, 37.0, 38.0, 45.0, 51.0, 39.0, 49.0, 52.0, 49.0, 53.0, 43.0, 29.0, 39.0, 42.0, 31.0, 28.0, 32.0, 16.0, 17.0, 23.0, 16.0, 11.0, 8.0, 7.0, 4.0, 3.0, 2.0, 8.0, 3.0, 0.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-76.3125, -73.8701171875, -71.427734375, -68.9853515625, -66.54296875, -64.1005859375, -61.658203125, -59.2158203125, -56.7734375, -54.3310546875, -51.888671875, -49.4462890625, -47.00390625, -44.5615234375, -42.119140625, -39.6767578125, -37.234375, -34.7919921875, -32.349609375, -29.9072265625, -27.46484375, -25.0224609375, -22.580078125, -20.1376953125, -17.6953125, -15.2529296875, -12.810546875, -10.3681640625, -7.92578125, -5.4833984375, -3.041015625, -0.5986328125, 1.84375, 4.2861328125, 6.728515625, 9.1708984375, 11.61328125, 14.0556640625, 16.498046875, 18.9404296875, 21.3828125, 23.8251953125, 26.267578125, 28.7099609375, 31.15234375, 33.5947265625, 36.037109375, 38.4794921875, 40.921875, 43.3642578125, 45.806640625, 48.2490234375, 50.69140625, 53.1337890625, 55.576171875, 58.0185546875, 60.4609375, 62.9033203125, 65.345703125, 67.7880859375, 70.23046875, 72.6728515625, 75.115234375, 77.5576171875, 80.0]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 3.0, 10.0, 6.0, 15.0, 23.0, 36.0, 46.0, 76.0, 102.0, 159.0, 237.0, 315.0, 526.0, 838.0, 1217.0, 2032.0, 3343.0, 5691.0, 10545.0, 24046.0, 159398.0, 761680.0, 44644.0, 14880.0, 7445.0, 4291.0, 2548.0, 1576.0, 982.0, 642.0, 400.0, 265.0, 183.0, 116.0, 73.0, 65.0, 31.0, 28.0, 11.0, 10.0, 7.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.3125, -110.2646484375, -106.216796875, -102.1689453125, -98.12109375, -94.0732421875, -90.025390625, -85.9775390625, -81.9296875, -77.8818359375, -73.833984375, -69.7861328125, -65.73828125, -61.6904296875, -57.642578125, -53.5947265625, -49.546875, -45.4990234375, -41.451171875, -37.4033203125, -33.35546875, -29.3076171875, -25.259765625, -21.2119140625, -17.1640625, -13.1162109375, -9.068359375, -5.0205078125, -0.97265625, 3.0751953125, 7.123046875, 11.1708984375, 15.21875, 19.2666015625, 23.314453125, 27.3623046875, 31.41015625, 35.4580078125, 39.505859375, 43.5537109375, 47.6015625, 51.6494140625, 55.697265625, 59.7451171875, 63.79296875, 67.8408203125, 71.888671875, 75.9365234375, 79.984375, 84.0322265625, 88.080078125, 92.1279296875, 96.17578125, 100.2236328125, 104.271484375, 108.3193359375, 112.3671875, 116.4150390625, 120.462890625, 124.5107421875, 128.55859375, 132.6064453125, 136.654296875, 140.7021484375, 144.75]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 9.0, 5.0, 5.0, 9.0, 25.0, 14.0, 18.0, 19.0, 25.0, 22.0, 37.0, 25.0, 40.0, 43.0, 46.0, 46.0, 46.0, 46.0, 58.0, 42.0, 54.0, 57.0, 49.0, 35.0, 34.0, 31.0, 23.0, 20.0, 17.0, 16.0, 19.0, 17.0, 8.0, 11.0, 8.0, 6.0, 4.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-96.375, -93.3330078125, -90.291015625, -87.2490234375, -84.20703125, -81.1650390625, -78.123046875, -75.0810546875, -72.0390625, -68.9970703125, -65.955078125, -62.9130859375, -59.87109375, -56.8291015625, -53.787109375, -50.7451171875, -47.703125, -44.6611328125, -41.619140625, -38.5771484375, -35.53515625, -32.4931640625, -29.451171875, -26.4091796875, -23.3671875, -20.3251953125, -17.283203125, -14.2412109375, -11.19921875, -8.1572265625, -5.115234375, -2.0732421875, 0.96875, 4.0107421875, 7.052734375, 10.0947265625, 13.13671875, 16.1787109375, 19.220703125, 22.2626953125, 25.3046875, 28.3466796875, 31.388671875, 34.4306640625, 37.47265625, 40.5146484375, 43.556640625, 46.5986328125, 49.640625, 52.6826171875, 55.724609375, 58.7666015625, 61.80859375, 64.8505859375, 67.892578125, 70.9345703125, 73.9765625, 77.0185546875, 80.060546875, 83.1025390625, 86.14453125, 89.1865234375, 92.228515625, 95.2705078125, 98.3125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 8.0, 2.0, 5.0, 5.0, 12.0, 6.0, 15.0, 14.0, 24.0, 26.0, 35.0, 50.0, 75.0, 96.0, 138.0, 205.0, 310.0, 523.0, 1063.0, 3121.0, 23556.0, 985493.0, 27788.0, 3314.0, 1097.0, 566.0, 306.0, 197.0, 148.0, 97.0, 78.0, 47.0, 26.0, 23.0, 27.0, 14.0, 10.0, 11.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.84375, -49.3271484375, -47.810546875, -46.2939453125, -44.77734375, -43.2607421875, -41.744140625, -40.2275390625, -38.7109375, -37.1943359375, -35.677734375, -34.1611328125, -32.64453125, -31.1279296875, -29.611328125, -28.0947265625, -26.578125, -25.0615234375, -23.544921875, -22.0283203125, -20.51171875, -18.9951171875, -17.478515625, -15.9619140625, -14.4453125, -12.9287109375, -11.412109375, -9.8955078125, -8.37890625, -6.8623046875, -5.345703125, -3.8291015625, -2.3125, -0.7958984375, 0.720703125, 2.2373046875, 3.75390625, 5.2705078125, 6.787109375, 8.3037109375, 9.8203125, 11.3369140625, 12.853515625, 14.3701171875, 15.88671875, 17.4033203125, 18.919921875, 20.4365234375, 21.953125, 23.4697265625, 24.986328125, 26.5029296875, 28.01953125, 29.5361328125, 31.052734375, 32.5693359375, 34.0859375, 35.6025390625, 37.119140625, 38.6357421875, 40.15234375, 41.6689453125, 43.185546875, 44.7021484375, 46.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 2.0, 3.0, 4.0, 9.0, 12.0, 23.0, 41.0, 47.0, 75.0, 124.0, 257.0, 150.0, 74.0, 51.0, 32.0, 23.0, 14.0, 13.0, 13.0, 7.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008209228515625, -0.007932066917419434, -0.007654905319213867, -0.007377743721008301, -0.007100582122802734, -0.006823420524597168, -0.0065462589263916016, -0.006269097328186035, -0.005991935729980469, -0.005714774131774902, -0.005437612533569336, -0.0051604509353637695, -0.004883289337158203, -0.004606127738952637, -0.00432896614074707, -0.004051804542541504, -0.0037746429443359375, -0.003497481346130371, -0.0032203197479248047, -0.0029431581497192383, -0.002665996551513672, -0.0023888349533081055, -0.002111673355102539, -0.0018345117568969727, -0.0015573501586914062, -0.0012801885604858398, -0.0010030269622802734, -0.000725865364074707, -0.0004487037658691406, -0.00017154216766357422, 0.00010561943054199219, 0.0003827810287475586, 0.000659942626953125, 0.0009371042251586914, 0.0012142658233642578, 0.0014914274215698242, 0.0017685890197753906, 0.002045750617980957, 0.0023229122161865234, 0.00260007381439209, 0.0028772354125976562, 0.0031543970108032227, 0.003431558609008789, 0.0037087202072143555, 0.003985881805419922, 0.004263043403625488, 0.004540205001831055, 0.004817366600036621, 0.0050945281982421875, 0.005371689796447754, 0.00564885139465332, 0.005926012992858887, 0.006203174591064453, 0.0064803361892700195, 0.006757497787475586, 0.007034659385681152, 0.007311820983886719, 0.007588982582092285, 0.007866144180297852, 0.008143305778503418, 0.008420467376708984, 0.00869762897491455, 0.008974790573120117, 0.009251952171325684, 0.00952911376953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 9.0, 7.0, 11.0, 11.0, 7.0, 14.0, 17.0, 34.0, 34.0, 69.0, 79.0, 106.0, 145.0, 207.0, 330.0, 403.0, 586.0, 855.0, 1199.0, 1746.0, 2423.0, 3593.0, 6543.0, 34229.0, 857977.0, 114131.0, 10087.0, 4229.0, 2767.0, 1996.0, 1345.0, 982.0, 706.0, 461.0, 323.0, 250.0, 170.0, 124.0, 89.0, 60.0, 54.0, 32.0, 33.0, 24.0, 17.0, 14.0, 10.0, 6.0, 6.0, 3.0, 1.0, 3.0, 4.0], "bins": [-41.28125, -40.12451171875, -38.9677734375, -37.81103515625, -36.654296875, -35.49755859375, -34.3408203125, -33.18408203125, -32.02734375, -30.87060546875, -29.7138671875, -28.55712890625, -27.400390625, -26.24365234375, -25.0869140625, -23.93017578125, -22.7734375, -21.61669921875, -20.4599609375, -19.30322265625, -18.146484375, -16.98974609375, -15.8330078125, -14.67626953125, -13.51953125, -12.36279296875, -11.2060546875, -10.04931640625, -8.892578125, -7.73583984375, -6.5791015625, -5.42236328125, -4.265625, -3.10888671875, -1.9521484375, -0.79541015625, 0.361328125, 1.51806640625, 2.6748046875, 3.83154296875, 4.98828125, 6.14501953125, 7.3017578125, 8.45849609375, 9.615234375, 10.77197265625, 11.9287109375, 13.08544921875, 14.2421875, 15.39892578125, 16.5556640625, 17.71240234375, 18.869140625, 20.02587890625, 21.1826171875, 22.33935546875, 23.49609375, 24.65283203125, 25.8095703125, 26.96630859375, 28.123046875, 29.27978515625, 30.4365234375, 31.59326171875, 32.75]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 4.0, 5.0, 18.0, 44.0, 167.0, 367.0, 242.0, 85.0, 29.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.78125, -11.45166015625, -11.1220703125, -10.79248046875, -10.462890625, -10.13330078125, -9.8037109375, -9.47412109375, -9.14453125, -8.81494140625, -8.4853515625, -8.15576171875, -7.826171875, -7.49658203125, -7.1669921875, -6.83740234375, -6.5078125, -6.17822265625, -5.8486328125, -5.51904296875, -5.189453125, -4.85986328125, -4.5302734375, -4.20068359375, -3.87109375, -3.54150390625, -3.2119140625, -2.88232421875, -2.552734375, -2.22314453125, -1.8935546875, -1.56396484375, -1.234375, -0.90478515625, -0.5751953125, -0.24560546875, 0.083984375, 0.41357421875, 0.7431640625, 1.07275390625, 1.40234375, 1.73193359375, 2.0615234375, 2.39111328125, 2.720703125, 3.05029296875, 3.3798828125, 3.70947265625, 4.0390625, 4.36865234375, 4.6982421875, 5.02783203125, 5.357421875, 5.68701171875, 6.0166015625, 6.34619140625, 6.67578125, 7.00537109375, 7.3349609375, 7.66455078125, 7.994140625, 8.32373046875, 8.6533203125, 8.98291015625, 9.3125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 10.0, 5.0, 7.0, 15.0, 15.0, 20.0, 25.0, 22.0, 49.0, 37.0, 72.0, 83.0, 110.0, 112.0, 93.0, 65.0, 67.0, 37.0, 35.0, 27.0, 19.0, 14.0, 8.0, 11.0, 7.0, 4.0, 7.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-91.28695678710938, -88.04277801513672, -84.79859924316406, -81.5544204711914, -78.31024169921875, -75.06607055664062, -71.82189178466797, -68.57771301269531, -65.33353424072266, -62.08935546875, -58.845176696777344, -55.60100173950195, -52.3568229675293, -49.11264419555664, -45.86846923828125, -42.624290466308594, -39.38011169433594, -36.13593292236328, -32.891754150390625, -29.647579193115234, -26.403400421142578, -23.159221649169922, -19.9150447845459, -16.670867919921875, -13.426689147949219, -10.182511329650879, -6.938333511352539, -3.694155693054199, -0.4499778747558594, 2.794200897216797, 6.03837776184082, 9.282554626464844, 12.526741027832031, 15.770918846130371, 19.01509666442871, 22.259273529052734, 25.50345230102539, 28.747631072998047, 31.99180793762207, 35.235984802246094, 38.48016357421875, 41.724342346191406, 44.96852111816406, 48.21269607543945, 51.45687484741211, 54.701053619384766, 57.945228576660156, 61.18940734863281, 64.43358612060547, 67.67776489257812, 70.92194366455078, 74.16612243652344, 77.41029357910156, 80.65447998046875, 83.89865112304688, 87.14282989501953, 90.38700866699219, 93.63118743896484, 96.8753662109375, 100.11954498291016, 103.36372375488281, 106.60789489746094, 109.8520736694336, 113.09625244140625, 116.3404312133789]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 8.0, 5.0, 5.0, 8.0, 10.0, 13.0, 13.0, 13.0, 24.0, 27.0, 31.0, 29.0, 27.0, 31.0, 37.0, 37.0, 45.0, 49.0, 43.0, 44.0, 36.0, 43.0, 48.0, 30.0, 50.0, 39.0, 32.0, 22.0, 31.0, 30.0, 31.0, 19.0, 22.0, 15.0, 12.0, 6.0, 6.0, 5.0, 4.0, 5.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-72.8456039428711, -70.57373809814453, -68.30186462402344, -66.02999877929688, -63.75812530517578, -61.48625946044922, -59.21438980102539, -56.94252014160156, -54.670650482177734, -52.398780822753906, -50.12691116333008, -47.85504150390625, -45.58317565917969, -43.311302185058594, -41.03943634033203, -38.7675666809082, -36.495697021484375, -34.22382736206055, -31.95195770263672, -29.680089950561523, -27.408220291137695, -25.136350631713867, -22.864482879638672, -20.592613220214844, -18.320743560791016, -16.048873901367188, -13.777005195617676, -11.505136489868164, -9.233266830444336, -6.961397171020508, -4.689528465270996, -2.4176597595214844, -0.1457977294921875, 2.1260714530944824, 4.397940635681152, 6.669809818267822, 8.941679000854492, 11.21354866027832, 13.485417366027832, 15.757286071777344, 18.029155731201172, 20.301025390625, 22.572895050048828, 24.844762802124023, 27.11663246154785, 29.38850212097168, 31.660369873046875, 33.9322395324707, 36.20410919189453, 38.47597885131836, 40.74784851074219, 43.019718170166016, 45.291587829589844, 47.563453674316406, 49.835323333740234, 52.10719299316406, 54.37906265258789, 56.65093231201172, 58.92280197143555, 61.194671630859375, 63.46653747558594, 65.73841094970703, 68.0102767944336, 70.28215026855469, 72.55401611328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 12.0, 17.0, 12.0, 16.0, 45.0, 57.0, 60.0, 74.0, 107.0, 174.0, 220.0, 307.0, 387.0, 561.0, 720.0, 1052.0, 1650.0, 2321.0, 3428.0, 5235.0, 8205.0, 13795.0, 24568.0, 46528.0, 94904.0, 197038.0, 299615.0, 168472.0, 81753.0, 40703.0, 21725.0, 12154.0, 7455.0, 4795.0, 3154.0, 2101.0, 1442.0, 1046.0, 760.0, 520.0, 364.0, 255.0, 218.0, 144.0, 113.0, 81.0, 60.0, 39.0, 26.0, 27.0, 19.0, 5.0, 8.0, 4.0, 6.0, 4.0, 0.0, 2.0], "bins": [-102.5625, -99.396484375, -96.23046875, -93.064453125, -89.8984375, -86.732421875, -83.56640625, -80.400390625, -77.234375, -74.068359375, -70.90234375, -67.736328125, -64.5703125, -61.404296875, -58.23828125, -55.072265625, -51.90625, -48.740234375, -45.57421875, -42.408203125, -39.2421875, -36.076171875, -32.91015625, -29.744140625, -26.578125, -23.412109375, -20.24609375, -17.080078125, -13.9140625, -10.748046875, -7.58203125, -4.416015625, -1.25, 1.916015625, 5.08203125, 8.248046875, 11.4140625, 14.580078125, 17.74609375, 20.912109375, 24.078125, 27.244140625, 30.41015625, 33.576171875, 36.7421875, 39.908203125, 43.07421875, 46.240234375, 49.40625, 52.572265625, 55.73828125, 58.904296875, 62.0703125, 65.236328125, 68.40234375, 71.568359375, 74.734375, 77.900390625, 81.06640625, 84.232421875, 87.3984375, 90.564453125, 93.73046875, 96.896484375, 100.0625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 12.0, 9.0, 5.0, 14.0, 11.0, 20.0, 16.0, 25.0, 23.0, 32.0, 35.0, 27.0, 40.0, 47.0, 40.0, 65.0, 46.0, 45.0, 49.0, 40.0, 46.0, 46.0, 45.0, 41.0, 30.0, 20.0, 33.0, 31.0, 15.0, 19.0, 11.0, 12.0, 9.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-75.375, -73.0029296875, -70.630859375, -68.2587890625, -65.88671875, -63.5146484375, -61.142578125, -58.7705078125, -56.3984375, -54.0263671875, -51.654296875, -49.2822265625, -46.91015625, -44.5380859375, -42.166015625, -39.7939453125, -37.421875, -35.0498046875, -32.677734375, -30.3056640625, -27.93359375, -25.5615234375, -23.189453125, -20.8173828125, -18.4453125, -16.0732421875, -13.701171875, -11.3291015625, -8.95703125, -6.5849609375, -4.212890625, -1.8408203125, 0.53125, 2.9033203125, 5.275390625, 7.6474609375, 10.01953125, 12.3916015625, 14.763671875, 17.1357421875, 19.5078125, 21.8798828125, 24.251953125, 26.6240234375, 28.99609375, 31.3681640625, 33.740234375, 36.1123046875, 38.484375, 40.8564453125, 43.228515625, 45.6005859375, 47.97265625, 50.3447265625, 52.716796875, 55.0888671875, 57.4609375, 59.8330078125, 62.205078125, 64.5771484375, 66.94921875, 69.3212890625, 71.693359375, 74.0654296875, 76.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 7.0, 3.0, 7.0, 16.0, 15.0, 23.0, 34.0, 41.0, 67.0, 101.0, 136.0, 199.0, 271.0, 390.0, 559.0, 877.0, 1241.0, 1888.0, 2949.0, 4544.0, 7184.0, 11756.0, 19451.0, 33787.0, 60047.0, 113745.0, 211251.0, 249728.0, 146605.0, 76940.0, 42174.0, 23823.0, 14193.0, 8636.0, 5484.0, 3411.0, 2258.0, 1544.0, 971.0, 670.0, 484.0, 323.0, 231.0, 154.0, 105.0, 68.0, 48.0, 49.0, 25.0, 25.0, 8.0, 8.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-109.125, -105.626953125, -102.12890625, -98.630859375, -95.1328125, -91.634765625, -88.13671875, -84.638671875, -81.140625, -77.642578125, -74.14453125, -70.646484375, -67.1484375, -63.650390625, -60.15234375, -56.654296875, -53.15625, -49.658203125, -46.16015625, -42.662109375, -39.1640625, -35.666015625, -32.16796875, -28.669921875, -25.171875, -21.673828125, -18.17578125, -14.677734375, -11.1796875, -7.681640625, -4.18359375, -0.685546875, 2.8125, 6.310546875, 9.80859375, 13.306640625, 16.8046875, 20.302734375, 23.80078125, 27.298828125, 30.796875, 34.294921875, 37.79296875, 41.291015625, 44.7890625, 48.287109375, 51.78515625, 55.283203125, 58.78125, 62.279296875, 65.77734375, 69.275390625, 72.7734375, 76.271484375, 79.76953125, 83.267578125, 86.765625, 90.263671875, 93.76171875, 97.259765625, 100.7578125, 104.255859375, 107.75390625, 111.251953125, 114.75]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 13.0, 6.0, 11.0, 11.0, 15.0, 11.0, 22.0, 27.0, 29.0, 29.0, 20.0, 36.0, 32.0, 39.0, 34.0, 51.0, 40.0, 44.0, 52.0, 31.0, 45.0, 49.0, 47.0, 42.0, 31.0, 27.0, 26.0, 23.0, 20.0, 21.0, 18.0, 13.0, 14.0, 7.0, 6.0, 11.0, 8.0, 7.0, 4.0, 6.0, 6.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-47.875, -46.46728515625, -45.0595703125, -43.65185546875, -42.244140625, -40.83642578125, -39.4287109375, -38.02099609375, -36.61328125, -35.20556640625, -33.7978515625, -32.39013671875, -30.982421875, -29.57470703125, -28.1669921875, -26.75927734375, -25.3515625, -23.94384765625, -22.5361328125, -21.12841796875, -19.720703125, -18.31298828125, -16.9052734375, -15.49755859375, -14.08984375, -12.68212890625, -11.2744140625, -9.86669921875, -8.458984375, -7.05126953125, -5.6435546875, -4.23583984375, -2.828125, -1.42041015625, -0.0126953125, 1.39501953125, 2.802734375, 4.21044921875, 5.6181640625, 7.02587890625, 8.43359375, 9.84130859375, 11.2490234375, 12.65673828125, 14.064453125, 15.47216796875, 16.8798828125, 18.28759765625, 19.6953125, 21.10302734375, 22.5107421875, 23.91845703125, 25.326171875, 26.73388671875, 28.1416015625, 29.54931640625, 30.95703125, 32.36474609375, 33.7724609375, 35.18017578125, 36.587890625, 37.99560546875, 39.4033203125, 40.81103515625, 42.21875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 3.0, 9.0, 7.0, 10.0, 9.0, 20.0, 18.0, 40.0, 41.0, 77.0, 79.0, 129.0, 178.0, 243.0, 324.0, 547.0, 855.0, 1118.0, 1674.0, 2496.0, 3813.0, 5671.0, 8954.0, 14596.0, 25014.0, 46461.0, 99405.0, 271165.0, 324018.0, 116227.0, 52997.0, 27832.0, 15975.0, 9834.0, 6291.0, 3961.0, 2738.0, 1715.0, 1267.0, 843.0, 567.0, 391.0, 294.0, 178.0, 132.0, 100.0, 74.0, 51.0, 31.0, 24.0, 11.0, 14.0, 10.0, 9.0, 4.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0], "bins": [-27.28125, -26.40380859375, -25.5263671875, -24.64892578125, -23.771484375, -22.89404296875, -22.0166015625, -21.13916015625, -20.26171875, -19.38427734375, -18.5068359375, -17.62939453125, -16.751953125, -15.87451171875, -14.9970703125, -14.11962890625, -13.2421875, -12.36474609375, -11.4873046875, -10.60986328125, -9.732421875, -8.85498046875, -7.9775390625, -7.10009765625, -6.22265625, -5.34521484375, -4.4677734375, -3.59033203125, -2.712890625, -1.83544921875, -0.9580078125, -0.08056640625, 0.796875, 1.67431640625, 2.5517578125, 3.42919921875, 4.306640625, 5.18408203125, 6.0615234375, 6.93896484375, 7.81640625, 8.69384765625, 9.5712890625, 10.44873046875, 11.326171875, 12.20361328125, 13.0810546875, 13.95849609375, 14.8359375, 15.71337890625, 16.5908203125, 17.46826171875, 18.345703125, 19.22314453125, 20.1005859375, 20.97802734375, 21.85546875, 22.73291015625, 23.6103515625, 24.48779296875, 25.365234375, 26.24267578125, 27.1201171875, 27.99755859375, 28.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 5.0, 8.0, 8.0, 10.0, 15.0, 24.0, 23.0, 35.0, 38.0, 47.0, 98.0, 123.0, 143.0, 110.0, 82.0, 52.0, 29.0, 25.0, 21.0, 20.0, 21.0, 9.0, 8.0, 4.0, 10.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003299713134765625, -0.0031915903091430664, -0.003083467483520508, -0.0029753446578979492, -0.0028672218322753906, -0.002759099006652832, -0.0026509761810302734, -0.002542853355407715, -0.0024347305297851562, -0.0023266077041625977, -0.002218484878540039, -0.0021103620529174805, -0.002002239227294922, -0.0018941164016723633, -0.0017859935760498047, -0.001677870750427246, -0.0015697479248046875, -0.001461625099182129, -0.0013535022735595703, -0.0012453794479370117, -0.0011372566223144531, -0.0010291337966918945, -0.0009210109710693359, -0.0008128881454467773, -0.0007047653198242188, -0.0005966424942016602, -0.0004885196685791016, -0.00038039684295654297, -0.0002722740173339844, -0.00016415119171142578, -5.602836608886719e-05, 5.2094459533691406e-05, 0.00016021728515625, 0.0002683401107788086, 0.0003764629364013672, 0.0004845857620239258, 0.0005927085876464844, 0.000700831413269043, 0.0008089542388916016, 0.0009170770645141602, 0.0010251998901367188, 0.0011333227157592773, 0.001241445541381836, 0.0013495683670043945, 0.0014576911926269531, 0.0015658140182495117, 0.0016739368438720703, 0.001782059669494629, 0.0018901824951171875, 0.001998305320739746, 0.0021064281463623047, 0.0022145509719848633, 0.002322673797607422, 0.0024307966232299805, 0.002538919448852539, 0.0026470422744750977, 0.0027551651000976562, 0.002863287925720215, 0.0029714107513427734, 0.003079533576965332, 0.0031876564025878906, 0.0032957792282104492, 0.003403902053833008, 0.0035120248794555664, 0.003620147705078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 3.0, 9.0, 7.0, 14.0, 24.0, 36.0, 44.0, 70.0, 94.0, 131.0, 180.0, 272.0, 357.0, 562.0, 782.0, 1032.0, 1514.0, 2173.0, 3234.0, 4971.0, 7552.0, 12484.0, 21635.0, 41535.0, 90180.0, 236375.0, 350754.0, 139604.0, 58968.0, 29456.0, 16032.0, 9657.0, 5995.0, 4087.0, 2716.0, 1796.0, 1276.0, 872.0, 619.0, 424.0, 315.0, 206.0, 154.0, 107.0, 68.0, 62.0, 38.0, 28.0, 19.0, 9.0, 14.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-28.890625, -28.021484375, -27.15234375, -26.283203125, -25.4140625, -24.544921875, -23.67578125, -22.806640625, -21.9375, -21.068359375, -20.19921875, -19.330078125, -18.4609375, -17.591796875, -16.72265625, -15.853515625, -14.984375, -14.115234375, -13.24609375, -12.376953125, -11.5078125, -10.638671875, -9.76953125, -8.900390625, -8.03125, -7.162109375, -6.29296875, -5.423828125, -4.5546875, -3.685546875, -2.81640625, -1.947265625, -1.078125, -0.208984375, 0.66015625, 1.529296875, 2.3984375, 3.267578125, 4.13671875, 5.005859375, 5.875, 6.744140625, 7.61328125, 8.482421875, 9.3515625, 10.220703125, 11.08984375, 11.958984375, 12.828125, 13.697265625, 14.56640625, 15.435546875, 16.3046875, 17.173828125, 18.04296875, 18.912109375, 19.78125, 20.650390625, 21.51953125, 22.388671875, 23.2578125, 24.126953125, 24.99609375, 25.865234375, 26.734375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 6.0, 2.0, 3.0, 4.0, 5.0, 11.0, 11.0, 5.0, 12.0, 16.0, 18.0, 17.0, 27.0, 45.0, 38.0, 46.0, 69.0, 87.0, 90.0, 84.0, 74.0, 58.0, 52.0, 49.0, 45.0, 18.0, 18.0, 17.0, 14.0, 10.0, 11.0, 6.0, 3.0, 4.0, 2.0, 5.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.4375, -9.15966796875, -8.8818359375, -8.60400390625, -8.326171875, -8.04833984375, -7.7705078125, -7.49267578125, -7.21484375, -6.93701171875, -6.6591796875, -6.38134765625, -6.103515625, -5.82568359375, -5.5478515625, -5.27001953125, -4.9921875, -4.71435546875, -4.4365234375, -4.15869140625, -3.880859375, -3.60302734375, -3.3251953125, -3.04736328125, -2.76953125, -2.49169921875, -2.2138671875, -1.93603515625, -1.658203125, -1.38037109375, -1.1025390625, -0.82470703125, -0.546875, -0.26904296875, 0.0087890625, 0.28662109375, 0.564453125, 0.84228515625, 1.1201171875, 1.39794921875, 1.67578125, 1.95361328125, 2.2314453125, 2.50927734375, 2.787109375, 3.06494140625, 3.3427734375, 3.62060546875, 3.8984375, 4.17626953125, 4.4541015625, 4.73193359375, 5.009765625, 5.28759765625, 5.5654296875, 5.84326171875, 6.12109375, 6.39892578125, 6.6767578125, 6.95458984375, 7.232421875, 7.51025390625, 7.7880859375, 8.06591796875, 8.34375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 7.0, 13.0, 11.0, 14.0, 21.0, 27.0, 35.0, 54.0, 72.0, 92.0, 104.0, 114.0, 97.0, 70.0, 63.0, 40.0, 33.0, 32.0, 20.0, 9.0, 14.0, 10.0, 8.0, 4.0, 7.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.12782287597656, -90.66825103759766, -87.20867919921875, -83.74910736083984, -80.28953552246094, -76.82996368408203, -73.37039184570312, -69.91082000732422, -66.45124816894531, -62.991676330566406, -59.5321044921875, -56.072532653808594, -52.61296081542969, -49.15338897705078, -45.693817138671875, -42.23424530029297, -38.7746696472168, -35.31509780883789, -31.855525970458984, -28.395954132080078, -24.936382293701172, -21.476808547973633, -18.017236709594727, -14.55766487121582, -11.098093032836914, -7.638521194458008, -4.178948879241943, -0.7193765640258789, 2.7401952743530273, 6.19976806640625, 9.659339904785156, 13.118911743164062, 16.57848358154297, 20.038055419921875, 23.49762725830078, 26.957199096679688, 30.416770935058594, 33.8763427734375, 37.335914611816406, 40.79548645019531, 44.25505828857422, 47.714630126953125, 51.17420196533203, 54.63377380371094, 58.093345642089844, 61.55291748046875, 65.01248931884766, 68.47206115722656, 71.931640625, 75.3912124633789, 78.85078430175781, 82.31035614013672, 85.76992797851562, 89.22949981689453, 92.68907165527344, 96.14864349365234, 99.60821533203125, 103.06778717041016, 106.52735900878906, 109.98693084716797, 113.44650268554688, 116.90607452392578, 120.36564636230469, 123.8252182006836, 127.2847900390625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 11.0, 8.0, 9.0, 11.0, 6.0, 12.0, 9.0, 11.0, 19.0, 24.0, 21.0, 27.0, 36.0, 39.0, 40.0, 26.0, 37.0, 45.0, 42.0, 35.0, 38.0, 39.0, 48.0, 33.0, 40.0, 29.0, 34.0, 29.0, 34.0, 27.0, 23.0, 19.0, 24.0, 15.0, 19.0, 14.0, 11.0, 5.0, 13.0, 6.0, 8.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-65.30443572998047, -63.186561584472656, -61.068687438964844, -58.9508171081543, -56.832942962646484, -54.71506881713867, -52.597198486328125, -50.47932434082031, -48.3614501953125, -46.24357604980469, -44.125701904296875, -42.00783157348633, -39.889957427978516, -37.7720832824707, -35.654212951660156, -33.536338806152344, -31.41846466064453, -29.30059051513672, -27.18271827697754, -25.06484603881836, -22.946971893310547, -20.829097747802734, -18.711225509643555, -16.593353271484375, -14.475479125976562, -12.357605934143066, -10.23973274230957, -8.121859550476074, -6.003986358642578, -3.886113166809082, -1.768239974975586, 0.34963321685791016, 2.4675140380859375, 4.585387229919434, 6.70326042175293, 8.821133613586426, 10.939006805419922, 13.056879997253418, 15.174753189086914, 17.292625427246094, 19.410499572753906, 21.52837371826172, 23.6462459564209, 25.764118194580078, 27.88199234008789, 29.999866485595703, 32.11773681640625, 34.23561096191406, 36.353485107421875, 38.47135925292969, 40.5892333984375, 42.70710372924805, 44.82497787475586, 46.94285202026367, 49.06072235107422, 51.17859649658203, 53.296470642089844, 55.414344787597656, 57.53221893310547, 59.650089263916016, 61.76796340942383, 63.88583755493164, 66.00370788574219, 68.12158203125, 70.23945617675781]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 3.0, 17.0, 21.0, 12.0, 36.0, 43.0, 63.0, 73.0, 113.0, 164.0, 233.0, 357.0, 489.0, 767.0, 1070.0, 1631.0, 2544.0, 3880.0, 6081.0, 10112.0, 18614.0, 45417.0, 161411.0, 749467.0, 2216903.0, 734247.0, 153075.0, 41293.0, 18124.0, 10063.0, 6150.0, 3793.0, 2489.0, 1710.0, 1181.0, 771.0, 549.0, 351.0, 295.0, 201.0, 142.0, 88.0, 71.0, 49.0, 37.0, 23.0, 18.0, 12.0, 11.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-120.0625, -116.4775390625, -112.892578125, -109.3076171875, -105.72265625, -102.1376953125, -98.552734375, -94.9677734375, -91.3828125, -87.7978515625, -84.212890625, -80.6279296875, -77.04296875, -73.4580078125, -69.873046875, -66.2880859375, -62.703125, -59.1181640625, -55.533203125, -51.9482421875, -48.36328125, -44.7783203125, -41.193359375, -37.6083984375, -34.0234375, -30.4384765625, -26.853515625, -23.2685546875, -19.68359375, -16.0986328125, -12.513671875, -8.9287109375, -5.34375, -1.7587890625, 1.826171875, 5.4111328125, 8.99609375, 12.5810546875, 16.166015625, 19.7509765625, 23.3359375, 26.9208984375, 30.505859375, 34.0908203125, 37.67578125, 41.2607421875, 44.845703125, 48.4306640625, 52.015625, 55.6005859375, 59.185546875, 62.7705078125, 66.35546875, 69.9404296875, 73.525390625, 77.1103515625, 80.6953125, 84.2802734375, 87.865234375, 91.4501953125, 95.03515625, 98.6201171875, 102.205078125, 105.7900390625, 109.375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 12.0, 9.0, 9.0, 9.0, 9.0, 11.0, 15.0, 20.0, 27.0, 21.0, 40.0, 36.0, 28.0, 41.0, 37.0, 55.0, 46.0, 57.0, 43.0, 54.0, 42.0, 32.0, 35.0, 39.0, 24.0, 35.0, 35.0, 31.0, 20.0, 17.0, 18.0, 11.0, 14.0, 13.0, 10.0, 6.0, 9.0, 5.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.4375, -59.421875, -57.40625, -55.390625, -53.375, -51.359375, -49.34375, -47.328125, -45.3125, -43.296875, -41.28125, -39.265625, -37.25, -35.234375, -33.21875, -31.203125, -29.1875, -27.171875, -25.15625, -23.140625, -21.125, -19.109375, -17.09375, -15.078125, -13.0625, -11.046875, -9.03125, -7.015625, -5.0, -2.984375, -0.96875, 1.046875, 3.0625, 5.078125, 7.09375, 9.109375, 11.125, 13.140625, 15.15625, 17.171875, 19.1875, 21.203125, 23.21875, 25.234375, 27.25, 29.265625, 31.28125, 33.296875, 35.3125, 37.328125, 39.34375, 41.359375, 43.375, 45.390625, 47.40625, 49.421875, 51.4375, 53.453125, 55.46875, 57.484375, 59.5, 61.515625, 63.53125, 65.546875, 67.5625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 6.0, 6.0, 11.0, 12.0, 15.0, 26.0, 35.0, 53.0, 86.0, 84.0, 153.0, 167.0, 296.0, 392.0, 575.0, 796.0, 1136.0, 1634.0, 2451.0, 3782.0, 5765.0, 9065.0, 15447.0, 27695.0, 55778.0, 144545.0, 592342.0, 2443917.0, 613597.0, 147094.0, 56999.0, 27776.0, 15623.0, 9236.0, 5954.0, 3765.0, 2586.0, 1632.0, 1130.0, 787.0, 527.0, 390.0, 258.0, 172.0, 139.0, 106.0, 60.0, 56.0, 37.0, 36.0, 11.0, 21.0, 14.0, 6.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-118.6875, -114.5244140625, -110.361328125, -106.1982421875, -102.03515625, -97.8720703125, -93.708984375, -89.5458984375, -85.3828125, -81.2197265625, -77.056640625, -72.8935546875, -68.73046875, -64.5673828125, -60.404296875, -56.2412109375, -52.078125, -47.9150390625, -43.751953125, -39.5888671875, -35.42578125, -31.2626953125, -27.099609375, -22.9365234375, -18.7734375, -14.6103515625, -10.447265625, -6.2841796875, -2.12109375, 2.0419921875, 6.205078125, 10.3681640625, 14.53125, 18.6943359375, 22.857421875, 27.0205078125, 31.18359375, 35.3466796875, 39.509765625, 43.6728515625, 47.8359375, 51.9990234375, 56.162109375, 60.3251953125, 64.48828125, 68.6513671875, 72.814453125, 76.9775390625, 81.140625, 85.3037109375, 89.466796875, 93.6298828125, 97.79296875, 101.9560546875, 106.119140625, 110.2822265625, 114.4453125, 118.6083984375, 122.771484375, 126.9345703125, 131.09765625, 135.2607421875, 139.423828125, 143.5869140625, 147.75]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 5.0, 9.0, 8.0, 13.0, 11.0, 21.0, 27.0, 23.0, 27.0, 38.0, 56.0, 74.0, 92.0, 154.0, 241.0, 329.0, 524.0, 692.0, 564.0, 355.0, 253.0, 145.0, 96.0, 64.0, 49.0, 35.0, 39.0, 28.0, 13.0, 7.0, 12.0, 11.0, 14.0, 6.0, 6.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.40625, -35.17578125, -33.9453125, -32.71484375, -31.484375, -30.25390625, -29.0234375, -27.79296875, -26.5625, -25.33203125, -24.1015625, -22.87109375, -21.640625, -20.41015625, -19.1796875, -17.94921875, -16.71875, -15.48828125, -14.2578125, -13.02734375, -11.796875, -10.56640625, -9.3359375, -8.10546875, -6.875, -5.64453125, -4.4140625, -3.18359375, -1.953125, -0.72265625, 0.5078125, 1.73828125, 2.96875, 4.19921875, 5.4296875, 6.66015625, 7.890625, 9.12109375, 10.3515625, 11.58203125, 12.8125, 14.04296875, 15.2734375, 16.50390625, 17.734375, 18.96484375, 20.1953125, 21.42578125, 22.65625, 23.88671875, 25.1171875, 26.34765625, 27.578125, 28.80859375, 30.0390625, 31.26953125, 32.5, 33.73046875, 34.9609375, 36.19140625, 37.421875, 38.65234375, 39.8828125, 41.11328125, 42.34375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 10.0, 8.0, 8.0, 12.0, 22.0, 19.0, 29.0, 29.0, 36.0, 61.0, 70.0, 82.0, 103.0, 102.0, 77.0, 63.0, 53.0, 35.0, 27.0, 36.0, 20.0, 10.0, 10.0, 12.0, 12.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-92.34141540527344, -89.34625244140625, -86.35108947753906, -83.35592651367188, -80.36076354980469, -77.36560821533203, -74.37044525146484, -71.37528228759766, -68.38011932373047, -65.38495635986328, -62.389793395996094, -59.39463424682617, -56.399471282958984, -53.4043083190918, -50.409149169921875, -47.41398620605469, -44.4188232421875, -41.42366027832031, -38.428497314453125, -35.4333381652832, -32.438175201416016, -29.443012237548828, -26.447851181030273, -23.45269012451172, -20.45752716064453, -17.462364196777344, -14.467203140258789, -11.472041130065918, -8.476879119873047, -5.481717109680176, -2.4865550994873047, 0.50860595703125, 3.5037689208984375, 6.498930931091309, 9.49409294128418, 12.48925495147705, 15.484416961669922, 18.47957992553711, 21.474740982055664, 24.46990203857422, 27.465065002441406, 30.460227966308594, 33.45539093017578, 36.4505500793457, 39.44571304321289, 42.44087600708008, 45.43603515625, 48.43119812011719, 51.426361083984375, 54.42152404785156, 57.41668701171875, 60.41184616088867, 63.40700912475586, 66.40216827392578, 69.39733123779297, 72.39249420166016, 75.38765716552734, 78.38282012939453, 81.37798309326172, 84.3731460571289, 87.36830139160156, 90.36346435546875, 93.35862731933594, 96.35379028320312, 99.34895324707031]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 3.0, 7.0, 14.0, 13.0, 7.0, 11.0, 11.0, 13.0, 10.0, 25.0, 23.0, 35.0, 29.0, 22.0, 41.0, 45.0, 42.0, 39.0, 55.0, 40.0, 37.0, 40.0, 35.0, 44.0, 34.0, 38.0, 30.0, 38.0, 33.0, 28.0, 19.0, 19.0, 19.0, 18.0, 13.0, 11.0, 8.0, 12.0, 7.0, 7.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-76.96728515625, -74.66474914550781, -72.36222076416016, -70.05968475341797, -67.75715637207031, -65.45462036132812, -63.15208435058594, -60.849552154541016, -58.547019958496094, -56.24448776245117, -53.94195556640625, -51.63941955566406, -49.33688735961914, -47.03435516357422, -44.73181915283203, -42.42928695678711, -40.12675476074219, -37.824222564697266, -35.521690368652344, -33.219154357910156, -30.916622161865234, -28.614089965820312, -26.311555862426758, -24.009021759033203, -21.70648956298828, -19.40395736694336, -17.101423263549805, -14.798890113830566, -12.496356964111328, -10.19382381439209, -7.891290664672852, -5.588756561279297, -3.2862319946289062, -0.983698844909668, 1.3188343048095703, 3.6213674545288086, 5.923900604248047, 8.226433753967285, 10.528966903686523, 12.831501007080078, 15.134033203125, 17.436565399169922, 19.739099502563477, 22.04163360595703, 24.344165802001953, 26.646697998046875, 28.94923210144043, 31.251766204833984, 33.554298400878906, 35.85683059692383, 38.15936279296875, 40.46189880371094, 42.76443099975586, 45.06696319580078, 47.36949920654297, 49.67203140258789, 51.97456359863281, 54.277095794677734, 56.579627990722656, 58.882164001464844, 61.184696197509766, 63.48722839355469, 65.78976440429688, 68.09230041503906, 70.39482879638672]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 3.0, 8.0, 11.0, 13.0, 24.0, 21.0, 43.0, 40.0, 83.0, 136.0, 185.0, 232.0, 332.0, 467.0, 690.0, 1081.0, 1592.0, 2219.0, 3195.0, 4603.0, 6663.0, 9962.0, 15354.0, 24012.0, 38506.0, 67407.0, 121743.0, 207951.0, 219141.0, 132586.0, 73632.0, 41731.0, 24984.0, 16176.0, 10742.0, 7151.0, 4883.0, 3388.0, 2266.0, 1664.0, 1102.0, 753.0, 535.0, 387.0, 275.0, 197.0, 110.0, 96.0, 54.0, 53.0, 31.0, 20.0, 12.0, 9.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-42.9375, -41.5556640625, -40.173828125, -38.7919921875, -37.41015625, -36.0283203125, -34.646484375, -33.2646484375, -31.8828125, -30.5009765625, -29.119140625, -27.7373046875, -26.35546875, -24.9736328125, -23.591796875, -22.2099609375, -20.828125, -19.4462890625, -18.064453125, -16.6826171875, -15.30078125, -13.9189453125, -12.537109375, -11.1552734375, -9.7734375, -8.3916015625, -7.009765625, -5.6279296875, -4.24609375, -2.8642578125, -1.482421875, -0.1005859375, 1.28125, 2.6630859375, 4.044921875, 5.4267578125, 6.80859375, 8.1904296875, 9.572265625, 10.9541015625, 12.3359375, 13.7177734375, 15.099609375, 16.4814453125, 17.86328125, 19.2451171875, 20.626953125, 22.0087890625, 23.390625, 24.7724609375, 26.154296875, 27.5361328125, 28.91796875, 30.2998046875, 31.681640625, 33.0634765625, 34.4453125, 35.8271484375, 37.208984375, 38.5908203125, 39.97265625, 41.3544921875, 42.736328125, 44.1181640625, 45.5]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 5.0, 13.0, 8.0, 8.0, 6.0, 9.0, 11.0, 15.0, 6.0, 17.0, 26.0, 25.0, 24.0, 30.0, 31.0, 34.0, 39.0, 43.0, 46.0, 40.0, 48.0, 44.0, 44.0, 47.0, 38.0, 34.0, 39.0, 25.0, 33.0, 28.0, 24.0, 22.0, 14.0, 17.0, 14.0, 17.0, 11.0, 9.0, 7.0, 13.0, 8.0, 4.0, 5.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-62.96875, -61.078125, -59.1875, -57.296875, -55.40625, -53.515625, -51.625, -49.734375, -47.84375, -45.953125, -44.0625, -42.171875, -40.28125, -38.390625, -36.5, -34.609375, -32.71875, -30.828125, -28.9375, -27.046875, -25.15625, -23.265625, -21.375, -19.484375, -17.59375, -15.703125, -13.8125, -11.921875, -10.03125, -8.140625, -6.25, -4.359375, -2.46875, -0.578125, 1.3125, 3.203125, 5.09375, 6.984375, 8.875, 10.765625, 12.65625, 14.546875, 16.4375, 18.328125, 20.21875, 22.109375, 24.0, 25.890625, 27.78125, 29.671875, 31.5625, 33.453125, 35.34375, 37.234375, 39.125, 41.015625, 42.90625, 44.796875, 46.6875, 48.578125, 50.46875, 52.359375, 54.25, 56.140625, 58.03125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 4.0, 10.0, 6.0, 9.0, 20.0, 17.0, 35.0, 33.0, 49.0, 90.0, 97.0, 157.0, 225.0, 334.0, 458.0, 646.0, 959.0, 1376.0, 2119.0, 3473.0, 5545.0, 9245.0, 18258.0, 62497.0, 778120.0, 113903.0, 22633.0, 10939.0, 6113.0, 3891.0, 2457.0, 1563.0, 1044.0, 679.0, 439.0, 336.0, 228.0, 156.0, 94.0, 84.0, 60.0, 44.0, 27.0, 22.0, 20.0, 10.0, 9.0, 6.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-120.375, -116.169921875, -111.96484375, -107.759765625, -103.5546875, -99.349609375, -95.14453125, -90.939453125, -86.734375, -82.529296875, -78.32421875, -74.119140625, -69.9140625, -65.708984375, -61.50390625, -57.298828125, -53.09375, -48.888671875, -44.68359375, -40.478515625, -36.2734375, -32.068359375, -27.86328125, -23.658203125, -19.453125, -15.248046875, -11.04296875, -6.837890625, -2.6328125, 1.572265625, 5.77734375, 9.982421875, 14.1875, 18.392578125, 22.59765625, 26.802734375, 31.0078125, 35.212890625, 39.41796875, 43.623046875, 47.828125, 52.033203125, 56.23828125, 60.443359375, 64.6484375, 68.853515625, 73.05859375, 77.263671875, 81.46875, 85.673828125, 89.87890625, 94.083984375, 98.2890625, 102.494140625, 106.69921875, 110.904296875, 115.109375, 119.314453125, 123.51953125, 127.724609375, 131.9296875, 136.134765625, 140.33984375, 144.544921875, 148.75]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 7.0, 16.0, 10.0, 13.0, 22.0, 22.0, 15.0, 35.0, 31.0, 29.0, 38.0, 35.0, 41.0, 36.0, 36.0, 51.0, 45.0, 42.0, 41.0, 43.0, 35.0, 45.0, 28.0, 38.0, 43.0, 36.0, 23.0, 21.0, 19.0, 22.0, 18.0, 10.0, 13.0, 8.0, 8.0, 9.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-121.375, -118.064453125, -114.75390625, -111.443359375, -108.1328125, -104.822265625, -101.51171875, -98.201171875, -94.890625, -91.580078125, -88.26953125, -84.958984375, -81.6484375, -78.337890625, -75.02734375, -71.716796875, -68.40625, -65.095703125, -61.78515625, -58.474609375, -55.1640625, -51.853515625, -48.54296875, -45.232421875, -41.921875, -38.611328125, -35.30078125, -31.990234375, -28.6796875, -25.369140625, -22.05859375, -18.748046875, -15.4375, -12.126953125, -8.81640625, -5.505859375, -2.1953125, 1.115234375, 4.42578125, 7.736328125, 11.046875, 14.357421875, 17.66796875, 20.978515625, 24.2890625, 27.599609375, 30.91015625, 34.220703125, 37.53125, 40.841796875, 44.15234375, 47.462890625, 50.7734375, 54.083984375, 57.39453125, 60.705078125, 64.015625, 67.326171875, 70.63671875, 73.947265625, 77.2578125, 80.568359375, 83.87890625, 87.189453125, 90.5]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 5.0, 6.0, 14.0, 15.0, 14.0, 23.0, 32.0, 52.0, 75.0, 106.0, 145.0, 194.0, 344.0, 521.0, 829.0, 1396.0, 2421.0, 4610.0, 9688.0, 29265.0, 394399.0, 550328.0, 32458.0, 10268.0, 4793.0, 2495.0, 1491.0, 909.0, 555.0, 313.0, 228.0, 182.0, 114.0, 89.0, 50.0, 37.0, 25.0, 12.0, 10.0, 15.0, 5.0, 8.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.375, -16.776611328125, -16.17822265625, -15.579833984375, -14.9814453125, -14.383056640625, -13.78466796875, -13.186279296875, -12.587890625, -11.989501953125, -11.39111328125, -10.792724609375, -10.1943359375, -9.595947265625, -8.99755859375, -8.399169921875, -7.80078125, -7.202392578125, -6.60400390625, -6.005615234375, -5.4072265625, -4.808837890625, -4.21044921875, -3.612060546875, -3.013671875, -2.415283203125, -1.81689453125, -1.218505859375, -0.6201171875, -0.021728515625, 0.57666015625, 1.175048828125, 1.7734375, 2.371826171875, 2.97021484375, 3.568603515625, 4.1669921875, 4.765380859375, 5.36376953125, 5.962158203125, 6.560546875, 7.158935546875, 7.75732421875, 8.355712890625, 8.9541015625, 9.552490234375, 10.15087890625, 10.749267578125, 11.34765625, 11.946044921875, 12.54443359375, 13.142822265625, 13.7412109375, 14.339599609375, 14.93798828125, 15.536376953125, 16.134765625, 16.733154296875, 17.33154296875, 17.929931640625, 18.5283203125, 19.126708984375, 19.72509765625, 20.323486328125, 20.921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 11.0, 19.0, 21.0, 43.0, 51.0, 106.0, 167.0, 193.0, 138.0, 80.0, 49.0, 25.0, 20.0, 22.0, 9.0, 11.0, 5.0, 2.0, 6.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0109100341796875, -0.010509371757507324, -0.010108709335327148, -0.009708046913146973, -0.009307384490966797, -0.008906722068786621, -0.008506059646606445, -0.00810539722442627, -0.007704734802246094, -0.007304072380065918, -0.006903409957885742, -0.006502747535705566, -0.006102085113525391, -0.005701422691345215, -0.005300760269165039, -0.004900097846984863, -0.0044994354248046875, -0.004098773002624512, -0.003698110580444336, -0.00329744815826416, -0.0028967857360839844, -0.0024961233139038086, -0.002095460891723633, -0.001694798469543457, -0.0012941360473632812, -0.0008934736251831055, -0.0004928112030029297, -9.21487808227539e-05, 0.0003085136413574219, 0.0007091760635375977, 0.0011098384857177734, 0.0015105009078979492, 0.001911163330078125, 0.0023118257522583008, 0.0027124881744384766, 0.0031131505966186523, 0.003513813018798828, 0.003914475440979004, 0.00431513786315918, 0.0047158002853393555, 0.005116462707519531, 0.005517125129699707, 0.005917787551879883, 0.006318449974060059, 0.006719112396240234, 0.00711977481842041, 0.007520437240600586, 0.007921099662780762, 0.008321762084960938, 0.008722424507141113, 0.009123086929321289, 0.009523749351501465, 0.00992441177368164, 0.010325074195861816, 0.010725736618041992, 0.011126399040222168, 0.011527061462402344, 0.01192772388458252, 0.012328386306762695, 0.012729048728942871, 0.013129711151123047, 0.013530373573303223, 0.013931035995483398, 0.014331698417663574, 0.01473236083984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 7.0, 2.0, 8.0, 6.0, 14.0, 23.0, 32.0, 47.0, 57.0, 99.0, 126.0, 139.0, 214.0, 294.0, 447.0, 635.0, 961.0, 1454.0, 2228.0, 3488.0, 5456.0, 8998.0, 15452.0, 28021.0, 53898.0, 122910.0, 323168.0, 270496.0, 101860.0, 47224.0, 24509.0, 13869.0, 8089.0, 4999.0, 3096.0, 2011.0, 1334.0, 862.0, 609.0, 445.0, 300.0, 192.0, 129.0, 98.0, 69.0, 61.0, 29.0, 26.0, 26.0, 11.0, 7.0, 14.0, 5.0, 7.0, 3.0, 3.0, 2.0], "bins": [-7.60546875, -7.381103515625, -7.15673828125, -6.932373046875, -6.7080078125, -6.483642578125, -6.25927734375, -6.034912109375, -5.810546875, -5.586181640625, -5.36181640625, -5.137451171875, -4.9130859375, -4.688720703125, -4.46435546875, -4.239990234375, -4.015625, -3.791259765625, -3.56689453125, -3.342529296875, -3.1181640625, -2.893798828125, -2.66943359375, -2.445068359375, -2.220703125, -1.996337890625, -1.77197265625, -1.547607421875, -1.3232421875, -1.098876953125, -0.87451171875, -0.650146484375, -0.42578125, -0.201416015625, 0.02294921875, 0.247314453125, 0.4716796875, 0.696044921875, 0.92041015625, 1.144775390625, 1.369140625, 1.593505859375, 1.81787109375, 2.042236328125, 2.2666015625, 2.490966796875, 2.71533203125, 2.939697265625, 3.1640625, 3.388427734375, 3.61279296875, 3.837158203125, 4.0615234375, 4.285888671875, 4.51025390625, 4.734619140625, 4.958984375, 5.183349609375, 5.40771484375, 5.632080078125, 5.8564453125, 6.080810546875, 6.30517578125, 6.529541015625, 6.75390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 4.0, 5.0, 7.0, 5.0, 12.0, 13.0, 12.0, 22.0, 20.0, 24.0, 34.0, 47.0, 46.0, 48.0, 57.0, 60.0, 82.0, 62.0, 60.0, 62.0, 64.0, 42.0, 29.0, 27.0, 39.0, 15.0, 19.0, 17.0, 15.0, 11.0, 10.0, 8.0, 2.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.33984375, -2.274261474609375, -2.20867919921875, -2.143096923828125, -2.0775146484375, -2.011932373046875, -1.94635009765625, -1.880767822265625, -1.815185546875, -1.749603271484375, -1.68402099609375, -1.618438720703125, -1.5528564453125, -1.487274169921875, -1.42169189453125, -1.356109619140625, -1.29052734375, -1.224945068359375, -1.15936279296875, -1.093780517578125, -1.0281982421875, -0.962615966796875, -0.89703369140625, -0.831451416015625, -0.765869140625, -0.700286865234375, -0.63470458984375, -0.569122314453125, -0.5035400390625, -0.437957763671875, -0.37237548828125, -0.306793212890625, -0.2412109375, -0.175628662109375, -0.11004638671875, -0.044464111328125, 0.0211181640625, 0.086700439453125, 0.15228271484375, 0.217864990234375, 0.283447265625, 0.349029541015625, 0.41461181640625, 0.480194091796875, 0.5457763671875, 0.611358642578125, 0.67694091796875, 0.742523193359375, 0.80810546875, 0.873687744140625, 0.93927001953125, 1.004852294921875, 1.0704345703125, 1.136016845703125, 1.20159912109375, 1.267181396484375, 1.332763671875, 1.398345947265625, 1.46392822265625, 1.529510498046875, 1.5950927734375, 1.660675048828125, 1.72625732421875, 1.791839599609375, 1.857421875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 10.0, 8.0, 11.0, 12.0, 11.0, 18.0, 22.0, 24.0, 36.0, 52.0, 74.0, 85.0, 104.0, 107.0, 110.0, 76.0, 63.0, 42.0, 39.0, 28.0, 11.0, 8.0, 15.0, 11.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.31333923339844, -87.32707214355469, -84.3407974243164, -81.35453033447266, -78.36825561523438, -75.38198852539062, -72.39572143554688, -69.40945434570312, -66.42317962646484, -63.43690872192383, -60.45063781738281, -57.46437072753906, -54.47809982299805, -51.49182891845703, -48.50556182861328, -45.519290924072266, -42.53302001953125, -39.546749114990234, -36.56047821044922, -33.57421112060547, -30.587940216064453, -27.601669311523438, -24.615400314331055, -21.629131317138672, -18.642860412597656, -15.656590461730957, -12.670320510864258, -9.684050559997559, -6.697780609130859, -3.71151065826416, -0.7252407073974609, 2.261028289794922, 5.247291564941406, 8.233561515808105, 11.219831466674805, 14.206101417541504, 17.192371368408203, 20.17864227294922, 23.1649112701416, 26.151180267333984, 29.137451171875, 32.123722076416016, 35.10999298095703, 38.09626007080078, 41.0825309753418, 44.06880187988281, 47.05506896972656, 50.04133987426758, 53.027610778808594, 56.01388168334961, 59.000152587890625, 61.986419677734375, 64.97268676757812, 67.9589614868164, 70.94522857666016, 73.93150329589844, 76.91777038574219, 79.90403747558594, 82.89031219482422, 85.87657928466797, 88.86285400390625, 91.84912109375, 94.83538818359375, 97.8216552734375, 100.80792999267578]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 8.0, 14.0, 9.0, 3.0, 11.0, 13.0, 14.0, 13.0, 21.0, 22.0, 23.0, 34.0, 35.0, 34.0, 30.0, 44.0, 42.0, 43.0, 43.0, 39.0, 39.0, 41.0, 42.0, 46.0, 30.0, 28.0, 42.0, 24.0, 34.0, 22.0, 21.0, 19.0, 17.0, 16.0, 18.0, 11.0, 8.0, 8.0, 8.0, 10.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-61.97907257080078, -60.09901809692383, -58.21896743774414, -56.33891296386719, -54.4588623046875, -52.57880783081055, -50.698753356933594, -48.818702697753906, -46.93865203857422, -45.058597564697266, -43.17854690551758, -41.298492431640625, -39.41844177246094, -37.538387298583984, -35.65833282470703, -33.778282165527344, -31.89822769165039, -30.01817512512207, -28.13812255859375, -26.258068084716797, -24.37801742553711, -22.497962951660156, -20.617910385131836, -18.737857818603516, -16.857805252075195, -14.977752685546875, -13.097700119018555, -11.217646598815918, -9.337594032287598, -7.457541465759277, -5.577487945556641, -3.6974353790283203, -1.8173866271972656, 0.06266617774963379, 1.9427189826965332, 3.8227720260620117, 5.702824592590332, 7.582877159118652, 9.462930679321289, 11.34298324584961, 13.22303581237793, 15.10308837890625, 16.98314094543457, 18.86319351196289, 20.743247985839844, 22.62329864501953, 24.503353118896484, 26.383405685424805, 28.263458251953125, 30.143510818481445, 32.023563385009766, 33.90361785888672, 35.783668518066406, 37.66372299194336, 39.54377746582031, 41.423828125, 43.30387878417969, 45.18393325805664, 47.06398391723633, 48.94403839111328, 50.82408905029297, 52.70414352416992, 54.584197998046875, 56.46424865722656, 58.344303131103516]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 11.0, 7.0, 8.0, 13.0, 17.0, 23.0, 29.0, 35.0, 67.0, 88.0, 115.0, 171.0, 192.0, 332.0, 449.0, 619.0, 839.0, 1197.0, 1637.0, 2352.0, 3245.0, 4653.0, 6610.0, 9804.0, 14832.0, 23296.0, 36802.0, 62077.0, 107403.0, 189793.0, 230199.0, 140221.0, 79113.0, 46716.0, 28566.0, 18159.0, 11967.0, 8089.0, 5464.0, 3868.0, 2590.0, 1944.0, 1401.0, 1018.0, 728.0, 521.0, 373.0, 258.0, 184.0, 134.0, 104.0, 74.0, 51.0, 35.0, 37.0, 18.0, 8.0, 4.0, 7.0, 1.0, 2.0, 2.0], "bins": [-56.125, -54.3837890625, -52.642578125, -50.9013671875, -49.16015625, -47.4189453125, -45.677734375, -43.9365234375, -42.1953125, -40.4541015625, -38.712890625, -36.9716796875, -35.23046875, -33.4892578125, -31.748046875, -30.0068359375, -28.265625, -26.5244140625, -24.783203125, -23.0419921875, -21.30078125, -19.5595703125, -17.818359375, -16.0771484375, -14.3359375, -12.5947265625, -10.853515625, -9.1123046875, -7.37109375, -5.6298828125, -3.888671875, -2.1474609375, -0.40625, 1.3349609375, 3.076171875, 4.8173828125, 6.55859375, 8.2998046875, 10.041015625, 11.7822265625, 13.5234375, 15.2646484375, 17.005859375, 18.7470703125, 20.48828125, 22.2294921875, 23.970703125, 25.7119140625, 27.453125, 29.1943359375, 30.935546875, 32.6767578125, 34.41796875, 36.1591796875, 37.900390625, 39.6416015625, 41.3828125, 43.1240234375, 44.865234375, 46.6064453125, 48.34765625, 50.0888671875, 51.830078125, 53.5712890625, 55.3125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 0.0, 9.0, 14.0, 10.0, 4.0, 8.0, 11.0, 13.0, 17.0, 11.0, 23.0, 22.0, 29.0, 28.0, 30.0, 33.0, 45.0, 45.0, 44.0, 52.0, 39.0, 60.0, 46.0, 46.0, 47.0, 37.0, 31.0, 36.0, 28.0, 20.0, 24.0, 22.0, 18.0, 14.0, 20.0, 13.0, 11.0, 6.0, 10.0, 7.0, 6.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-64.625, -62.67578125, -60.7265625, -58.77734375, -56.828125, -54.87890625, -52.9296875, -50.98046875, -49.03125, -47.08203125, -45.1328125, -43.18359375, -41.234375, -39.28515625, -37.3359375, -35.38671875, -33.4375, -31.48828125, -29.5390625, -27.58984375, -25.640625, -23.69140625, -21.7421875, -19.79296875, -17.84375, -15.89453125, -13.9453125, -11.99609375, -10.046875, -8.09765625, -6.1484375, -4.19921875, -2.25, -0.30078125, 1.6484375, 3.59765625, 5.546875, 7.49609375, 9.4453125, 11.39453125, 13.34375, 15.29296875, 17.2421875, 19.19140625, 21.140625, 23.08984375, 25.0390625, 26.98828125, 28.9375, 30.88671875, 32.8359375, 34.78515625, 36.734375, 38.68359375, 40.6328125, 42.58203125, 44.53125, 46.48046875, 48.4296875, 50.37890625, 52.328125, 54.27734375, 56.2265625, 58.17578125, 60.125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 10.0, 8.0, 21.0, 36.0, 30.0, 70.0, 95.0, 129.0, 188.0, 293.0, 378.0, 613.0, 964.0, 1368.0, 2149.0, 3299.0, 4962.0, 7663.0, 12243.0, 19353.0, 31074.0, 52935.0, 93617.0, 176373.0, 259329.0, 164268.0, 87096.0, 49309.0, 29634.0, 18439.0, 11450.0, 7314.0, 4662.0, 3155.0, 1983.0, 1338.0, 866.0, 581.0, 422.0, 269.0, 184.0, 128.0, 83.0, 51.0, 47.0, 33.0, 12.0, 13.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-73.875, -71.525390625, -69.17578125, -66.826171875, -64.4765625, -62.126953125, -59.77734375, -57.427734375, -55.078125, -52.728515625, -50.37890625, -48.029296875, -45.6796875, -43.330078125, -40.98046875, -38.630859375, -36.28125, -33.931640625, -31.58203125, -29.232421875, -26.8828125, -24.533203125, -22.18359375, -19.833984375, -17.484375, -15.134765625, -12.78515625, -10.435546875, -8.0859375, -5.736328125, -3.38671875, -1.037109375, 1.3125, 3.662109375, 6.01171875, 8.361328125, 10.7109375, 13.060546875, 15.41015625, 17.759765625, 20.109375, 22.458984375, 24.80859375, 27.158203125, 29.5078125, 31.857421875, 34.20703125, 36.556640625, 38.90625, 41.255859375, 43.60546875, 45.955078125, 48.3046875, 50.654296875, 53.00390625, 55.353515625, 57.703125, 60.052734375, 62.40234375, 64.751953125, 67.1015625, 69.451171875, 71.80078125, 74.150390625, 76.5]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 10.0, 16.0, 20.0, 11.0, 17.0, 20.0, 17.0, 29.0, 16.0, 28.0, 49.0, 36.0, 41.0, 40.0, 39.0, 41.0, 32.0, 33.0, 53.0, 43.0, 42.0, 49.0, 44.0, 28.0, 25.0, 27.0, 36.0, 20.0, 18.0, 18.0, 16.0, 13.0, 17.0, 9.0, 9.0, 4.0, 3.0, 3.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.6875, -39.47216796875, -38.2568359375, -37.04150390625, -35.826171875, -34.61083984375, -33.3955078125, -32.18017578125, -30.96484375, -29.74951171875, -28.5341796875, -27.31884765625, -26.103515625, -24.88818359375, -23.6728515625, -22.45751953125, -21.2421875, -20.02685546875, -18.8115234375, -17.59619140625, -16.380859375, -15.16552734375, -13.9501953125, -12.73486328125, -11.51953125, -10.30419921875, -9.0888671875, -7.87353515625, -6.658203125, -5.44287109375, -4.2275390625, -3.01220703125, -1.796875, -0.58154296875, 0.6337890625, 1.84912109375, 3.064453125, 4.27978515625, 5.4951171875, 6.71044921875, 7.92578125, 9.14111328125, 10.3564453125, 11.57177734375, 12.787109375, 14.00244140625, 15.2177734375, 16.43310546875, 17.6484375, 18.86376953125, 20.0791015625, 21.29443359375, 22.509765625, 23.72509765625, 24.9404296875, 26.15576171875, 27.37109375, 28.58642578125, 29.8017578125, 31.01708984375, 32.232421875, 33.44775390625, 34.6630859375, 35.87841796875, 37.09375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 11.0, 13.0, 28.0, 31.0, 50.0, 62.0, 115.0, 169.0, 230.0, 337.0, 494.0, 853.0, 1206.0, 1815.0, 2819.0, 4538.0, 7407.0, 12567.0, 22327.0, 41592.0, 85897.0, 204944.0, 349283.0, 159600.0, 69540.0, 35007.0, 18955.0, 10650.0, 6570.0, 3948.0, 2575.0, 1621.0, 1074.0, 723.0, 486.0, 350.0, 212.0, 142.0, 102.0, 68.0, 42.0, 34.0, 22.0, 10.0, 12.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.109375, -24.308837890625, -23.50830078125, -22.707763671875, -21.9072265625, -21.106689453125, -20.30615234375, -19.505615234375, -18.705078125, -17.904541015625, -17.10400390625, -16.303466796875, -15.5029296875, -14.702392578125, -13.90185546875, -13.101318359375, -12.30078125, -11.500244140625, -10.69970703125, -9.899169921875, -9.0986328125, -8.298095703125, -7.49755859375, -6.697021484375, -5.896484375, -5.095947265625, -4.29541015625, -3.494873046875, -2.6943359375, -1.893798828125, -1.09326171875, -0.292724609375, 0.5078125, 1.308349609375, 2.10888671875, 2.909423828125, 3.7099609375, 4.510498046875, 5.31103515625, 6.111572265625, 6.912109375, 7.712646484375, 8.51318359375, 9.313720703125, 10.1142578125, 10.914794921875, 11.71533203125, 12.515869140625, 13.31640625, 14.116943359375, 14.91748046875, 15.718017578125, 16.5185546875, 17.319091796875, 18.11962890625, 18.920166015625, 19.720703125, 20.521240234375, 21.32177734375, 22.122314453125, 22.9228515625, 23.723388671875, 24.52392578125, 25.324462890625, 26.125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 4.0, 6.0, 9.0, 10.0, 14.0, 20.0, 18.0, 19.0, 27.0, 47.0, 56.0, 84.0, 121.0, 127.0, 107.0, 68.0, 60.0, 46.0, 30.0, 18.0, 20.0, 14.0, 11.0, 9.0, 13.0, 4.0, 4.0, 9.0, 4.0, 0.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00307464599609375, -0.0029824376106262207, -0.0028902292251586914, -0.002798020839691162, -0.002705812454223633, -0.0026136040687561035, -0.0025213956832885742, -0.002429187297821045, -0.0023369789123535156, -0.0022447705268859863, -0.002152562141418457, -0.0020603537559509277, -0.0019681453704833984, -0.0018759369850158691, -0.0017837285995483398, -0.0016915202140808105, -0.0015993118286132812, -0.001507103443145752, -0.0014148950576782227, -0.0013226866722106934, -0.001230478286743164, -0.0011382699012756348, -0.0010460615158081055, -0.0009538531303405762, -0.0008616447448730469, -0.0007694363594055176, -0.0006772279739379883, -0.000585019588470459, -0.0004928112030029297, -0.0004006028175354004, -0.0003083944320678711, -0.0002161860466003418, -0.0001239776611328125, -3.17692756652832e-05, 6.0439109802246094e-05, 0.0001526474952697754, 0.0002448558807373047, 0.000337064266204834, 0.0004292726516723633, 0.0005214810371398926, 0.0006136894226074219, 0.0007058978080749512, 0.0007981061935424805, 0.0008903145790100098, 0.000982522964477539, 0.0010747313499450684, 0.0011669397354125977, 0.001259148120880127, 0.0013513565063476562, 0.0014435648918151855, 0.0015357732772827148, 0.0016279816627502441, 0.0017201900482177734, 0.0018123984336853027, 0.001904606819152832, 0.0019968152046203613, 0.0020890235900878906, 0.00218123197555542, 0.0022734403610229492, 0.0023656487464904785, 0.002457857131958008, 0.002550065517425537, 0.0026422739028930664, 0.0027344822883605957, 0.002826690673828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 14.0, 14.0, 24.0, 35.0, 29.0, 55.0, 75.0, 110.0, 156.0, 261.0, 346.0, 460.0, 736.0, 1108.0, 1740.0, 2711.0, 4487.0, 7552.0, 13167.0, 23971.0, 47476.0, 102829.0, 249473.0, 321777.0, 138656.0, 61541.0, 30030.0, 15892.0, 9004.0, 5419.0, 3294.0, 2072.0, 1373.0, 824.0, 566.0, 361.0, 276.0, 158.0, 149.0, 85.0, 75.0, 36.0, 40.0, 35.0, 25.0, 12.0, 5.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-24.421875, -23.662841796875, -22.90380859375, -22.144775390625, -21.3857421875, -20.626708984375, -19.86767578125, -19.108642578125, -18.349609375, -17.590576171875, -16.83154296875, -16.072509765625, -15.3134765625, -14.554443359375, -13.79541015625, -13.036376953125, -12.27734375, -11.518310546875, -10.75927734375, -10.000244140625, -9.2412109375, -8.482177734375, -7.72314453125, -6.964111328125, -6.205078125, -5.446044921875, -4.68701171875, -3.927978515625, -3.1689453125, -2.409912109375, -1.65087890625, -0.891845703125, -0.1328125, 0.626220703125, 1.38525390625, 2.144287109375, 2.9033203125, 3.662353515625, 4.42138671875, 5.180419921875, 5.939453125, 6.698486328125, 7.45751953125, 8.216552734375, 8.9755859375, 9.734619140625, 10.49365234375, 11.252685546875, 12.01171875, 12.770751953125, 13.52978515625, 14.288818359375, 15.0478515625, 15.806884765625, 16.56591796875, 17.324951171875, 18.083984375, 18.843017578125, 19.60205078125, 20.361083984375, 21.1201171875, 21.879150390625, 22.63818359375, 23.397216796875, 24.15625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 10.0, 10.0, 9.0, 10.0, 8.0, 20.0, 20.0, 15.0, 28.0, 40.0, 41.0, 40.0, 46.0, 61.0, 62.0, 58.0, 64.0, 71.0, 59.0, 48.0, 46.0, 42.0, 33.0, 24.0, 37.0, 25.0, 18.0, 11.0, 9.0, 10.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1484375, -7.9169921875, -7.685546875, -7.4541015625, -7.22265625, -6.9912109375, -6.759765625, -6.5283203125, -6.296875, -6.0654296875, -5.833984375, -5.6025390625, -5.37109375, -5.1396484375, -4.908203125, -4.6767578125, -4.4453125, -4.2138671875, -3.982421875, -3.7509765625, -3.51953125, -3.2880859375, -3.056640625, -2.8251953125, -2.59375, -2.3623046875, -2.130859375, -1.8994140625, -1.66796875, -1.4365234375, -1.205078125, -0.9736328125, -0.7421875, -0.5107421875, -0.279296875, -0.0478515625, 0.18359375, 0.4150390625, 0.646484375, 0.8779296875, 1.109375, 1.3408203125, 1.572265625, 1.8037109375, 2.03515625, 2.2666015625, 2.498046875, 2.7294921875, 2.9609375, 3.1923828125, 3.423828125, 3.6552734375, 3.88671875, 4.1181640625, 4.349609375, 4.5810546875, 4.8125, 5.0439453125, 5.275390625, 5.5068359375, 5.73828125, 5.9697265625, 6.201171875, 6.4326171875, 6.6640625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 7.0, 11.0, 14.0, 13.0, 14.0, 21.0, 38.0, 39.0, 48.0, 62.0, 94.0, 112.0, 109.0, 101.0, 77.0, 56.0, 47.0, 29.0, 23.0, 17.0, 17.0, 11.0, 8.0, 5.0, 11.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.94277954101562, -82.0176773071289, -79.09258270263672, -76.16748046875, -73.24238586425781, -70.3172836303711, -67.39218139648438, -64.46708679199219, -61.541988372802734, -58.61688995361328, -55.69179153442383, -52.766693115234375, -49.841590881347656, -46.91649627685547, -43.99139404296875, -41.0662956237793, -38.141197204589844, -35.21609878540039, -32.29100036621094, -29.36590003967285, -26.4408016204834, -23.515703201293945, -20.59060287475586, -17.665504455566406, -14.740406036376953, -11.8153076171875, -8.89020824432373, -5.965108871459961, -3.040010452270508, -0.11491203308105469, 2.8101882934570312, 5.735286712646484, 8.660385131835938, 11.58548355102539, 14.51058292388916, 17.43568229675293, 20.360780715942383, 23.285879135131836, 26.210979461669922, 29.136077880859375, 32.06117630004883, 34.98627471923828, 37.911373138427734, 40.83647155761719, 43.761573791503906, 46.686668395996094, 49.61177062988281, 52.536869049072266, 55.46196746826172, 58.38706588745117, 61.312164306640625, 64.23726654052734, 67.16236114501953, 70.08746337890625, 73.01255798339844, 75.93766021728516, 78.86276245117188, 81.7878646850586, 84.71295928955078, 87.6380615234375, 90.56315612792969, 93.4882583618164, 96.41336059570312, 99.33845520019531, 102.2635498046875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 6.0, 9.0, 4.0, 9.0, 4.0, 9.0, 11.0, 18.0, 22.0, 13.0, 21.0, 20.0, 30.0, 41.0, 40.0, 36.0, 43.0, 34.0, 39.0, 46.0, 35.0, 26.0, 42.0, 31.0, 41.0, 37.0, 32.0, 29.0, 39.0, 27.0, 23.0, 24.0, 22.0, 23.0, 13.0, 24.0, 12.0, 13.0, 11.0, 11.0, 9.0, 3.0, 3.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-62.063899993896484, -60.25804138183594, -58.452186584472656, -56.646331787109375, -54.84047317504883, -53.03461456298828, -51.228759765625, -49.42290496826172, -47.61704635620117, -45.811187744140625, -44.005332946777344, -42.19947814941406, -40.393619537353516, -38.58776092529297, -36.78190612792969, -34.976051330566406, -33.17019271850586, -31.364336013793945, -29.55847930908203, -27.752622604370117, -25.946765899658203, -24.14090919494629, -22.335052490234375, -20.52919578552246, -18.723339080810547, -16.917482376098633, -15.111625671386719, -13.305768966674805, -11.49991226196289, -9.694055557250977, -7.8881988525390625, -6.082342147827148, -4.276485443115234, -2.4706287384033203, -0.6647720336914062, 1.1410846710205078, 2.946941375732422, 4.752798080444336, 6.55865478515625, 8.364511489868164, 10.170368194580078, 11.976224899291992, 13.782081604003906, 15.58793830871582, 17.393795013427734, 19.19965171813965, 21.005508422851562, 22.811365127563477, 24.61722183227539, 26.423078536987305, 28.22893524169922, 30.034791946411133, 31.840648651123047, 33.646507263183594, 35.452362060546875, 37.258216857910156, 39.0640754699707, 40.86993408203125, 42.67578887939453, 44.48164367675781, 46.28750228881836, 48.093360900878906, 49.89921569824219, 51.70507049560547, 53.510929107666016]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 7.0, 21.0, 12.0, 18.0, 21.0, 40.0, 50.0, 84.0, 84.0, 136.0, 185.0, 268.0, 399.0, 595.0, 862.0, 1369.0, 2142.0, 3378.0, 5803.0, 10013.0, 20067.0, 56019.0, 285590.0, 1523091.0, 1841127.0, 328792.0, 66079.0, 21586.0, 10408.0, 5894.0, 3518.0, 2325.0, 1398.0, 951.0, 618.0, 392.0, 290.0, 206.0, 119.0, 73.0, 68.0, 45.0, 40.0, 34.0, 15.0, 5.0, 8.0, 9.0, 6.0, 4.0, 6.0, 5.0, 1.0], "bins": [-120.875, -117.4267578125, -113.978515625, -110.5302734375, -107.08203125, -103.6337890625, -100.185546875, -96.7373046875, -93.2890625, -89.8408203125, -86.392578125, -82.9443359375, -79.49609375, -76.0478515625, -72.599609375, -69.1513671875, -65.703125, -62.2548828125, -58.806640625, -55.3583984375, -51.91015625, -48.4619140625, -45.013671875, -41.5654296875, -38.1171875, -34.6689453125, -31.220703125, -27.7724609375, -24.32421875, -20.8759765625, -17.427734375, -13.9794921875, -10.53125, -7.0830078125, -3.634765625, -0.1865234375, 3.26171875, 6.7099609375, 10.158203125, 13.6064453125, 17.0546875, 20.5029296875, 23.951171875, 27.3994140625, 30.84765625, 34.2958984375, 37.744140625, 41.1923828125, 44.640625, 48.0888671875, 51.537109375, 54.9853515625, 58.43359375, 61.8818359375, 65.330078125, 68.7783203125, 72.2265625, 75.6748046875, 79.123046875, 82.5712890625, 86.01953125, 89.4677734375, 92.916015625, 96.3642578125, 99.8125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 5.0, 6.0, 7.0, 5.0, 7.0, 14.0, 15.0, 10.0, 23.0, 16.0, 18.0, 19.0, 30.0, 39.0, 29.0, 42.0, 56.0, 40.0, 46.0, 47.0, 32.0, 40.0, 36.0, 42.0, 44.0, 31.0, 35.0, 38.0, 28.0, 31.0, 28.0, 13.0, 17.0, 17.0, 20.0, 9.0, 17.0, 5.0, 12.0, 13.0, 6.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-57.3125, -55.6328125, -53.953125, -52.2734375, -50.59375, -48.9140625, -47.234375, -45.5546875, -43.875, -42.1953125, -40.515625, -38.8359375, -37.15625, -35.4765625, -33.796875, -32.1171875, -30.4375, -28.7578125, -27.078125, -25.3984375, -23.71875, -22.0390625, -20.359375, -18.6796875, -17.0, -15.3203125, -13.640625, -11.9609375, -10.28125, -8.6015625, -6.921875, -5.2421875, -3.5625, -1.8828125, -0.203125, 1.4765625, 3.15625, 4.8359375, 6.515625, 8.1953125, 9.875, 11.5546875, 13.234375, 14.9140625, 16.59375, 18.2734375, 19.953125, 21.6328125, 23.3125, 24.9921875, 26.671875, 28.3515625, 30.03125, 31.7109375, 33.390625, 35.0703125, 36.75, 38.4296875, 40.109375, 41.7890625, 43.46875, 45.1484375, 46.828125, 48.5078125, 50.1875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 11.0, 9.0, 17.0, 34.0, 36.0, 48.0, 51.0, 93.0, 108.0, 205.0, 275.0, 430.0, 596.0, 1048.0, 1497.0, 2428.0, 3990.0, 6548.0, 11268.0, 20502.0, 40339.0, 93729.0, 315349.0, 2183670.0, 1163809.0, 203724.0, 70404.0, 32446.0, 17036.0, 9339.0, 5665.0, 3438.0, 2184.0, 1436.0, 849.0, 542.0, 358.0, 235.0, 159.0, 114.0, 82.0, 49.0, 42.0, 16.0, 25.0, 16.0, 14.0, 8.0, 3.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0], "bins": [-123.8125, -120.04296875, -116.2734375, -112.50390625, -108.734375, -104.96484375, -101.1953125, -97.42578125, -93.65625, -89.88671875, -86.1171875, -82.34765625, -78.578125, -74.80859375, -71.0390625, -67.26953125, -63.5, -59.73046875, -55.9609375, -52.19140625, -48.421875, -44.65234375, -40.8828125, -37.11328125, -33.34375, -29.57421875, -25.8046875, -22.03515625, -18.265625, -14.49609375, -10.7265625, -6.95703125, -3.1875, 0.58203125, 4.3515625, 8.12109375, 11.890625, 15.66015625, 19.4296875, 23.19921875, 26.96875, 30.73828125, 34.5078125, 38.27734375, 42.046875, 45.81640625, 49.5859375, 53.35546875, 57.125, 60.89453125, 64.6640625, 68.43359375, 72.203125, 75.97265625, 79.7421875, 83.51171875, 87.28125, 91.05078125, 94.8203125, 98.58984375, 102.359375, 106.12890625, 109.8984375, 113.66796875, 117.4375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 10.0, 14.0, 13.0, 12.0, 18.0, 24.0, 17.0, 28.0, 45.0, 69.0, 87.0, 96.0, 163.0, 294.0, 423.0, 656.0, 717.0, 471.0, 298.0, 187.0, 100.0, 73.0, 58.0, 54.0, 26.0, 37.0, 16.0, 11.0, 17.0, 10.0, 6.0, 9.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.125, -37.97802734375, -36.8310546875, -35.68408203125, -34.537109375, -33.39013671875, -32.2431640625, -31.09619140625, -29.94921875, -28.80224609375, -27.6552734375, -26.50830078125, -25.361328125, -24.21435546875, -23.0673828125, -21.92041015625, -20.7734375, -19.62646484375, -18.4794921875, -17.33251953125, -16.185546875, -15.03857421875, -13.8916015625, -12.74462890625, -11.59765625, -10.45068359375, -9.3037109375, -8.15673828125, -7.009765625, -5.86279296875, -4.7158203125, -3.56884765625, -2.421875, -1.27490234375, -0.1279296875, 1.01904296875, 2.166015625, 3.31298828125, 4.4599609375, 5.60693359375, 6.75390625, 7.90087890625, 9.0478515625, 10.19482421875, 11.341796875, 12.48876953125, 13.6357421875, 14.78271484375, 15.9296875, 17.07666015625, 18.2236328125, 19.37060546875, 20.517578125, 21.66455078125, 22.8115234375, 23.95849609375, 25.10546875, 26.25244140625, 27.3994140625, 28.54638671875, 29.693359375, 30.84033203125, 31.9873046875, 33.13427734375, 34.28125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 6.0, 4.0, 8.0, 14.0, 23.0, 22.0, 32.0, 31.0, 51.0, 70.0, 82.0, 112.0, 96.0, 100.0, 74.0, 61.0, 37.0, 41.0, 28.0, 21.0, 12.0, 14.0, 13.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.39539337158203, -62.81571960449219, -60.236045837402344, -57.656368255615234, -55.07669448852539, -52.49702072143555, -49.91734313964844, -47.337669372558594, -44.75799560546875, -42.178321838378906, -39.59864807128906, -37.01897048950195, -34.43929672241211, -31.859622955322266, -29.27994728088379, -26.700271606445312, -24.12059783935547, -21.540924072265625, -18.96124839782715, -16.381572723388672, -13.801898956298828, -11.222224235534668, -8.642549514770508, -6.062873840332031, -3.4832000732421875, -0.9035253524780273, 1.6761493682861328, 4.255824089050293, 6.835498809814453, 9.415173530578613, 11.994848251342773, 14.57452392578125, 17.154205322265625, 19.73387908935547, 22.313554763793945, 24.893230438232422, 27.472904205322266, 30.05257797241211, 32.63225555419922, 35.21192932128906, 37.791603088378906, 40.37127685546875, 42.950950622558594, 45.5306282043457, 48.11030197143555, 50.68997573852539, 53.2696533203125, 55.849327087402344, 58.42900085449219, 61.00867462158203, 63.588348388671875, 66.16802215576172, 68.74769592285156, 71.32737731933594, 73.90705108642578, 76.48672485351562, 79.06639862060547, 81.64607238769531, 84.22574615478516, 86.805419921875, 89.38510131835938, 91.96477508544922, 94.54444885253906, 97.1241226196289, 99.70379638671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 7.0, 11.0, 14.0, 17.0, 14.0, 16.0, 14.0, 21.0, 30.0, 41.0, 37.0, 40.0, 44.0, 43.0, 37.0, 52.0, 37.0, 41.0, 36.0, 42.0, 52.0, 36.0, 37.0, 27.0, 26.0, 29.0, 20.0, 23.0, 17.0, 20.0, 17.0, 21.0, 15.0, 8.0, 8.0, 9.0, 7.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.66313934326172, -53.819252014160156, -51.97536087036133, -50.131473541259766, -48.28758239746094, -46.443695068359375, -44.59980773925781, -42.755916595458984, -40.91202926635742, -39.06814193725586, -37.22425079345703, -35.38036346435547, -33.53647232055664, -31.692584991455078, -29.848695755004883, -28.004806518554688, -26.160917282104492, -24.317028045654297, -22.4731388092041, -20.629249572753906, -18.785362243652344, -16.94147300720215, -15.097583770751953, -13.253695487976074, -11.409806251525879, -9.565917015075684, -7.722028732299805, -5.878139495849609, -4.034250736236572, -2.190361976623535, -0.34647274017333984, 1.497415542602539, 3.3413047790527344, 5.1851935386657715, 7.029082298278809, 8.872971534729004, 10.716859817504883, 12.560749053955078, 14.404638290405273, 16.24852752685547, 18.09241485595703, 19.936304092407227, 21.780193328857422, 23.624080657958984, 25.46796989440918, 27.311859130859375, 29.15574836730957, 30.999637603759766, 32.843528747558594, 34.687416076660156, 36.531307220458984, 38.37519454956055, 40.219085693359375, 42.06297302246094, 43.9068603515625, 45.75075149536133, 47.59463882446289, 49.43852615356445, 51.28241729736328, 53.126304626464844, 54.97019577026367, 56.814083099365234, 58.65797424316406, 60.501861572265625, 62.34574890136719]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 10.0, 15.0, 18.0, 28.0, 29.0, 50.0, 69.0, 93.0, 149.0, 191.0, 268.0, 387.0, 624.0, 931.0, 1403.0, 2199.0, 3430.0, 5581.0, 9211.0, 15981.0, 27662.0, 51669.0, 105641.0, 226523.0, 287755.0, 150110.0, 70745.0, 36370.0, 20332.0, 11906.0, 7000.0, 4414.0, 2655.0, 1765.0, 1104.0, 722.0, 481.0, 320.0, 204.0, 159.0, 97.0, 74.0, 54.0, 41.0, 27.0, 13.0, 18.0, 7.0, 12.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.5, -39.16015625, -37.8203125, -36.48046875, -35.140625, -33.80078125, -32.4609375, -31.12109375, -29.78125, -28.44140625, -27.1015625, -25.76171875, -24.421875, -23.08203125, -21.7421875, -20.40234375, -19.0625, -17.72265625, -16.3828125, -15.04296875, -13.703125, -12.36328125, -11.0234375, -9.68359375, -8.34375, -7.00390625, -5.6640625, -4.32421875, -2.984375, -1.64453125, -0.3046875, 1.03515625, 2.375, 3.71484375, 5.0546875, 6.39453125, 7.734375, 9.07421875, 10.4140625, 11.75390625, 13.09375, 14.43359375, 15.7734375, 17.11328125, 18.453125, 19.79296875, 21.1328125, 22.47265625, 23.8125, 25.15234375, 26.4921875, 27.83203125, 29.171875, 30.51171875, 31.8515625, 33.19140625, 34.53125, 35.87109375, 37.2109375, 38.55078125, 39.890625, 41.23046875, 42.5703125, 43.91015625, 45.25]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 0.0, 4.0, 4.0, 6.0, 3.0, 3.0, 5.0, 13.0, 15.0, 10.0, 10.0, 11.0, 17.0, 24.0, 27.0, 39.0, 37.0, 37.0, 42.0, 38.0, 58.0, 35.0, 43.0, 45.0, 50.0, 56.0, 52.0, 42.0, 37.0, 34.0, 23.0, 21.0, 20.0, 18.0, 21.0, 17.0, 17.0, 15.0, 11.0, 12.0, 3.0, 6.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.21875, -55.3896484375, -53.560546875, -51.7314453125, -49.90234375, -48.0732421875, -46.244140625, -44.4150390625, -42.5859375, -40.7568359375, -38.927734375, -37.0986328125, -35.26953125, -33.4404296875, -31.611328125, -29.7822265625, -27.953125, -26.1240234375, -24.294921875, -22.4658203125, -20.63671875, -18.8076171875, -16.978515625, -15.1494140625, -13.3203125, -11.4912109375, -9.662109375, -7.8330078125, -6.00390625, -4.1748046875, -2.345703125, -0.5166015625, 1.3125, 3.1416015625, 4.970703125, 6.7998046875, 8.62890625, 10.4580078125, 12.287109375, 14.1162109375, 15.9453125, 17.7744140625, 19.603515625, 21.4326171875, 23.26171875, 25.0908203125, 26.919921875, 28.7490234375, 30.578125, 32.4072265625, 34.236328125, 36.0654296875, 37.89453125, 39.7236328125, 41.552734375, 43.3818359375, 45.2109375, 47.0400390625, 48.869140625, 50.6982421875, 52.52734375, 54.3564453125, 56.185546875, 58.0146484375, 59.84375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 8.0, 20.0, 26.0, 20.0, 37.0, 52.0, 62.0, 90.0, 121.0, 194.0, 287.0, 409.0, 585.0, 888.0, 1365.0, 2045.0, 3108.0, 5291.0, 9013.0, 17725.0, 57607.0, 772324.0, 125551.0, 23524.0, 10947.0, 6253.0, 3898.0, 2355.0, 1559.0, 962.0, 674.0, 442.0, 317.0, 216.0, 159.0, 122.0, 81.0, 57.0, 39.0, 27.0, 18.0, 16.0, 17.0, 9.0, 9.0, 5.0, 1.0, 4.0, 1.0, 0.0, 3.0], "bins": [-80.9375, -78.6025390625, -76.267578125, -73.9326171875, -71.59765625, -69.2626953125, -66.927734375, -64.5927734375, -62.2578125, -59.9228515625, -57.587890625, -55.2529296875, -52.91796875, -50.5830078125, -48.248046875, -45.9130859375, -43.578125, -41.2431640625, -38.908203125, -36.5732421875, -34.23828125, -31.9033203125, -29.568359375, -27.2333984375, -24.8984375, -22.5634765625, -20.228515625, -17.8935546875, -15.55859375, -13.2236328125, -10.888671875, -8.5537109375, -6.21875, -3.8837890625, -1.548828125, 0.7861328125, 3.12109375, 5.4560546875, 7.791015625, 10.1259765625, 12.4609375, 14.7958984375, 17.130859375, 19.4658203125, 21.80078125, 24.1357421875, 26.470703125, 28.8056640625, 31.140625, 33.4755859375, 35.810546875, 38.1455078125, 40.48046875, 42.8154296875, 45.150390625, 47.4853515625, 49.8203125, 52.1552734375, 54.490234375, 56.8251953125, 59.16015625, 61.4951171875, 63.830078125, 66.1650390625, 68.5]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 9.0, 3.0, 11.0, 7.0, 7.0, 11.0, 14.0, 14.0, 25.0, 18.0, 21.0, 34.0, 37.0, 49.0, 32.0, 39.0, 51.0, 35.0, 42.0, 45.0, 58.0, 35.0, 23.0, 39.0, 39.0, 39.0, 31.0, 39.0, 25.0, 26.0, 27.0, 18.0, 23.0, 11.0, 16.0, 16.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-51.46875, -49.71044921875, -47.9521484375, -46.19384765625, -44.435546875, -42.67724609375, -40.9189453125, -39.16064453125, -37.40234375, -35.64404296875, -33.8857421875, -32.12744140625, -30.369140625, -28.61083984375, -26.8525390625, -25.09423828125, -23.3359375, -21.57763671875, -19.8193359375, -18.06103515625, -16.302734375, -14.54443359375, -12.7861328125, -11.02783203125, -9.26953125, -7.51123046875, -5.7529296875, -3.99462890625, -2.236328125, -0.47802734375, 1.2802734375, 3.03857421875, 4.796875, 6.55517578125, 8.3134765625, 10.07177734375, 11.830078125, 13.58837890625, 15.3466796875, 17.10498046875, 18.86328125, 20.62158203125, 22.3798828125, 24.13818359375, 25.896484375, 27.65478515625, 29.4130859375, 31.17138671875, 32.9296875, 34.68798828125, 36.4462890625, 38.20458984375, 39.962890625, 41.72119140625, 43.4794921875, 45.23779296875, 46.99609375, 48.75439453125, 50.5126953125, 52.27099609375, 54.029296875, 55.78759765625, 57.5458984375, 59.30419921875, 61.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 7.0, 8.0, 13.0, 14.0, 22.0, 35.0, 40.0, 65.0, 83.0, 122.0, 161.0, 224.0, 358.0, 544.0, 891.0, 1513.0, 2936.0, 6597.0, 18550.0, 106298.0, 834851.0, 51279.0, 12980.0, 5021.0, 2317.0, 1290.0, 790.0, 489.0, 314.0, 203.0, 147.0, 106.0, 68.0, 44.0, 47.0, 28.0, 22.0, 15.0, 15.0, 10.0, 10.0, 8.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.20703125, -5.988037109375, -5.76904296875, -5.550048828125, -5.3310546875, -5.112060546875, -4.89306640625, -4.674072265625, -4.455078125, -4.236083984375, -4.01708984375, -3.798095703125, -3.5791015625, -3.360107421875, -3.14111328125, -2.922119140625, -2.703125, -2.484130859375, -2.26513671875, -2.046142578125, -1.8271484375, -1.608154296875, -1.38916015625, -1.170166015625, -0.951171875, -0.732177734375, -0.51318359375, -0.294189453125, -0.0751953125, 0.143798828125, 0.36279296875, 0.581787109375, 0.80078125, 1.019775390625, 1.23876953125, 1.457763671875, 1.6767578125, 1.895751953125, 2.11474609375, 2.333740234375, 2.552734375, 2.771728515625, 2.99072265625, 3.209716796875, 3.4287109375, 3.647705078125, 3.86669921875, 4.085693359375, 4.3046875, 4.523681640625, 4.74267578125, 4.961669921875, 5.1806640625, 5.399658203125, 5.61865234375, 5.837646484375, 6.056640625, 6.275634765625, 6.49462890625, 6.713623046875, 6.9326171875, 7.151611328125, 7.37060546875, 7.589599609375, 7.80859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 5.0, 8.0, 4.0, 8.0, 12.0, 12.0, 14.0, 29.0, 35.0, 48.0, 68.0, 82.0, 99.0, 135.0, 112.0, 79.0, 52.0, 45.0, 30.0, 28.0, 12.0, 22.0, 14.0, 8.0, 8.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0030670166015625, -0.0029805004596710205, -0.002893984317779541, -0.0028074681758880615, -0.002720952033996582, -0.0026344358921051025, -0.002547919750213623, -0.0024614036083221436, -0.002374887466430664, -0.0022883713245391846, -0.002201855182647705, -0.0021153390407562256, -0.002028822898864746, -0.0019423067569732666, -0.0018557906150817871, -0.0017692744731903076, -0.0016827583312988281, -0.0015962421894073486, -0.0015097260475158691, -0.0014232099056243896, -0.0013366937637329102, -0.0012501776218414307, -0.0011636614799499512, -0.0010771453380584717, -0.0009906291961669922, -0.0009041130542755127, -0.0008175969123840332, -0.0007310807704925537, -0.0006445646286010742, -0.0005580484867095947, -0.00047153234481811523, -0.00038501620292663574, -0.00029850006103515625, -0.00021198391914367676, -0.00012546777725219727, -3.8951635360717773e-05, 4.756450653076172e-05, 0.0001340806484222412, 0.0002205967903137207, 0.0003071129322052002, 0.0003936290740966797, 0.0004801452159881592, 0.0005666613578796387, 0.0006531774997711182, 0.0007396936416625977, 0.0008262097835540771, 0.0009127259254455566, 0.0009992420673370361, 0.0010857582092285156, 0.0011722743511199951, 0.0012587904930114746, 0.001345306634902954, 0.0014318227767944336, 0.001518338918685913, 0.0016048550605773926, 0.001691371202468872, 0.0017778873443603516, 0.001864403486251831, 0.0019509196281433105, 0.00203743577003479, 0.0021239519119262695, 0.002210468053817749, 0.0022969841957092285, 0.002383500337600708, 0.0024700164794921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 6.0, 5.0, 8.0, 13.0, 22.0, 32.0, 38.0, 56.0, 85.0, 120.0, 175.0, 231.0, 337.0, 538.0, 709.0, 1204.0, 1912.0, 3128.0, 5291.0, 9407.0, 18284.0, 37906.0, 92937.0, 284961.0, 368469.0, 125288.0, 47848.0, 22115.0, 11466.0, 6249.0, 3480.0, 2174.0, 1318.0, 882.0, 548.0, 377.0, 296.0, 196.0, 123.0, 96.0, 60.0, 47.0, 34.0, 28.0, 19.0, 14.0, 6.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-3.146484375, -3.05694580078125, -2.9674072265625, -2.87786865234375, -2.788330078125, -2.69879150390625, -2.6092529296875, -2.51971435546875, -2.43017578125, -2.34063720703125, -2.2510986328125, -2.16156005859375, -2.072021484375, -1.98248291015625, -1.8929443359375, -1.80340576171875, -1.7138671875, -1.62432861328125, -1.5347900390625, -1.44525146484375, -1.355712890625, -1.26617431640625, -1.1766357421875, -1.08709716796875, -0.99755859375, -0.90802001953125, -0.8184814453125, -0.72894287109375, -0.639404296875, -0.54986572265625, -0.4603271484375, -0.37078857421875, -0.28125, -0.19171142578125, -0.1021728515625, -0.01263427734375, 0.076904296875, 0.16644287109375, 0.2559814453125, 0.34552001953125, 0.43505859375, 0.52459716796875, 0.6141357421875, 0.70367431640625, 0.793212890625, 0.88275146484375, 0.9722900390625, 1.06182861328125, 1.1513671875, 1.24090576171875, 1.3304443359375, 1.41998291015625, 1.509521484375, 1.59906005859375, 1.6885986328125, 1.77813720703125, 1.86767578125, 1.95721435546875, 2.0467529296875, 2.13629150390625, 2.225830078125, 2.31536865234375, 2.4049072265625, 2.49444580078125, 2.583984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 9.0, 15.0, 17.0, 18.0, 12.0, 28.0, 33.0, 30.0, 60.0, 69.0, 101.0, 90.0, 85.0, 79.0, 81.0, 49.0, 40.0, 35.0, 22.0, 14.0, 13.0, 18.0, 22.0, 11.0, 8.0, 5.0, 4.0, 2.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9072265625, -0.8797149658203125, -0.852203369140625, -0.8246917724609375, -0.79718017578125, -0.7696685791015625, -0.742156982421875, -0.7146453857421875, -0.6871337890625, -0.6596221923828125, -0.632110595703125, -0.6045989990234375, -0.57708740234375, -0.5495758056640625, -0.522064208984375, -0.4945526123046875, -0.467041015625, -0.4395294189453125, -0.412017822265625, -0.3845062255859375, -0.35699462890625, -0.3294830322265625, -0.301971435546875, -0.2744598388671875, -0.2469482421875, -0.2194366455078125, -0.191925048828125, -0.1644134521484375, -0.13690185546875, -0.1093902587890625, -0.081878662109375, -0.0543670654296875, -0.02685546875, 0.0006561279296875, 0.028167724609375, 0.0556793212890625, 0.08319091796875, 0.1107025146484375, 0.138214111328125, 0.1657257080078125, 0.1932373046875, 0.2207489013671875, 0.248260498046875, 0.2757720947265625, 0.30328369140625, 0.3307952880859375, 0.358306884765625, 0.3858184814453125, 0.413330078125, 0.4408416748046875, 0.468353271484375, 0.4958648681640625, 0.52337646484375, 0.5508880615234375, 0.578399658203125, 0.6059112548828125, 0.6334228515625, 0.6609344482421875, 0.688446044921875, 0.7159576416015625, 0.74346923828125, 0.7709808349609375, 0.798492431640625, 0.8260040283203125, 0.853515625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 3.0, 4.0, 14.0, 14.0, 24.0, 20.0, 36.0, 34.0, 55.0, 78.0, 97.0, 98.0, 113.0, 105.0, 68.0, 55.0, 37.0, 37.0, 19.0, 19.0, 15.0, 14.0, 6.0, 7.0, 5.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.0177001953125, -71.4654769897461, -68.91324615478516, -66.36102294921875, -63.80879592895508, -61.256568908691406, -58.704341888427734, -56.15211486816406, -53.599891662597656, -51.047664642333984, -48.49543762207031, -45.943214416503906, -43.390987396240234, -40.83876037597656, -38.28653335571289, -35.73430633544922, -33.18207931518555, -30.629852294921875, -28.077627182006836, -25.525400161743164, -22.973175048828125, -20.420948028564453, -17.86872100830078, -15.316495895385742, -12.76426887512207, -10.212042808532715, -7.659816265106201, -5.1075897216796875, -2.555363655090332, -0.0031375885009765625, 2.5490894317626953, 5.101314544677734, 7.653541564941406, 10.205767631530762, 12.757993698120117, 15.310220718383789, 17.862445831298828, 20.4146728515625, 22.966899871826172, 25.51912498474121, 28.071352005004883, 30.623579025268555, 33.175804138183594, 35.728031158447266, 38.28025817871094, 40.832481384277344, 43.38471221923828, 45.93693542480469, 48.48916244506836, 51.04138946533203, 53.5936164855957, 56.145843505859375, 58.69806671142578, 61.25029373168945, 63.802520751953125, 66.35474395751953, 68.90697479248047, 71.45919799804688, 74.01142883300781, 76.56365203857422, 79.11588287353516, 81.66810607910156, 84.2203369140625, 86.7725601196289, 89.32478332519531]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 6.0, 2.0, 6.0, 5.0, 5.0, 7.0, 11.0, 14.0, 19.0, 15.0, 17.0, 14.0, 18.0, 33.0, 42.0, 37.0, 45.0, 33.0, 51.0, 39.0, 46.0, 42.0, 36.0, 39.0, 52.0, 43.0, 37.0, 33.0, 28.0, 27.0, 24.0, 22.0, 23.0, 22.0, 17.0, 16.0, 21.0, 15.0, 6.0, 8.0, 5.0, 11.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.7095947265625, -49.992801666259766, -48.27600860595703, -46.5592155456543, -44.84242248535156, -43.12562942504883, -41.408836364746094, -39.69204330444336, -37.975250244140625, -36.25845718383789, -34.541664123535156, -32.82487106323242, -31.108078002929688, -29.391284942626953, -27.67449188232422, -25.957698822021484, -24.24090576171875, -22.524112701416016, -20.80731964111328, -19.090526580810547, -17.373733520507812, -15.656940460205078, -13.940147399902344, -12.22335433959961, -10.506561279296875, -8.78976821899414, -7.072975158691406, -5.356182098388672, -3.6393890380859375, -1.9225959777832031, -0.20580291748046875, 1.5109901428222656, 3.2277870178222656, 4.944580078125, 6.661373138427734, 8.378166198730469, 10.094959259033203, 11.811752319335938, 13.528545379638672, 15.245338439941406, 16.96213150024414, 18.678924560546875, 20.39571762084961, 22.112510681152344, 23.829303741455078, 25.546096801757812, 27.262889862060547, 28.97968292236328, 30.696475982666016, 32.41326904296875, 34.130062103271484, 35.84685516357422, 37.56364822387695, 39.28044128417969, 40.99723434448242, 42.714027404785156, 44.43082046508789, 46.147613525390625, 47.86440658569336, 49.581199645996094, 51.29799270629883, 53.01478576660156, 54.7315788269043, 56.44837188720703, 58.165164947509766]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 9.0, 7.0, 14.0, 24.0, 41.0, 40.0, 72.0, 110.0, 146.0, 197.0, 302.0, 519.0, 841.0, 1245.0, 2151.0, 3449.0, 6096.0, 10942.0, 20134.0, 40966.0, 90703.0, 230498.0, 350087.0, 156873.0, 65342.0, 30976.0, 15804.0, 8525.0, 4897.0, 2757.0, 1731.0, 1065.0, 630.0, 435.0, 307.0, 190.0, 122.0, 86.0, 69.0, 39.0, 30.0, 27.0, 12.0, 18.0, 7.0, 2.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-89.875, -87.2548828125, -84.634765625, -82.0146484375, -79.39453125, -76.7744140625, -74.154296875, -71.5341796875, -68.9140625, -66.2939453125, -63.673828125, -61.0537109375, -58.43359375, -55.8134765625, -53.193359375, -50.5732421875, -47.953125, -45.3330078125, -42.712890625, -40.0927734375, -37.47265625, -34.8525390625, -32.232421875, -29.6123046875, -26.9921875, -24.3720703125, -21.751953125, -19.1318359375, -16.51171875, -13.8916015625, -11.271484375, -8.6513671875, -6.03125, -3.4111328125, -0.791015625, 1.8291015625, 4.44921875, 7.0693359375, 9.689453125, 12.3095703125, 14.9296875, 17.5498046875, 20.169921875, 22.7900390625, 25.41015625, 28.0302734375, 30.650390625, 33.2705078125, 35.890625, 38.5107421875, 41.130859375, 43.7509765625, 46.37109375, 48.9912109375, 51.611328125, 54.2314453125, 56.8515625, 59.4716796875, 62.091796875, 64.7119140625, 67.33203125, 69.9521484375, 72.572265625, 75.1923828125, 77.8125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 5.0, 5.0, 3.0, 3.0, 7.0, 7.0, 10.0, 10.0, 12.0, 15.0, 17.0, 15.0, 22.0, 24.0, 40.0, 33.0, 28.0, 43.0, 46.0, 45.0, 51.0, 44.0, 42.0, 40.0, 50.0, 47.0, 42.0, 33.0, 40.0, 24.0, 24.0, 17.0, 24.0, 14.0, 26.0, 16.0, 18.0, 16.0, 7.0, 7.0, 10.0, 5.0, 6.0, 4.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.90625, -53.15966796875, -51.4130859375, -49.66650390625, -47.919921875, -46.17333984375, -44.4267578125, -42.68017578125, -40.93359375, -39.18701171875, -37.4404296875, -35.69384765625, -33.947265625, -32.20068359375, -30.4541015625, -28.70751953125, -26.9609375, -25.21435546875, -23.4677734375, -21.72119140625, -19.974609375, -18.22802734375, -16.4814453125, -14.73486328125, -12.98828125, -11.24169921875, -9.4951171875, -7.74853515625, -6.001953125, -4.25537109375, -2.5087890625, -0.76220703125, 0.984375, 2.73095703125, 4.4775390625, 6.22412109375, 7.970703125, 9.71728515625, 11.4638671875, 13.21044921875, 14.95703125, 16.70361328125, 18.4501953125, 20.19677734375, 21.943359375, 23.68994140625, 25.4365234375, 27.18310546875, 28.9296875, 30.67626953125, 32.4228515625, 34.16943359375, 35.916015625, 37.66259765625, 39.4091796875, 41.15576171875, 42.90234375, 44.64892578125, 46.3955078125, 48.14208984375, 49.888671875, 51.63525390625, 53.3818359375, 55.12841796875, 56.875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 16.0, 18.0, 24.0, 43.0, 54.0, 67.0, 101.0, 153.0, 213.0, 313.0, 429.0, 582.0, 797.0, 1205.0, 1765.0, 2599.0, 3822.0, 6030.0, 9499.0, 14855.0, 24829.0, 42357.0, 75776.0, 148133.0, 270766.0, 204209.0, 101660.0, 54464.0, 31501.0, 18802.0, 11559.0, 7316.0, 4664.0, 3089.0, 2060.0, 1444.0, 992.0, 687.0, 482.0, 335.0, 259.0, 171.0, 121.0, 95.0, 62.0, 41.0, 40.0, 22.0, 13.0, 7.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0], "bins": [-69.0, -66.8916015625, -64.783203125, -62.6748046875, -60.56640625, -58.4580078125, -56.349609375, -54.2412109375, -52.1328125, -50.0244140625, -47.916015625, -45.8076171875, -43.69921875, -41.5908203125, -39.482421875, -37.3740234375, -35.265625, -33.1572265625, -31.048828125, -28.9404296875, -26.83203125, -24.7236328125, -22.615234375, -20.5068359375, -18.3984375, -16.2900390625, -14.181640625, -12.0732421875, -9.96484375, -7.8564453125, -5.748046875, -3.6396484375, -1.53125, 0.5771484375, 2.685546875, 4.7939453125, 6.90234375, 9.0107421875, 11.119140625, 13.2275390625, 15.3359375, 17.4443359375, 19.552734375, 21.6611328125, 23.76953125, 25.8779296875, 27.986328125, 30.0947265625, 32.203125, 34.3115234375, 36.419921875, 38.5283203125, 40.63671875, 42.7451171875, 44.853515625, 46.9619140625, 49.0703125, 51.1787109375, 53.287109375, 55.3955078125, 57.50390625, 59.6123046875, 61.720703125, 63.8291015625, 65.9375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 1.0, 9.0, 3.0, 11.0, 17.0, 13.0, 15.0, 30.0, 21.0, 24.0, 20.0, 37.0, 34.0, 43.0, 38.0, 46.0, 32.0, 43.0, 51.0, 45.0, 42.0, 43.0, 39.0, 39.0, 35.0, 31.0, 27.0, 24.0, 26.0, 29.0, 23.0, 19.0, 13.0, 14.0, 7.0, 8.0, 8.0, 4.0, 5.0, 3.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-31.296875, -30.258056640625, -29.21923828125, -28.180419921875, -27.1416015625, -26.102783203125, -25.06396484375, -24.025146484375, -22.986328125, -21.947509765625, -20.90869140625, -19.869873046875, -18.8310546875, -17.792236328125, -16.75341796875, -15.714599609375, -14.67578125, -13.636962890625, -12.59814453125, -11.559326171875, -10.5205078125, -9.481689453125, -8.44287109375, -7.404052734375, -6.365234375, -5.326416015625, -4.28759765625, -3.248779296875, -2.2099609375, -1.171142578125, -0.13232421875, 0.906494140625, 1.9453125, 2.984130859375, 4.02294921875, 5.061767578125, 6.1005859375, 7.139404296875, 8.17822265625, 9.217041015625, 10.255859375, 11.294677734375, 12.33349609375, 13.372314453125, 14.4111328125, 15.449951171875, 16.48876953125, 17.527587890625, 18.56640625, 19.605224609375, 20.64404296875, 21.682861328125, 22.7216796875, 23.760498046875, 24.79931640625, 25.838134765625, 26.876953125, 27.915771484375, 28.95458984375, 29.993408203125, 31.0322265625, 32.071044921875, 33.10986328125, 34.148681640625, 35.1875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 6.0, 8.0, 13.0, 18.0, 27.0, 39.0, 75.0, 110.0, 142.0, 186.0, 289.0, 472.0, 644.0, 1091.0, 1557.0, 2546.0, 4299.0, 7424.0, 13200.0, 24625.0, 48574.0, 103069.0, 231129.0, 311932.0, 151716.0, 69418.0, 33698.0, 17848.0, 9842.0, 5394.0, 3314.0, 2096.0, 1295.0, 818.0, 551.0, 346.0, 242.0, 166.0, 111.0, 71.0, 49.0, 34.0, 24.0, 16.0, 12.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.953125, -22.2412109375, -21.529296875, -20.8173828125, -20.10546875, -19.3935546875, -18.681640625, -17.9697265625, -17.2578125, -16.5458984375, -15.833984375, -15.1220703125, -14.41015625, -13.6982421875, -12.986328125, -12.2744140625, -11.5625, -10.8505859375, -10.138671875, -9.4267578125, -8.71484375, -8.0029296875, -7.291015625, -6.5791015625, -5.8671875, -5.1552734375, -4.443359375, -3.7314453125, -3.01953125, -2.3076171875, -1.595703125, -0.8837890625, -0.171875, 0.5400390625, 1.251953125, 1.9638671875, 2.67578125, 3.3876953125, 4.099609375, 4.8115234375, 5.5234375, 6.2353515625, 6.947265625, 7.6591796875, 8.37109375, 9.0830078125, 9.794921875, 10.5068359375, 11.21875, 11.9306640625, 12.642578125, 13.3544921875, 14.06640625, 14.7783203125, 15.490234375, 16.2021484375, 16.9140625, 17.6259765625, 18.337890625, 19.0498046875, 19.76171875, 20.4736328125, 21.185546875, 21.8974609375, 22.609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 6.0, 2.0, 5.0, 7.0, 8.0, 13.0, 13.0, 17.0, 19.0, 23.0, 36.0, 66.0, 58.0, 92.0, 90.0, 126.0, 76.0, 61.0, 66.0, 52.0, 31.0, 19.0, 27.0, 19.0, 15.0, 11.0, 6.0, 9.0, 3.0, 4.0, 5.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002597808837890625, -0.0025197267532348633, -0.0024416446685791016, -0.00236356258392334, -0.002285480499267578, -0.0022073984146118164, -0.0021293163299560547, -0.002051234245300293, -0.0019731521606445312, -0.0018950700759887695, -0.0018169879913330078, -0.001738905906677246, -0.0016608238220214844, -0.0015827417373657227, -0.001504659652709961, -0.0014265775680541992, -0.0013484954833984375, -0.0012704133987426758, -0.001192331314086914, -0.0011142492294311523, -0.0010361671447753906, -0.0009580850601196289, -0.0008800029754638672, -0.0008019208908081055, -0.0007238388061523438, -0.000645756721496582, -0.0005676746368408203, -0.0004895925521850586, -0.0004115104675292969, -0.00033342838287353516, -0.00025534629821777344, -0.00017726421356201172, -9.918212890625e-05, -2.110004425048828e-05, 5.698204040527344e-05, 0.00013506412506103516, 0.00021314620971679688, 0.0002912282943725586, 0.0003693103790283203, 0.00044739246368408203, 0.0005254745483398438, 0.0006035566329956055, 0.0006816387176513672, 0.0007597208023071289, 0.0008378028869628906, 0.0009158849716186523, 0.000993967056274414, 0.0010720491409301758, 0.0011501312255859375, 0.0012282133102416992, 0.001306295394897461, 0.0013843774795532227, 0.0014624595642089844, 0.001540541648864746, 0.0016186237335205078, 0.0016967058181762695, 0.0017747879028320312, 0.001852869987487793, 0.0019309520721435547, 0.0020090341567993164, 0.002087116241455078, 0.00216519832611084, 0.0022432804107666016, 0.0023213624954223633, 0.002399444580078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 5.0, 6.0, 6.0, 4.0, 14.0, 15.0, 32.0, 32.0, 40.0, 48.0, 95.0, 90.0, 152.0, 222.0, 295.0, 413.0, 589.0, 933.0, 1524.0, 2370.0, 3967.0, 6747.0, 12311.0, 22781.0, 44619.0, 91834.0, 197118.0, 307393.0, 180473.0, 84442.0, 40751.0, 21095.0, 11157.0, 6588.0, 3805.0, 2301.0, 1464.0, 859.0, 584.0, 404.0, 272.0, 180.0, 153.0, 100.0, 67.0, 59.0, 48.0, 29.0, 25.0, 14.0, 10.0, 10.0, 5.0, 9.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-19.53125, -18.92919921875, -18.3271484375, -17.72509765625, -17.123046875, -16.52099609375, -15.9189453125, -15.31689453125, -14.71484375, -14.11279296875, -13.5107421875, -12.90869140625, -12.306640625, -11.70458984375, -11.1025390625, -10.50048828125, -9.8984375, -9.29638671875, -8.6943359375, -8.09228515625, -7.490234375, -6.88818359375, -6.2861328125, -5.68408203125, -5.08203125, -4.47998046875, -3.8779296875, -3.27587890625, -2.673828125, -2.07177734375, -1.4697265625, -0.86767578125, -0.265625, 0.33642578125, 0.9384765625, 1.54052734375, 2.142578125, 2.74462890625, 3.3466796875, 3.94873046875, 4.55078125, 5.15283203125, 5.7548828125, 6.35693359375, 6.958984375, 7.56103515625, 8.1630859375, 8.76513671875, 9.3671875, 9.96923828125, 10.5712890625, 11.17333984375, 11.775390625, 12.37744140625, 12.9794921875, 13.58154296875, 14.18359375, 14.78564453125, 15.3876953125, 15.98974609375, 16.591796875, 17.19384765625, 17.7958984375, 18.39794921875, 19.0]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 11.0, 9.0, 11.0, 16.0, 20.0, 30.0, 29.0, 34.0, 43.0, 47.0, 70.0, 76.0, 84.0, 70.0, 73.0, 82.0, 59.0, 58.0, 37.0, 27.0, 23.0, 16.0, 14.0, 19.0, 12.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6640625, -6.45135498046875, -6.2386474609375, -6.02593994140625, -5.813232421875, -5.60052490234375, -5.3878173828125, -5.17510986328125, -4.96240234375, -4.74969482421875, -4.5369873046875, -4.32427978515625, -4.111572265625, -3.89886474609375, -3.6861572265625, -3.47344970703125, -3.2607421875, -3.04803466796875, -2.8353271484375, -2.62261962890625, -2.409912109375, -2.19720458984375, -1.9844970703125, -1.77178955078125, -1.55908203125, -1.34637451171875, -1.1336669921875, -0.92095947265625, -0.708251953125, -0.49554443359375, -0.2828369140625, -0.07012939453125, 0.142578125, 0.35528564453125, 0.5679931640625, 0.78070068359375, 0.993408203125, 1.20611572265625, 1.4188232421875, 1.63153076171875, 1.84423828125, 2.05694580078125, 2.2696533203125, 2.48236083984375, 2.695068359375, 2.90777587890625, 3.1204833984375, 3.33319091796875, 3.5458984375, 3.75860595703125, 3.9713134765625, 4.18402099609375, 4.396728515625, 4.60943603515625, 4.8221435546875, 5.03485107421875, 5.24755859375, 5.46026611328125, 5.6729736328125, 5.88568115234375, 6.098388671875, 6.31109619140625, 6.5238037109375, 6.73651123046875, 6.94921875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 0.0, 2.0, 5.0, 8.0, 9.0, 13.0, 13.0, 18.0, 24.0, 50.0, 40.0, 78.0, 103.0, 115.0, 109.0, 104.0, 85.0, 58.0, 40.0, 26.0, 31.0, 24.0, 14.0, 12.0, 11.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.49870300292969, -74.7408676147461, -71.9830322265625, -69.2251968383789, -66.46736145019531, -63.70952224731445, -60.951683044433594, -58.19384765625, -55.436012268066406, -52.67817687988281, -49.92034149169922, -47.16250228881836, -44.404666900634766, -41.64683151245117, -38.88899230957031, -36.13115692138672, -33.373321533203125, -30.61548614501953, -27.857648849487305, -25.099811553955078, -22.341976165771484, -19.58414077758789, -16.826303482055664, -14.068466186523438, -11.310630798339844, -8.552794456481934, -5.794958114624023, -3.0371217727661133, -0.2792854309082031, 2.478550910949707, 5.236387252807617, 7.994224548339844, 10.752067565917969, 13.509903907775879, 16.26774024963379, 19.025577545166016, 21.78341293334961, 24.541248321533203, 27.29908561706543, 30.056922912597656, 32.81475830078125, 35.572593688964844, 38.33042907714844, 41.0882682800293, 43.84610366821289, 46.603939056396484, 49.361778259277344, 52.11961364746094, 54.87744903564453, 57.635284423828125, 60.39311981201172, 63.15095901489258, 65.90879821777344, 68.66663360595703, 71.42446899414062, 74.18230438232422, 76.94013977050781, 79.6979751586914, 82.455810546875, 85.2136459350586, 87.97148132324219, 90.72932434082031, 93.4871597290039, 96.2449951171875, 99.0028305053711]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 8.0, 6.0, 6.0, 6.0, 11.0, 10.0, 18.0, 14.0, 13.0, 15.0, 16.0, 25.0, 23.0, 34.0, 44.0, 42.0, 30.0, 42.0, 45.0, 42.0, 45.0, 45.0, 36.0, 43.0, 39.0, 35.0, 34.0, 28.0, 32.0, 24.0, 27.0, 17.0, 22.0, 21.0, 20.0, 15.0, 11.0, 11.0, 6.0, 3.0, 9.0, 7.0, 3.0, 2.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-53.536766052246094, -51.87102127075195, -50.20528030395508, -48.53953552246094, -46.87379455566406, -45.20804977416992, -43.54230499267578, -41.876564025878906, -40.21082305908203, -38.54507827758789, -36.879337310791016, -35.213592529296875, -33.5478515625, -31.88210678100586, -30.21636390686035, -28.550621032714844, -26.884876251220703, -25.219133377075195, -23.553390502929688, -21.887645721435547, -20.221904754638672, -18.55615997314453, -16.890417098999023, -15.224674224853516, -13.558931350708008, -11.8931884765625, -10.227445602416992, -8.561701774597168, -6.89595890045166, -5.230216026306152, -3.564472198486328, -1.8987293243408203, -0.23298263549804688, 1.43276047706604, 3.098503589630127, 4.764246940612793, 6.429989814758301, 8.095732688903809, 9.761476516723633, 11.42721939086914, 13.092962265014648, 14.758705139160156, 16.424448013305664, 18.090190887451172, 19.755935668945312, 21.421676635742188, 23.087421417236328, 24.753164291381836, 26.418907165527344, 28.08465003967285, 29.75039291381836, 31.4161376953125, 33.081878662109375, 34.747623443603516, 36.413368225097656, 38.07910919189453, 39.744850158691406, 41.41059494018555, 43.07633590698242, 44.74208068847656, 46.40782165527344, 48.07356643676758, 49.73931121826172, 51.405052185058594, 53.070796966552734]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 5.0, 11.0, 5.0, 15.0, 29.0, 23.0, 35.0, 70.0, 87.0, 119.0, 151.0, 236.0, 289.0, 440.0, 629.0, 904.0, 1241.0, 1882.0, 2686.0, 3940.0, 6084.0, 9984.0, 17171.0, 38349.0, 119400.0, 459895.0, 1670667.0, 1357458.0, 343094.0, 85731.0, 30357.0, 15307.0, 8928.0, 5921.0, 3915.0, 2643.0, 1902.0, 1328.0, 987.0, 663.0, 474.0, 342.0, 251.0, 183.0, 127.0, 98.0, 65.0, 47.0, 41.0, 24.0, 16.0, 12.0, 7.0, 6.0, 4.0, 6.0, 4.0], "bins": [-79.9375, -77.5791015625, -75.220703125, -72.8623046875, -70.50390625, -68.1455078125, -65.787109375, -63.4287109375, -61.0703125, -58.7119140625, -56.353515625, -53.9951171875, -51.63671875, -49.2783203125, -46.919921875, -44.5615234375, -42.203125, -39.8447265625, -37.486328125, -35.1279296875, -32.76953125, -30.4111328125, -28.052734375, -25.6943359375, -23.3359375, -20.9775390625, -18.619140625, -16.2607421875, -13.90234375, -11.5439453125, -9.185546875, -6.8271484375, -4.46875, -2.1103515625, 0.248046875, 2.6064453125, 4.96484375, 7.3232421875, 9.681640625, 12.0400390625, 14.3984375, 16.7568359375, 19.115234375, 21.4736328125, 23.83203125, 26.1904296875, 28.548828125, 30.9072265625, 33.265625, 35.6240234375, 37.982421875, 40.3408203125, 42.69921875, 45.0576171875, 47.416015625, 49.7744140625, 52.1328125, 54.4912109375, 56.849609375, 59.2080078125, 61.56640625, 63.9248046875, 66.283203125, 68.6416015625, 71.0]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 9.0, 8.0, 8.0, 5.0, 8.0, 7.0, 15.0, 13.0, 12.0, 17.0, 15.0, 27.0, 22.0, 23.0, 51.0, 34.0, 46.0, 33.0, 47.0, 38.0, 49.0, 52.0, 44.0, 39.0, 48.0, 41.0, 30.0, 33.0, 39.0, 25.0, 21.0, 17.0, 19.0, 18.0, 16.0, 15.0, 12.0, 10.0, 7.0, 6.0, 5.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-48.25, -46.75732421875, -45.2646484375, -43.77197265625, -42.279296875, -40.78662109375, -39.2939453125, -37.80126953125, -36.30859375, -34.81591796875, -33.3232421875, -31.83056640625, -30.337890625, -28.84521484375, -27.3525390625, -25.85986328125, -24.3671875, -22.87451171875, -21.3818359375, -19.88916015625, -18.396484375, -16.90380859375, -15.4111328125, -13.91845703125, -12.42578125, -10.93310546875, -9.4404296875, -7.94775390625, -6.455078125, -4.96240234375, -3.4697265625, -1.97705078125, -0.484375, 1.00830078125, 2.5009765625, 3.99365234375, 5.486328125, 6.97900390625, 8.4716796875, 9.96435546875, 11.45703125, 12.94970703125, 14.4423828125, 15.93505859375, 17.427734375, 18.92041015625, 20.4130859375, 21.90576171875, 23.3984375, 24.89111328125, 26.3837890625, 27.87646484375, 29.369140625, 30.86181640625, 32.3544921875, 33.84716796875, 35.33984375, 36.83251953125, 38.3251953125, 39.81787109375, 41.310546875, 42.80322265625, 44.2958984375, 45.78857421875, 47.28125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 8.0, 17.0, 22.0, 31.0, 26.0, 35.0, 81.0, 99.0, 158.0, 254.0, 341.0, 547.0, 834.0, 1227.0, 2133.0, 3408.0, 5598.0, 9726.0, 18011.0, 36415.0, 86317.0, 293724.0, 2051764.0, 1328752.0, 215736.0, 70236.0, 30996.0, 15668.0, 8924.0, 4976.0, 2950.0, 1865.0, 1169.0, 737.0, 471.0, 341.0, 208.0, 144.0, 114.0, 92.0, 38.0, 36.0, 21.0, 10.0, 8.0, 7.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.4375, -100.1943359375, -96.951171875, -93.7080078125, -90.46484375, -87.2216796875, -83.978515625, -80.7353515625, -77.4921875, -74.2490234375, -71.005859375, -67.7626953125, -64.51953125, -61.2763671875, -58.033203125, -54.7900390625, -51.546875, -48.3037109375, -45.060546875, -41.8173828125, -38.57421875, -35.3310546875, -32.087890625, -28.8447265625, -25.6015625, -22.3583984375, -19.115234375, -15.8720703125, -12.62890625, -9.3857421875, -6.142578125, -2.8994140625, 0.34375, 3.5869140625, 6.830078125, 10.0732421875, 13.31640625, 16.5595703125, 19.802734375, 23.0458984375, 26.2890625, 29.5322265625, 32.775390625, 36.0185546875, 39.26171875, 42.5048828125, 45.748046875, 48.9912109375, 52.234375, 55.4775390625, 58.720703125, 61.9638671875, 65.20703125, 68.4501953125, 71.693359375, 74.9365234375, 78.1796875, 81.4228515625, 84.666015625, 87.9091796875, 91.15234375, 94.3955078125, 97.638671875, 100.8818359375, 104.125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 9.0, 5.0, 14.0, 10.0, 15.0, 23.0, 19.0, 29.0, 45.0, 48.0, 65.0, 97.0, 118.0, 200.0, 311.0, 477.0, 681.0, 593.0, 437.0, 251.0, 176.0, 83.0, 84.0, 56.0, 56.0, 32.0, 36.0, 27.0, 12.0, 10.0, 8.0, 12.0, 7.0, 8.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.9375, -25.037353515625, -24.13720703125, -23.237060546875, -22.3369140625, -21.436767578125, -20.53662109375, -19.636474609375, -18.736328125, -17.836181640625, -16.93603515625, -16.035888671875, -15.1357421875, -14.235595703125, -13.33544921875, -12.435302734375, -11.53515625, -10.635009765625, -9.73486328125, -8.834716796875, -7.9345703125, -7.034423828125, -6.13427734375, -5.234130859375, -4.333984375, -3.433837890625, -2.53369140625, -1.633544921875, -0.7333984375, 0.166748046875, 1.06689453125, 1.967041015625, 2.8671875, 3.767333984375, 4.66748046875, 5.567626953125, 6.4677734375, 7.367919921875, 8.26806640625, 9.168212890625, 10.068359375, 10.968505859375, 11.86865234375, 12.768798828125, 13.6689453125, 14.569091796875, 15.46923828125, 16.369384765625, 17.26953125, 18.169677734375, 19.06982421875, 19.969970703125, 20.8701171875, 21.770263671875, 22.67041015625, 23.570556640625, 24.470703125, 25.370849609375, 26.27099609375, 27.171142578125, 28.0712890625, 28.971435546875, 29.87158203125, 30.771728515625, 31.671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 6.0, 7.0, 6.0, 7.0, 11.0, 16.0, 21.0, 29.0, 38.0, 58.0, 47.0, 78.0, 72.0, 105.0, 88.0, 106.0, 63.0, 47.0, 46.0, 36.0, 22.0, 18.0, 15.0, 7.0, 9.0, 7.0, 6.0, 11.0, 4.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.113773345947266, -49.06436538696289, -47.014957427978516, -44.96554946899414, -42.9161376953125, -40.866729736328125, -38.81732177734375, -36.767913818359375, -34.718505859375, -32.669097900390625, -30.61968994140625, -28.570280075073242, -26.520872116088867, -24.471464157104492, -22.422054290771484, -20.37264633178711, -18.323238372802734, -16.27383041381836, -14.224421501159668, -12.175012588500977, -10.125604629516602, -8.076196670532227, -6.026787757873535, -3.9773788452148438, -1.9279708862304688, 0.12143754959106445, 2.1708459854125977, 4.220254421234131, 6.269662857055664, 8.319070816040039, 10.36847972869873, 12.417888641357422, 14.467292785644531, 16.516700744628906, 18.56610870361328, 20.61551856994629, 22.664926528930664, 24.71433448791504, 26.763744354248047, 28.813152313232422, 30.862560272216797, 32.91196823120117, 34.96137619018555, 37.01078414916992, 39.06019592285156, 41.10960388183594, 43.15901184082031, 45.20841979980469, 47.25782775878906, 49.30723571777344, 51.35664367675781, 53.40605163574219, 55.45545959472656, 57.50486755371094, 59.55427932739258, 61.60368728637695, 63.65309524536133, 65.70250701904297, 67.75191497802734, 69.80132293701172, 71.8507308959961, 73.90013885498047, 75.94954681396484, 77.99895477294922, 80.0483627319336]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 4.0, 7.0, 7.0, 10.0, 12.0, 11.0, 14.0, 13.0, 15.0, 18.0, 25.0, 32.0, 22.0, 25.0, 30.0, 41.0, 39.0, 48.0, 28.0, 41.0, 37.0, 38.0, 35.0, 41.0, 48.0, 46.0, 36.0, 23.0, 28.0, 22.0, 28.0, 25.0, 25.0, 15.0, 21.0, 9.0, 13.0, 12.0, 11.0, 4.0, 4.0, 8.0, 5.0, 5.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-46.545711517333984, -45.09880447387695, -43.65189743041992, -42.204986572265625, -40.758079528808594, -39.31117248535156, -37.86426544189453, -36.4173583984375, -34.97045135498047, -33.52354431152344, -32.076637268066406, -30.629728317260742, -29.18282127380371, -27.735912322998047, -26.289005279541016, -24.842098236083984, -23.39518928527832, -21.94828224182129, -20.501373291015625, -19.054466247558594, -17.607559204101562, -16.16065216064453, -14.713743209838867, -13.266836166381836, -11.819928169250488, -10.37302017211914, -8.92611312866211, -7.479205131530762, -6.032297611236572, -4.585390090942383, -3.138482093811035, -1.691575050354004, -0.24466705322265625, 1.2022405862808228, 2.6491482257843018, 4.09605598449707, 5.54296350479126, 6.989871025085449, 8.436779022216797, 9.883686065673828, 11.330594062805176, 12.777502059936523, 14.224409103393555, 15.671317100524902, 17.11822509765625, 18.56513214111328, 20.012039184570312, 21.458946228027344, 22.905855178833008, 24.35276222229004, 25.799671173095703, 27.246578216552734, 28.693485260009766, 30.140392303466797, 31.58730125427246, 33.034210205078125, 34.481117248535156, 35.92802429199219, 37.37493133544922, 38.82183837890625, 40.26874923706055, 41.71565628051758, 43.16256332397461, 44.60947036743164, 46.05637741088867]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 21.0, 25.0, 38.0, 64.0, 103.0, 146.0, 224.0, 267.0, 438.0, 598.0, 873.0, 1366.0, 1955.0, 3010.0, 4458.0, 6704.0, 10614.0, 16668.0, 27408.0, 48098.0, 89532.0, 181472.0, 286326.0, 167579.0, 83517.0, 45485.0, 26361.0, 15884.0, 9951.0, 6469.0, 4164.0, 2863.0, 1889.0, 1273.0, 882.0, 566.0, 427.0, 258.0, 159.0, 137.0, 95.0, 63.0, 42.0, 22.0, 21.0, 10.0, 12.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.34375, -29.34716796875, -28.3505859375, -27.35400390625, -26.357421875, -25.36083984375, -24.3642578125, -23.36767578125, -22.37109375, -21.37451171875, -20.3779296875, -19.38134765625, -18.384765625, -17.38818359375, -16.3916015625, -15.39501953125, -14.3984375, -13.40185546875, -12.4052734375, -11.40869140625, -10.412109375, -9.41552734375, -8.4189453125, -7.42236328125, -6.42578125, -5.42919921875, -4.4326171875, -3.43603515625, -2.439453125, -1.44287109375, -0.4462890625, 0.55029296875, 1.546875, 2.54345703125, 3.5400390625, 4.53662109375, 5.533203125, 6.52978515625, 7.5263671875, 8.52294921875, 9.51953125, 10.51611328125, 11.5126953125, 12.50927734375, 13.505859375, 14.50244140625, 15.4990234375, 16.49560546875, 17.4921875, 18.48876953125, 19.4853515625, 20.48193359375, 21.478515625, 22.47509765625, 23.4716796875, 24.46826171875, 25.46484375, 26.46142578125, 27.4580078125, 28.45458984375, 29.451171875, 30.44775390625, 31.4443359375, 32.44091796875, 33.4375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 3.0, 7.0, 8.0, 10.0, 14.0, 14.0, 16.0, 14.0, 26.0, 20.0, 22.0, 31.0, 22.0, 34.0, 33.0, 41.0, 48.0, 39.0, 42.0, 41.0, 51.0, 51.0, 52.0, 45.0, 28.0, 38.0, 20.0, 32.0, 19.0, 24.0, 23.0, 15.0, 21.0, 19.0, 4.0, 9.0, 11.0, 12.0, 0.0, 7.0, 5.0, 7.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-50.15625, -48.62353515625, -47.0908203125, -45.55810546875, -44.025390625, -42.49267578125, -40.9599609375, -39.42724609375, -37.89453125, -36.36181640625, -34.8291015625, -33.29638671875, -31.763671875, -30.23095703125, -28.6982421875, -27.16552734375, -25.6328125, -24.10009765625, -22.5673828125, -21.03466796875, -19.501953125, -17.96923828125, -16.4365234375, -14.90380859375, -13.37109375, -11.83837890625, -10.3056640625, -8.77294921875, -7.240234375, -5.70751953125, -4.1748046875, -2.64208984375, -1.109375, 0.42333984375, 1.9560546875, 3.48876953125, 5.021484375, 6.55419921875, 8.0869140625, 9.61962890625, 11.15234375, 12.68505859375, 14.2177734375, 15.75048828125, 17.283203125, 18.81591796875, 20.3486328125, 21.88134765625, 23.4140625, 24.94677734375, 26.4794921875, 28.01220703125, 29.544921875, 31.07763671875, 32.6103515625, 34.14306640625, 35.67578125, 37.20849609375, 38.7412109375, 40.27392578125, 41.806640625, 43.33935546875, 44.8720703125, 46.40478515625, 47.9375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 12.0, 6.0, 8.0, 12.0, 26.0, 36.0, 47.0, 47.0, 75.0, 92.0, 156.0, 224.0, 310.0, 439.0, 660.0, 979.0, 1412.0, 2182.0, 3259.0, 5399.0, 8749.0, 15760.0, 40602.0, 598207.0, 302423.0, 31726.0, 13823.0, 7839.0, 4822.0, 3073.0, 2022.0, 1310.0, 914.0, 596.0, 385.0, 276.0, 188.0, 152.0, 93.0, 60.0, 53.0, 32.0, 17.0, 9.0, 20.0, 11.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.8125, -47.23291015625, -45.6533203125, -44.07373046875, -42.494140625, -40.91455078125, -39.3349609375, -37.75537109375, -36.17578125, -34.59619140625, -33.0166015625, -31.43701171875, -29.857421875, -28.27783203125, -26.6982421875, -25.11865234375, -23.5390625, -21.95947265625, -20.3798828125, -18.80029296875, -17.220703125, -15.64111328125, -14.0615234375, -12.48193359375, -10.90234375, -9.32275390625, -7.7431640625, -6.16357421875, -4.583984375, -3.00439453125, -1.4248046875, 0.15478515625, 1.734375, 3.31396484375, 4.8935546875, 6.47314453125, 8.052734375, 9.63232421875, 11.2119140625, 12.79150390625, 14.37109375, 15.95068359375, 17.5302734375, 19.10986328125, 20.689453125, 22.26904296875, 23.8486328125, 25.42822265625, 27.0078125, 28.58740234375, 30.1669921875, 31.74658203125, 33.326171875, 34.90576171875, 36.4853515625, 38.06494140625, 39.64453125, 41.22412109375, 42.8037109375, 44.38330078125, 45.962890625, 47.54248046875, 49.1220703125, 50.70166015625, 52.28125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 4.0, 5.0, 0.0, 6.0, 8.0, 9.0, 14.0, 7.0, 24.0, 17.0, 17.0, 13.0, 20.0, 24.0, 29.0, 29.0, 27.0, 37.0, 36.0, 24.0, 36.0, 39.0, 43.0, 41.0, 46.0, 43.0, 39.0, 37.0, 33.0, 29.0, 37.0, 30.0, 18.0, 24.0, 19.0, 18.0, 18.0, 11.0, 21.0, 14.0, 8.0, 11.0, 5.0, 7.0, 7.0, 6.0, 2.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-36.34375, -35.21142578125, -34.0791015625, -32.94677734375, -31.814453125, -30.68212890625, -29.5498046875, -28.41748046875, -27.28515625, -26.15283203125, -25.0205078125, -23.88818359375, -22.755859375, -21.62353515625, -20.4912109375, -19.35888671875, -18.2265625, -17.09423828125, -15.9619140625, -14.82958984375, -13.697265625, -12.56494140625, -11.4326171875, -10.30029296875, -9.16796875, -8.03564453125, -6.9033203125, -5.77099609375, -4.638671875, -3.50634765625, -2.3740234375, -1.24169921875, -0.109375, 1.02294921875, 2.1552734375, 3.28759765625, 4.419921875, 5.55224609375, 6.6845703125, 7.81689453125, 8.94921875, 10.08154296875, 11.2138671875, 12.34619140625, 13.478515625, 14.61083984375, 15.7431640625, 16.87548828125, 18.0078125, 19.14013671875, 20.2724609375, 21.40478515625, 22.537109375, 23.66943359375, 24.8017578125, 25.93408203125, 27.06640625, 28.19873046875, 29.3310546875, 30.46337890625, 31.595703125, 32.72802734375, 33.8603515625, 34.99267578125, 36.125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 5.0, 10.0, 10.0, 13.0, 19.0, 45.0, 59.0, 76.0, 139.0, 207.0, 344.0, 510.0, 883.0, 1723.0, 3089.0, 6628.0, 17092.0, 90258.0, 847303.0, 54581.0, 13704.0, 5571.0, 2687.0, 1476.0, 801.0, 480.0, 291.0, 170.0, 114.0, 91.0, 52.0, 41.0, 24.0, 15.0, 15.0, 8.0, 5.0, 3.0, 9.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.9453125, -3.830596923828125, -3.71588134765625, -3.601165771484375, -3.4864501953125, -3.371734619140625, -3.25701904296875, -3.142303466796875, -3.027587890625, -2.912872314453125, -2.79815673828125, -2.683441162109375, -2.5687255859375, -2.454010009765625, -2.33929443359375, -2.224578857421875, -2.10986328125, -1.995147705078125, -1.88043212890625, -1.765716552734375, -1.6510009765625, -1.536285400390625, -1.42156982421875, -1.306854248046875, -1.192138671875, -1.077423095703125, -0.96270751953125, -0.847991943359375, -0.7332763671875, -0.618560791015625, -0.50384521484375, -0.389129638671875, -0.2744140625, -0.159698486328125, -0.04498291015625, 0.069732666015625, 0.1844482421875, 0.299163818359375, 0.41387939453125, 0.528594970703125, 0.643310546875, 0.758026123046875, 0.87274169921875, 0.987457275390625, 1.1021728515625, 1.216888427734375, 1.33160400390625, 1.446319580078125, 1.56103515625, 1.675750732421875, 1.79046630859375, 1.905181884765625, 2.0198974609375, 2.134613037109375, 2.24932861328125, 2.364044189453125, 2.478759765625, 2.593475341796875, 2.70819091796875, 2.822906494140625, 2.9376220703125, 3.052337646484375, 3.16705322265625, 3.281768798828125, 3.396484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 6.0, 12.0, 4.0, 15.0, 22.0, 23.0, 44.0, 47.0, 83.0, 135.0, 184.0, 119.0, 72.0, 52.0, 32.0, 41.0, 26.0, 3.0, 11.0, 10.0, 15.0, 4.0, 1.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001567840576171875, -0.001516297459602356, -0.001464754343032837, -0.0014132112264633179, -0.0013616681098937988, -0.0013101249933242798, -0.0012585818767547607, -0.0012070387601852417, -0.0011554956436157227, -0.0011039525270462036, -0.0010524094104766846, -0.0010008662939071655, -0.0009493231773376465, -0.0008977800607681274, -0.0008462369441986084, -0.0007946938276290894, -0.0007431507110595703, -0.0006916075944900513, -0.0006400644779205322, -0.0005885213613510132, -0.0005369782447814941, -0.0004854351282119751, -0.00043389201164245605, -0.000382348895072937, -0.00033080577850341797, -0.0002792626619338989, -0.00022771954536437988, -0.00017617642879486084, -0.0001246333122253418, -7.309019565582275e-05, -2.154707908630371e-05, 2.9996037483215332e-05, 8.153915405273438e-05, 0.00013308227062225342, 0.00018462538719177246, 0.0002361685037612915, 0.00028771162033081055, 0.0003392547369003296, 0.00039079785346984863, 0.0004423409700393677, 0.0004938840866088867, 0.0005454272031784058, 0.0005969703197479248, 0.0006485134363174438, 0.0007000565528869629, 0.0007515996694564819, 0.000803142786026001, 0.00085468590259552, 0.0009062290191650391, 0.0009577721357345581, 0.0010093152523040771, 0.0010608583688735962, 0.0011124014854431152, 0.0011639446020126343, 0.0012154877185821533, 0.0012670308351516724, 0.0013185739517211914, 0.0013701170682907104, 0.0014216601848602295, 0.0014732033014297485, 0.0015247464179992676, 0.0015762895345687866, 0.0016278326511383057, 0.0016793757677078247, 0.0017309188842773438]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 9.0, 11.0, 13.0, 24.0, 33.0, 62.0, 90.0, 147.0, 217.0, 324.0, 485.0, 737.0, 1085.0, 1663.0, 2684.0, 4147.0, 7056.0, 12425.0, 22024.0, 43134.0, 94126.0, 241105.0, 342000.0, 143488.0, 61374.0, 30199.0, 16103.0, 9192.0, 5347.0, 3325.0, 2090.0, 1294.0, 844.0, 553.0, 393.0, 268.0, 178.0, 122.0, 79.0, 46.0, 23.0, 11.0, 18.0, 10.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.951171875, -1.8957977294921875, -1.840423583984375, -1.7850494384765625, -1.72967529296875, -1.6743011474609375, -1.618927001953125, -1.5635528564453125, -1.5081787109375, -1.4528045654296875, -1.397430419921875, -1.3420562744140625, -1.28668212890625, -1.2313079833984375, -1.175933837890625, -1.1205596923828125, -1.065185546875, -1.0098114013671875, -0.954437255859375, -0.8990631103515625, -0.84368896484375, -0.7883148193359375, -0.732940673828125, -0.6775665283203125, -0.6221923828125, -0.5668182373046875, -0.511444091796875, -0.4560699462890625, -0.40069580078125, -0.3453216552734375, -0.289947509765625, -0.2345733642578125, -0.17919921875, -0.1238250732421875, -0.068450927734375, -0.0130767822265625, 0.04229736328125, 0.0976715087890625, 0.153045654296875, 0.2084197998046875, 0.2637939453125, 0.3191680908203125, 0.374542236328125, 0.4299163818359375, 0.48529052734375, 0.5406646728515625, 0.596038818359375, 0.6514129638671875, 0.706787109375, 0.7621612548828125, 0.817535400390625, 0.8729095458984375, 0.92828369140625, 0.9836578369140625, 1.039031982421875, 1.0944061279296875, 1.1497802734375, 1.2051544189453125, 1.260528564453125, 1.3159027099609375, 1.37127685546875, 1.4266510009765625, 1.482025146484375, 1.5373992919921875, 1.5927734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 9.0, 9.0, 11.0, 14.0, 17.0, 25.0, 29.0, 21.0, 32.0, 26.0, 55.0, 69.0, 64.0, 77.0, 67.0, 76.0, 62.0, 60.0, 41.0, 55.0, 28.0, 28.0, 17.0, 14.0, 11.0, 11.0, 7.0, 8.0, 7.0, 5.0, 2.0, 7.0, 3.0, 3.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.470703125, -0.4547576904296875, -0.438812255859375, -0.4228668212890625, -0.40692138671875, -0.3909759521484375, -0.375030517578125, -0.3590850830078125, -0.3431396484375, -0.3271942138671875, -0.311248779296875, -0.2953033447265625, -0.27935791015625, -0.2634124755859375, -0.247467041015625, -0.2315216064453125, -0.215576171875, -0.1996307373046875, -0.183685302734375, -0.1677398681640625, -0.15179443359375, -0.1358489990234375, -0.119903564453125, -0.1039581298828125, -0.0880126953125, -0.0720672607421875, -0.056121826171875, -0.0401763916015625, -0.02423095703125, -0.0082855224609375, 0.007659912109375, 0.0236053466796875, 0.03955078125, 0.0554962158203125, 0.071441650390625, 0.0873870849609375, 0.10333251953125, 0.1192779541015625, 0.135223388671875, 0.1511688232421875, 0.1671142578125, 0.1830596923828125, 0.199005126953125, 0.2149505615234375, 0.23089599609375, 0.2468414306640625, 0.262786865234375, 0.2787322998046875, 0.294677734375, 0.3106231689453125, 0.326568603515625, 0.3425140380859375, 0.35845947265625, 0.3744049072265625, 0.390350341796875, 0.4062957763671875, 0.4222412109375, 0.4381866455078125, 0.454132080078125, 0.4700775146484375, 0.48602294921875, 0.5019683837890625, 0.517913818359375, 0.5338592529296875, 0.5498046875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 6.0, 16.0, 13.0, 17.0, 25.0, 41.0, 43.0, 53.0, 49.0, 71.0, 85.0, 101.0, 85.0, 85.0, 77.0, 47.0, 41.0, 19.0, 20.0, 21.0, 12.0, 11.0, 7.0, 7.0, 8.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.05890655517578, -47.134620666503906, -45.21033477783203, -43.286048889160156, -41.361759185791016, -39.43747329711914, -37.513187408447266, -35.58890151977539, -33.66461181640625, -31.740325927734375, -29.816038131713867, -27.891752243041992, -25.967464447021484, -24.04317855834961, -22.118892669677734, -20.19460678100586, -18.270320892333984, -16.34603500366211, -14.421747207641602, -12.497461318969727, -10.573174476623535, -8.648887634277344, -6.724601745605469, -4.800314903259277, -2.876028060913086, -0.9517414569854736, 0.9725451469421387, 2.896831512451172, 4.821118354797363, 6.745405197143555, 8.66969108581543, 10.593977928161621, 12.518264770507812, 14.442551612854004, 16.366838455200195, 18.29112434387207, 20.215412139892578, 22.139698028564453, 24.063983917236328, 25.988269805908203, 27.91255760192871, 29.836843490600586, 31.761131286621094, 33.68541717529297, 35.609703063964844, 37.53398895263672, 39.458274841308594, 41.382564544677734, 43.30685043334961, 45.231136322021484, 47.15542221069336, 49.0797119140625, 51.003997802734375, 52.92828369140625, 54.852569580078125, 56.77685546875, 58.701141357421875, 60.62542724609375, 62.549713134765625, 64.4739990234375, 66.39828491210938, 68.32257080078125, 70.24685668945312, 72.17115020751953, 74.0954360961914]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 4.0, 6.0, 9.0, 9.0, 11.0, 14.0, 15.0, 9.0, 16.0, 19.0, 25.0, 32.0, 24.0, 22.0, 32.0, 45.0, 35.0, 50.0, 27.0, 38.0, 35.0, 49.0, 33.0, 39.0, 50.0, 42.0, 32.0, 25.0, 31.0, 21.0, 31.0, 23.0, 22.0, 17.0, 18.0, 10.0, 14.0, 10.0, 13.0, 2.0, 7.0, 5.0, 6.0, 4.0, 4.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-45.38300323486328, -43.97460174560547, -42.56620407104492, -41.15780258178711, -39.74940490722656, -38.34100341796875, -36.93260192871094, -35.52420425415039, -34.115806579589844, -32.70740509033203, -31.299007415771484, -29.890605926513672, -28.482208251953125, -27.073806762695312, -25.665407180786133, -24.257007598876953, -22.84860610961914, -21.44020652770996, -20.03180694580078, -18.62340545654297, -17.215007781982422, -15.806607246398926, -14.39820671081543, -12.98980712890625, -11.58140754699707, -10.17300796508789, -8.764608383178711, -7.356207847595215, -5.947808265686035, -4.5394086837768555, -3.1310081481933594, -1.7226085662841797, -0.314208984375, 1.0941908359527588, 2.5025906562805176, 3.9109907150268555, 5.319390296936035, 6.727789878845215, 8.136190414428711, 9.54458999633789, 10.95298957824707, 12.36138916015625, 13.76978874206543, 15.178189277648926, 16.586589813232422, 17.99498748779297, 19.40338897705078, 20.81178855895996, 22.22018814086914, 23.62858772277832, 25.0369873046875, 26.445388793945312, 27.85378646850586, 29.262187957763672, 30.67058753967285, 32.07898712158203, 33.487388610839844, 34.895790100097656, 36.3041877746582, 37.712589263916016, 39.12098693847656, 40.529388427734375, 41.93778991699219, 43.346187591552734, 44.75458526611328]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 13.0, 14.0, 22.0, 23.0, 29.0, 49.0, 73.0, 121.0, 161.0, 257.0, 369.0, 520.0, 763.0, 1171.0, 1785.0, 2876.0, 4437.0, 7131.0, 11923.0, 20813.0, 38368.0, 76848.0, 169996.0, 314269.0, 202439.0, 90743.0, 44412.0, 23646.0, 13419.0, 7987.0, 4952.0, 3019.0, 1987.0, 1273.0, 868.0, 551.0, 408.0, 240.0, 172.0, 128.0, 87.0, 61.0, 43.0, 30.0, 18.0, 20.0, 9.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.6875, -63.609375, -61.53125, -59.453125, -57.375, -55.296875, -53.21875, -51.140625, -49.0625, -46.984375, -44.90625, -42.828125, -40.75, -38.671875, -36.59375, -34.515625, -32.4375, -30.359375, -28.28125, -26.203125, -24.125, -22.046875, -19.96875, -17.890625, -15.8125, -13.734375, -11.65625, -9.578125, -7.5, -5.421875, -3.34375, -1.265625, 0.8125, 2.890625, 4.96875, 7.046875, 9.125, 11.203125, 13.28125, 15.359375, 17.4375, 19.515625, 21.59375, 23.671875, 25.75, 27.828125, 29.90625, 31.984375, 34.0625, 36.140625, 38.21875, 40.296875, 42.375, 44.453125, 46.53125, 48.609375, 50.6875, 52.765625, 54.84375, 56.921875, 59.0, 61.078125, 63.15625, 65.234375, 67.3125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 5.0, 6.0, 8.0, 9.0, 14.0, 14.0, 12.0, 15.0, 13.0, 30.0, 29.0, 19.0, 25.0, 40.0, 40.0, 41.0, 48.0, 38.0, 34.0, 50.0, 43.0, 45.0, 39.0, 60.0, 37.0, 40.0, 22.0, 27.0, 26.0, 21.0, 20.0, 19.0, 16.0, 17.0, 15.0, 7.0, 7.0, 7.0, 3.0, 5.0, 4.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-47.90625, -46.44677734375, -44.9873046875, -43.52783203125, -42.068359375, -40.60888671875, -39.1494140625, -37.68994140625, -36.23046875, -34.77099609375, -33.3115234375, -31.85205078125, -30.392578125, -28.93310546875, -27.4736328125, -26.01416015625, -24.5546875, -23.09521484375, -21.6357421875, -20.17626953125, -18.716796875, -17.25732421875, -15.7978515625, -14.33837890625, -12.87890625, -11.41943359375, -9.9599609375, -8.50048828125, -7.041015625, -5.58154296875, -4.1220703125, -2.66259765625, -1.203125, 0.25634765625, 1.7158203125, 3.17529296875, 4.634765625, 6.09423828125, 7.5537109375, 9.01318359375, 10.47265625, 11.93212890625, 13.3916015625, 14.85107421875, 16.310546875, 17.77001953125, 19.2294921875, 20.68896484375, 22.1484375, 23.60791015625, 25.0673828125, 26.52685546875, 27.986328125, 29.44580078125, 30.9052734375, 32.36474609375, 33.82421875, 35.28369140625, 36.7431640625, 38.20263671875, 39.662109375, 41.12158203125, 42.5810546875, 44.04052734375, 45.5]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 8.0, 5.0, 19.0, 31.0, 38.0, 60.0, 82.0, 144.0, 215.0, 302.0, 436.0, 628.0, 1019.0, 1491.0, 2362.0, 3954.0, 6219.0, 10073.0, 17239.0, 29389.0, 53034.0, 98802.0, 194391.0, 270292.0, 163985.0, 84473.0, 45533.0, 25556.0, 14862.0, 8885.0, 5315.0, 3459.0, 2128.0, 1378.0, 931.0, 629.0, 405.0, 264.0, 190.0, 101.0, 83.0, 44.0, 25.0, 29.0, 19.0, 12.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-64.0625, -62.0205078125, -59.978515625, -57.9365234375, -55.89453125, -53.8525390625, -51.810546875, -49.7685546875, -47.7265625, -45.6845703125, -43.642578125, -41.6005859375, -39.55859375, -37.5166015625, -35.474609375, -33.4326171875, -31.390625, -29.3486328125, -27.306640625, -25.2646484375, -23.22265625, -21.1806640625, -19.138671875, -17.0966796875, -15.0546875, -13.0126953125, -10.970703125, -8.9287109375, -6.88671875, -4.8447265625, -2.802734375, -0.7607421875, 1.28125, 3.3232421875, 5.365234375, 7.4072265625, 9.44921875, 11.4912109375, 13.533203125, 15.5751953125, 17.6171875, 19.6591796875, 21.701171875, 23.7431640625, 25.78515625, 27.8271484375, 29.869140625, 31.9111328125, 33.953125, 35.9951171875, 38.037109375, 40.0791015625, 42.12109375, 44.1630859375, 46.205078125, 48.2470703125, 50.2890625, 52.3310546875, 54.373046875, 56.4150390625, 58.45703125, 60.4990234375, 62.541015625, 64.5830078125, 66.625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 4.0, 9.0, 9.0, 10.0, 10.0, 19.0, 16.0, 25.0, 21.0, 38.0, 32.0, 36.0, 34.0, 28.0, 47.0, 41.0, 47.0, 34.0, 44.0, 52.0, 45.0, 29.0, 40.0, 40.0, 33.0, 37.0, 35.0, 24.0, 26.0, 27.0, 16.0, 17.0, 12.0, 9.0, 8.0, 7.0, 6.0, 5.0, 2.0, 3.0, 4.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.90625, -29.94970703125, -28.9931640625, -28.03662109375, -27.080078125, -26.12353515625, -25.1669921875, -24.21044921875, -23.25390625, -22.29736328125, -21.3408203125, -20.38427734375, -19.427734375, -18.47119140625, -17.5146484375, -16.55810546875, -15.6015625, -14.64501953125, -13.6884765625, -12.73193359375, -11.775390625, -10.81884765625, -9.8623046875, -8.90576171875, -7.94921875, -6.99267578125, -6.0361328125, -5.07958984375, -4.123046875, -3.16650390625, -2.2099609375, -1.25341796875, -0.296875, 0.65966796875, 1.6162109375, 2.57275390625, 3.529296875, 4.48583984375, 5.4423828125, 6.39892578125, 7.35546875, 8.31201171875, 9.2685546875, 10.22509765625, 11.181640625, 12.13818359375, 13.0947265625, 14.05126953125, 15.0078125, 15.96435546875, 16.9208984375, 17.87744140625, 18.833984375, 19.79052734375, 20.7470703125, 21.70361328125, 22.66015625, 23.61669921875, 24.5732421875, 25.52978515625, 26.486328125, 27.44287109375, 28.3994140625, 29.35595703125, 30.3125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 6.0, 5.0, 6.0, 18.0, 26.0, 25.0, 57.0, 94.0, 122.0, 183.0, 276.0, 541.0, 851.0, 1485.0, 2746.0, 5031.0, 9630.0, 19718.0, 45165.0, 116411.0, 338007.0, 318268.0, 108346.0, 42627.0, 18830.0, 9125.0, 4763.0, 2507.0, 1455.0, 843.0, 542.0, 311.0, 207.0, 106.0, 81.0, 50.0, 36.0, 24.0, 15.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.546875, -28.62255859375, -27.6982421875, -26.77392578125, -25.849609375, -24.92529296875, -24.0009765625, -23.07666015625, -22.15234375, -21.22802734375, -20.3037109375, -19.37939453125, -18.455078125, -17.53076171875, -16.6064453125, -15.68212890625, -14.7578125, -13.83349609375, -12.9091796875, -11.98486328125, -11.060546875, -10.13623046875, -9.2119140625, -8.28759765625, -7.36328125, -6.43896484375, -5.5146484375, -4.59033203125, -3.666015625, -2.74169921875, -1.8173828125, -0.89306640625, 0.03125, 0.95556640625, 1.8798828125, 2.80419921875, 3.728515625, 4.65283203125, 5.5771484375, 6.50146484375, 7.42578125, 8.35009765625, 9.2744140625, 10.19873046875, 11.123046875, 12.04736328125, 12.9716796875, 13.89599609375, 14.8203125, 15.74462890625, 16.6689453125, 17.59326171875, 18.517578125, 19.44189453125, 20.3662109375, 21.29052734375, 22.21484375, 23.13916015625, 24.0634765625, 24.98779296875, 25.912109375, 26.83642578125, 27.7607421875, 28.68505859375, 29.609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 1.0, 10.0, 12.0, 7.0, 12.0, 15.0, 19.0, 22.0, 33.0, 53.0, 60.0, 106.0, 125.0, 114.0, 105.0, 81.0, 52.0, 52.0, 37.0, 16.0, 14.0, 5.0, 10.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028018951416015625, -0.0027174949645996094, -0.0026330947875976562, -0.002548694610595703, -0.00246429443359375, -0.002379894256591797, -0.0022954940795898438, -0.0022110939025878906, -0.0021266937255859375, -0.0020422935485839844, -0.0019578933715820312, -0.0018734931945800781, -0.001789093017578125, -0.0017046928405761719, -0.0016202926635742188, -0.0015358924865722656, -0.0014514923095703125, -0.0013670921325683594, -0.0012826919555664062, -0.0011982917785644531, -0.0011138916015625, -0.0010294914245605469, -0.0009450912475585938, -0.0008606910705566406, -0.0007762908935546875, -0.0006918907165527344, -0.0006074905395507812, -0.0005230903625488281, -0.000438690185546875, -0.0003542900085449219, -0.00026988983154296875, -0.00018548965454101562, -0.0001010894775390625, -1.6689300537109375e-05, 6.771087646484375e-05, 0.00015211105346679688, 0.00023651123046875, 0.0003209114074707031, 0.00040531158447265625, 0.0004897117614746094, 0.0005741119384765625, 0.0006585121154785156, 0.0007429122924804688, 0.0008273124694824219, 0.000911712646484375, 0.0009961128234863281, 0.0010805130004882812, 0.0011649131774902344, 0.0012493133544921875, 0.0013337135314941406, 0.0014181137084960938, 0.0015025138854980469, 0.0015869140625, 0.0016713142395019531, 0.0017557144165039062, 0.0018401145935058594, 0.0019245147705078125, 0.0020089149475097656, 0.0020933151245117188, 0.002177715301513672, 0.002262115478515625, 0.002346515655517578, 0.0024309158325195312, 0.0025153160095214844, 0.0025997161865234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 10.0, 20.0, 25.0, 22.0, 32.0, 54.0, 73.0, 110.0, 180.0, 255.0, 391.0, 585.0, 909.0, 1467.0, 2336.0, 3798.0, 6491.0, 11101.0, 19807.0, 37407.0, 74294.0, 157066.0, 287984.0, 223804.0, 105806.0, 51425.0, 26989.0, 14645.0, 8559.0, 4814.0, 2953.0, 1865.0, 1163.0, 701.0, 463.0, 285.0, 219.0, 145.0, 101.0, 65.0, 41.0, 36.0, 18.0, 13.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0], "bins": [-21.28125, -20.668701171875, -20.05615234375, -19.443603515625, -18.8310546875, -18.218505859375, -17.60595703125, -16.993408203125, -16.380859375, -15.768310546875, -15.15576171875, -14.543212890625, -13.9306640625, -13.318115234375, -12.70556640625, -12.093017578125, -11.48046875, -10.867919921875, -10.25537109375, -9.642822265625, -9.0302734375, -8.417724609375, -7.80517578125, -7.192626953125, -6.580078125, -5.967529296875, -5.35498046875, -4.742431640625, -4.1298828125, -3.517333984375, -2.90478515625, -2.292236328125, -1.6796875, -1.067138671875, -0.45458984375, 0.157958984375, 0.7705078125, 1.383056640625, 1.99560546875, 2.608154296875, 3.220703125, 3.833251953125, 4.44580078125, 5.058349609375, 5.6708984375, 6.283447265625, 6.89599609375, 7.508544921875, 8.12109375, 8.733642578125, 9.34619140625, 9.958740234375, 10.5712890625, 11.183837890625, 11.79638671875, 12.408935546875, 13.021484375, 13.634033203125, 14.24658203125, 14.859130859375, 15.4716796875, 16.084228515625, 16.69677734375, 17.309326171875, 17.921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 9.0, 12.0, 19.0, 19.0, 41.0, 23.0, 37.0, 49.0, 39.0, 50.0, 56.0, 69.0, 74.0, 62.0, 60.0, 58.0, 47.0, 51.0, 35.0, 26.0, 35.0, 23.0, 21.0, 18.0, 9.0, 14.0, 10.0, 5.0, 4.0, 5.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.22265625, -6.0164794921875, -5.810302734375, -5.6041259765625, -5.39794921875, -5.1917724609375, -4.985595703125, -4.7794189453125, -4.5732421875, -4.3670654296875, -4.160888671875, -3.9547119140625, -3.74853515625, -3.5423583984375, -3.336181640625, -3.1300048828125, -2.923828125, -2.7176513671875, -2.511474609375, -2.3052978515625, -2.09912109375, -1.8929443359375, -1.686767578125, -1.4805908203125, -1.2744140625, -1.0682373046875, -0.862060546875, -0.6558837890625, -0.44970703125, -0.2435302734375, -0.037353515625, 0.1688232421875, 0.375, 0.5811767578125, 0.787353515625, 0.9935302734375, 1.19970703125, 1.4058837890625, 1.612060546875, 1.8182373046875, 2.0244140625, 2.2305908203125, 2.436767578125, 2.6429443359375, 2.84912109375, 3.0552978515625, 3.261474609375, 3.4676513671875, 3.673828125, 3.8800048828125, 4.086181640625, 4.2923583984375, 4.49853515625, 4.7047119140625, 4.910888671875, 5.1170654296875, 5.3232421875, 5.5294189453125, 5.735595703125, 5.9417724609375, 6.14794921875, 6.3541259765625, 6.560302734375, 6.7664794921875, 6.97265625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 7.0, 13.0, 14.0, 19.0, 23.0, 31.0, 30.0, 43.0, 47.0, 70.0, 61.0, 76.0, 80.0, 80.0, 78.0, 66.0, 48.0, 46.0, 34.0, 20.0, 18.0, 22.0, 12.0, 10.0, 9.0, 2.0, 5.0, 6.0, 7.0, 6.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-46.28619384765625, -44.47490310668945, -42.663612365722656, -40.85232162475586, -39.04103088378906, -37.229740142822266, -35.41844940185547, -33.60715866088867, -31.795867919921875, -29.984577178955078, -28.17328643798828, -26.361995697021484, -24.550704956054688, -22.73941421508789, -20.928123474121094, -19.116832733154297, -17.305543899536133, -15.494253158569336, -13.682962417602539, -11.871671676635742, -10.060380935668945, -8.249091148376465, -6.437800407409668, -4.626509666442871, -2.815218925476074, -1.003928303718567, 0.8073623180389404, 2.618652820587158, 4.429943561553955, 6.241233825683594, 8.05252456665039, 9.863815307617188, 11.675106048583984, 13.486396789550781, 15.297687530517578, 17.108978271484375, 18.920269012451172, 20.73155975341797, 22.542850494384766, 24.354141235351562, 26.16543197631836, 27.976722717285156, 29.788013458251953, 31.59930419921875, 33.41059494018555, 35.221885681152344, 37.03317642211914, 38.84446716308594, 40.65575408935547, 42.467044830322266, 44.27833557128906, 46.08962631225586, 47.900917053222656, 49.71220779418945, 51.52349853515625, 53.33478927612305, 55.146080017089844, 56.95737075805664, 58.76866149902344, 60.579952239990234, 62.39124298095703, 64.20252990722656, 66.01382446289062, 67.82511138916016, 69.63640594482422]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 4.0, 10.0, 11.0, 12.0, 14.0, 22.0, 16.0, 21.0, 24.0, 23.0, 22.0, 26.0, 31.0, 38.0, 41.0, 37.0, 31.0, 33.0, 47.0, 30.0, 50.0, 28.0, 41.0, 50.0, 36.0, 38.0, 32.0, 31.0, 21.0, 20.0, 25.0, 17.0, 19.0, 11.0, 7.0, 18.0, 9.0, 6.0, 11.0, 6.0, 9.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-45.57964324951172, -44.09043502807617, -42.601226806640625, -41.11201858520508, -39.62281036376953, -38.133602142333984, -36.64439392089844, -35.15518569946289, -33.665977478027344, -32.1767692565918, -30.68756103515625, -29.198352813720703, -27.709144592285156, -26.21993637084961, -24.730728149414062, -23.241519927978516, -21.75231170654297, -20.263103485107422, -18.773895263671875, -17.284687042236328, -15.795478820800781, -14.306270599365234, -12.817062377929688, -11.32785415649414, -9.838645935058594, -8.349437713623047, -6.8602294921875, -5.371021270751953, -3.8818130493164062, -2.3926048278808594, -0.9033966064453125, 0.5858116149902344, 2.0750198364257812, 3.564228057861328, 5.053436279296875, 6.542644500732422, 8.031852722167969, 9.521060943603516, 11.010269165039062, 12.49947738647461, 13.988685607910156, 15.477893829345703, 16.96710205078125, 18.456310272216797, 19.945518493652344, 21.43472671508789, 22.923934936523438, 24.413143157958984, 25.90235137939453, 27.391559600830078, 28.880767822265625, 30.369976043701172, 31.85918426513672, 33.348392486572266, 34.83760070800781, 36.32680892944336, 37.816017150878906, 39.30522537231445, 40.79443359375, 42.28364181518555, 43.772850036621094, 45.26205825805664, 46.75126647949219, 48.240474700927734, 49.72968292236328]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 3.0, 9.0, 16.0, 22.0, 29.0, 45.0, 53.0, 84.0, 96.0, 172.0, 284.0, 414.0, 585.0, 897.0, 1299.0, 2154.0, 3219.0, 5348.0, 9672.0, 19459.0, 54626.0, 259882.0, 1364810.0, 1924529.0, 418698.0, 76868.0, 23226.0, 10986.0, 6048.0, 3631.0, 2318.0, 1558.0, 1061.0, 670.0, 467.0, 300.0, 232.0, 172.0, 103.0, 70.0, 46.0, 34.0, 27.0, 24.0, 11.0, 4.0, 13.0, 7.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-82.875, -80.3740234375, -77.873046875, -75.3720703125, -72.87109375, -70.3701171875, -67.869140625, -65.3681640625, -62.8671875, -60.3662109375, -57.865234375, -55.3642578125, -52.86328125, -50.3623046875, -47.861328125, -45.3603515625, -42.859375, -40.3583984375, -37.857421875, -35.3564453125, -32.85546875, -30.3544921875, -27.853515625, -25.3525390625, -22.8515625, -20.3505859375, -17.849609375, -15.3486328125, -12.84765625, -10.3466796875, -7.845703125, -5.3447265625, -2.84375, -0.3427734375, 2.158203125, 4.6591796875, 7.16015625, 9.6611328125, 12.162109375, 14.6630859375, 17.1640625, 19.6650390625, 22.166015625, 24.6669921875, 27.16796875, 29.6689453125, 32.169921875, 34.6708984375, 37.171875, 39.6728515625, 42.173828125, 44.6748046875, 47.17578125, 49.6767578125, 52.177734375, 54.6787109375, 57.1796875, 59.6806640625, 62.181640625, 64.6826171875, 67.18359375, 69.6845703125, 72.185546875, 74.6865234375, 77.1875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 5.0, 7.0, 5.0, 10.0, 13.0, 20.0, 14.0, 9.0, 23.0, 23.0, 18.0, 19.0, 18.0, 28.0, 46.0, 29.0, 32.0, 43.0, 31.0, 50.0, 46.0, 28.0, 41.0, 51.0, 40.0, 49.0, 32.0, 37.0, 29.0, 35.0, 26.0, 19.0, 20.0, 14.0, 14.0, 12.0, 7.0, 14.0, 7.0, 9.0, 7.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.71875, -36.4296875, -35.140625, -33.8515625, -32.5625, -31.2734375, -29.984375, -28.6953125, -27.40625, -26.1171875, -24.828125, -23.5390625, -22.25, -20.9609375, -19.671875, -18.3828125, -17.09375, -15.8046875, -14.515625, -13.2265625, -11.9375, -10.6484375, -9.359375, -8.0703125, -6.78125, -5.4921875, -4.203125, -2.9140625, -1.625, -0.3359375, 0.953125, 2.2421875, 3.53125, 4.8203125, 6.109375, 7.3984375, 8.6875, 9.9765625, 11.265625, 12.5546875, 13.84375, 15.1328125, 16.421875, 17.7109375, 19.0, 20.2890625, 21.578125, 22.8671875, 24.15625, 25.4453125, 26.734375, 28.0234375, 29.3125, 30.6015625, 31.890625, 33.1796875, 34.46875, 35.7578125, 37.046875, 38.3359375, 39.625, 40.9140625, 42.203125, 43.4921875, 44.78125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 10.0, 13.0, 13.0, 20.0, 32.0, 29.0, 53.0, 80.0, 109.0, 139.0, 247.0, 319.0, 528.0, 723.0, 1200.0, 1995.0, 3363.0, 5920.0, 11272.0, 23008.0, 53835.0, 158527.0, 787917.0, 2525035.0, 431163.0, 108627.0, 40480.0, 18090.0, 9063.0, 4876.0, 2872.0, 1669.0, 1021.0, 655.0, 425.0, 303.0, 197.0, 123.0, 104.0, 76.0, 31.0, 39.0, 21.0, 16.0, 9.0, 13.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-92.0, -88.9677734375, -85.935546875, -82.9033203125, -79.87109375, -76.8388671875, -73.806640625, -70.7744140625, -67.7421875, -64.7099609375, -61.677734375, -58.6455078125, -55.61328125, -52.5810546875, -49.548828125, -46.5166015625, -43.484375, -40.4521484375, -37.419921875, -34.3876953125, -31.35546875, -28.3232421875, -25.291015625, -22.2587890625, -19.2265625, -16.1943359375, -13.162109375, -10.1298828125, -7.09765625, -4.0654296875, -1.033203125, 1.9990234375, 5.03125, 8.0634765625, 11.095703125, 14.1279296875, 17.16015625, 20.1923828125, 23.224609375, 26.2568359375, 29.2890625, 32.3212890625, 35.353515625, 38.3857421875, 41.41796875, 44.4501953125, 47.482421875, 50.5146484375, 53.546875, 56.5791015625, 59.611328125, 62.6435546875, 65.67578125, 68.7080078125, 71.740234375, 74.7724609375, 77.8046875, 80.8369140625, 83.869140625, 86.9013671875, 89.93359375, 92.9658203125, 95.998046875, 99.0302734375, 102.0625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 6.0, 8.0, 13.0, 11.0, 13.0, 21.0, 32.0, 58.0, 50.0, 89.0, 111.0, 185.0, 293.0, 470.0, 688.0, 672.0, 457.0, 269.0, 161.0, 139.0, 81.0, 66.0, 48.0, 34.0, 19.0, 20.0, 10.0, 14.0, 7.0, 9.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.28125, -20.3935546875, -19.505859375, -18.6181640625, -17.73046875, -16.8427734375, -15.955078125, -15.0673828125, -14.1796875, -13.2919921875, -12.404296875, -11.5166015625, -10.62890625, -9.7412109375, -8.853515625, -7.9658203125, -7.078125, -6.1904296875, -5.302734375, -4.4150390625, -3.52734375, -2.6396484375, -1.751953125, -0.8642578125, 0.0234375, 0.9111328125, 1.798828125, 2.6865234375, 3.57421875, 4.4619140625, 5.349609375, 6.2373046875, 7.125, 8.0126953125, 8.900390625, 9.7880859375, 10.67578125, 11.5634765625, 12.451171875, 13.3388671875, 14.2265625, 15.1142578125, 16.001953125, 16.8896484375, 17.77734375, 18.6650390625, 19.552734375, 20.4404296875, 21.328125, 22.2158203125, 23.103515625, 23.9912109375, 24.87890625, 25.7666015625, 26.654296875, 27.5419921875, 28.4296875, 29.3173828125, 30.205078125, 31.0927734375, 31.98046875, 32.8681640625, 33.755859375, 34.6435546875, 35.53125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 6.0, 6.0, 4.0, 7.0, 4.0, 14.0, 12.0, 16.0, 24.0, 25.0, 35.0, 41.0, 49.0, 69.0, 82.0, 94.0, 82.0, 80.0, 70.0, 70.0, 34.0, 34.0, 44.0, 16.0, 11.0, 21.0, 12.0, 8.0, 9.0, 6.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-54.37342071533203, -52.585872650146484, -50.7983283996582, -49.010780334472656, -47.223236083984375, -45.43568801879883, -43.64813995361328, -41.860595703125, -40.07304763793945, -38.285499572753906, -36.497955322265625, -34.71040725708008, -32.9228630065918, -31.13531494140625, -29.347768783569336, -27.560222625732422, -25.772676467895508, -23.985130310058594, -22.19758415222168, -20.410037994384766, -18.62248992919922, -16.834943771362305, -15.04739761352539, -13.25985050201416, -11.472304344177246, -9.684758186340332, -7.897211074829102, -6.1096649169921875, -4.322118282318115, -2.534571647644043, -0.7470254898071289, 1.0405216217041016, 2.8280677795410156, 4.615614414215088, 6.40316104888916, 8.190707206726074, 9.978254318237305, 11.765800476074219, 13.553346633911133, 15.340893745422363, 17.128440856933594, 18.915987014770508, 20.703533172607422, 22.49108123779297, 24.278627395629883, 26.066173553466797, 27.85371971130371, 29.641265869140625, 31.42881202697754, 33.21635818481445, 35.00390625, 36.79145050048828, 38.57899856567383, 40.366546630859375, 42.154090881347656, 43.9416389465332, 45.729183197021484, 47.51673126220703, 49.30427551269531, 51.09182357788086, 52.87936782836914, 54.66691589355469, 56.45446014404297, 58.242008209228516, 60.02955627441406]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 8.0, 3.0, 2.0, 5.0, 12.0, 16.0, 8.0, 12.0, 18.0, 14.0, 37.0, 30.0, 26.0, 28.0, 29.0, 38.0, 40.0, 39.0, 43.0, 44.0, 48.0, 53.0, 37.0, 50.0, 50.0, 32.0, 34.0, 29.0, 32.0, 23.0, 29.0, 26.0, 16.0, 20.0, 15.0, 11.0, 10.0, 13.0, 8.0, 6.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.65070724487305, -41.14067459106445, -39.630645751953125, -38.12061309814453, -36.6105842590332, -35.10055160522461, -33.59052276611328, -32.08049011230469, -30.570457458496094, -29.060426712036133, -27.550395965576172, -26.040363311767578, -24.530332565307617, -23.020301818847656, -21.510271072387695, -20.000240325927734, -18.490209579467773, -16.980178833007812, -15.470147132873535, -13.960116386413574, -12.450084686279297, -10.940053939819336, -9.430023193359375, -7.919991493225098, -6.409960746765137, -4.899929523468018, -3.3898985385894775, -1.8798675537109375, -0.36983633041381836, 1.1401948928833008, 2.6502256393432617, 4.160257339477539, 5.6702880859375, 7.180319309234619, 8.690350532531738, 10.2003812789917, 11.710412979125977, 13.220443725585938, 14.730474472045898, 16.24050521850586, 17.750537872314453, 19.260568618774414, 20.770599365234375, 22.28063201904297, 23.79066276550293, 25.30069351196289, 26.81072425842285, 28.320755004882812, 29.830785751342773, 31.340816497802734, 32.85084915161133, 34.360877990722656, 35.87091064453125, 37.380943298339844, 38.89097213745117, 40.401004791259766, 41.911033630371094, 43.42106628417969, 44.931095123291016, 46.44112777709961, 47.95115661621094, 49.46118927001953, 50.971221923828125, 52.48125076293945, 53.99128341674805]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 7.0, 9.0, 7.0, 27.0, 28.0, 54.0, 66.0, 72.0, 134.0, 194.0, 286.0, 390.0, 541.0, 725.0, 1064.0, 1450.0, 2105.0, 3069.0, 4193.0, 5958.0, 8662.0, 12837.0, 19312.0, 29646.0, 46993.0, 77466.0, 132686.0, 215853.0, 187610.0, 111730.0, 65657.0, 40066.0, 25483.0, 16950.0, 11420.0, 7660.0, 5381.0, 3735.0, 2707.0, 1896.0, 1288.0, 893.0, 708.0, 459.0, 340.0, 217.0, 163.0, 124.0, 83.0, 54.0, 41.0, 28.0, 11.0, 11.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0], "bins": [-18.25, -17.6767578125, -17.103515625, -16.5302734375, -15.95703125, -15.3837890625, -14.810546875, -14.2373046875, -13.6640625, -13.0908203125, -12.517578125, -11.9443359375, -11.37109375, -10.7978515625, -10.224609375, -9.6513671875, -9.078125, -8.5048828125, -7.931640625, -7.3583984375, -6.78515625, -6.2119140625, -5.638671875, -5.0654296875, -4.4921875, -3.9189453125, -3.345703125, -2.7724609375, -2.19921875, -1.6259765625, -1.052734375, -0.4794921875, 0.09375, 0.6669921875, 1.240234375, 1.8134765625, 2.38671875, 2.9599609375, 3.533203125, 4.1064453125, 4.6796875, 5.2529296875, 5.826171875, 6.3994140625, 6.97265625, 7.5458984375, 8.119140625, 8.6923828125, 9.265625, 9.8388671875, 10.412109375, 10.9853515625, 11.55859375, 12.1318359375, 12.705078125, 13.2783203125, 13.8515625, 14.4248046875, 14.998046875, 15.5712890625, 16.14453125, 16.7177734375, 17.291015625, 17.8642578125, 18.4375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 4.0, 4.0, 4.0, 9.0, 4.0, 14.0, 18.0, 13.0, 10.0, 21.0, 25.0, 29.0, 26.0, 23.0, 28.0, 43.0, 36.0, 46.0, 52.0, 39.0, 46.0, 44.0, 42.0, 48.0, 45.0, 34.0, 30.0, 31.0, 29.0, 23.0, 29.0, 28.0, 21.0, 19.0, 9.0, 22.0, 7.0, 10.0, 7.0, 10.0, 2.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.8125, -40.3369140625, -38.861328125, -37.3857421875, -35.91015625, -34.4345703125, -32.958984375, -31.4833984375, -30.0078125, -28.5322265625, -27.056640625, -25.5810546875, -24.10546875, -22.6298828125, -21.154296875, -19.6787109375, -18.203125, -16.7275390625, -15.251953125, -13.7763671875, -12.30078125, -10.8251953125, -9.349609375, -7.8740234375, -6.3984375, -4.9228515625, -3.447265625, -1.9716796875, -0.49609375, 0.9794921875, 2.455078125, 3.9306640625, 5.40625, 6.8818359375, 8.357421875, 9.8330078125, 11.30859375, 12.7841796875, 14.259765625, 15.7353515625, 17.2109375, 18.6865234375, 20.162109375, 21.6376953125, 23.11328125, 24.5888671875, 26.064453125, 27.5400390625, 29.015625, 30.4912109375, 31.966796875, 33.4423828125, 34.91796875, 36.3935546875, 37.869140625, 39.3447265625, 40.8203125, 42.2958984375, 43.771484375, 45.2470703125, 46.72265625, 48.1982421875, 49.673828125, 51.1494140625, 52.625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 8.0, 13.0, 18.0, 34.0, 25.0, 44.0, 60.0, 82.0, 112.0, 154.0, 222.0, 313.0, 436.0, 663.0, 952.0, 1460.0, 2140.0, 3464.0, 5492.0, 9665.0, 19171.0, 60702.0, 760320.0, 127792.0, 25056.0, 11909.0, 6716.0, 4035.0, 2507.0, 1568.0, 1069.0, 688.0, 492.0, 343.0, 234.0, 161.0, 121.0, 101.0, 51.0, 52.0, 30.0, 22.0, 15.0, 11.0, 5.0, 14.0, 3.0, 3.0, 0.0, 2.0, 2.0], "bins": [-42.5, -41.30810546875, -40.1162109375, -38.92431640625, -37.732421875, -36.54052734375, -35.3486328125, -34.15673828125, -32.96484375, -31.77294921875, -30.5810546875, -29.38916015625, -28.197265625, -27.00537109375, -25.8134765625, -24.62158203125, -23.4296875, -22.23779296875, -21.0458984375, -19.85400390625, -18.662109375, -17.47021484375, -16.2783203125, -15.08642578125, -13.89453125, -12.70263671875, -11.5107421875, -10.31884765625, -9.126953125, -7.93505859375, -6.7431640625, -5.55126953125, -4.359375, -3.16748046875, -1.9755859375, -0.78369140625, 0.408203125, 1.60009765625, 2.7919921875, 3.98388671875, 5.17578125, 6.36767578125, 7.5595703125, 8.75146484375, 9.943359375, 11.13525390625, 12.3271484375, 13.51904296875, 14.7109375, 15.90283203125, 17.0947265625, 18.28662109375, 19.478515625, 20.67041015625, 21.8623046875, 23.05419921875, 24.24609375, 25.43798828125, 26.6298828125, 27.82177734375, 29.013671875, 30.20556640625, 31.3974609375, 32.58935546875, 33.78125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 11.0, 11.0, 10.0, 10.0, 13.0, 13.0, 20.0, 23.0, 23.0, 23.0, 24.0, 25.0, 33.0, 27.0, 47.0, 38.0, 45.0, 42.0, 34.0, 38.0, 46.0, 39.0, 36.0, 41.0, 46.0, 27.0, 46.0, 26.0, 35.0, 20.0, 15.0, 18.0, 15.0, 10.0, 13.0, 3.0, 5.0, 9.0, 10.0, 8.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-30.484375, -29.447021484375, -28.40966796875, -27.372314453125, -26.3349609375, -25.297607421875, -24.26025390625, -23.222900390625, -22.185546875, -21.148193359375, -20.11083984375, -19.073486328125, -18.0361328125, -16.998779296875, -15.96142578125, -14.924072265625, -13.88671875, -12.849365234375, -11.81201171875, -10.774658203125, -9.7373046875, -8.699951171875, -7.66259765625, -6.625244140625, -5.587890625, -4.550537109375, -3.51318359375, -2.475830078125, -1.4384765625, -0.401123046875, 0.63623046875, 1.673583984375, 2.7109375, 3.748291015625, 4.78564453125, 5.822998046875, 6.8603515625, 7.897705078125, 8.93505859375, 9.972412109375, 11.009765625, 12.047119140625, 13.08447265625, 14.121826171875, 15.1591796875, 16.196533203125, 17.23388671875, 18.271240234375, 19.30859375, 20.345947265625, 21.38330078125, 22.420654296875, 23.4580078125, 24.495361328125, 25.53271484375, 26.570068359375, 27.607421875, 28.644775390625, 29.68212890625, 30.719482421875, 31.7568359375, 32.794189453125, 33.83154296875, 34.868896484375, 35.90625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 8.0, 9.0, 21.0, 34.0, 45.0, 88.0, 178.0, 330.0, 596.0, 1518.0, 4573.0, 21986.0, 929529.0, 76471.0, 8848.0, 2417.0, 1007.0, 403.0, 204.0, 98.0, 59.0, 48.0, 27.0, 13.0, 8.0, 8.0, 7.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1796875, -6.9208984375, -6.662109375, -6.4033203125, -6.14453125, -5.8857421875, -5.626953125, -5.3681640625, -5.109375, -4.8505859375, -4.591796875, -4.3330078125, -4.07421875, -3.8154296875, -3.556640625, -3.2978515625, -3.0390625, -2.7802734375, -2.521484375, -2.2626953125, -2.00390625, -1.7451171875, -1.486328125, -1.2275390625, -0.96875, -0.7099609375, -0.451171875, -0.1923828125, 0.06640625, 0.3251953125, 0.583984375, 0.8427734375, 1.1015625, 1.3603515625, 1.619140625, 1.8779296875, 2.13671875, 2.3955078125, 2.654296875, 2.9130859375, 3.171875, 3.4306640625, 3.689453125, 3.9482421875, 4.20703125, 4.4658203125, 4.724609375, 4.9833984375, 5.2421875, 5.5009765625, 5.759765625, 6.0185546875, 6.27734375, 6.5361328125, 6.794921875, 7.0537109375, 7.3125, 7.5712890625, 7.830078125, 8.0888671875, 8.34765625, 8.6064453125, 8.865234375, 9.1240234375, 9.3828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 10.0, 11.0, 25.0, 27.0, 36.0, 59.0, 77.0, 140.0, 147.0, 148.0, 89.0, 62.0, 44.0, 34.0, 17.0, 13.0, 11.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000743865966796875, -0.0007168799638748169, -0.0006898939609527588, -0.0006629079580307007, -0.0006359219551086426, -0.0006089359521865845, -0.0005819499492645264, -0.0005549639463424683, -0.0005279779434204102, -0.000500991940498352, -0.00047400593757629395, -0.00044701993465423584, -0.00042003393173217773, -0.00039304792881011963, -0.0003660619258880615, -0.0003390759229660034, -0.0003120899200439453, -0.0002851039171218872, -0.0002581179141998291, -0.000231131911277771, -0.0002041459083557129, -0.00017715990543365479, -0.00015017390251159668, -0.00012318789958953857, -9.620189666748047e-05, -6.921589374542236e-05, -4.222989082336426e-05, -1.5243887901306152e-05, 1.1742115020751953e-05, 3.872811794281006e-05, 6.571412086486816e-05, 9.270012378692627e-05, 0.00011968612670898438, 0.00014667212963104248, 0.00017365813255310059, 0.0002006441354751587, 0.0002276301383972168, 0.0002546161413192749, 0.000281602144241333, 0.0003085881471633911, 0.0003355741500854492, 0.0003625601530075073, 0.00038954615592956543, 0.00041653215885162354, 0.00044351816177368164, 0.00047050416469573975, 0.0004974901676177979, 0.000524476170539856, 0.0005514621734619141, 0.0005784481763839722, 0.0006054341793060303, 0.0006324201822280884, 0.0006594061851501465, 0.0006863921880722046, 0.0007133781909942627, 0.0007403641939163208, 0.0007673501968383789, 0.000794336199760437, 0.0008213222026824951, 0.0008483082056045532, 0.0008752942085266113, 0.0009022802114486694, 0.0009292662143707275, 0.0009562522172927856, 0.0009832382202148438]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 8.0, 11.0, 8.0, 22.0, 18.0, 36.0, 50.0, 55.0, 99.0, 144.0, 166.0, 258.0, 386.0, 587.0, 912.0, 1456.0, 2508.0, 4546.0, 9346.0, 22490.0, 69919.0, 330441.0, 457919.0, 95073.0, 28121.0, 11159.0, 5315.0, 2871.0, 1615.0, 1047.0, 636.0, 410.0, 275.0, 167.0, 136.0, 97.0, 69.0, 51.0, 27.0, 24.0, 18.0, 11.0, 15.0, 12.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.15625, -5.9583740234375, -5.760498046875, -5.5626220703125, -5.36474609375, -5.1668701171875, -4.968994140625, -4.7711181640625, -4.5732421875, -4.3753662109375, -4.177490234375, -3.9796142578125, -3.78173828125, -3.5838623046875, -3.385986328125, -3.1881103515625, -2.990234375, -2.7923583984375, -2.594482421875, -2.3966064453125, -2.19873046875, -2.0008544921875, -1.802978515625, -1.6051025390625, -1.4072265625, -1.2093505859375, -1.011474609375, -0.8135986328125, -0.61572265625, -0.4178466796875, -0.219970703125, -0.0220947265625, 0.17578125, 0.3736572265625, 0.571533203125, 0.7694091796875, 0.96728515625, 1.1651611328125, 1.363037109375, 1.5609130859375, 1.7587890625, 1.9566650390625, 2.154541015625, 2.3524169921875, 2.55029296875, 2.7481689453125, 2.946044921875, 3.1439208984375, 3.341796875, 3.5396728515625, 3.737548828125, 3.9354248046875, 4.13330078125, 4.3311767578125, 4.529052734375, 4.7269287109375, 4.9248046875, 5.1226806640625, 5.320556640625, 5.5184326171875, 5.71630859375, 5.9141845703125, 6.112060546875, 6.3099365234375, 6.5078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 9.0, 5.0, 11.0, 17.0, 25.0, 36.0, 53.0, 95.0, 116.0, 174.0, 144.0, 114.0, 52.0, 38.0, 20.0, 20.0, 19.0, 7.0, 9.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6865234375, -1.629425048828125, -1.57232666015625, -1.515228271484375, -1.4581298828125, -1.401031494140625, -1.34393310546875, -1.286834716796875, -1.229736328125, -1.172637939453125, -1.11553955078125, -1.058441162109375, -1.0013427734375, -0.944244384765625, -0.88714599609375, -0.830047607421875, -0.77294921875, -0.715850830078125, -0.65875244140625, -0.601654052734375, -0.5445556640625, -0.487457275390625, -0.43035888671875, -0.373260498046875, -0.316162109375, -0.259063720703125, -0.20196533203125, -0.144866943359375, -0.0877685546875, -0.030670166015625, 0.02642822265625, 0.083526611328125, 0.140625, 0.197723388671875, 0.25482177734375, 0.311920166015625, 0.3690185546875, 0.426116943359375, 0.48321533203125, 0.540313720703125, 0.597412109375, 0.654510498046875, 0.71160888671875, 0.768707275390625, 0.8258056640625, 0.882904052734375, 0.94000244140625, 0.997100830078125, 1.05419921875, 1.111297607421875, 1.16839599609375, 1.225494384765625, 1.2825927734375, 1.339691162109375, 1.39678955078125, 1.453887939453125, 1.510986328125, 1.568084716796875, 1.62518310546875, 1.682281494140625, 1.7393798828125, 1.796478271484375, 1.85357666015625, 1.910675048828125, 1.9677734375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 7.0, 3.0, 8.0, 11.0, 10.0, 7.0, 21.0, 19.0, 23.0, 43.0, 41.0, 61.0, 58.0, 84.0, 90.0, 85.0, 77.0, 77.0, 58.0, 40.0, 41.0, 33.0, 21.0, 17.0, 10.0, 11.0, 10.0, 10.0, 8.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.22563552856445, -45.49348449707031, -43.76133346557617, -42.02918243408203, -40.297035217285156, -38.564884185791016, -36.832733154296875, -35.100582122802734, -33.368431091308594, -31.636280059814453, -29.904130935668945, -28.171979904174805, -26.439828872680664, -24.707679748535156, -22.975528717041016, -21.243377685546875, -19.511228561401367, -17.779077529907227, -16.04692840576172, -14.314777374267578, -12.582626342773438, -10.850476264953613, -9.118326187133789, -7.386175155639648, -5.654025077819824, -3.921874523162842, -2.1897242069244385, -0.45757389068603516, 1.2745766639709473, 3.0067272186279297, 4.738877296447754, 6.4710283279418945, 8.203178405761719, 9.935328483581543, 11.667479515075684, 13.399629592895508, 15.131780624389648, 16.863929748535156, 18.596080780029297, 20.328231811523438, 22.060382843017578, 23.79253387451172, 25.524682998657227, 27.256834030151367, 28.988985061645508, 30.721134185791016, 32.453285217285156, 34.1854362487793, 35.91758728027344, 37.64973831176758, 39.38188934326172, 41.114036560058594, 42.846187591552734, 44.578338623046875, 46.310489654541016, 48.042640686035156, 49.77478790283203, 51.50693893432617, 53.23908996582031, 54.97123718261719, 56.70338821411133, 58.43553924560547, 60.16769027709961, 61.89984130859375, 63.63199234008789]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 5.0, 2.0, 4.0, 10.0, 17.0, 8.0, 12.0, 16.0, 13.0, 39.0, 28.0, 32.0, 25.0, 28.0, 36.0, 41.0, 42.0, 42.0, 46.0, 47.0, 50.0, 39.0, 51.0, 47.0, 33.0, 36.0, 29.0, 33.0, 24.0, 26.0, 26.0, 21.0, 19.0, 14.0, 9.0, 12.0, 11.0, 8.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.657379150390625, -40.182823181152344, -38.70826721191406, -37.23371505737305, -35.759159088134766, -34.284603118896484, -32.81005096435547, -31.335494995117188, -29.860939025878906, -28.386383056640625, -26.911828994750977, -25.437274932861328, -23.962718963623047, -22.488162994384766, -21.013608932495117, -19.53905487060547, -18.064498901367188, -16.589942932128906, -15.115388870239258, -13.640833854675293, -12.166278839111328, -10.691723823547363, -9.217168807983398, -7.742613792419434, -6.268058776855469, -4.793503761291504, -3.318948745727539, -1.8443937301635742, -0.3698387145996094, 1.1047163009643555, 2.5792713165283203, 4.053826332092285, 5.528385162353516, 7.0029401779174805, 8.477495193481445, 9.95205020904541, 11.426605224609375, 12.90116024017334, 14.375715255737305, 15.85027027130127, 17.324825286865234, 18.799381256103516, 20.273935317993164, 21.748489379882812, 23.223045349121094, 24.697601318359375, 26.172155380249023, 27.646709442138672, 29.121265411376953, 30.595821380615234, 32.07037353515625, 33.54492950439453, 35.01948547363281, 36.494041442871094, 37.968597412109375, 39.44314956665039, 40.91770553588867, 42.39226150512695, 43.86681365966797, 45.34136962890625, 46.81592559814453, 48.29048156738281, 49.765037536621094, 51.23958969116211, 52.71414566040039]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 12.0, 16.0, 34.0, 19.0, 38.0, 64.0, 96.0, 150.0, 211.0, 330.0, 438.0, 719.0, 1004.0, 1617.0, 2487.0, 3842.0, 5950.0, 9954.0, 16658.0, 28735.0, 53169.0, 105241.0, 218391.0, 282525.0, 149215.0, 73524.0, 38526.0, 21692.0, 12624.0, 7650.0, 4796.0, 3107.0, 1872.0, 1276.0, 822.0, 568.0, 368.0, 263.0, 175.0, 113.0, 88.0, 54.0, 35.0, 28.0, 21.0, 16.0, 3.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-56.0, -54.20751953125, -52.4150390625, -50.62255859375, -48.830078125, -47.03759765625, -45.2451171875, -43.45263671875, -41.66015625, -39.86767578125, -38.0751953125, -36.28271484375, -34.490234375, -32.69775390625, -30.9052734375, -29.11279296875, -27.3203125, -25.52783203125, -23.7353515625, -21.94287109375, -20.150390625, -18.35791015625, -16.5654296875, -14.77294921875, -12.98046875, -11.18798828125, -9.3955078125, -7.60302734375, -5.810546875, -4.01806640625, -2.2255859375, -0.43310546875, 1.359375, 3.15185546875, 4.9443359375, 6.73681640625, 8.529296875, 10.32177734375, 12.1142578125, 13.90673828125, 15.69921875, 17.49169921875, 19.2841796875, 21.07666015625, 22.869140625, 24.66162109375, 26.4541015625, 28.24658203125, 30.0390625, 31.83154296875, 33.6240234375, 35.41650390625, 37.208984375, 39.00146484375, 40.7939453125, 42.58642578125, 44.37890625, 46.17138671875, 47.9638671875, 49.75634765625, 51.548828125, 53.34130859375, 55.1337890625, 56.92626953125, 58.71875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 13.0, 7.0, 10.0, 14.0, 18.0, 27.0, 30.0, 24.0, 24.0, 32.0, 36.0, 40.0, 49.0, 45.0, 54.0, 53.0, 48.0, 55.0, 61.0, 50.0, 38.0, 31.0, 33.0, 26.0, 29.0, 25.0, 23.0, 19.0, 16.0, 11.0, 8.0, 10.0, 8.0, 7.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.03125, -42.470703125, -40.91015625, -39.349609375, -37.7890625, -36.228515625, -34.66796875, -33.107421875, -31.546875, -29.986328125, -28.42578125, -26.865234375, -25.3046875, -23.744140625, -22.18359375, -20.623046875, -19.0625, -17.501953125, -15.94140625, -14.380859375, -12.8203125, -11.259765625, -9.69921875, -8.138671875, -6.578125, -5.017578125, -3.45703125, -1.896484375, -0.3359375, 1.224609375, 2.78515625, 4.345703125, 5.90625, 7.466796875, 9.02734375, 10.587890625, 12.1484375, 13.708984375, 15.26953125, 16.830078125, 18.390625, 19.951171875, 21.51171875, 23.072265625, 24.6328125, 26.193359375, 27.75390625, 29.314453125, 30.875, 32.435546875, 33.99609375, 35.556640625, 37.1171875, 38.677734375, 40.23828125, 41.798828125, 43.359375, 44.919921875, 46.48046875, 48.041015625, 49.6015625, 51.162109375, 52.72265625, 54.283203125, 55.84375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 5.0, 5.0, 9.0, 15.0, 20.0, 23.0, 36.0, 70.0, 87.0, 149.0, 235.0, 352.0, 532.0, 740.0, 1168.0, 1754.0, 2792.0, 4189.0, 6369.0, 10309.0, 16229.0, 26510.0, 44146.0, 77424.0, 140489.0, 235193.0, 204504.0, 114224.0, 63065.0, 37174.0, 22100.0, 13894.0, 8586.0, 5684.0, 3523.0, 2368.0, 1614.0, 966.0, 673.0, 476.0, 291.0, 207.0, 115.0, 94.0, 59.0, 34.0, 23.0, 23.0, 5.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-58.90625, -57.21484375, -55.5234375, -53.83203125, -52.140625, -50.44921875, -48.7578125, -47.06640625, -45.375, -43.68359375, -41.9921875, -40.30078125, -38.609375, -36.91796875, -35.2265625, -33.53515625, -31.84375, -30.15234375, -28.4609375, -26.76953125, -25.078125, -23.38671875, -21.6953125, -20.00390625, -18.3125, -16.62109375, -14.9296875, -13.23828125, -11.546875, -9.85546875, -8.1640625, -6.47265625, -4.78125, -3.08984375, -1.3984375, 0.29296875, 1.984375, 3.67578125, 5.3671875, 7.05859375, 8.75, 10.44140625, 12.1328125, 13.82421875, 15.515625, 17.20703125, 18.8984375, 20.58984375, 22.28125, 23.97265625, 25.6640625, 27.35546875, 29.046875, 30.73828125, 32.4296875, 34.12109375, 35.8125, 37.50390625, 39.1953125, 40.88671875, 42.578125, 44.26953125, 45.9609375, 47.65234375, 49.34375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 13.0, 11.0, 12.0, 10.0, 13.0, 18.0, 19.0, 29.0, 25.0, 22.0, 27.0, 30.0, 40.0, 30.0, 39.0, 23.0, 36.0, 45.0, 39.0, 53.0, 41.0, 38.0, 43.0, 37.0, 35.0, 32.0, 28.0, 26.0, 16.0, 24.0, 19.0, 20.0, 16.0, 10.0, 13.0, 4.0, 11.0, 8.0, 8.0, 7.0, 5.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-28.484375, -27.630126953125, -26.77587890625, -25.921630859375, -25.0673828125, -24.213134765625, -23.35888671875, -22.504638671875, -21.650390625, -20.796142578125, -19.94189453125, -19.087646484375, -18.2333984375, -17.379150390625, -16.52490234375, -15.670654296875, -14.81640625, -13.962158203125, -13.10791015625, -12.253662109375, -11.3994140625, -10.545166015625, -9.69091796875, -8.836669921875, -7.982421875, -7.128173828125, -6.27392578125, -5.419677734375, -4.5654296875, -3.711181640625, -2.85693359375, -2.002685546875, -1.1484375, -0.294189453125, 0.56005859375, 1.414306640625, 2.2685546875, 3.122802734375, 3.97705078125, 4.831298828125, 5.685546875, 6.539794921875, 7.39404296875, 8.248291015625, 9.1025390625, 9.956787109375, 10.81103515625, 11.665283203125, 12.51953125, 13.373779296875, 14.22802734375, 15.082275390625, 15.9365234375, 16.790771484375, 17.64501953125, 18.499267578125, 19.353515625, 20.207763671875, 21.06201171875, 21.916259765625, 22.7705078125, 23.624755859375, 24.47900390625, 25.333251953125, 26.1875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 1.0, 6.0, 12.0, 20.0, 23.0, 28.0, 48.0, 70.0, 100.0, 165.0, 248.0, 440.0, 731.0, 1199.0, 2183.0, 4312.0, 9951.0, 25476.0, 80189.0, 315661.0, 434965.0, 113867.0, 34590.0, 12793.0, 5330.0, 2576.0, 1432.0, 817.0, 493.0, 287.0, 185.0, 124.0, 59.0, 49.0, 51.0, 17.0, 18.0, 14.0, 12.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.0625, -38.77587890625, -37.4892578125, -36.20263671875, -34.916015625, -33.62939453125, -32.3427734375, -31.05615234375, -29.76953125, -28.48291015625, -27.1962890625, -25.90966796875, -24.623046875, -23.33642578125, -22.0498046875, -20.76318359375, -19.4765625, -18.18994140625, -16.9033203125, -15.61669921875, -14.330078125, -13.04345703125, -11.7568359375, -10.47021484375, -9.18359375, -7.89697265625, -6.6103515625, -5.32373046875, -4.037109375, -2.75048828125, -1.4638671875, -0.17724609375, 1.109375, 2.39599609375, 3.6826171875, 4.96923828125, 6.255859375, 7.54248046875, 8.8291015625, 10.11572265625, 11.40234375, 12.68896484375, 13.9755859375, 15.26220703125, 16.548828125, 17.83544921875, 19.1220703125, 20.40869140625, 21.6953125, 22.98193359375, 24.2685546875, 25.55517578125, 26.841796875, 28.12841796875, 29.4150390625, 30.70166015625, 31.98828125, 33.27490234375, 34.5615234375, 35.84814453125, 37.134765625, 38.42138671875, 39.7080078125, 40.99462890625, 42.28125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 9.0, 7.0, 17.0, 18.0, 29.0, 37.0, 79.0, 141.0, 179.0, 169.0, 107.0, 76.0, 43.0, 27.0, 24.0, 16.0, 6.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028438568115234375, -0.0027130544185638428, -0.002582252025604248, -0.0024514496326446533, -0.0023206472396850586, -0.002189844846725464, -0.002059042453765869, -0.0019282400608062744, -0.0017974376678466797, -0.001666635274887085, -0.0015358328819274902, -0.0014050304889678955, -0.0012742280960083008, -0.001143425703048706, -0.0010126233100891113, -0.0008818209171295166, -0.0007510185241699219, -0.0006202161312103271, -0.0004894137382507324, -0.0003586113452911377, -0.00022780895233154297, -9.700655937194824e-05, 3.3795833587646484e-05, 0.0001645982265472412, 0.00029540061950683594, 0.00042620301246643066, 0.0005570054054260254, 0.0006878077983856201, 0.0008186101913452148, 0.0009494125843048096, 0.0010802149772644043, 0.001211017370223999, 0.0013418197631835938, 0.0014726221561431885, 0.0016034245491027832, 0.001734226942062378, 0.0018650293350219727, 0.0019958317279815674, 0.002126634120941162, 0.002257436513900757, 0.0023882389068603516, 0.0025190412998199463, 0.002649843692779541, 0.0027806460857391357, 0.0029114484786987305, 0.003042250871658325, 0.00317305326461792, 0.0033038556575775146, 0.0034346580505371094, 0.003565460443496704, 0.003696262836456299, 0.0038270652294158936, 0.003957867622375488, 0.004088670015335083, 0.004219472408294678, 0.0043502748012542725, 0.004481077194213867, 0.004611879587173462, 0.004742681980133057, 0.004873484373092651, 0.005004286766052246, 0.005135089159011841, 0.0052658915519714355, 0.00539669394493103, 0.005527496337890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 6.0, 4.0, 16.0, 11.0, 25.0, 21.0, 26.0, 45.0, 77.0, 93.0, 142.0, 217.0, 308.0, 467.0, 776.0, 1194.0, 2061.0, 3830.0, 7562.0, 16503.0, 40236.0, 112003.0, 328009.0, 341590.0, 116624.0, 42287.0, 17161.0, 7786.0, 3994.0, 2010.0, 1251.0, 735.0, 502.0, 285.0, 188.0, 151.0, 95.0, 81.0, 41.0, 43.0, 25.0, 23.0, 13.0, 15.0, 9.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.328125, -27.384521484375, -26.44091796875, -25.497314453125, -24.5537109375, -23.610107421875, -22.66650390625, -21.722900390625, -20.779296875, -19.835693359375, -18.89208984375, -17.948486328125, -17.0048828125, -16.061279296875, -15.11767578125, -14.174072265625, -13.23046875, -12.286865234375, -11.34326171875, -10.399658203125, -9.4560546875, -8.512451171875, -7.56884765625, -6.625244140625, -5.681640625, -4.738037109375, -3.79443359375, -2.850830078125, -1.9072265625, -0.963623046875, -0.02001953125, 0.923583984375, 1.8671875, 2.810791015625, 3.75439453125, 4.697998046875, 5.6416015625, 6.585205078125, 7.52880859375, 8.472412109375, 9.416015625, 10.359619140625, 11.30322265625, 12.246826171875, 13.1904296875, 14.134033203125, 15.07763671875, 16.021240234375, 16.96484375, 17.908447265625, 18.85205078125, 19.795654296875, 20.7392578125, 21.682861328125, 22.62646484375, 23.570068359375, 24.513671875, 25.457275390625, 26.40087890625, 27.344482421875, 28.2880859375, 29.231689453125, 30.17529296875, 31.118896484375, 32.0625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 4.0, 8.0, 13.0, 9.0, 11.0, 22.0, 23.0, 30.0, 50.0, 50.0, 69.0, 62.0, 74.0, 83.0, 85.0, 73.0, 62.0, 51.0, 40.0, 38.0, 33.0, 25.0, 15.0, 19.0, 12.0, 4.0, 14.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.890625, -7.650634765625, -7.41064453125, -7.170654296875, -6.9306640625, -6.690673828125, -6.45068359375, -6.210693359375, -5.970703125, -5.730712890625, -5.49072265625, -5.250732421875, -5.0107421875, -4.770751953125, -4.53076171875, -4.290771484375, -4.05078125, -3.810791015625, -3.57080078125, -3.330810546875, -3.0908203125, -2.850830078125, -2.61083984375, -2.370849609375, -2.130859375, -1.890869140625, -1.65087890625, -1.410888671875, -1.1708984375, -0.930908203125, -0.69091796875, -0.450927734375, -0.2109375, 0.029052734375, 0.26904296875, 0.509033203125, 0.7490234375, 0.989013671875, 1.22900390625, 1.468994140625, 1.708984375, 1.948974609375, 2.18896484375, 2.428955078125, 2.6689453125, 2.908935546875, 3.14892578125, 3.388916015625, 3.62890625, 3.868896484375, 4.10888671875, 4.348876953125, 4.5888671875, 4.828857421875, 5.06884765625, 5.308837890625, 5.548828125, 5.788818359375, 6.02880859375, 6.268798828125, 6.5087890625, 6.748779296875, 6.98876953125, 7.228759765625, 7.46875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 3.0, 7.0, 14.0, 15.0, 23.0, 23.0, 21.0, 36.0, 52.0, 49.0, 77.0, 66.0, 86.0, 96.0, 74.0, 77.0, 45.0, 48.0, 37.0, 38.0, 27.0, 21.0, 8.0, 11.0, 7.0, 8.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.10462951660156, -46.39650344848633, -44.688377380371094, -42.98025131225586, -41.272125244140625, -39.56399917602539, -37.855873107910156, -36.14774703979492, -34.43962097167969, -32.73149490356445, -31.02336883544922, -29.315242767333984, -27.60711669921875, -25.898990631103516, -24.19086456298828, -22.482738494873047, -20.774612426757812, -19.066486358642578, -17.358360290527344, -15.65023422241211, -13.942108154296875, -12.23398208618164, -10.525856018066406, -8.817729949951172, -7.1096038818359375, -5.401477813720703, -3.6933517456054688, -1.9852256774902344, -0.277099609375, 1.4310264587402344, 3.1391525268554688, 4.847278594970703, 6.555408477783203, 8.263534545898438, 9.971660614013672, 11.679786682128906, 13.38791275024414, 15.096038818359375, 16.80416488647461, 18.512290954589844, 20.220417022705078, 21.928543090820312, 23.636669158935547, 25.34479522705078, 27.052921295166016, 28.76104736328125, 30.469173431396484, 32.17729949951172, 33.88542556762695, 35.59355163574219, 37.30167770385742, 39.009803771972656, 40.71792984008789, 42.426055908203125, 44.13418197631836, 45.842308044433594, 47.55043411254883, 49.25856018066406, 50.9666862487793, 52.67481231689453, 54.382938385009766, 56.091064453125, 57.799190521240234, 59.50731658935547, 61.2154426574707]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 8.0, 7.0, 11.0, 11.0, 12.0, 10.0, 22.0, 21.0, 23.0, 39.0, 38.0, 41.0, 42.0, 42.0, 56.0, 44.0, 47.0, 48.0, 36.0, 52.0, 41.0, 43.0, 40.0, 40.0, 39.0, 24.0, 34.0, 19.0, 20.0, 24.0, 14.0, 11.0, 13.0, 11.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.30747604370117, -44.63785934448242, -42.968238830566406, -41.298622131347656, -39.629005432128906, -37.959388732910156, -36.289772033691406, -34.62015151977539, -32.95053482055664, -31.28091812133789, -29.611299514770508, -27.941680908203125, -26.272064208984375, -24.602447509765625, -22.932828903198242, -21.26321029663086, -19.59359359741211, -17.92397689819336, -16.254358291625977, -14.58474063873291, -12.915122985839844, -11.245505332946777, -9.575887680053711, -7.9062700271606445, -6.236652374267578, -4.567034721374512, -2.8974170684814453, -1.227799415588379, 0.4418182373046875, 2.111435890197754, 3.7810535430908203, 5.450671195983887, 7.120288848876953, 8.78990650177002, 10.459524154663086, 12.129141807556152, 13.798759460449219, 15.468377113342285, 17.13799476623535, 18.807613372802734, 20.477230072021484, 22.146846771240234, 23.816465377807617, 25.486083984375, 27.15570068359375, 28.8253173828125, 30.494935989379883, 32.164554595947266, 33.834171295166016, 35.503787994384766, 37.17340850830078, 38.84302520751953, 40.51264190673828, 42.18225860595703, 43.85187530517578, 45.5214958190918, 47.19111251831055, 48.8607292175293, 50.53034973144531, 52.19996643066406, 53.86958312988281, 55.53919982910156, 57.20881652832031, 58.87843704223633, 60.54805374145508]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [3.0, 4.0, 8.0, 9.0, 16.0, 18.0, 22.0, 42.0, 49.0, 78.0, 105.0, 190.0, 232.0, 303.0, 488.0, 733.0, 1007.0, 1568.0, 2430.0, 3651.0, 6001.0, 10176.0, 19867.0, 46041.0, 143957.0, 517808.0, 1595474.0, 1303254.0, 365226.0, 97405.0, 35240.0, 16718.0, 9416.0, 5473.0, 3545.0, 2304.0, 1531.0, 1090.0, 828.0, 526.0, 422.0, 278.0, 220.0, 142.0, 117.0, 91.0, 48.0, 37.0, 33.0, 27.0, 14.0, 19.0, 9.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.71875, -47.86865234375, -46.0185546875, -44.16845703125, -42.318359375, -40.46826171875, -38.6181640625, -36.76806640625, -34.91796875, -33.06787109375, -31.2177734375, -29.36767578125, -27.517578125, -25.66748046875, -23.8173828125, -21.96728515625, -20.1171875, -18.26708984375, -16.4169921875, -14.56689453125, -12.716796875, -10.86669921875, -9.0166015625, -7.16650390625, -5.31640625, -3.46630859375, -1.6162109375, 0.23388671875, 2.083984375, 3.93408203125, 5.7841796875, 7.63427734375, 9.484375, 11.33447265625, 13.1845703125, 15.03466796875, 16.884765625, 18.73486328125, 20.5849609375, 22.43505859375, 24.28515625, 26.13525390625, 27.9853515625, 29.83544921875, 31.685546875, 33.53564453125, 35.3857421875, 37.23583984375, 39.0859375, 40.93603515625, 42.7861328125, 44.63623046875, 46.486328125, 48.33642578125, 50.1865234375, 52.03662109375, 53.88671875, 55.73681640625, 57.5869140625, 59.43701171875, 61.287109375, 63.13720703125, 64.9873046875, 66.83740234375, 68.6875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 10.0, 8.0, 10.0, 8.0, 7.0, 19.0, 17.0, 25.0, 24.0, 32.0, 31.0, 49.0, 45.0, 47.0, 57.0, 53.0, 60.0, 40.0, 51.0, 48.0, 53.0, 46.0, 36.0, 41.0, 28.0, 31.0, 29.0, 23.0, 21.0, 11.0, 9.0, 10.0, 11.0, 8.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.40625, -39.896484375, -38.38671875, -36.876953125, -35.3671875, -33.857421875, -32.34765625, -30.837890625, -29.328125, -27.818359375, -26.30859375, -24.798828125, -23.2890625, -21.779296875, -20.26953125, -18.759765625, -17.25, -15.740234375, -14.23046875, -12.720703125, -11.2109375, -9.701171875, -8.19140625, -6.681640625, -5.171875, -3.662109375, -2.15234375, -0.642578125, 0.8671875, 2.376953125, 3.88671875, 5.396484375, 6.90625, 8.416015625, 9.92578125, 11.435546875, 12.9453125, 14.455078125, 15.96484375, 17.474609375, 18.984375, 20.494140625, 22.00390625, 23.513671875, 25.0234375, 26.533203125, 28.04296875, 29.552734375, 31.0625, 32.572265625, 34.08203125, 35.591796875, 37.1015625, 38.611328125, 40.12109375, 41.630859375, 43.140625, 44.650390625, 46.16015625, 47.669921875, 49.1796875, 50.689453125, 52.19921875, 53.708984375, 55.21875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 14.0, 13.0, 13.0, 21.0, 26.0, 52.0, 90.0, 121.0, 193.0, 240.0, 385.0, 586.0, 928.0, 1359.0, 2169.0, 3688.0, 6189.0, 11245.0, 22359.0, 50400.0, 137311.0, 507643.0, 2188399.0, 912934.0, 213288.0, 71314.0, 29546.0, 14459.0, 7693.0, 4341.0, 2609.0, 1607.0, 1031.0, 648.0, 438.0, 298.0, 205.0, 143.0, 109.0, 62.0, 34.0, 30.0, 16.0, 11.0, 13.0, 2.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.0, -72.5556640625, -70.111328125, -67.6669921875, -65.22265625, -62.7783203125, -60.333984375, -57.8896484375, -55.4453125, -53.0009765625, -50.556640625, -48.1123046875, -45.66796875, -43.2236328125, -40.779296875, -38.3349609375, -35.890625, -33.4462890625, -31.001953125, -28.5576171875, -26.11328125, -23.6689453125, -21.224609375, -18.7802734375, -16.3359375, -13.8916015625, -11.447265625, -9.0029296875, -6.55859375, -4.1142578125, -1.669921875, 0.7744140625, 3.21875, 5.6630859375, 8.107421875, 10.5517578125, 12.99609375, 15.4404296875, 17.884765625, 20.3291015625, 22.7734375, 25.2177734375, 27.662109375, 30.1064453125, 32.55078125, 34.9951171875, 37.439453125, 39.8837890625, 42.328125, 44.7724609375, 47.216796875, 49.6611328125, 52.10546875, 54.5498046875, 56.994140625, 59.4384765625, 61.8828125, 64.3271484375, 66.771484375, 69.2158203125, 71.66015625, 74.1044921875, 76.548828125, 78.9931640625, 81.4375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 7.0, 2.0, 9.0, 5.0, 10.0, 16.0, 18.0, 20.0, 27.0, 35.0, 60.0, 87.0, 108.0, 150.0, 202.0, 274.0, 373.0, 516.0, 603.0, 421.0, 286.0, 246.0, 164.0, 116.0, 74.0, 64.0, 34.0, 34.0, 25.0, 23.0, 9.0, 8.0, 7.0, 10.0, 15.0, 6.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.921875, -22.20849609375, -21.4951171875, -20.78173828125, -20.068359375, -19.35498046875, -18.6416015625, -17.92822265625, -17.21484375, -16.50146484375, -15.7880859375, -15.07470703125, -14.361328125, -13.64794921875, -12.9345703125, -12.22119140625, -11.5078125, -10.79443359375, -10.0810546875, -9.36767578125, -8.654296875, -7.94091796875, -7.2275390625, -6.51416015625, -5.80078125, -5.08740234375, -4.3740234375, -3.66064453125, -2.947265625, -2.23388671875, -1.5205078125, -0.80712890625, -0.09375, 0.61962890625, 1.3330078125, 2.04638671875, 2.759765625, 3.47314453125, 4.1865234375, 4.89990234375, 5.61328125, 6.32666015625, 7.0400390625, 7.75341796875, 8.466796875, 9.18017578125, 9.8935546875, 10.60693359375, 11.3203125, 12.03369140625, 12.7470703125, 13.46044921875, 14.173828125, 14.88720703125, 15.6005859375, 16.31396484375, 17.02734375, 17.74072265625, 18.4541015625, 19.16748046875, 19.880859375, 20.59423828125, 21.3076171875, 22.02099609375, 22.734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 6.0, 5.0, 8.0, 11.0, 6.0, 9.0, 16.0, 16.0, 16.0, 15.0, 23.0, 40.0, 54.0, 59.0, 55.0, 74.0, 89.0, 69.0, 72.0, 62.0, 49.0, 50.0, 40.0, 39.0, 23.0, 17.0, 22.0, 15.0, 14.0, 3.0, 7.0, 4.0, 2.0, 1.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-44.840267181396484, -43.35997772216797, -41.87968826293945, -40.39939880371094, -38.91911315917969, -37.43882369995117, -35.958534240722656, -34.47824478149414, -32.997955322265625, -31.51766586303711, -30.037378311157227, -28.55708885192871, -27.076801300048828, -25.596511840820312, -24.116222381591797, -22.63593292236328, -21.15564727783203, -19.675357818603516, -18.195070266723633, -16.714780807495117, -15.234492301940918, -13.754203796386719, -12.273914337158203, -10.793625831604004, -9.313337326049805, -7.8330488204956055, -6.352759838104248, -4.872470855712891, -3.3921823501586914, -1.9118938446044922, -0.43160438537597656, 1.0486841201782227, 2.5289764404296875, 4.009264945983887, 5.489553928375244, 6.969842910766602, 8.4501314163208, 9.930419921875, 11.410709381103516, 12.890997886657715, 14.371286392211914, 15.851574897766113, 17.331863403320312, 18.812152862548828, 20.292442321777344, 21.772729873657227, 23.253019332885742, 24.733306884765625, 26.21359634399414, 27.693885803222656, 29.17417335510254, 30.654462814331055, 32.13475036621094, 33.61503982543945, 35.09532928466797, 36.575618743896484, 38.055908203125, 39.536197662353516, 41.01648712158203, 42.49677276611328, 43.9770622253418, 45.45735168457031, 46.93764114379883, 48.417930603027344, 49.898216247558594]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 10.0, 12.0, 10.0, 15.0, 15.0, 18.0, 12.0, 26.0, 27.0, 26.0, 39.0, 34.0, 36.0, 49.0, 41.0, 41.0, 44.0, 37.0, 47.0, 45.0, 41.0, 41.0, 38.0, 32.0, 43.0, 24.0, 33.0, 25.0, 28.0, 14.0, 20.0, 12.0, 11.0, 17.0, 8.0, 5.0, 2.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.163185119628906, -39.7889404296875, -38.41469192504883, -37.04044723510742, -35.66619873046875, -34.291954040527344, -32.91770935058594, -31.543460845947266, -30.16921615600586, -28.79496955871582, -27.42072296142578, -26.046478271484375, -24.672231674194336, -23.297985076904297, -21.923738479614258, -20.54949188232422, -19.17524528503418, -17.80099868774414, -16.4267520904541, -15.052506446838379, -13.678260803222656, -12.304014205932617, -10.929767608642578, -9.555521965026855, -8.181275367736816, -6.8070292472839355, -5.432783126831055, -4.058536529541016, -2.6842904090881348, -1.310044288635254, 0.06420230865478516, 1.4384479522705078, 2.812694549560547, 4.186940670013428, 5.561186790466309, 6.935433387756348, 8.30967903137207, 9.68392562866211, 11.058172225952148, 12.432417869567871, 13.80666446685791, 15.18091106414795, 16.555156707763672, 17.92940330505371, 19.30364990234375, 20.677894592285156, 22.052143096923828, 23.426387786865234, 24.800634384155273, 26.174880981445312, 27.54912757873535, 28.92337417602539, 30.297618865966797, 31.671865463256836, 33.046112060546875, 34.42035675048828, 35.79460525512695, 37.16884994506836, 38.54309844970703, 39.91734313964844, 41.29159164428711, 42.665836334228516, 44.04008483886719, 45.414329528808594, 46.78857421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 13.0, 11.0, 21.0, 22.0, 42.0, 56.0, 60.0, 126.0, 150.0, 209.0, 306.0, 470.0, 677.0, 931.0, 1393.0, 2202.0, 3149.0, 4741.0, 6992.0, 11121.0, 17308.0, 27710.0, 47300.0, 82841.0, 151644.0, 249589.0, 188215.0, 102670.0, 56757.0, 33219.0, 20518.0, 13123.0, 8265.0, 5372.0, 3574.0, 2459.0, 1690.0, 1132.0, 787.0, 523.0, 324.0, 267.0, 172.0, 139.0, 81.0, 59.0, 48.0, 30.0, 22.0, 15.0, 2.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-18.46875, -17.903564453125, -17.33837890625, -16.773193359375, -16.2080078125, -15.642822265625, -15.07763671875, -14.512451171875, -13.947265625, -13.382080078125, -12.81689453125, -12.251708984375, -11.6865234375, -11.121337890625, -10.55615234375, -9.990966796875, -9.42578125, -8.860595703125, -8.29541015625, -7.730224609375, -7.1650390625, -6.599853515625, -6.03466796875, -5.469482421875, -4.904296875, -4.339111328125, -3.77392578125, -3.208740234375, -2.6435546875, -2.078369140625, -1.51318359375, -0.947998046875, -0.3828125, 0.182373046875, 0.74755859375, 1.312744140625, 1.8779296875, 2.443115234375, 3.00830078125, 3.573486328125, 4.138671875, 4.703857421875, 5.26904296875, 5.834228515625, 6.3994140625, 6.964599609375, 7.52978515625, 8.094970703125, 8.66015625, 9.225341796875, 9.79052734375, 10.355712890625, 10.9208984375, 11.486083984375, 12.05126953125, 12.616455078125, 13.181640625, 13.746826171875, 14.31201171875, 14.877197265625, 15.4423828125, 16.007568359375, 16.57275390625, 17.137939453125, 17.703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 7.0, 11.0, 14.0, 13.0, 10.0, 10.0, 25.0, 23.0, 24.0, 31.0, 35.0, 29.0, 38.0, 50.0, 43.0, 45.0, 39.0, 36.0, 37.0, 41.0, 47.0, 58.0, 33.0, 36.0, 37.0, 32.0, 25.0, 28.0, 21.0, 15.0, 14.0, 17.0, 10.0, 6.0, 13.0, 9.0, 5.0, 2.0, 3.0, 3.0, 5.0, 0.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.84375, -39.48291015625, -38.1220703125, -36.76123046875, -35.400390625, -34.03955078125, -32.6787109375, -31.31787109375, -29.95703125, -28.59619140625, -27.2353515625, -25.87451171875, -24.513671875, -23.15283203125, -21.7919921875, -20.43115234375, -19.0703125, -17.70947265625, -16.3486328125, -14.98779296875, -13.626953125, -12.26611328125, -10.9052734375, -9.54443359375, -8.18359375, -6.82275390625, -5.4619140625, -4.10107421875, -2.740234375, -1.37939453125, -0.0185546875, 1.34228515625, 2.703125, 4.06396484375, 5.4248046875, 6.78564453125, 8.146484375, 9.50732421875, 10.8681640625, 12.22900390625, 13.58984375, 14.95068359375, 16.3115234375, 17.67236328125, 19.033203125, 20.39404296875, 21.7548828125, 23.11572265625, 24.4765625, 25.83740234375, 27.1982421875, 28.55908203125, 29.919921875, 31.28076171875, 32.6416015625, 34.00244140625, 35.36328125, 36.72412109375, 38.0849609375, 39.44580078125, 40.806640625, 42.16748046875, 43.5283203125, 44.88916015625, 46.25]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 3.0, 14.0, 13.0, 21.0, 33.0, 46.0, 59.0, 85.0, 148.0, 214.0, 341.0, 571.0, 899.0, 1348.0, 2400.0, 3880.0, 6731.0, 12190.0, 26185.0, 158199.0, 742604.0, 52341.0, 17785.0, 9336.0, 5135.0, 2995.0, 1806.0, 1166.0, 733.0, 442.0, 303.0, 167.0, 132.0, 59.0, 50.0, 46.0, 26.0, 13.0, 10.0, 5.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.28125, -35.22265625, -34.1640625, -33.10546875, -32.046875, -30.98828125, -29.9296875, -28.87109375, -27.8125, -26.75390625, -25.6953125, -24.63671875, -23.578125, -22.51953125, -21.4609375, -20.40234375, -19.34375, -18.28515625, -17.2265625, -16.16796875, -15.109375, -14.05078125, -12.9921875, -11.93359375, -10.875, -9.81640625, -8.7578125, -7.69921875, -6.640625, -5.58203125, -4.5234375, -3.46484375, -2.40625, -1.34765625, -0.2890625, 0.76953125, 1.828125, 2.88671875, 3.9453125, 5.00390625, 6.0625, 7.12109375, 8.1796875, 9.23828125, 10.296875, 11.35546875, 12.4140625, 13.47265625, 14.53125, 15.58984375, 16.6484375, 17.70703125, 18.765625, 19.82421875, 20.8828125, 21.94140625, 23.0, 24.05859375, 25.1171875, 26.17578125, 27.234375, 28.29296875, 29.3515625, 30.41015625, 31.46875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 1.0, 6.0, 4.0, 10.0, 17.0, 10.0, 15.0, 21.0, 15.0, 22.0, 20.0, 34.0, 37.0, 26.0, 40.0, 47.0, 37.0, 36.0, 45.0, 50.0, 46.0, 38.0, 43.0, 46.0, 35.0, 28.0, 40.0, 27.0, 34.0, 31.0, 14.0, 19.0, 18.0, 19.0, 17.0, 15.0, 13.0, 6.0, 4.0, 6.0, 3.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.84375, -28.8251953125, -27.806640625, -26.7880859375, -25.76953125, -24.7509765625, -23.732421875, -22.7138671875, -21.6953125, -20.6767578125, -19.658203125, -18.6396484375, -17.62109375, -16.6025390625, -15.583984375, -14.5654296875, -13.546875, -12.5283203125, -11.509765625, -10.4912109375, -9.47265625, -8.4541015625, -7.435546875, -6.4169921875, -5.3984375, -4.3798828125, -3.361328125, -2.3427734375, -1.32421875, -0.3056640625, 0.712890625, 1.7314453125, 2.75, 3.7685546875, 4.787109375, 5.8056640625, 6.82421875, 7.8427734375, 8.861328125, 9.8798828125, 10.8984375, 11.9169921875, 12.935546875, 13.9541015625, 14.97265625, 15.9912109375, 17.009765625, 18.0283203125, 19.046875, 20.0654296875, 21.083984375, 22.1025390625, 23.12109375, 24.1396484375, 25.158203125, 26.1767578125, 27.1953125, 28.2138671875, 29.232421875, 30.2509765625, 31.26953125, 32.2880859375, 33.306640625, 34.3251953125, 35.34375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 18.0, 20.0, 37.0, 52.0, 60.0, 86.0, 125.0, 174.0, 282.0, 431.0, 728.0, 1230.0, 2253.0, 4399.0, 9206.0, 22871.0, 128126.0, 804883.0, 44743.0, 14834.0, 6411.0, 3205.0, 1740.0, 971.0, 562.0, 377.0, 198.0, 151.0, 106.0, 65.0, 63.0, 35.0, 30.0, 15.0, 15.0, 9.0, 10.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3359375, -3.232574462890625, -3.12921142578125, -3.025848388671875, -2.9224853515625, -2.819122314453125, -2.71575927734375, -2.612396240234375, -2.509033203125, -2.405670166015625, -2.30230712890625, -2.198944091796875, -2.0955810546875, -1.992218017578125, -1.88885498046875, -1.785491943359375, -1.68212890625, -1.578765869140625, -1.47540283203125, -1.372039794921875, -1.2686767578125, -1.165313720703125, -1.06195068359375, -0.958587646484375, -0.855224609375, -0.751861572265625, -0.64849853515625, -0.545135498046875, -0.4417724609375, -0.338409423828125, -0.23504638671875, -0.131683349609375, -0.0283203125, 0.075042724609375, 0.17840576171875, 0.281768798828125, 0.3851318359375, 0.488494873046875, 0.59185791015625, 0.695220947265625, 0.798583984375, 0.901947021484375, 1.00531005859375, 1.108673095703125, 1.2120361328125, 1.315399169921875, 1.41876220703125, 1.522125244140625, 1.62548828125, 1.728851318359375, 1.83221435546875, 1.935577392578125, 2.0389404296875, 2.142303466796875, 2.24566650390625, 2.349029541015625, 2.452392578125, 2.555755615234375, 2.65911865234375, 2.762481689453125, 2.8658447265625, 2.969207763671875, 3.07257080078125, 3.175933837890625, 3.279296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 9.0, 16.0, 23.0, 52.0, 70.0, 108.0, 145.0, 176.0, 124.0, 106.0, 75.0, 40.0, 18.0, 13.0, 9.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006508827209472656, -0.0006280690431594849, -0.0006052553653717041, -0.0005824416875839233, -0.0005596280097961426, -0.0005368143320083618, -0.0005140006542205811, -0.0004911869764328003, -0.00046837329864501953, -0.00044555962085723877, -0.000422745943069458, -0.00039993226528167725, -0.0003771185874938965, -0.0003543049097061157, -0.00033149123191833496, -0.0003086775541305542, -0.00028586387634277344, -0.0002630501985549927, -0.00024023652076721191, -0.00021742284297943115, -0.0001946091651916504, -0.00017179548740386963, -0.00014898180961608887, -0.0001261681318283081, -0.00010335445404052734, -8.054077625274658e-05, -5.772709846496582e-05, -3.491342067718506e-05, -1.2099742889404297e-05, 1.0713934898376465e-05, 3.3527612686157227e-05, 5.634129047393799e-05, 7.915496826171875e-05, 0.00010196864604949951, 0.00012478232383728027, 0.00014759600162506104, 0.0001704096794128418, 0.00019322335720062256, 0.00021603703498840332, 0.00023885071277618408, 0.00026166439056396484, 0.0002844780683517456, 0.00030729174613952637, 0.00033010542392730713, 0.0003529191017150879, 0.00037573277950286865, 0.0003985464572906494, 0.0004213601350784302, 0.00044417381286621094, 0.0004669874906539917, 0.0004898011684417725, 0.0005126148462295532, 0.000535428524017334, 0.0005582422018051147, 0.0005810558795928955, 0.0006038695573806763, 0.000626683235168457, 0.0006494969129562378, 0.0006723105907440186, 0.0006951242685317993, 0.0007179379463195801, 0.0007407516241073608, 0.0007635653018951416, 0.0007863789796829224, 0.0008091926574707031]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 9.0, 9.0, 9.0, 12.0, 15.0, 25.0, 40.0, 52.0, 77.0, 138.0, 151.0, 240.0, 351.0, 468.0, 696.0, 982.0, 1435.0, 2188.0, 3121.0, 4755.0, 7134.0, 10908.0, 16831.0, 27006.0, 44433.0, 75589.0, 133211.0, 211581.0, 202320.0, 121976.0, 70137.0, 40940.0, 24780.0, 15852.0, 10240.0, 6722.0, 4461.0, 3083.0, 2052.0, 1392.0, 1013.0, 659.0, 424.0, 318.0, 245.0, 121.0, 101.0, 82.0, 60.0, 37.0, 30.0, 22.0, 10.0, 9.0, 7.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.13671875, -2.067626953125, -1.99853515625, -1.929443359375, -1.8603515625, -1.791259765625, -1.72216796875, -1.653076171875, -1.583984375, -1.514892578125, -1.44580078125, -1.376708984375, -1.3076171875, -1.238525390625, -1.16943359375, -1.100341796875, -1.03125, -0.962158203125, -0.89306640625, -0.823974609375, -0.7548828125, -0.685791015625, -0.61669921875, -0.547607421875, -0.478515625, -0.409423828125, -0.34033203125, -0.271240234375, -0.2021484375, -0.133056640625, -0.06396484375, 0.005126953125, 0.07421875, 0.143310546875, 0.21240234375, 0.281494140625, 0.3505859375, 0.419677734375, 0.48876953125, 0.557861328125, 0.626953125, 0.696044921875, 0.76513671875, 0.834228515625, 0.9033203125, 0.972412109375, 1.04150390625, 1.110595703125, 1.1796875, 1.248779296875, 1.31787109375, 1.386962890625, 1.4560546875, 1.525146484375, 1.59423828125, 1.663330078125, 1.732421875, 1.801513671875, 1.87060546875, 1.939697265625, 2.0087890625, 2.077880859375, 2.14697265625, 2.216064453125, 2.28515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 8.0, 5.0, 10.0, 10.0, 11.0, 12.0, 12.0, 21.0, 18.0, 23.0, 28.0, 25.0, 38.0, 37.0, 44.0, 42.0, 70.0, 72.0, 72.0, 68.0, 57.0, 44.0, 41.0, 32.0, 25.0, 23.0, 24.0, 31.0, 10.0, 13.0, 12.0, 11.0, 14.0, 4.0, 2.0, 5.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74658203125, -0.72076416015625, -0.6949462890625, -0.66912841796875, -0.643310546875, -0.61749267578125, -0.5916748046875, -0.56585693359375, -0.5400390625, -0.51422119140625, -0.4884033203125, -0.46258544921875, -0.436767578125, -0.41094970703125, -0.3851318359375, -0.35931396484375, -0.33349609375, -0.30767822265625, -0.2818603515625, -0.25604248046875, -0.230224609375, -0.20440673828125, -0.1785888671875, -0.15277099609375, -0.126953125, -0.10113525390625, -0.0753173828125, -0.04949951171875, -0.023681640625, 0.00213623046875, 0.0279541015625, 0.05377197265625, 0.07958984375, 0.10540771484375, 0.1312255859375, 0.15704345703125, 0.182861328125, 0.20867919921875, 0.2344970703125, 0.26031494140625, 0.2861328125, 0.31195068359375, 0.3377685546875, 0.36358642578125, 0.389404296875, 0.41522216796875, 0.4410400390625, 0.46685791015625, 0.49267578125, 0.51849365234375, 0.5443115234375, 0.57012939453125, 0.595947265625, 0.62176513671875, 0.6475830078125, 0.67340087890625, 0.69921875, 0.72503662109375, 0.7508544921875, 0.77667236328125, 0.802490234375, 0.82830810546875, 0.8541259765625, 0.87994384765625, 0.90576171875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 0.0, 3.0, 7.0, 5.0, 8.0, 9.0, 15.0, 10.0, 11.0, 22.0, 23.0, 37.0, 52.0, 62.0, 61.0, 85.0, 95.0, 92.0, 65.0, 70.0, 54.0, 45.0, 40.0, 39.0, 14.0, 23.0, 15.0, 11.0, 5.0, 3.0, 5.0, 6.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.892513275146484, -47.27054977416992, -45.648590087890625, -44.02662658691406, -42.4046630859375, -40.7827033996582, -39.16073989868164, -37.538780212402344, -35.91681671142578, -34.29485321044922, -32.67289352416992, -31.05093002319336, -29.42896842956543, -27.8070068359375, -26.185043334960938, -24.563081741333008, -22.941118240356445, -21.319156646728516, -19.697193145751953, -18.075231552124023, -16.453269958496094, -14.831307411193848, -13.209344863891602, -11.587383270263672, -9.965420722961426, -8.34345817565918, -6.72149658203125, -5.099534034729004, -3.477571964263916, -1.8556098937988281, -0.23364734649658203, 1.3883142471313477, 3.0102767944335938, 4.632238864898682, 6.2542009353637695, 7.876163482666016, 9.498125076293945, 11.120087623596191, 12.742050170898438, 14.364011764526367, 15.985974311828613, 17.60793685913086, 19.22989845275879, 20.85186004638672, 22.47382354736328, 24.09578514099121, 25.71774673461914, 27.339710235595703, 28.961671829223633, 30.583633422851562, 32.205596923828125, 33.82756042480469, 35.449520111083984, 37.07148361206055, 38.693443298339844, 40.315406799316406, 41.93737030029297, 43.55933380126953, 45.18129348754883, 46.80325698852539, 48.42522048950195, 50.04718017578125, 51.66914367675781, 53.291107177734375, 54.91306686401367]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 10.0, 8.0, 12.0, 11.0, 19.0, 16.0, 16.0, 23.0, 25.0, 29.0, 32.0, 34.0, 37.0, 44.0, 52.0, 45.0, 42.0, 32.0, 44.0, 47.0, 47.0, 42.0, 38.0, 37.0, 38.0, 31.0, 29.0, 27.0, 27.0, 13.0, 18.0, 13.0, 11.0, 18.0, 9.0, 3.0, 2.0, 4.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.21173858642578, -39.8424186706543, -38.47309494018555, -37.10377502441406, -35.73445510864258, -34.365135192871094, -32.995811462402344, -31.62649154663086, -30.257169723510742, -28.887847900390625, -27.51852798461914, -26.149206161499023, -24.779884338378906, -23.410564422607422, -22.041242599487305, -20.671920776367188, -19.302600860595703, -17.933279037475586, -16.5639591217041, -15.194637298583984, -13.825316429138184, -12.455995559692383, -11.086673736572266, -9.717352867126465, -8.348031997680664, -6.978711128234863, -5.609389781951904, -4.240068435668945, -2.8707475662231445, -1.5014266967773438, -0.13210487365722656, 1.2372159957885742, 2.6065330505371094, 3.9758541584014893, 5.345175266265869, 6.714496612548828, 8.083817481994629, 9.45313835144043, 10.822460174560547, 12.191781044006348, 13.561101913452148, 14.93042278289795, 16.29974365234375, 17.669065475463867, 19.038387298583984, 20.40770721435547, 21.777029037475586, 23.146350860595703, 24.515670776367188, 25.884992599487305, 27.25431251525879, 28.623634338378906, 29.99295425415039, 31.362276077270508, 32.731597900390625, 34.10091781616211, 35.470237731933594, 36.83955764770508, 38.20888137817383, 39.57820129394531, 40.9475212097168, 42.31684112548828, 43.68616485595703, 45.055484771728516, 46.424808502197266]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 13.0, 11.0, 18.0, 34.0, 47.0, 70.0, 87.0, 172.0, 252.0, 365.0, 554.0, 787.0, 1213.0, 1881.0, 2633.0, 4179.0, 6529.0, 10543.0, 16626.0, 26977.0, 44716.0, 77811.0, 143249.0, 238386.0, 202275.0, 111432.0, 61406.0, 36234.0, 22017.0, 13596.0, 8568.0, 5426.0, 3545.0, 2252.0, 1589.0, 1012.0, 726.0, 430.0, 315.0, 208.0, 124.0, 94.0, 50.0, 32.0, 32.0, 15.0, 8.0, 5.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.875, -44.38525390625, -42.8955078125, -41.40576171875, -39.916015625, -38.42626953125, -36.9365234375, -35.44677734375, -33.95703125, -32.46728515625, -30.9775390625, -29.48779296875, -27.998046875, -26.50830078125, -25.0185546875, -23.52880859375, -22.0390625, -20.54931640625, -19.0595703125, -17.56982421875, -16.080078125, -14.59033203125, -13.1005859375, -11.61083984375, -10.12109375, -8.63134765625, -7.1416015625, -5.65185546875, -4.162109375, -2.67236328125, -1.1826171875, 0.30712890625, 1.796875, 3.28662109375, 4.7763671875, 6.26611328125, 7.755859375, 9.24560546875, 10.7353515625, 12.22509765625, 13.71484375, 15.20458984375, 16.6943359375, 18.18408203125, 19.673828125, 21.16357421875, 22.6533203125, 24.14306640625, 25.6328125, 27.12255859375, 28.6123046875, 30.10205078125, 31.591796875, 33.08154296875, 34.5712890625, 36.06103515625, 37.55078125, 39.04052734375, 40.5302734375, 42.02001953125, 43.509765625, 44.99951171875, 46.4892578125, 47.97900390625, 49.46875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 13.0, 8.0, 12.0, 17.0, 17.0, 12.0, 21.0, 21.0, 28.0, 22.0, 32.0, 39.0, 48.0, 47.0, 50.0, 39.0, 41.0, 40.0, 40.0, 43.0, 60.0, 29.0, 36.0, 26.0, 42.0, 30.0, 26.0, 20.0, 24.0, 20.0, 20.0, 13.0, 9.0, 6.0, 9.0, 8.0, 3.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.5, -38.203125, -36.90625, -35.609375, -34.3125, -33.015625, -31.71875, -30.421875, -29.125, -27.828125, -26.53125, -25.234375, -23.9375, -22.640625, -21.34375, -20.046875, -18.75, -17.453125, -16.15625, -14.859375, -13.5625, -12.265625, -10.96875, -9.671875, -8.375, -7.078125, -5.78125, -4.484375, -3.1875, -1.890625, -0.59375, 0.703125, 2.0, 3.296875, 4.59375, 5.890625, 7.1875, 8.484375, 9.78125, 11.078125, 12.375, 13.671875, 14.96875, 16.265625, 17.5625, 18.859375, 20.15625, 21.453125, 22.75, 24.046875, 25.34375, 26.640625, 27.9375, 29.234375, 30.53125, 31.828125, 33.125, 34.421875, 35.71875, 37.015625, 38.3125, 39.609375, 40.90625, 42.203125, 43.5]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 15.0, 20.0, 22.0, 33.0, 51.0, 89.0, 106.0, 152.0, 213.0, 355.0, 446.0, 745.0, 1098.0, 1681.0, 2496.0, 3876.0, 6036.0, 9300.0, 14857.0, 23634.0, 39460.0, 66401.0, 113235.0, 188531.0, 216807.0, 144651.0, 84477.0, 49242.0, 29672.0, 18212.0, 11595.0, 7309.0, 4582.0, 3015.0, 2002.0, 1304.0, 933.0, 577.0, 415.0, 284.0, 181.0, 148.0, 96.0, 68.0, 38.0, 36.0, 22.0, 12.0, 9.0, 5.0, 3.0, 0.0, 1.0, 3.0], "bins": [-53.375, -51.8154296875, -50.255859375, -48.6962890625, -47.13671875, -45.5771484375, -44.017578125, -42.4580078125, -40.8984375, -39.3388671875, -37.779296875, -36.2197265625, -34.66015625, -33.1005859375, -31.541015625, -29.9814453125, -28.421875, -26.8623046875, -25.302734375, -23.7431640625, -22.18359375, -20.6240234375, -19.064453125, -17.5048828125, -15.9453125, -14.3857421875, -12.826171875, -11.2666015625, -9.70703125, -8.1474609375, -6.587890625, -5.0283203125, -3.46875, -1.9091796875, -0.349609375, 1.2099609375, 2.76953125, 4.3291015625, 5.888671875, 7.4482421875, 9.0078125, 10.5673828125, 12.126953125, 13.6865234375, 15.24609375, 16.8056640625, 18.365234375, 19.9248046875, 21.484375, 23.0439453125, 24.603515625, 26.1630859375, 27.72265625, 29.2822265625, 30.841796875, 32.4013671875, 33.9609375, 35.5205078125, 37.080078125, 38.6396484375, 40.19921875, 41.7587890625, 43.318359375, 44.8779296875, 46.4375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 9.0, 5.0, 10.0, 11.0, 10.0, 10.0, 7.0, 13.0, 13.0, 8.0, 22.0, 16.0, 32.0, 40.0, 30.0, 27.0, 32.0, 46.0, 41.0, 48.0, 47.0, 34.0, 31.0, 40.0, 38.0, 27.0, 43.0, 39.0, 28.0, 28.0, 30.0, 16.0, 21.0, 23.0, 18.0, 16.0, 13.0, 19.0, 16.0, 8.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-25.875, -25.0791015625, -24.283203125, -23.4873046875, -22.69140625, -21.8955078125, -21.099609375, -20.3037109375, -19.5078125, -18.7119140625, -17.916015625, -17.1201171875, -16.32421875, -15.5283203125, -14.732421875, -13.9365234375, -13.140625, -12.3447265625, -11.548828125, -10.7529296875, -9.95703125, -9.1611328125, -8.365234375, -7.5693359375, -6.7734375, -5.9775390625, -5.181640625, -4.3857421875, -3.58984375, -2.7939453125, -1.998046875, -1.2021484375, -0.40625, 0.3896484375, 1.185546875, 1.9814453125, 2.77734375, 3.5732421875, 4.369140625, 5.1650390625, 5.9609375, 6.7568359375, 7.552734375, 8.3486328125, 9.14453125, 9.9404296875, 10.736328125, 11.5322265625, 12.328125, 13.1240234375, 13.919921875, 14.7158203125, 15.51171875, 16.3076171875, 17.103515625, 17.8994140625, 18.6953125, 19.4912109375, 20.287109375, 21.0830078125, 21.87890625, 22.6748046875, 23.470703125, 24.2666015625, 25.0625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 8.0, 9.0, 15.0, 21.0, 26.0, 47.0, 76.0, 61.0, 98.0, 153.0, 227.0, 346.0, 472.0, 773.0, 1094.0, 1693.0, 2703.0, 4318.0, 6887.0, 11244.0, 18874.0, 33375.0, 61340.0, 117326.0, 227908.0, 256274.0, 138319.0, 70837.0, 38361.0, 21979.0, 12616.0, 7686.0, 4654.0, 2930.0, 1881.0, 1235.0, 897.0, 581.0, 414.0, 264.0, 187.0, 104.0, 75.0, 50.0, 33.0, 32.0, 17.0, 13.0, 11.0, 5.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-23.828125, -23.108642578125, -22.38916015625, -21.669677734375, -20.9501953125, -20.230712890625, -19.51123046875, -18.791748046875, -18.072265625, -17.352783203125, -16.63330078125, -15.913818359375, -15.1943359375, -14.474853515625, -13.75537109375, -13.035888671875, -12.31640625, -11.596923828125, -10.87744140625, -10.157958984375, -9.4384765625, -8.718994140625, -7.99951171875, -7.280029296875, -6.560546875, -5.841064453125, -5.12158203125, -4.402099609375, -3.6826171875, -2.963134765625, -2.24365234375, -1.524169921875, -0.8046875, -0.085205078125, 0.63427734375, 1.353759765625, 2.0732421875, 2.792724609375, 3.51220703125, 4.231689453125, 4.951171875, 5.670654296875, 6.39013671875, 7.109619140625, 7.8291015625, 8.548583984375, 9.26806640625, 9.987548828125, 10.70703125, 11.426513671875, 12.14599609375, 12.865478515625, 13.5849609375, 14.304443359375, 15.02392578125, 15.743408203125, 16.462890625, 17.182373046875, 17.90185546875, 18.621337890625, 19.3408203125, 20.060302734375, 20.77978515625, 21.499267578125, 22.21875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 4.0, 8.0, 8.0, 20.0, 18.0, 29.0, 35.0, 32.0, 54.0, 67.0, 85.0, 97.0, 98.0, 89.0, 80.0, 49.0, 54.0, 40.0, 32.0, 22.0, 19.0, 15.0, 6.0, 5.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0025501251220703125, -0.002465665340423584, -0.0023812055587768555, -0.002296745777130127, -0.0022122859954833984, -0.00212782621383667, -0.0020433664321899414, -0.001958906650543213, -0.0018744468688964844, -0.0017899870872497559, -0.0017055273056030273, -0.0016210675239562988, -0.0015366077423095703, -0.0014521479606628418, -0.0013676881790161133, -0.0012832283973693848, -0.0011987686157226562, -0.0011143088340759277, -0.0010298490524291992, -0.0009453892707824707, -0.0008609294891357422, -0.0007764697074890137, -0.0006920099258422852, -0.0006075501441955566, -0.0005230903625488281, -0.0004386305809020996, -0.0003541707992553711, -0.0002697110176086426, -0.00018525123596191406, -0.00010079145431518555, -1.633167266845703e-05, 6.812810897827148e-05, 0.000152587890625, 0.00023704767227172852, 0.00032150745391845703, 0.00040596723556518555, 0.0004904270172119141, 0.0005748867988586426, 0.0006593465805053711, 0.0007438063621520996, 0.0008282661437988281, 0.0009127259254455566, 0.0009971857070922852, 0.0010816454887390137, 0.0011661052703857422, 0.0012505650520324707, 0.0013350248336791992, 0.0014194846153259277, 0.0015039443969726562, 0.0015884041786193848, 0.0016728639602661133, 0.0017573237419128418, 0.0018417835235595703, 0.0019262433052062988, 0.0020107030868530273, 0.002095162868499756, 0.0021796226501464844, 0.002264082431793213, 0.0023485422134399414, 0.00243300199508667, 0.0025174617767333984, 0.002601921558380127, 0.0026863813400268555, 0.002770841121673584, 0.0028553009033203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 14.0, 8.0, 13.0, 24.0, 34.0, 43.0, 77.0, 133.0, 191.0, 261.0, 430.0, 687.0, 1087.0, 1795.0, 2998.0, 5204.0, 9346.0, 17753.0, 36381.0, 79783.0, 183510.0, 326727.0, 206603.0, 90118.0, 40961.0, 20126.0, 10304.0, 5719.0, 3336.0, 1841.0, 1133.0, 670.0, 428.0, 272.0, 168.0, 113.0, 78.0, 46.0, 32.0, 31.0, 18.0, 13.0, 8.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-24.3125, -23.517333984375, -22.72216796875, -21.927001953125, -21.1318359375, -20.336669921875, -19.54150390625, -18.746337890625, -17.951171875, -17.156005859375, -16.36083984375, -15.565673828125, -14.7705078125, -13.975341796875, -13.18017578125, -12.385009765625, -11.58984375, -10.794677734375, -9.99951171875, -9.204345703125, -8.4091796875, -7.614013671875, -6.81884765625, -6.023681640625, -5.228515625, -4.433349609375, -3.63818359375, -2.843017578125, -2.0478515625, -1.252685546875, -0.45751953125, 0.337646484375, 1.1328125, 1.927978515625, 2.72314453125, 3.518310546875, 4.3134765625, 5.108642578125, 5.90380859375, 6.698974609375, 7.494140625, 8.289306640625, 9.08447265625, 9.879638671875, 10.6748046875, 11.469970703125, 12.26513671875, 13.060302734375, 13.85546875, 14.650634765625, 15.44580078125, 16.240966796875, 17.0361328125, 17.831298828125, 18.62646484375, 19.421630859375, 20.216796875, 21.011962890625, 21.80712890625, 22.602294921875, 23.3974609375, 24.192626953125, 24.98779296875, 25.782958984375, 26.578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 7.0, 10.0, 12.0, 12.0, 21.0, 22.0, 25.0, 37.0, 36.0, 49.0, 43.0, 41.0, 52.0, 60.0, 72.0, 62.0, 63.0, 61.0, 53.0, 30.0, 45.0, 33.0, 29.0, 24.0, 19.0, 18.0, 11.0, 13.0, 6.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5703125, -5.372802734375, -5.17529296875, -4.977783203125, -4.7802734375, -4.582763671875, -4.38525390625, -4.187744140625, -3.990234375, -3.792724609375, -3.59521484375, -3.397705078125, -3.2001953125, -3.002685546875, -2.80517578125, -2.607666015625, -2.41015625, -2.212646484375, -2.01513671875, -1.817626953125, -1.6201171875, -1.422607421875, -1.22509765625, -1.027587890625, -0.830078125, -0.632568359375, -0.43505859375, -0.237548828125, -0.0400390625, 0.157470703125, 0.35498046875, 0.552490234375, 0.75, 0.947509765625, 1.14501953125, 1.342529296875, 1.5400390625, 1.737548828125, 1.93505859375, 2.132568359375, 2.330078125, 2.527587890625, 2.72509765625, 2.922607421875, 3.1201171875, 3.317626953125, 3.51513671875, 3.712646484375, 3.91015625, 4.107666015625, 4.30517578125, 4.502685546875, 4.7001953125, 4.897705078125, 5.09521484375, 5.292724609375, 5.490234375, 5.687744140625, 5.88525390625, 6.082763671875, 6.2802734375, 6.477783203125, 6.67529296875, 6.872802734375, 7.0703125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 3.0, 8.0, 13.0, 9.0, 16.0, 17.0, 16.0, 16.0, 29.0, 40.0, 60.0, 55.0, 63.0, 71.0, 80.0, 77.0, 59.0, 65.0, 58.0, 40.0, 34.0, 27.0, 20.0, 30.0, 22.0, 9.0, 16.0, 6.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.81684875488281, -39.41847229003906, -38.02009582519531, -36.62171936035156, -35.22334289550781, -33.82497024536133, -32.42659378051758, -31.028217315673828, -29.629840850830078, -28.231464385986328, -26.833087921142578, -25.43471336364746, -24.03633689880371, -22.63796043395996, -21.239585876464844, -19.841209411621094, -18.442832946777344, -17.044456481933594, -15.64608097076416, -14.247705459594727, -12.849328994750977, -11.450952529907227, -10.052577018737793, -8.65420150756836, -7.255825042724609, -5.857449054718018, -4.459073066711426, -3.060697078704834, -1.6623210906982422, -0.2639451026916504, 1.1344308853149414, 2.532806396484375, 3.931182861328125, 5.329558849334717, 6.727934837341309, 8.126310348510742, 9.524686813354492, 10.923063278198242, 12.321438789367676, 13.71981430053711, 15.11819076538086, 16.51656723022461, 17.91494369506836, 19.313318252563477, 20.711694717407227, 22.110071182250977, 23.508445739746094, 24.906822204589844, 26.305198669433594, 27.703575134277344, 29.101951599121094, 30.50032615661621, 31.89870262145996, 33.29707717895508, 34.69545364379883, 36.09383010864258, 37.49220657348633, 38.89058303833008, 40.28895950317383, 41.68733596801758, 43.08570861816406, 44.48408508300781, 45.88246154785156, 47.28083801269531, 48.67921447753906]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 13.0, 15.0, 14.0, 14.0, 20.0, 22.0, 29.0, 15.0, 31.0, 44.0, 28.0, 34.0, 38.0, 52.0, 53.0, 43.0, 37.0, 56.0, 38.0, 46.0, 42.0, 32.0, 33.0, 26.0, 25.0, 31.0, 27.0, 19.0, 16.0, 12.0, 17.0, 13.0, 13.0, 6.0, 6.0, 4.0, 7.0, 6.0, 2.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.6596565246582, -39.28377151489258, -37.90788650512695, -36.53200149536133, -35.1561164855957, -33.78023147583008, -32.40434646606445, -31.028461456298828, -29.652576446533203, -28.276691436767578, -26.900806427001953, -25.524921417236328, -24.149036407470703, -22.773151397705078, -21.397266387939453, -20.021381378173828, -18.64549446105957, -17.269609451293945, -15.89372444152832, -14.517839431762695, -13.14195442199707, -11.766069412231445, -10.390183448791504, -9.014298439025879, -7.638413429260254, -6.262528419494629, -4.886643409729004, -3.5107579231262207, -2.1348729133605957, -0.7589879035949707, 0.6168975830078125, 1.9927825927734375, 3.3686676025390625, 4.7445526123046875, 6.1204376220703125, 7.496323108673096, 8.872207641601562, 10.248092651367188, 11.623978614807129, 12.999863624572754, 14.375748634338379, 15.751633644104004, 17.127519607543945, 18.50340461730957, 19.879289627075195, 21.25517463684082, 22.631059646606445, 24.00694465637207, 25.382829666137695, 26.75871467590332, 28.134599685668945, 29.51048469543457, 30.886369705200195, 32.26225662231445, 33.63814163208008, 35.0140266418457, 36.38991165161133, 37.76579666137695, 39.14168167114258, 40.5175666809082, 41.89345169067383, 43.26933670043945, 44.64522171020508, 46.0211067199707, 47.39699172973633]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 6.0, 12.0, 15.0, 13.0, 29.0, 42.0, 61.0, 67.0, 110.0, 150.0, 204.0, 344.0, 438.0, 617.0, 947.0, 1337.0, 2026.0, 3041.0, 4918.0, 7871.0, 13667.0, 25896.0, 58326.0, 183117.0, 746151.0, 1911021.0, 885868.0, 214148.0, 65864.0, 28619.0, 15027.0, 8524.0, 5234.0, 3274.0, 2254.0, 1468.0, 1078.0, 696.0, 502.0, 378.0, 255.0, 197.0, 134.0, 93.0, 79.0, 59.0, 31.0, 24.0, 19.0, 8.0, 14.0, 8.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-58.65625, -56.7978515625, -54.939453125, -53.0810546875, -51.22265625, -49.3642578125, -47.505859375, -45.6474609375, -43.7890625, -41.9306640625, -40.072265625, -38.2138671875, -36.35546875, -34.4970703125, -32.638671875, -30.7802734375, -28.921875, -27.0634765625, -25.205078125, -23.3466796875, -21.48828125, -19.6298828125, -17.771484375, -15.9130859375, -14.0546875, -12.1962890625, -10.337890625, -8.4794921875, -6.62109375, -4.7626953125, -2.904296875, -1.0458984375, 0.8125, 2.6708984375, 4.529296875, 6.3876953125, 8.24609375, 10.1044921875, 11.962890625, 13.8212890625, 15.6796875, 17.5380859375, 19.396484375, 21.2548828125, 23.11328125, 24.9716796875, 26.830078125, 28.6884765625, 30.546875, 32.4052734375, 34.263671875, 36.1220703125, 37.98046875, 39.8388671875, 41.697265625, 43.5556640625, 45.4140625, 47.2724609375, 49.130859375, 50.9892578125, 52.84765625, 54.7060546875, 56.564453125, 58.4228515625, 60.28125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 1.0, 0.0, 8.0, 12.0, 4.0, 12.0, 14.0, 14.0, 20.0, 24.0, 21.0, 18.0, 20.0, 31.0, 36.0, 25.0, 37.0, 34.0, 43.0, 47.0, 40.0, 45.0, 46.0, 46.0, 46.0, 36.0, 32.0, 25.0, 35.0, 32.0, 24.0, 25.0, 29.0, 15.0, 20.0, 8.0, 14.0, 12.0, 13.0, 11.0, 8.0, 3.0, 3.0, 1.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.625, -32.53173828125, -31.4384765625, -30.34521484375, -29.251953125, -28.15869140625, -27.0654296875, -25.97216796875, -24.87890625, -23.78564453125, -22.6923828125, -21.59912109375, -20.505859375, -19.41259765625, -18.3193359375, -17.22607421875, -16.1328125, -15.03955078125, -13.9462890625, -12.85302734375, -11.759765625, -10.66650390625, -9.5732421875, -8.47998046875, -7.38671875, -6.29345703125, -5.2001953125, -4.10693359375, -3.013671875, -1.92041015625, -0.8271484375, 0.26611328125, 1.359375, 2.45263671875, 3.5458984375, 4.63916015625, 5.732421875, 6.82568359375, 7.9189453125, 9.01220703125, 10.10546875, 11.19873046875, 12.2919921875, 13.38525390625, 14.478515625, 15.57177734375, 16.6650390625, 17.75830078125, 18.8515625, 19.94482421875, 21.0380859375, 22.13134765625, 23.224609375, 24.31787109375, 25.4111328125, 26.50439453125, 27.59765625, 28.69091796875, 29.7841796875, 30.87744140625, 31.970703125, 33.06396484375, 34.1572265625, 35.25048828125, 36.34375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 14.0, 20.0, 13.0, 35.0, 53.0, 69.0, 105.0, 141.0, 203.0, 337.0, 442.0, 672.0, 1058.0, 1753.0, 2682.0, 4142.0, 7292.0, 13045.0, 24272.0, 49422.0, 111165.0, 291219.0, 1005586.0, 1829166.0, 523866.0, 177593.0, 72967.0, 34410.0, 17682.0, 9750.0, 5711.0, 3335.0, 2086.0, 1331.0, 886.0, 590.0, 372.0, 269.0, 172.0, 96.0, 77.0, 64.0, 38.0, 31.0, 13.0, 12.0, 9.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-60.40625, -58.40966796875, -56.4130859375, -54.41650390625, -52.419921875, -50.42333984375, -48.4267578125, -46.43017578125, -44.43359375, -42.43701171875, -40.4404296875, -38.44384765625, -36.447265625, -34.45068359375, -32.4541015625, -30.45751953125, -28.4609375, -26.46435546875, -24.4677734375, -22.47119140625, -20.474609375, -18.47802734375, -16.4814453125, -14.48486328125, -12.48828125, -10.49169921875, -8.4951171875, -6.49853515625, -4.501953125, -2.50537109375, -0.5087890625, 1.48779296875, 3.484375, 5.48095703125, 7.4775390625, 9.47412109375, 11.470703125, 13.46728515625, 15.4638671875, 17.46044921875, 19.45703125, 21.45361328125, 23.4501953125, 25.44677734375, 27.443359375, 29.43994140625, 31.4365234375, 33.43310546875, 35.4296875, 37.42626953125, 39.4228515625, 41.41943359375, 43.416015625, 45.41259765625, 47.4091796875, 49.40576171875, 51.40234375, 53.39892578125, 55.3955078125, 57.39208984375, 59.388671875, 61.38525390625, 63.3818359375, 65.37841796875, 67.375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 7.0, 6.0, 3.0, 7.0, 7.0, 10.0, 10.0, 18.0, 15.0, 10.0, 26.0, 33.0, 30.0, 50.0, 54.0, 65.0, 79.0, 108.0, 125.0, 154.0, 196.0, 241.0, 326.0, 361.0, 373.0, 346.0, 274.0, 238.0, 164.0, 142.0, 129.0, 88.0, 72.0, 69.0, 46.0, 37.0, 32.0, 16.0, 19.0, 14.0, 15.0, 7.0, 9.0, 4.0, 14.0, 8.0, 4.0, 9.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-15.3203125, -14.8148193359375, -14.309326171875, -13.8038330078125, -13.29833984375, -12.7928466796875, -12.287353515625, -11.7818603515625, -11.2763671875, -10.7708740234375, -10.265380859375, -9.7598876953125, -9.25439453125, -8.7489013671875, -8.243408203125, -7.7379150390625, -7.232421875, -6.7269287109375, -6.221435546875, -5.7159423828125, -5.21044921875, -4.7049560546875, -4.199462890625, -3.6939697265625, -3.1884765625, -2.6829833984375, -2.177490234375, -1.6719970703125, -1.16650390625, -0.6610107421875, -0.155517578125, 0.3499755859375, 0.85546875, 1.3609619140625, 1.866455078125, 2.3719482421875, 2.87744140625, 3.3829345703125, 3.888427734375, 4.3939208984375, 4.8994140625, 5.4049072265625, 5.910400390625, 6.4158935546875, 6.92138671875, 7.4268798828125, 7.932373046875, 8.4378662109375, 8.943359375, 9.4488525390625, 9.954345703125, 10.4598388671875, 10.96533203125, 11.4708251953125, 11.976318359375, 12.4818115234375, 12.9873046875, 13.4927978515625, 13.998291015625, 14.5037841796875, 15.00927734375, 15.5147705078125, 16.020263671875, 16.5257568359375, 17.03125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 3.0, 3.0, 7.0, 7.0, 12.0, 20.0, 19.0, 33.0, 29.0, 57.0, 59.0, 46.0, 84.0, 95.0, 81.0, 69.0, 74.0, 66.0, 43.0, 44.0, 33.0, 25.0, 17.0, 12.0, 17.0, 10.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.31568908691406, -45.760162353515625, -44.20463562011719, -42.64910888671875, -41.09358596801758, -39.53805923461914, -37.9825325012207, -36.427005767822266, -34.87147903442383, -33.31595230102539, -31.760427474975586, -30.20490074157715, -28.64937400817871, -27.093849182128906, -25.53832244873047, -23.98279571533203, -22.427270889282227, -20.87174415588379, -19.316219329833984, -17.760692596435547, -16.20516586303711, -14.649640083312988, -13.094114303588867, -11.53858757019043, -9.983061790466309, -8.427536010742188, -6.87200927734375, -5.316483497619629, -3.7609572410583496, -2.2054309844970703, -0.6499052047729492, 0.9056215286254883, 2.4611473083496094, 4.016673564910889, 5.572199821472168, 7.127725601196289, 8.683252334594727, 10.238778114318848, 11.794303894042969, 13.349830627441406, 14.905356407165527, 16.46088218688965, 18.016408920288086, 19.57193374633789, 21.127460479736328, 22.682987213134766, 24.238513946533203, 25.79404067993164, 27.349565505981445, 28.905092239379883, 30.460617065429688, 32.016143798828125, 33.57167053222656, 35.127197265625, 36.68272399902344, 38.238250732421875, 39.79377365112305, 41.349300384521484, 42.90482711791992, 44.460350036621094, 46.01587677001953, 47.57140350341797, 49.126930236816406, 50.682456970214844, 52.23798370361328]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 2.0, 6.0, 6.0, 6.0, 13.0, 9.0, 18.0, 22.0, 23.0, 22.0, 35.0, 25.0, 22.0, 31.0, 30.0, 35.0, 39.0, 59.0, 30.0, 48.0, 46.0, 49.0, 43.0, 47.0, 45.0, 36.0, 35.0, 21.0, 24.0, 25.0, 16.0, 23.0, 18.0, 21.0, 16.0, 8.0, 12.0, 7.0, 4.0, 5.0, 7.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.902496337890625, -31.659561157226562, -30.416627883911133, -29.173694610595703, -27.93075942993164, -26.687824249267578, -25.44489097595215, -24.20195770263672, -22.959022521972656, -21.716087341308594, -20.473154067993164, -19.230220794677734, -17.987285614013672, -16.74435043334961, -15.50141716003418, -14.258482933044434, -13.015548706054688, -11.772614479064941, -10.529680252075195, -9.28674602508545, -8.043811798095703, -6.800877571105957, -5.557943344116211, -4.315009117126465, -3.0720748901367188, -1.8291406631469727, -0.5862064361572266, 0.6567277908325195, 1.8996620178222656, 3.1425962448120117, 4.385530471801758, 5.628464698791504, 6.871402740478516, 8.114336967468262, 9.357271194458008, 10.600205421447754, 11.8431396484375, 13.086073875427246, 14.329008102416992, 15.571942329406738, 16.814876556396484, 18.057811737060547, 19.300745010375977, 20.543678283691406, 21.78661346435547, 23.02954864501953, 24.27248191833496, 25.51541519165039, 26.758350372314453, 28.001285552978516, 29.244218826293945, 30.487152099609375, 31.730087280273438, 32.9730224609375, 34.21595764160156, 35.45888900756836, 36.70182418823242, 37.944759368896484, 39.18769073486328, 40.430625915527344, 41.673561096191406, 42.91649627685547, 44.15943145751953, 45.40236282348633, 46.64529800415039]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 6.0, 5.0, 13.0, 16.0, 24.0, 27.0, 42.0, 60.0, 89.0, 130.0, 229.0, 317.0, 518.0, 811.0, 1314.0, 2123.0, 3712.0, 6487.0, 11176.0, 20446.0, 38820.0, 78824.0, 173637.0, 315775.0, 204345.0, 92062.0, 44404.0, 23110.0, 12541.0, 6948.0, 4132.0, 2362.0, 1452.0, 898.0, 595.0, 381.0, 249.0, 139.0, 105.0, 65.0, 42.0, 27.0, 25.0, 13.0, 14.0, 14.0, 6.0, 10.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-18.25, -17.690185546875, -17.13037109375, -16.570556640625, -16.0107421875, -15.450927734375, -14.89111328125, -14.331298828125, -13.771484375, -13.211669921875, -12.65185546875, -12.092041015625, -11.5322265625, -10.972412109375, -10.41259765625, -9.852783203125, -9.29296875, -8.733154296875, -8.17333984375, -7.613525390625, -7.0537109375, -6.493896484375, -5.93408203125, -5.374267578125, -4.814453125, -4.254638671875, -3.69482421875, -3.135009765625, -2.5751953125, -2.015380859375, -1.45556640625, -0.895751953125, -0.3359375, 0.223876953125, 0.78369140625, 1.343505859375, 1.9033203125, 2.463134765625, 3.02294921875, 3.582763671875, 4.142578125, 4.702392578125, 5.26220703125, 5.822021484375, 6.3818359375, 6.941650390625, 7.50146484375, 8.061279296875, 8.62109375, 9.180908203125, 9.74072265625, 10.300537109375, 10.8603515625, 11.420166015625, 11.97998046875, 12.539794921875, 13.099609375, 13.659423828125, 14.21923828125, 14.779052734375, 15.3388671875, 15.898681640625, 16.45849609375, 17.018310546875, 17.578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 5.0, 4.0, 2.0, 6.0, 9.0, 11.0, 20.0, 13.0, 19.0, 18.0, 15.0, 34.0, 20.0, 18.0, 34.0, 28.0, 31.0, 36.0, 42.0, 39.0, 44.0, 38.0, 41.0, 48.0, 40.0, 38.0, 45.0, 32.0, 34.0, 31.0, 19.0, 23.0, 24.0, 24.0, 16.0, 13.0, 17.0, 19.0, 6.0, 8.0, 5.0, 5.0, 5.0, 1.0, 9.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-35.875, -34.69775390625, -33.5205078125, -32.34326171875, -31.166015625, -29.98876953125, -28.8115234375, -27.63427734375, -26.45703125, -25.27978515625, -24.1025390625, -22.92529296875, -21.748046875, -20.57080078125, -19.3935546875, -18.21630859375, -17.0390625, -15.86181640625, -14.6845703125, -13.50732421875, -12.330078125, -11.15283203125, -9.9755859375, -8.79833984375, -7.62109375, -6.44384765625, -5.2666015625, -4.08935546875, -2.912109375, -1.73486328125, -0.5576171875, 0.61962890625, 1.796875, 2.97412109375, 4.1513671875, 5.32861328125, 6.505859375, 7.68310546875, 8.8603515625, 10.03759765625, 11.21484375, 12.39208984375, 13.5693359375, 14.74658203125, 15.923828125, 17.10107421875, 18.2783203125, 19.45556640625, 20.6328125, 21.81005859375, 22.9873046875, 24.16455078125, 25.341796875, 26.51904296875, 27.6962890625, 28.87353515625, 30.05078125, 31.22802734375, 32.4052734375, 33.58251953125, 34.759765625, 35.93701171875, 37.1142578125, 38.29150390625, 39.46875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 7.0, 3.0, 6.0, 7.0, 17.0, 14.0, 21.0, 27.0, 52.0, 74.0, 122.0, 236.0, 431.0, 826.0, 1669.0, 3635.0, 8360.0, 21701.0, 168678.0, 788722.0, 33316.0, 11337.0, 4845.0, 2171.0, 1033.0, 536.0, 279.0, 162.0, 86.0, 53.0, 43.0, 16.0, 16.0, 14.0, 10.0, 5.0, 5.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-44.15625, -42.8642578125, -41.572265625, -40.2802734375, -38.98828125, -37.6962890625, -36.404296875, -35.1123046875, -33.8203125, -32.5283203125, -31.236328125, -29.9443359375, -28.65234375, -27.3603515625, -26.068359375, -24.7763671875, -23.484375, -22.1923828125, -20.900390625, -19.6083984375, -18.31640625, -17.0244140625, -15.732421875, -14.4404296875, -13.1484375, -11.8564453125, -10.564453125, -9.2724609375, -7.98046875, -6.6884765625, -5.396484375, -4.1044921875, -2.8125, -1.5205078125, -0.228515625, 1.0634765625, 2.35546875, 3.6474609375, 4.939453125, 6.2314453125, 7.5234375, 8.8154296875, 10.107421875, 11.3994140625, 12.69140625, 13.9833984375, 15.275390625, 16.5673828125, 17.859375, 19.1513671875, 20.443359375, 21.7353515625, 23.02734375, 24.3193359375, 25.611328125, 26.9033203125, 28.1953125, 29.4873046875, 30.779296875, 32.0712890625, 33.36328125, 34.6552734375, 35.947265625, 37.2392578125, 38.53125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 4.0, 3.0, 9.0, 9.0, 7.0, 14.0, 9.0, 14.0, 11.0, 17.0, 17.0, 19.0, 11.0, 28.0, 23.0, 31.0, 26.0, 41.0, 40.0, 37.0, 36.0, 44.0, 40.0, 42.0, 38.0, 39.0, 35.0, 33.0, 34.0, 37.0, 37.0, 25.0, 23.0, 23.0, 21.0, 20.0, 11.0, 15.0, 9.0, 11.0, 13.0, 4.0, 13.0, 5.0, 6.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.140625, -23.35986328125, -22.5791015625, -21.79833984375, -21.017578125, -20.23681640625, -19.4560546875, -18.67529296875, -17.89453125, -17.11376953125, -16.3330078125, -15.55224609375, -14.771484375, -13.99072265625, -13.2099609375, -12.42919921875, -11.6484375, -10.86767578125, -10.0869140625, -9.30615234375, -8.525390625, -7.74462890625, -6.9638671875, -6.18310546875, -5.40234375, -4.62158203125, -3.8408203125, -3.06005859375, -2.279296875, -1.49853515625, -0.7177734375, 0.06298828125, 0.84375, 1.62451171875, 2.4052734375, 3.18603515625, 3.966796875, 4.74755859375, 5.5283203125, 6.30908203125, 7.08984375, 7.87060546875, 8.6513671875, 9.43212890625, 10.212890625, 10.99365234375, 11.7744140625, 12.55517578125, 13.3359375, 14.11669921875, 14.8974609375, 15.67822265625, 16.458984375, 17.23974609375, 18.0205078125, 18.80126953125, 19.58203125, 20.36279296875, 21.1435546875, 21.92431640625, 22.705078125, 23.48583984375, 24.2666015625, 25.04736328125, 25.828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 10.0, 6.0, 14.0, 23.0, 30.0, 43.0, 67.0, 89.0, 115.0, 204.0, 318.0, 532.0, 928.0, 1708.0, 3678.0, 8761.0, 26070.0, 678643.0, 290017.0, 22149.0, 7871.0, 3288.0, 1620.0, 926.0, 490.0, 312.0, 193.0, 138.0, 89.0, 64.0, 34.0, 25.0, 27.0, 23.0, 14.0, 6.0, 9.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.751953125, -3.626617431640625, -3.50128173828125, -3.375946044921875, -3.2506103515625, -3.125274658203125, -2.99993896484375, -2.874603271484375, -2.749267578125, -2.623931884765625, -2.49859619140625, -2.373260498046875, -2.2479248046875, -2.122589111328125, -1.99725341796875, -1.871917724609375, -1.74658203125, -1.621246337890625, -1.49591064453125, -1.370574951171875, -1.2452392578125, -1.119903564453125, -0.99456787109375, -0.869232177734375, -0.743896484375, -0.618560791015625, -0.49322509765625, -0.367889404296875, -0.2425537109375, -0.117218017578125, 0.00811767578125, 0.133453369140625, 0.2587890625, 0.384124755859375, 0.50946044921875, 0.634796142578125, 0.7601318359375, 0.885467529296875, 1.01080322265625, 1.136138916015625, 1.261474609375, 1.386810302734375, 1.51214599609375, 1.637481689453125, 1.7628173828125, 1.888153076171875, 2.01348876953125, 2.138824462890625, 2.26416015625, 2.389495849609375, 2.51483154296875, 2.640167236328125, 2.7655029296875, 2.890838623046875, 3.01617431640625, 3.141510009765625, 3.266845703125, 3.392181396484375, 3.51751708984375, 3.642852783203125, 3.7681884765625, 3.893524169921875, 4.01885986328125, 4.144195556640625, 4.26953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 11.0, 13.0, 19.0, 24.0, 37.0, 41.0, 54.0, 115.0, 129.0, 139.0, 122.0, 77.0, 53.0, 51.0, 34.0, 33.0, 9.0, 13.0, 7.0, 4.0, 1.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005731582641601562, -0.0005593076348304749, -0.0005454570055007935, -0.0005316063761711121, -0.0005177557468414307, -0.0005039051175117493, -0.0004900544881820679, -0.0004762038588523865, -0.0004623532295227051, -0.0004485026001930237, -0.0004346519708633423, -0.0004208013415336609, -0.0004069507122039795, -0.0003931000828742981, -0.0003792494535446167, -0.0003653988242149353, -0.0003515481948852539, -0.0003376975655555725, -0.0003238469362258911, -0.0003099963068962097, -0.0002961456775665283, -0.0002822950482368469, -0.00026844441890716553, -0.00025459378957748413, -0.00024074316024780273, -0.00022689253091812134, -0.00021304190158843994, -0.00019919127225875854, -0.00018534064292907715, -0.00017149001359939575, -0.00015763938426971436, -0.00014378875494003296, -0.00012993812561035156, -0.00011608749628067017, -0.00010223686695098877, -8.838623762130737e-05, -7.453560829162598e-05, -6.068497896194458e-05, -4.6834349632263184e-05, -3.298372030258179e-05, -1.913309097290039e-05, -5.282461643218994e-06, 8.568167686462402e-06, 2.24187970161438e-05, 3.6269426345825195e-05, 5.012005567550659e-05, 6.397068500518799e-05, 7.782131433486938e-05, 9.167194366455078e-05, 0.00010552257299423218, 0.00011937320232391357, 0.00013322383165359497, 0.00014707446098327637, 0.00016092509031295776, 0.00017477571964263916, 0.00018862634897232056, 0.00020247697830200195, 0.00021632760763168335, 0.00023017823696136475, 0.00024402886629104614, 0.00025787949562072754, 0.00027173012495040894, 0.00028558075428009033, 0.00029943138360977173, 0.0003132820129394531]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 8.0, 12.0, 17.0, 29.0, 33.0, 44.0, 92.0, 99.0, 153.0, 217.0, 327.0, 475.0, 720.0, 1118.0, 1706.0, 2522.0, 3947.0, 6447.0, 10731.0, 18287.0, 33631.0, 67960.0, 158767.0, 338785.0, 215670.0, 88827.0, 41959.0, 22062.0, 12638.0, 7738.0, 4825.0, 2991.0, 1935.0, 1262.0, 810.0, 570.0, 347.0, 246.0, 165.0, 112.0, 80.0, 53.0, 44.0, 24.0, 20.0, 11.0, 12.0, 8.0, 6.0, 8.0, 2.0, 1.0, 2.0, 4.0], "bins": [-3.626953125, -3.51922607421875, -3.4114990234375, -3.30377197265625, -3.196044921875, -3.08831787109375, -2.9805908203125, -2.87286376953125, -2.76513671875, -2.65740966796875, -2.5496826171875, -2.44195556640625, -2.334228515625, -2.22650146484375, -2.1187744140625, -2.01104736328125, -1.9033203125, -1.79559326171875, -1.6878662109375, -1.58013916015625, -1.472412109375, -1.36468505859375, -1.2569580078125, -1.14923095703125, -1.04150390625, -0.93377685546875, -0.8260498046875, -0.71832275390625, -0.610595703125, -0.50286865234375, -0.3951416015625, -0.28741455078125, -0.1796875, -0.07196044921875, 0.0357666015625, 0.14349365234375, 0.251220703125, 0.35894775390625, 0.4666748046875, 0.57440185546875, 0.68212890625, 0.78985595703125, 0.8975830078125, 1.00531005859375, 1.113037109375, 1.22076416015625, 1.3284912109375, 1.43621826171875, 1.5439453125, 1.65167236328125, 1.7593994140625, 1.86712646484375, 1.974853515625, 2.08258056640625, 2.1903076171875, 2.29803466796875, 2.40576171875, 2.51348876953125, 2.6212158203125, 2.72894287109375, 2.836669921875, 2.94439697265625, 3.0521240234375, 3.15985107421875, 3.267578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 11.0, 11.0, 12.0, 17.0, 10.0, 25.0, 35.0, 28.0, 28.0, 43.0, 55.0, 70.0, 59.0, 67.0, 82.0, 57.0, 59.0, 64.0, 42.0, 31.0, 42.0, 28.0, 21.0, 14.0, 13.0, 19.0, 10.0, 6.0, 9.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1142578125, -1.0807647705078125, -1.047271728515625, -1.0137786865234375, -0.98028564453125, -0.9467926025390625, -0.913299560546875, -0.8798065185546875, -0.8463134765625, -0.8128204345703125, -0.779327392578125, -0.7458343505859375, -0.71234130859375, -0.6788482666015625, -0.645355224609375, -0.6118621826171875, -0.578369140625, -0.5448760986328125, -0.511383056640625, -0.4778900146484375, -0.44439697265625, -0.4109039306640625, -0.377410888671875, -0.3439178466796875, -0.3104248046875, -0.2769317626953125, -0.243438720703125, -0.2099456787109375, -0.17645263671875, -0.1429595947265625, -0.109466552734375, -0.0759735107421875, -0.04248046875, -0.0089874267578125, 0.024505615234375, 0.0579986572265625, 0.09149169921875, 0.1249847412109375, 0.158477783203125, 0.1919708251953125, 0.2254638671875, 0.2589569091796875, 0.292449951171875, 0.3259429931640625, 0.35943603515625, 0.3929290771484375, 0.426422119140625, 0.4599151611328125, 0.493408203125, 0.5269012451171875, 0.560394287109375, 0.5938873291015625, 0.62738037109375, 0.6608734130859375, 0.694366455078125, 0.7278594970703125, 0.7613525390625, 0.7948455810546875, 0.828338623046875, 0.8618316650390625, 0.89532470703125, 0.9288177490234375, 0.962310791015625, 0.9958038330078125, 1.029296875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 9.0, 14.0, 22.0, 22.0, 30.0, 45.0, 43.0, 64.0, 57.0, 79.0, 86.0, 78.0, 74.0, 69.0, 61.0, 51.0, 29.0, 36.0, 19.0, 17.0, 25.0, 11.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.452972412109375, -41.96217727661133, -40.47138214111328, -38.9805908203125, -37.48979568481445, -35.999000549316406, -34.508209228515625, -33.01741409301758, -31.52661895751953, -30.035823822021484, -28.54503059387207, -27.054237365722656, -25.56344223022461, -24.072647094726562, -22.58185386657715, -21.091060638427734, -19.600265502929688, -18.10947036743164, -16.618677139282227, -15.127882957458496, -13.637088775634766, -12.146294593811035, -10.655500411987305, -9.164706230163574, -7.673912048339844, -6.183117866516113, -4.692323684692383, -3.2015295028686523, -1.7107353210449219, -0.2199411392211914, 1.270853042602539, 2.7616472244262695, 4.25244140625, 5.7432355880737305, 7.234029769897461, 8.724823951721191, 10.215618133544922, 11.706412315368652, 13.197206497192383, 14.688000679016113, 16.178794860839844, 17.66958999633789, 19.160383224487305, 20.65117645263672, 22.141971588134766, 23.632766723632812, 25.123559951782227, 26.61435317993164, 28.105148315429688, 29.595943450927734, 31.08673667907715, 32.57752990722656, 34.06832504272461, 35.559120178222656, 37.04991149902344, 38.540706634521484, 40.03150177001953, 41.52229690551758, 43.013092041015625, 44.503883361816406, 45.99467849731445, 47.4854736328125, 48.97626495361328, 50.46706008911133, 51.957855224609375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 7.0, 3.0, 1.0, 7.0, 6.0, 2.0, 13.0, 13.0, 16.0, 20.0, 23.0, 23.0, 31.0, 25.0, 28.0, 25.0, 29.0, 38.0, 40.0, 52.0, 39.0, 47.0, 42.0, 45.0, 49.0, 47.0, 45.0, 38.0, 33.0, 24.0, 21.0, 21.0, 23.0, 22.0, 16.0, 21.0, 21.0, 8.0, 9.0, 11.0, 2.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.65187072753906, -31.42336082458496, -30.19485092163086, -28.966341018676758, -27.737831115722656, -26.509321212768555, -25.280811309814453, -24.05230140686035, -22.82379150390625, -21.59528160095215, -20.366771697998047, -19.138261795043945, -17.909751892089844, -16.681241989135742, -15.45273208618164, -14.224222183227539, -12.995712280273438, -11.767202377319336, -10.538692474365234, -9.310182571411133, -8.081672668457031, -6.85316276550293, -5.624652862548828, -4.396142959594727, -3.167633056640625, -1.9391231536865234, -0.7106132507324219, 0.5178966522216797, 1.7464065551757812, 2.974916458129883, 4.203426361083984, 5.431936264038086, 6.660442352294922, 7.888952255249023, 9.117462158203125, 10.345972061157227, 11.574481964111328, 12.80299186706543, 14.031501770019531, 15.260011672973633, 16.488521575927734, 17.717031478881836, 18.945541381835938, 20.17405128479004, 21.40256118774414, 22.631071090698242, 23.859580993652344, 25.088090896606445, 26.316600799560547, 27.54511070251465, 28.77362060546875, 30.00213050842285, 31.230640411376953, 32.45915222167969, 33.687660217285156, 34.916168212890625, 36.14468002319336, 37.373191833496094, 38.60169982910156, 39.83020782470703, 41.058719635009766, 42.2872314453125, 43.51573944091797, 44.74424743652344, 45.97275924682617]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 9.0, 10.0, 7.0, 33.0, 35.0, 64.0, 99.0, 167.0, 277.0, 435.0, 746.0, 1303.0, 2126.0, 4117.0, 7508.0, 14851.0, 30506.0, 66884.0, 154875.0, 322904.0, 243889.0, 105181.0, 46821.0, 22004.0, 10803.0, 5647.0, 3085.0, 1687.0, 1007.0, 575.0, 368.0, 197.0, 119.0, 81.0, 36.0, 26.0, 18.0, 14.0, 10.0, 6.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-75.25, -73.20361328125, -71.1572265625, -69.11083984375, -67.064453125, -65.01806640625, -62.9716796875, -60.92529296875, -58.87890625, -56.83251953125, -54.7861328125, -52.73974609375, -50.693359375, -48.64697265625, -46.6005859375, -44.55419921875, -42.5078125, -40.46142578125, -38.4150390625, -36.36865234375, -34.322265625, -32.27587890625, -30.2294921875, -28.18310546875, -26.13671875, -24.09033203125, -22.0439453125, -19.99755859375, -17.951171875, -15.90478515625, -13.8583984375, -11.81201171875, -9.765625, -7.71923828125, -5.6728515625, -3.62646484375, -1.580078125, 0.46630859375, 2.5126953125, 4.55908203125, 6.60546875, 8.65185546875, 10.6982421875, 12.74462890625, 14.791015625, 16.83740234375, 18.8837890625, 20.93017578125, 22.9765625, 25.02294921875, 27.0693359375, 29.11572265625, 31.162109375, 33.20849609375, 35.2548828125, 37.30126953125, 39.34765625, 41.39404296875, 43.4404296875, 45.48681640625, 47.533203125, 49.57958984375, 51.6259765625, 53.67236328125, 55.71875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 5.0, 6.0, 6.0, 10.0, 15.0, 12.0, 25.0, 22.0, 36.0, 18.0, 26.0, 22.0, 34.0, 44.0, 35.0, 42.0, 47.0, 43.0, 48.0, 51.0, 55.0, 51.0, 55.0, 32.0, 27.0, 26.0, 29.0, 21.0, 21.0, 14.0, 19.0, 20.0, 16.0, 9.0, 15.0, 4.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.8125, -33.560546875, -32.30859375, -31.056640625, -29.8046875, -28.552734375, -27.30078125, -26.048828125, -24.796875, -23.544921875, -22.29296875, -21.041015625, -19.7890625, -18.537109375, -17.28515625, -16.033203125, -14.78125, -13.529296875, -12.27734375, -11.025390625, -9.7734375, -8.521484375, -7.26953125, -6.017578125, -4.765625, -3.513671875, -2.26171875, -1.009765625, 0.2421875, 1.494140625, 2.74609375, 3.998046875, 5.25, 6.501953125, 7.75390625, 9.005859375, 10.2578125, 11.509765625, 12.76171875, 14.013671875, 15.265625, 16.517578125, 17.76953125, 19.021484375, 20.2734375, 21.525390625, 22.77734375, 24.029296875, 25.28125, 26.533203125, 27.78515625, 29.037109375, 30.2890625, 31.541015625, 32.79296875, 34.044921875, 35.296875, 36.548828125, 37.80078125, 39.052734375, 40.3046875, 41.556640625, 42.80859375, 44.060546875, 45.3125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 10.0, 2.0, 13.0, 7.0, 34.0, 30.0, 47.0, 74.0, 98.0, 166.0, 239.0, 387.0, 567.0, 890.0, 1241.0, 1929.0, 3060.0, 4689.0, 7419.0, 11180.0, 17479.0, 28533.0, 46317.0, 76366.0, 125803.0, 189591.0, 192491.0, 130976.0, 79728.0, 48235.0, 29572.0, 18356.0, 11687.0, 7439.0, 4729.0, 3115.0, 2044.0, 1422.0, 878.0, 593.0, 384.0, 266.0, 153.0, 116.0, 59.0, 51.0, 30.0, 17.0, 17.0, 15.0, 10.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-43.40625, -42.0078125, -40.609375, -39.2109375, -37.8125, -36.4140625, -35.015625, -33.6171875, -32.21875, -30.8203125, -29.421875, -28.0234375, -26.625, -25.2265625, -23.828125, -22.4296875, -21.03125, -19.6328125, -18.234375, -16.8359375, -15.4375, -14.0390625, -12.640625, -11.2421875, -9.84375, -8.4453125, -7.046875, -5.6484375, -4.25, -2.8515625, -1.453125, -0.0546875, 1.34375, 2.7421875, 4.140625, 5.5390625, 6.9375, 8.3359375, 9.734375, 11.1328125, 12.53125, 13.9296875, 15.328125, 16.7265625, 18.125, 19.5234375, 20.921875, 22.3203125, 23.71875, 25.1171875, 26.515625, 27.9140625, 29.3125, 30.7109375, 32.109375, 33.5078125, 34.90625, 36.3046875, 37.703125, 39.1015625, 40.5, 41.8984375, 43.296875, 44.6953125, 46.09375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 11.0, 8.0, 12.0, 14.0, 12.0, 19.0, 17.0, 20.0, 10.0, 25.0, 24.0, 28.0, 23.0, 33.0, 45.0, 49.0, 38.0, 32.0, 47.0, 36.0, 32.0, 46.0, 43.0, 49.0, 55.0, 35.0, 46.0, 24.0, 22.0, 27.0, 15.0, 20.0, 13.0, 15.0, 15.0, 10.0, 8.0, 10.0, 7.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -22.07373046875, -21.2412109375, -20.40869140625, -19.576171875, -18.74365234375, -17.9111328125, -17.07861328125, -16.24609375, -15.41357421875, -14.5810546875, -13.74853515625, -12.916015625, -12.08349609375, -11.2509765625, -10.41845703125, -9.5859375, -8.75341796875, -7.9208984375, -7.08837890625, -6.255859375, -5.42333984375, -4.5908203125, -3.75830078125, -2.92578125, -2.09326171875, -1.2607421875, -0.42822265625, 0.404296875, 1.23681640625, 2.0693359375, 2.90185546875, 3.734375, 4.56689453125, 5.3994140625, 6.23193359375, 7.064453125, 7.89697265625, 8.7294921875, 9.56201171875, 10.39453125, 11.22705078125, 12.0595703125, 12.89208984375, 13.724609375, 14.55712890625, 15.3896484375, 16.22216796875, 17.0546875, 17.88720703125, 18.7197265625, 19.55224609375, 20.384765625, 21.21728515625, 22.0498046875, 22.88232421875, 23.71484375, 24.54736328125, 25.3798828125, 26.21240234375, 27.044921875, 27.87744140625, 28.7099609375, 29.54248046875, 30.375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 11.0, 12.0, 37.0, 30.0, 46.0, 78.0, 106.0, 149.0, 185.0, 279.0, 386.0, 575.0, 857.0, 1222.0, 1706.0, 2488.0, 3879.0, 5850.0, 9197.0, 14498.0, 23772.0, 40249.0, 69437.0, 124735.0, 219383.0, 222902.0, 127704.0, 70843.0, 41071.0, 24380.0, 14971.0, 9238.0, 5989.0, 3979.0, 2632.0, 1760.0, 1234.0, 846.0, 564.0, 374.0, 273.0, 186.0, 143.0, 104.0, 75.0, 34.0, 36.0, 17.0, 12.0, 8.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0], "bins": [-17.71875, -17.18212890625, -16.6455078125, -16.10888671875, -15.572265625, -15.03564453125, -14.4990234375, -13.96240234375, -13.42578125, -12.88916015625, -12.3525390625, -11.81591796875, -11.279296875, -10.74267578125, -10.2060546875, -9.66943359375, -9.1328125, -8.59619140625, -8.0595703125, -7.52294921875, -6.986328125, -6.44970703125, -5.9130859375, -5.37646484375, -4.83984375, -4.30322265625, -3.7666015625, -3.22998046875, -2.693359375, -2.15673828125, -1.6201171875, -1.08349609375, -0.546875, -0.01025390625, 0.5263671875, 1.06298828125, 1.599609375, 2.13623046875, 2.6728515625, 3.20947265625, 3.74609375, 4.28271484375, 4.8193359375, 5.35595703125, 5.892578125, 6.42919921875, 6.9658203125, 7.50244140625, 8.0390625, 8.57568359375, 9.1123046875, 9.64892578125, 10.185546875, 10.72216796875, 11.2587890625, 11.79541015625, 12.33203125, 12.86865234375, 13.4052734375, 13.94189453125, 14.478515625, 15.01513671875, 15.5517578125, 16.08837890625, 16.625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 10.0, 13.0, 17.0, 19.0, 13.0, 34.0, 44.0, 60.0, 66.0, 70.0, 87.0, 92.0, 91.0, 77.0, 58.0, 48.0, 29.0, 23.0, 18.0, 26.0, 19.0, 13.0, 8.0, 17.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.001983642578125, -0.0019261986017227173, -0.0018687546253204346, -0.0018113106489181519, -0.0017538666725158691, -0.0016964226961135864, -0.0016389787197113037, -0.001581534743309021, -0.0015240907669067383, -0.0014666467905044556, -0.0014092028141021729, -0.0013517588376998901, -0.0012943148612976074, -0.0012368708848953247, -0.001179426908493042, -0.0011219829320907593, -0.0010645389556884766, -0.0010070949792861938, -0.0009496510028839111, -0.0008922070264816284, -0.0008347630500793457, -0.000777319073677063, -0.0007198750972747803, -0.0006624311208724976, -0.0006049871444702148, -0.0005475431680679321, -0.0004900991916656494, -0.0004326552152633667, -0.000375211238861084, -0.00031776726245880127, -0.00026032328605651855, -0.00020287930965423584, -0.00014543533325195312, -8.799135684967041e-05, -3.0547380447387695e-05, 2.689659595489502e-05, 8.434057235717773e-05, 0.00014178454875946045, 0.00019922852516174316, 0.0002566725015640259, 0.0003141164779663086, 0.0003715604543685913, 0.000429004430770874, 0.00048644840717315674, 0.0005438923835754395, 0.0006013363599777222, 0.0006587803363800049, 0.0007162243127822876, 0.0007736682891845703, 0.000831112265586853, 0.0008885562419891357, 0.0009460002183914185, 0.0010034441947937012, 0.0010608881711959839, 0.0011183321475982666, 0.0011757761240005493, 0.001233220100402832, 0.0012906640768051147, 0.0013481080532073975, 0.0014055520296096802, 0.0014629960060119629, 0.0015204399824142456, 0.0015778839588165283, 0.001635327935218811, 0.0016927719116210938]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 11.0, 9.0, 11.0, 18.0, 33.0, 40.0, 54.0, 83.0, 130.0, 198.0, 257.0, 390.0, 530.0, 745.0, 1139.0, 1624.0, 2386.0, 3608.0, 5544.0, 8858.0, 14470.0, 22705.0, 37390.0, 65170.0, 114721.0, 207505.0, 234563.0, 135806.0, 75393.0, 43949.0, 25900.0, 16053.0, 10165.0, 6343.0, 4095.0, 2758.0, 1825.0, 1352.0, 848.0, 553.0, 426.0, 269.0, 207.0, 121.0, 88.0, 72.0, 39.0, 28.0, 21.0, 18.0, 15.0, 5.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0], "bins": [-16.328125, -15.820068359375, -15.31201171875, -14.803955078125, -14.2958984375, -13.787841796875, -13.27978515625, -12.771728515625, -12.263671875, -11.755615234375, -11.24755859375, -10.739501953125, -10.2314453125, -9.723388671875, -9.21533203125, -8.707275390625, -8.19921875, -7.691162109375, -7.18310546875, -6.675048828125, -6.1669921875, -5.658935546875, -5.15087890625, -4.642822265625, -4.134765625, -3.626708984375, -3.11865234375, -2.610595703125, -2.1025390625, -1.594482421875, -1.08642578125, -0.578369140625, -0.0703125, 0.437744140625, 0.94580078125, 1.453857421875, 1.9619140625, 2.469970703125, 2.97802734375, 3.486083984375, 3.994140625, 4.502197265625, 5.01025390625, 5.518310546875, 6.0263671875, 6.534423828125, 7.04248046875, 7.550537109375, 8.05859375, 8.566650390625, 9.07470703125, 9.582763671875, 10.0908203125, 10.598876953125, 11.10693359375, 11.614990234375, 12.123046875, 12.631103515625, 13.13916015625, 13.647216796875, 14.1552734375, 14.663330078125, 15.17138671875, 15.679443359375, 16.1875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 5.0, 12.0, 13.0, 7.0, 15.0, 15.0, 19.0, 17.0, 30.0, 33.0, 45.0, 30.0, 44.0, 38.0, 61.0, 65.0, 54.0, 63.0, 51.0, 55.0, 56.0, 39.0, 41.0, 37.0, 25.0, 21.0, 18.0, 21.0, 13.0, 12.0, 11.0, 0.0, 5.0, 2.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.70880126953125, -6.5113525390625, -6.31390380859375, -6.116455078125, -5.91900634765625, -5.7215576171875, -5.52410888671875, -5.32666015625, -5.12921142578125, -4.9317626953125, -4.73431396484375, -4.536865234375, -4.33941650390625, -4.1419677734375, -3.94451904296875, -3.7470703125, -3.54962158203125, -3.3521728515625, -3.15472412109375, -2.957275390625, -2.75982666015625, -2.5623779296875, -2.36492919921875, -2.16748046875, -1.97003173828125, -1.7725830078125, -1.57513427734375, -1.377685546875, -1.18023681640625, -0.9827880859375, -0.78533935546875, -0.587890625, -0.39044189453125, -0.1929931640625, 0.00445556640625, 0.201904296875, 0.39935302734375, 0.5968017578125, 0.79425048828125, 0.99169921875, 1.18914794921875, 1.3865966796875, 1.58404541015625, 1.781494140625, 1.97894287109375, 2.1763916015625, 2.37384033203125, 2.5712890625, 2.76873779296875, 2.9661865234375, 3.16363525390625, 3.361083984375, 3.55853271484375, 3.7559814453125, 3.95343017578125, 4.15087890625, 4.34832763671875, 4.5457763671875, 4.74322509765625, 4.940673828125, 5.13812255859375, 5.3355712890625, 5.53302001953125, 5.73046875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 7.0, 12.0, 16.0, 16.0, 11.0, 27.0, 26.0, 41.0, 48.0, 54.0, 58.0, 63.0, 57.0, 72.0, 67.0, 67.0, 52.0, 61.0, 56.0, 28.0, 33.0, 29.0, 13.0, 14.0, 15.0, 10.0, 7.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.03135299682617, -37.67646408081055, -36.32157516479492, -34.9666862487793, -33.61180114746094, -32.25691223144531, -30.902023315429688, -29.547134399414062, -28.192245483398438, -26.837356567382812, -25.482467651367188, -24.127580642700195, -22.77269172668457, -21.417802810668945, -20.062915802001953, -18.708026885986328, -17.353137969970703, -15.998249053955078, -14.64336109161377, -13.288473129272461, -11.933584213256836, -10.578695297241211, -9.223807334899902, -7.868919372558594, -6.514030456542969, -5.159142017364502, -3.804253578186035, -2.4493651390075684, -1.0944766998291016, 0.26041173934936523, 1.615300178527832, 2.9701881408691406, 4.3250732421875, 5.679961681365967, 7.034850120544434, 8.389738082885742, 9.744626998901367, 11.099515914916992, 12.4544038772583, 13.80929183959961, 15.164180755615234, 16.51906967163086, 17.873958587646484, 19.228845596313477, 20.5837345123291, 21.938623428344727, 23.29351043701172, 24.648399353027344, 26.00328826904297, 27.358177185058594, 28.71306610107422, 30.06795310974121, 31.422842025756836, 32.77772903442383, 34.13261795043945, 35.48750686645508, 36.8423957824707, 38.19728469848633, 39.55217361450195, 40.90706253051758, 42.26194763183594, 43.61683654785156, 44.97172546386719, 46.32661437988281, 47.68150329589844]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 11.0, 8.0, 8.0, 11.0, 14.0, 20.0, 23.0, 19.0, 25.0, 24.0, 22.0, 34.0, 43.0, 46.0, 41.0, 33.0, 55.0, 44.0, 49.0, 40.0, 43.0, 41.0, 43.0, 39.0, 41.0, 30.0, 26.0, 26.0, 22.0, 14.0, 14.0, 12.0, 13.0, 14.0, 7.0, 8.0, 10.0, 7.0, 2.0, 7.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.6940803527832, -32.41613006591797, -31.138179779052734, -29.8602294921875, -28.582279205322266, -27.30432891845703, -26.026378631591797, -24.748428344726562, -23.470478057861328, -22.192527770996094, -20.91457748413086, -19.636627197265625, -18.35867691040039, -17.080726623535156, -15.802775382995605, -14.524825096130371, -13.24687385559082, -11.968923568725586, -10.690973281860352, -9.413022994995117, -8.135072708129883, -6.85712194442749, -5.579171180725098, -4.301220893859863, -3.023270606994629, -1.745320200920105, -0.46736979484558105, 0.8105807304382324, 2.088531017303467, 3.366481304168701, 4.644432067871094, 5.922382354736328, 7.2003326416015625, 8.478282928466797, 9.756233215332031, 11.034183502197266, 12.3121337890625, 13.590084075927734, 14.868035316467285, 16.145984649658203, 17.423934936523438, 18.701885223388672, 19.979835510253906, 21.25778579711914, 22.535736083984375, 23.81368637084961, 25.091636657714844, 26.369586944580078, 27.647539138793945, 28.92548942565918, 30.203439712524414, 31.48138999938965, 32.759342193603516, 34.03729248046875, 35.315242767333984, 36.59319305419922, 37.87114334106445, 39.14909362792969, 40.42704391479492, 41.704994201660156, 42.98294448852539, 44.260894775390625, 45.53884506225586, 46.816795349121094, 48.09474563598633]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 15.0, 10.0, 16.0, 30.0, 47.0, 54.0, 94.0, 118.0, 183.0, 271.0, 388.0, 546.0, 910.0, 1372.0, 2258.0, 3877.0, 6655.0, 12272.0, 24811.0, 55763.0, 170156.0, 673337.0, 1882934.0, 983074.0, 237535.0, 72358.0, 30041.0, 15019.0, 7973.0, 4540.0, 2740.0, 1664.0, 1062.0, 702.0, 467.0, 339.0, 212.0, 128.0, 100.0, 64.0, 42.0, 42.0, 20.0, 8.0, 9.0, 9.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-62.28125, -60.4296875, -58.578125, -56.7265625, -54.875, -53.0234375, -51.171875, -49.3203125, -47.46875, -45.6171875, -43.765625, -41.9140625, -40.0625, -38.2109375, -36.359375, -34.5078125, -32.65625, -30.8046875, -28.953125, -27.1015625, -25.25, -23.3984375, -21.546875, -19.6953125, -17.84375, -15.9921875, -14.140625, -12.2890625, -10.4375, -8.5859375, -6.734375, -4.8828125, -3.03125, -1.1796875, 0.671875, 2.5234375, 4.375, 6.2265625, 8.078125, 9.9296875, 11.78125, 13.6328125, 15.484375, 17.3359375, 19.1875, 21.0390625, 22.890625, 24.7421875, 26.59375, 28.4453125, 30.296875, 32.1484375, 34.0, 35.8515625, 37.703125, 39.5546875, 41.40625, 43.2578125, 45.109375, 46.9609375, 48.8125, 50.6640625, 52.515625, 54.3671875, 56.21875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 9.0, 12.0, 6.0, 12.0, 23.0, 27.0, 29.0, 24.0, 23.0, 32.0, 35.0, 40.0, 43.0, 56.0, 46.0, 57.0, 60.0, 56.0, 43.0, 39.0, 44.0, 46.0, 41.0, 35.0, 19.0, 28.0, 18.0, 17.0, 7.0, 12.0, 11.0, 11.0, 6.0, 11.0, 7.0, 0.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.359375, -30.170166015625, -28.98095703125, -27.791748046875, -26.6025390625, -25.413330078125, -24.22412109375, -23.034912109375, -21.845703125, -20.656494140625, -19.46728515625, -18.278076171875, -17.0888671875, -15.899658203125, -14.71044921875, -13.521240234375, -12.33203125, -11.142822265625, -9.95361328125, -8.764404296875, -7.5751953125, -6.385986328125, -5.19677734375, -4.007568359375, -2.818359375, -1.629150390625, -0.43994140625, 0.749267578125, 1.9384765625, 3.127685546875, 4.31689453125, 5.506103515625, 6.6953125, 7.884521484375, 9.07373046875, 10.262939453125, 11.4521484375, 12.641357421875, 13.83056640625, 15.019775390625, 16.208984375, 17.398193359375, 18.58740234375, 19.776611328125, 20.9658203125, 22.155029296875, 23.34423828125, 24.533447265625, 25.72265625, 26.911865234375, 28.10107421875, 29.290283203125, 30.4794921875, 31.668701171875, 32.85791015625, 34.047119140625, 35.236328125, 36.425537109375, 37.61474609375, 38.803955078125, 39.9931640625, 41.182373046875, 42.37158203125, 43.560791015625, 44.75]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 9.0, 12.0, 19.0, 21.0, 23.0, 46.0, 55.0, 67.0, 118.0, 155.0, 237.0, 341.0, 470.0, 807.0, 1080.0, 1692.0, 2515.0, 4055.0, 6663.0, 11179.0, 19277.0, 34181.0, 64264.0, 127191.0, 277685.0, 705874.0, 1558648.0, 780701.0, 303262.0, 137564.0, 68539.0, 36184.0, 20321.0, 11727.0, 6958.0, 4247.0, 2750.0, 1773.0, 1128.0, 760.0, 502.0, 349.0, 252.0, 165.0, 136.0, 76.0, 53.0, 54.0, 29.0, 24.0, 15.0, 15.0, 9.0, 3.0, 2.0, 2.0, 5.0], "bins": [-50.0625, -48.5703125, -47.078125, -45.5859375, -44.09375, -42.6015625, -41.109375, -39.6171875, -38.125, -36.6328125, -35.140625, -33.6484375, -32.15625, -30.6640625, -29.171875, -27.6796875, -26.1875, -24.6953125, -23.203125, -21.7109375, -20.21875, -18.7265625, -17.234375, -15.7421875, -14.25, -12.7578125, -11.265625, -9.7734375, -8.28125, -6.7890625, -5.296875, -3.8046875, -2.3125, -0.8203125, 0.671875, 2.1640625, 3.65625, 5.1484375, 6.640625, 8.1328125, 9.625, 11.1171875, 12.609375, 14.1015625, 15.59375, 17.0859375, 18.578125, 20.0703125, 21.5625, 23.0546875, 24.546875, 26.0390625, 27.53125, 29.0234375, 30.515625, 32.0078125, 33.5, 34.9921875, 36.484375, 37.9765625, 39.46875, 40.9609375, 42.453125, 43.9453125, 45.4375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 8.0, 15.0, 16.0, 15.0, 22.0, 27.0, 35.0, 47.0, 43.0, 50.0, 58.0, 79.0, 99.0, 105.0, 150.0, 181.0, 216.0, 288.0, 351.0, 358.0, 338.0, 271.0, 236.0, 195.0, 155.0, 119.0, 107.0, 83.0, 79.0, 68.0, 45.0, 46.0, 31.0, 16.0, 30.0, 20.0, 15.0, 7.0, 10.0, 3.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.5703125, -15.1063232421875, -14.642333984375, -14.1783447265625, -13.71435546875, -13.2503662109375, -12.786376953125, -12.3223876953125, -11.8583984375, -11.3944091796875, -10.930419921875, -10.4664306640625, -10.00244140625, -9.5384521484375, -9.074462890625, -8.6104736328125, -8.146484375, -7.6824951171875, -7.218505859375, -6.7545166015625, -6.29052734375, -5.8265380859375, -5.362548828125, -4.8985595703125, -4.4345703125, -3.9705810546875, -3.506591796875, -3.0426025390625, -2.57861328125, -2.1146240234375, -1.650634765625, -1.1866455078125, -0.72265625, -0.2586669921875, 0.205322265625, 0.6693115234375, 1.13330078125, 1.5972900390625, 2.061279296875, 2.5252685546875, 2.9892578125, 3.4532470703125, 3.917236328125, 4.3812255859375, 4.84521484375, 5.3092041015625, 5.773193359375, 6.2371826171875, 6.701171875, 7.1651611328125, 7.629150390625, 8.0931396484375, 8.55712890625, 9.0211181640625, 9.485107421875, 9.9490966796875, 10.4130859375, 10.8770751953125, 11.341064453125, 11.8050537109375, 12.26904296875, 12.7330322265625, 13.197021484375, 13.6610107421875, 14.125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 8.0, 10.0, 5.0, 15.0, 16.0, 28.0, 25.0, 30.0, 36.0, 54.0, 49.0, 52.0, 54.0, 58.0, 68.0, 67.0, 57.0, 47.0, 48.0, 35.0, 40.0, 25.0, 21.0, 31.0, 19.0, 12.0, 16.0, 9.0, 6.0, 8.0, 7.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.71540832519531, -33.58159255981445, -32.447776794433594, -31.313961029052734, -30.180145263671875, -29.046329498291016, -27.912513732910156, -26.778697967529297, -25.644882202148438, -24.511066436767578, -23.37725067138672, -22.24343490600586, -21.109619140625, -19.97580337524414, -18.84198760986328, -17.708171844482422, -16.574356079101562, -15.440540313720703, -14.306724548339844, -13.172908782958984, -12.039093017578125, -10.905277252197266, -9.771461486816406, -8.637645721435547, -7.5038299560546875, -6.370014190673828, -5.236198425292969, -4.102382659912109, -2.96856689453125, -1.8347511291503906, -0.7009353637695312, 0.4328804016113281, 1.5666961669921875, 2.700511932373047, 3.8343276977539062, 4.968143463134766, 6.101959228515625, 7.235774993896484, 8.369590759277344, 9.503406524658203, 10.637222290039062, 11.771038055419922, 12.904853820800781, 14.03866958618164, 15.1724853515625, 16.30630111694336, 17.44011688232422, 18.573932647705078, 19.707748413085938, 20.841564178466797, 21.975379943847656, 23.109195709228516, 24.243011474609375, 25.376827239990234, 26.510643005371094, 27.644458770751953, 28.778274536132812, 29.912090301513672, 31.04590606689453, 32.17972183227539, 33.31353759765625, 34.44735336303711, 35.58116912841797, 36.71498489379883, 37.84880065917969]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 8.0, 14.0, 4.0, 14.0, 18.0, 13.0, 21.0, 19.0, 26.0, 27.0, 38.0, 31.0, 29.0, 39.0, 41.0, 39.0, 36.0, 48.0, 46.0, 43.0, 33.0, 41.0, 43.0, 31.0, 37.0, 28.0, 33.0, 24.0, 26.0, 20.0, 22.0, 12.0, 13.0, 14.0, 12.0, 6.0, 7.0, 3.0, 4.0, 9.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.75595474243164, -31.653465270996094, -30.550975799560547, -29.448486328125, -28.345996856689453, -27.243507385253906, -26.141016006469727, -25.03852653503418, -23.936037063598633, -22.833547592163086, -21.73105812072754, -20.628568649291992, -19.526077270507812, -18.423587799072266, -17.32109832763672, -16.218608856201172, -15.116119384765625, -14.013629913330078, -12.911140441894531, -11.808650016784668, -10.706160545349121, -9.603671073913574, -8.501180648803711, -7.398691177368164, -6.296201705932617, -5.19371223449707, -4.091222286224365, -2.9887325763702393, -1.8862428665161133, -0.7837533950805664, 0.31873655319213867, 1.4212265014648438, 2.5237159729003906, 3.6262056827545166, 4.728695392608643, 5.831185340881348, 6.9336748123168945, 8.036164283752441, 9.138654708862305, 10.241144180297852, 11.343633651733398, 12.446123123168945, 13.548612594604492, 14.651103019714355, 15.753592491149902, 16.856082916259766, 17.958572387695312, 19.06106185913086, 20.163551330566406, 21.266040802001953, 22.3685302734375, 23.471019744873047, 24.573509216308594, 25.67599868774414, 26.77849006652832, 27.880979537963867, 28.983469009399414, 30.08595848083496, 31.188447952270508, 32.29093933105469, 33.393428802490234, 34.49591827392578, 35.59840774536133, 36.700897216796875, 37.80338668823242]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 6.0, 6.0, 10.0, 8.0, 28.0, 27.0, 52.0, 63.0, 82.0, 139.0, 171.0, 251.0, 351.0, 451.0, 713.0, 1007.0, 1336.0, 1984.0, 2834.0, 4151.0, 5975.0, 8587.0, 13076.0, 19378.0, 29539.0, 46727.0, 75129.0, 126231.0, 211514.0, 192758.0, 113088.0, 67511.0, 42345.0, 27286.0, 17657.0, 11840.0, 8156.0, 5422.0, 3792.0, 2609.0, 1825.0, 1329.0, 889.0, 635.0, 475.0, 335.0, 242.0, 156.0, 124.0, 79.0, 42.0, 44.0, 41.0, 18.0, 19.0, 10.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-9.828125, -9.510009765625, -9.19189453125, -8.873779296875, -8.5556640625, -8.237548828125, -7.91943359375, -7.601318359375, -7.283203125, -6.965087890625, -6.64697265625, -6.328857421875, -6.0107421875, -5.692626953125, -5.37451171875, -5.056396484375, -4.73828125, -4.420166015625, -4.10205078125, -3.783935546875, -3.4658203125, -3.147705078125, -2.82958984375, -2.511474609375, -2.193359375, -1.875244140625, -1.55712890625, -1.239013671875, -0.9208984375, -0.602783203125, -0.28466796875, 0.033447265625, 0.3515625, 0.669677734375, 0.98779296875, 1.305908203125, 1.6240234375, 1.942138671875, 2.26025390625, 2.578369140625, 2.896484375, 3.214599609375, 3.53271484375, 3.850830078125, 4.1689453125, 4.487060546875, 4.80517578125, 5.123291015625, 5.44140625, 5.759521484375, 6.07763671875, 6.395751953125, 6.7138671875, 7.031982421875, 7.35009765625, 7.668212890625, 7.986328125, 8.304443359375, 8.62255859375, 8.940673828125, 9.2587890625, 9.576904296875, 9.89501953125, 10.213134765625, 10.53125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 7.0, 11.0, 8.0, 21.0, 10.0, 11.0, 19.0, 20.0, 27.0, 29.0, 31.0, 37.0, 28.0, 41.0, 29.0, 36.0, 47.0, 43.0, 47.0, 42.0, 35.0, 47.0, 27.0, 41.0, 39.0, 28.0, 40.0, 30.0, 19.0, 23.0, 15.0, 20.0, 15.0, 7.0, 12.0, 4.0, 8.0, 7.0, 6.0, 6.0, 6.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.625, -34.5029296875, -33.380859375, -32.2587890625, -31.13671875, -30.0146484375, -28.892578125, -27.7705078125, -26.6484375, -25.5263671875, -24.404296875, -23.2822265625, -22.16015625, -21.0380859375, -19.916015625, -18.7939453125, -17.671875, -16.5498046875, -15.427734375, -14.3056640625, -13.18359375, -12.0615234375, -10.939453125, -9.8173828125, -8.6953125, -7.5732421875, -6.451171875, -5.3291015625, -4.20703125, -3.0849609375, -1.962890625, -0.8408203125, 0.28125, 1.4033203125, 2.525390625, 3.6474609375, 4.76953125, 5.8916015625, 7.013671875, 8.1357421875, 9.2578125, 10.3798828125, 11.501953125, 12.6240234375, 13.74609375, 14.8681640625, 15.990234375, 17.1123046875, 18.234375, 19.3564453125, 20.478515625, 21.6005859375, 22.72265625, 23.8447265625, 24.966796875, 26.0888671875, 27.2109375, 28.3330078125, 29.455078125, 30.5771484375, 31.69921875, 32.8212890625, 33.943359375, 35.0654296875, 36.1875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 8.0, 5.0, 6.0, 20.0, 21.0, 36.0, 40.0, 74.0, 100.0, 148.0, 193.0, 306.0, 454.0, 731.0, 1182.0, 2040.0, 3597.0, 6853.0, 13393.0, 32143.0, 527019.0, 401775.0, 30298.0, 12946.0, 6453.0, 3488.0, 1980.0, 1105.0, 699.0, 452.0, 292.0, 191.0, 135.0, 94.0, 80.0, 43.0, 29.0, 24.0, 28.0, 11.0, 9.0, 14.0, 7.0, 6.0, 2.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-26.296875, -25.474365234375, -24.65185546875, -23.829345703125, -23.0068359375, -22.184326171875, -21.36181640625, -20.539306640625, -19.716796875, -18.894287109375, -18.07177734375, -17.249267578125, -16.4267578125, -15.604248046875, -14.78173828125, -13.959228515625, -13.13671875, -12.314208984375, -11.49169921875, -10.669189453125, -9.8466796875, -9.024169921875, -8.20166015625, -7.379150390625, -6.556640625, -5.734130859375, -4.91162109375, -4.089111328125, -3.2666015625, -2.444091796875, -1.62158203125, -0.799072265625, 0.0234375, 0.845947265625, 1.66845703125, 2.490966796875, 3.3134765625, 4.135986328125, 4.95849609375, 5.781005859375, 6.603515625, 7.426025390625, 8.24853515625, 9.071044921875, 9.8935546875, 10.716064453125, 11.53857421875, 12.361083984375, 13.18359375, 14.006103515625, 14.82861328125, 15.651123046875, 16.4736328125, 17.296142578125, 18.11865234375, 18.941162109375, 19.763671875, 20.586181640625, 21.40869140625, 22.231201171875, 23.0537109375, 23.876220703125, 24.69873046875, 25.521240234375, 26.34375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 5.0, 9.0, 4.0, 9.0, 10.0, 18.0, 14.0, 5.0, 27.0, 24.0, 20.0, 30.0, 22.0, 43.0, 48.0, 28.0, 45.0, 34.0, 40.0, 38.0, 39.0, 29.0, 29.0, 40.0, 35.0, 44.0, 25.0, 32.0, 28.0, 34.0, 22.0, 28.0, 19.0, 17.0, 13.0, 16.0, 18.0, 10.0, 12.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-24.203125, -23.479248046875, -22.75537109375, -22.031494140625, -21.3076171875, -20.583740234375, -19.85986328125, -19.135986328125, -18.412109375, -17.688232421875, -16.96435546875, -16.240478515625, -15.5166015625, -14.792724609375, -14.06884765625, -13.344970703125, -12.62109375, -11.897216796875, -11.17333984375, -10.449462890625, -9.7255859375, -9.001708984375, -8.27783203125, -7.553955078125, -6.830078125, -6.106201171875, -5.38232421875, -4.658447265625, -3.9345703125, -3.210693359375, -2.48681640625, -1.762939453125, -1.0390625, -0.315185546875, 0.40869140625, 1.132568359375, 1.8564453125, 2.580322265625, 3.30419921875, 4.028076171875, 4.751953125, 5.475830078125, 6.19970703125, 6.923583984375, 7.6474609375, 8.371337890625, 9.09521484375, 9.819091796875, 10.54296875, 11.266845703125, 11.99072265625, 12.714599609375, 13.4384765625, 14.162353515625, 14.88623046875, 15.610107421875, 16.333984375, 17.057861328125, 17.78173828125, 18.505615234375, 19.2294921875, 19.953369140625, 20.67724609375, 21.401123046875, 22.125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 6.0, 19.0, 22.0, 30.0, 44.0, 71.0, 62.0, 121.0, 146.0, 221.0, 365.0, 615.0, 1188.0, 2424.0, 5755.0, 15321.0, 67207.0, 892786.0, 40788.0, 12002.0, 4548.0, 2073.0, 1048.0, 624.0, 352.0, 248.0, 136.0, 87.0, 50.0, 43.0, 27.0, 26.0, 20.0, 15.0, 11.0, 13.0, 4.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.709228515625, -2.61376953125, -2.518310546875, -2.4228515625, -2.327392578125, -2.23193359375, -2.136474609375, -2.041015625, -1.945556640625, -1.85009765625, -1.754638671875, -1.6591796875, -1.563720703125, -1.46826171875, -1.372802734375, -1.27734375, -1.181884765625, -1.08642578125, -0.990966796875, -0.8955078125, -0.800048828125, -0.70458984375, -0.609130859375, -0.513671875, -0.418212890625, -0.32275390625, -0.227294921875, -0.1318359375, -0.036376953125, 0.05908203125, 0.154541015625, 0.25, 0.345458984375, 0.44091796875, 0.536376953125, 0.6318359375, 0.727294921875, 0.82275390625, 0.918212890625, 1.013671875, 1.109130859375, 1.20458984375, 1.300048828125, 1.3955078125, 1.490966796875, 1.58642578125, 1.681884765625, 1.77734375, 1.872802734375, 1.96826171875, 2.063720703125, 2.1591796875, 2.254638671875, 2.35009765625, 2.445556640625, 2.541015625, 2.636474609375, 2.73193359375, 2.827392578125, 2.9228515625, 3.018310546875, 3.11376953125, 3.209228515625, 3.3046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 6.0, 2.0, 14.0, 9.0, 13.0, 13.0, 26.0, 26.0, 33.0, 41.0, 41.0, 62.0, 63.0, 83.0, 65.0, 68.0, 67.0, 66.0, 56.0, 44.0, 23.0, 32.0, 20.0, 17.0, 19.0, 13.0, 16.0, 13.0, 11.0, 8.0, 3.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016009807586669922, -0.00015516020357608795, -0.00015022233128547668, -0.00014528445899486542, -0.00014034658670425415, -0.00013540871441364288, -0.00013047084212303162, -0.00012553296983242035, -0.00012059509754180908, -0.00011565722525119781, -0.00011071935296058655, -0.00010578148066997528, -0.00010084360837936401, -9.590573608875275e-05, -9.096786379814148e-05, -8.602999150753021e-05, -8.109211921691895e-05, -7.615424692630768e-05, -7.121637463569641e-05, -6.627850234508514e-05, -6.134063005447388e-05, -5.640275776386261e-05, -5.146488547325134e-05, -4.6527013182640076e-05, -4.158914089202881e-05, -3.665126860141754e-05, -3.1713396310806274e-05, -2.6775524020195007e-05, -2.183765172958374e-05, -1.6899779438972473e-05, -1.1961907148361206e-05, -7.024034857749939e-06, -2.086162567138672e-06, 2.8517097234725952e-06, 7.789582014083862e-06, 1.272745430469513e-05, 1.7665326595306396e-05, 2.2603198885917664e-05, 2.754107117652893e-05, 3.24789434671402e-05, 3.7416815757751465e-05, 4.235468804836273e-05, 4.7292560338974e-05, 5.2230432629585266e-05, 5.716830492019653e-05, 6.21061772108078e-05, 6.704404950141907e-05, 7.198192179203033e-05, 7.69197940826416e-05, 8.185766637325287e-05, 8.679553866386414e-05, 9.17334109544754e-05, 9.667128324508667e-05, 0.00010160915553569794, 0.0001065470278263092, 0.00011148490011692047, 0.00011642277240753174, 0.000121360644698143, 0.00012629851698875427, 0.00013123638927936554, 0.0001361742615699768, 0.00014111213386058807, 0.00014605000615119934, 0.0001509878784418106, 0.00015592575073242188]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 16.0, 32.0, 28.0, 36.0, 78.0, 101.0, 154.0, 204.0, 312.0, 414.0, 611.0, 919.0, 1348.0, 1906.0, 2783.0, 4188.0, 6459.0, 10162.0, 16405.0, 27944.0, 51127.0, 104035.0, 237867.0, 295683.0, 134853.0, 63588.0, 33994.0, 19064.0, 11764.0, 7418.0, 4847.0, 3389.0, 2160.0, 1511.0, 988.0, 624.0, 456.0, 329.0, 234.0, 163.0, 118.0, 59.0, 50.0, 49.0, 31.0, 11.0, 12.0, 2.0, 4.0, 5.0, 6.0, 0.0, 3.0], "bins": [-2.93359375, -2.84771728515625, -2.7618408203125, -2.67596435546875, -2.590087890625, -2.50421142578125, -2.4183349609375, -2.33245849609375, -2.24658203125, -2.16070556640625, -2.0748291015625, -1.98895263671875, -1.903076171875, -1.81719970703125, -1.7313232421875, -1.64544677734375, -1.5595703125, -1.47369384765625, -1.3878173828125, -1.30194091796875, -1.216064453125, -1.13018798828125, -1.0443115234375, -0.95843505859375, -0.87255859375, -0.78668212890625, -0.7008056640625, -0.61492919921875, -0.529052734375, -0.44317626953125, -0.3572998046875, -0.27142333984375, -0.185546875, -0.09967041015625, -0.0137939453125, 0.07208251953125, 0.157958984375, 0.24383544921875, 0.3297119140625, 0.41558837890625, 0.50146484375, 0.58734130859375, 0.6732177734375, 0.75909423828125, 0.844970703125, 0.93084716796875, 1.0167236328125, 1.10260009765625, 1.1884765625, 1.27435302734375, 1.3602294921875, 1.44610595703125, 1.531982421875, 1.61785888671875, 1.7037353515625, 1.78961181640625, 1.87548828125, 1.96136474609375, 2.0472412109375, 2.13311767578125, 2.218994140625, 2.30487060546875, 2.3907470703125, 2.47662353515625, 2.5625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 4.0, 8.0, 3.0, 4.0, 7.0, 7.0, 12.0, 12.0, 18.0, 25.0, 23.0, 37.0, 44.0, 63.0, 83.0, 111.0, 87.0, 96.0, 72.0, 47.0, 58.0, 41.0, 22.0, 27.0, 12.0, 12.0, 6.0, 9.0, 7.0, 4.0, 8.0, 6.0, 5.0, 1.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0361328125, -1.0007476806640625, -0.965362548828125, -0.9299774169921875, -0.89459228515625, -0.8592071533203125, -0.823822021484375, -0.7884368896484375, -0.7530517578125, -0.7176666259765625, -0.682281494140625, -0.6468963623046875, -0.61151123046875, -0.5761260986328125, -0.540740966796875, -0.5053558349609375, -0.469970703125, -0.4345855712890625, -0.399200439453125, -0.3638153076171875, -0.32843017578125, -0.2930450439453125, -0.257659912109375, -0.2222747802734375, -0.1868896484375, -0.1515045166015625, -0.116119384765625, -0.0807342529296875, -0.04534912109375, -0.0099639892578125, 0.025421142578125, 0.0608062744140625, 0.09619140625, 0.1315765380859375, 0.166961669921875, 0.2023468017578125, 0.23773193359375, 0.2731170654296875, 0.308502197265625, 0.3438873291015625, 0.3792724609375, 0.4146575927734375, 0.450042724609375, 0.4854278564453125, 0.52081298828125, 0.5561981201171875, 0.591583251953125, 0.6269683837890625, 0.662353515625, 0.6977386474609375, 0.733123779296875, 0.7685089111328125, 0.80389404296875, 0.8392791748046875, 0.874664306640625, 0.9100494384765625, 0.9454345703125, 0.9808197021484375, 1.016204833984375, 1.0515899658203125, 1.08697509765625, 1.1223602294921875, 1.157745361328125, 1.1931304931640625, 1.228515625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 8.0, 8.0, 8.0, 7.0, 11.0, 17.0, 30.0, 27.0, 30.0, 38.0, 47.0, 61.0, 60.0, 62.0, 63.0, 55.0, 72.0, 68.0, 54.0, 43.0, 39.0, 29.0, 22.0, 24.0, 23.0, 17.0, 15.0, 6.0, 10.0, 12.0, 5.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.98853302001953, -34.8026237487793, -33.61671447753906, -32.43080520629883, -31.244897842407227, -30.058988571166992, -28.87308120727539, -27.687171936035156, -26.501262664794922, -25.315353393554688, -24.129444122314453, -22.94353675842285, -21.757627487182617, -20.571718215942383, -19.38581085205078, -18.199901580810547, -17.013992309570312, -15.828083038330078, -14.64217472076416, -13.456266403198242, -12.270357131958008, -11.084447860717773, -9.898539543151855, -8.712631225585938, -7.526721954345703, -6.340813159942627, -5.154904365539551, -3.9689955711364746, -2.7830867767333984, -1.5971779823303223, -0.4112691879272461, 0.7746391296386719, 1.9605522155761719, 3.146461009979248, 4.332369804382324, 5.5182785987854, 6.704187393188477, 7.890096187591553, 9.076004981994629, 10.261913299560547, 11.447822570800781, 12.633731842041016, 13.819640159606934, 15.005548477172852, 16.191457748413086, 17.37736701965332, 18.563274383544922, 19.749183654785156, 20.93509292602539, 22.121002197265625, 23.30691146850586, 24.49281883239746, 25.678728103637695, 26.86463737487793, 28.05054473876953, 29.236454010009766, 30.42236328125, 31.608272552490234, 32.79418182373047, 33.9800910949707, 35.16600036621094, 36.351905822753906, 37.53781509399414, 38.723724365234375, 39.90963363647461]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 6.0, 4.0, 3.0, 5.0, 8.0, 12.0, 3.0, 14.0, 17.0, 18.0, 20.0, 20.0, 28.0, 26.0, 37.0, 30.0, 29.0, 37.0, 45.0, 37.0, 37.0, 45.0, 46.0, 38.0, 40.0, 41.0, 39.0, 34.0, 32.0, 30.0, 33.0, 22.0, 28.0, 21.0, 22.0, 13.0, 14.0, 13.0, 9.0, 9.0, 6.0, 4.0, 3.0, 9.0, 7.0, 4.0, 6.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.0479621887207, -30.97037124633789, -29.892780303955078, -28.815189361572266, -27.737598419189453, -26.66000747680664, -25.582416534423828, -24.504825592041016, -23.427234649658203, -22.34964370727539, -21.272052764892578, -20.194461822509766, -19.116870880126953, -18.03927993774414, -16.961688995361328, -15.884098052978516, -14.806507110595703, -13.72891616821289, -12.651325225830078, -11.573734283447266, -10.496143341064453, -9.41855239868164, -8.340961456298828, -7.263370513916016, -6.185779571533203, -5.108188629150391, -4.030597686767578, -2.9530067443847656, -1.8754158020019531, -0.7978248596191406, 0.2797660827636719, 1.3573570251464844, 2.4349517822265625, 3.512542724609375, 4.5901336669921875, 5.667724609375, 6.7453155517578125, 7.822906494140625, 8.900497436523438, 9.97808837890625, 11.055679321289062, 12.133270263671875, 13.210861206054688, 14.2884521484375, 15.366043090820312, 16.443634033203125, 17.521224975585938, 18.59881591796875, 19.676406860351562, 20.753997802734375, 21.831588745117188, 22.9091796875, 23.986770629882812, 25.064361572265625, 26.141952514648438, 27.21954345703125, 28.297134399414062, 29.374725341796875, 30.452316284179688, 31.5299072265625, 32.60749816894531, 33.685089111328125, 34.76268005371094, 35.84027099609375, 36.91786193847656]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 14.0, 24.0, 25.0, 55.0, 78.0, 108.0, 181.0, 320.0, 542.0, 806.0, 1169.0, 1992.0, 2976.0, 4706.0, 7568.0, 12784.0, 21044.0, 36227.0, 63725.0, 112983.0, 195324.0, 231253.0, 151071.0, 85556.0, 47987.0, 27550.0, 16320.0, 9937.0, 5910.0, 3628.0, 2413.0, 1496.0, 1006.0, 643.0, 437.0, 240.0, 153.0, 97.0, 85.0, 42.0, 25.0, 21.0, 14.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-49.625, -48.21728515625, -46.8095703125, -45.40185546875, -43.994140625, -42.58642578125, -41.1787109375, -39.77099609375, -38.36328125, -36.95556640625, -35.5478515625, -34.14013671875, -32.732421875, -31.32470703125, -29.9169921875, -28.50927734375, -27.1015625, -25.69384765625, -24.2861328125, -22.87841796875, -21.470703125, -20.06298828125, -18.6552734375, -17.24755859375, -15.83984375, -14.43212890625, -13.0244140625, -11.61669921875, -10.208984375, -8.80126953125, -7.3935546875, -5.98583984375, -4.578125, -3.17041015625, -1.7626953125, -0.35498046875, 1.052734375, 2.46044921875, 3.8681640625, 5.27587890625, 6.68359375, 8.09130859375, 9.4990234375, 10.90673828125, 12.314453125, 13.72216796875, 15.1298828125, 16.53759765625, 17.9453125, 19.35302734375, 20.7607421875, 22.16845703125, 23.576171875, 24.98388671875, 26.3916015625, 27.79931640625, 29.20703125, 30.61474609375, 32.0224609375, 33.43017578125, 34.837890625, 36.24560546875, 37.6533203125, 39.06103515625, 40.46875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 6.0, 6.0, 4.0, 5.0, 9.0, 14.0, 12.0, 17.0, 14.0, 19.0, 25.0, 33.0, 31.0, 26.0, 26.0, 40.0, 33.0, 51.0, 47.0, 54.0, 38.0, 42.0, 47.0, 28.0, 51.0, 38.0, 33.0, 30.0, 30.0, 29.0, 24.0, 19.0, 23.0, 16.0, 10.0, 11.0, 10.0, 9.0, 3.0, 10.0, 2.0, 3.0, 7.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.296875, -29.207763671875, -28.11865234375, -27.029541015625, -25.9404296875, -24.851318359375, -23.76220703125, -22.673095703125, -21.583984375, -20.494873046875, -19.40576171875, -18.316650390625, -17.2275390625, -16.138427734375, -15.04931640625, -13.960205078125, -12.87109375, -11.781982421875, -10.69287109375, -9.603759765625, -8.5146484375, -7.425537109375, -6.33642578125, -5.247314453125, -4.158203125, -3.069091796875, -1.97998046875, -0.890869140625, 0.1982421875, 1.287353515625, 2.37646484375, 3.465576171875, 4.5546875, 5.643798828125, 6.73291015625, 7.822021484375, 8.9111328125, 10.000244140625, 11.08935546875, 12.178466796875, 13.267578125, 14.356689453125, 15.44580078125, 16.534912109375, 17.6240234375, 18.713134765625, 19.80224609375, 20.891357421875, 21.98046875, 23.069580078125, 24.15869140625, 25.247802734375, 26.3369140625, 27.426025390625, 28.51513671875, 29.604248046875, 30.693359375, 31.782470703125, 32.87158203125, 33.960693359375, 35.0498046875, 36.138916015625, 37.22802734375, 38.317138671875, 39.40625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 8.0, 4.0, 5.0, 10.0, 11.0, 25.0, 27.0, 41.0, 68.0, 85.0, 142.0, 162.0, 252.0, 392.0, 595.0, 894.0, 1332.0, 2003.0, 3028.0, 4697.0, 7156.0, 11090.0, 17479.0, 28178.0, 46157.0, 76520.0, 124968.0, 185068.0, 190530.0, 133524.0, 81537.0, 49319.0, 30399.0, 18855.0, 11763.0, 7711.0, 4899.0, 3253.0, 2141.0, 1379.0, 940.0, 635.0, 402.0, 255.0, 177.0, 143.0, 92.0, 62.0, 54.0, 39.0, 16.0, 12.0, 9.0, 5.0, 4.0, 5.0, 2.0, 4.0, 5.0], "bins": [-40.59375, -39.3662109375, -38.138671875, -36.9111328125, -35.68359375, -34.4560546875, -33.228515625, -32.0009765625, -30.7734375, -29.5458984375, -28.318359375, -27.0908203125, -25.86328125, -24.6357421875, -23.408203125, -22.1806640625, -20.953125, -19.7255859375, -18.498046875, -17.2705078125, -16.04296875, -14.8154296875, -13.587890625, -12.3603515625, -11.1328125, -9.9052734375, -8.677734375, -7.4501953125, -6.22265625, -4.9951171875, -3.767578125, -2.5400390625, -1.3125, -0.0849609375, 1.142578125, 2.3701171875, 3.59765625, 4.8251953125, 6.052734375, 7.2802734375, 8.5078125, 9.7353515625, 10.962890625, 12.1904296875, 13.41796875, 14.6455078125, 15.873046875, 17.1005859375, 18.328125, 19.5556640625, 20.783203125, 22.0107421875, 23.23828125, 24.4658203125, 25.693359375, 26.9208984375, 28.1484375, 29.3759765625, 30.603515625, 31.8310546875, 33.05859375, 34.2861328125, 35.513671875, 36.7412109375, 37.96875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 6.0, 10.0, 9.0, 11.0, 15.0, 11.0, 17.0, 21.0, 26.0, 14.0, 25.0, 32.0, 28.0, 33.0, 33.0, 33.0, 33.0, 50.0, 48.0, 35.0, 43.0, 43.0, 36.0, 37.0, 33.0, 45.0, 30.0, 31.0, 43.0, 17.0, 16.0, 13.0, 18.0, 23.0, 12.0, 9.0, 6.0, 11.0, 7.0, 9.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-20.5, -19.858642578125, -19.21728515625, -18.575927734375, -17.9345703125, -17.293212890625, -16.65185546875, -16.010498046875, -15.369140625, -14.727783203125, -14.08642578125, -13.445068359375, -12.8037109375, -12.162353515625, -11.52099609375, -10.879638671875, -10.23828125, -9.596923828125, -8.95556640625, -8.314208984375, -7.6728515625, -7.031494140625, -6.39013671875, -5.748779296875, -5.107421875, -4.466064453125, -3.82470703125, -3.183349609375, -2.5419921875, -1.900634765625, -1.25927734375, -0.617919921875, 0.0234375, 0.664794921875, 1.30615234375, 1.947509765625, 2.5888671875, 3.230224609375, 3.87158203125, 4.512939453125, 5.154296875, 5.795654296875, 6.43701171875, 7.078369140625, 7.7197265625, 8.361083984375, 9.00244140625, 9.643798828125, 10.28515625, 10.926513671875, 11.56787109375, 12.209228515625, 12.8505859375, 13.491943359375, 14.13330078125, 14.774658203125, 15.416015625, 16.057373046875, 16.69873046875, 17.340087890625, 17.9814453125, 18.622802734375, 19.26416015625, 19.905517578125, 20.546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 13.0, 21.0, 29.0, 40.0, 73.0, 88.0, 120.0, 150.0, 246.0, 308.0, 486.0, 674.0, 955.0, 1317.0, 1961.0, 2640.0, 4087.0, 6266.0, 9471.0, 14908.0, 24482.0, 42440.0, 77394.0, 146513.0, 253581.0, 204876.0, 108618.0, 58063.0, 33170.0, 19460.0, 12057.0, 7731.0, 5004.0, 3416.0, 2349.0, 1635.0, 1165.0, 814.0, 550.0, 419.0, 266.0, 199.0, 139.0, 100.0, 69.0, 57.0, 48.0, 24.0, 18.0, 13.0, 9.0, 3.0, 6.0, 4.0, 1.0, 3.0, 1.0], "bins": [-14.0234375, -13.58203125, -13.140625, -12.69921875, -12.2578125, -11.81640625, -11.375, -10.93359375, -10.4921875, -10.05078125, -9.609375, -9.16796875, -8.7265625, -8.28515625, -7.84375, -7.40234375, -6.9609375, -6.51953125, -6.078125, -5.63671875, -5.1953125, -4.75390625, -4.3125, -3.87109375, -3.4296875, -2.98828125, -2.546875, -2.10546875, -1.6640625, -1.22265625, -0.78125, -0.33984375, 0.1015625, 0.54296875, 0.984375, 1.42578125, 1.8671875, 2.30859375, 2.75, 3.19140625, 3.6328125, 4.07421875, 4.515625, 4.95703125, 5.3984375, 5.83984375, 6.28125, 6.72265625, 7.1640625, 7.60546875, 8.046875, 8.48828125, 8.9296875, 9.37109375, 9.8125, 10.25390625, 10.6953125, 11.13671875, 11.578125, 12.01953125, 12.4609375, 12.90234375, 13.34375, 13.78515625, 14.2265625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 11.0, 14.0, 13.0, 26.0, 28.0, 45.0, 43.0, 70.0, 84.0, 108.0, 139.0, 105.0, 79.0, 55.0, 51.0, 32.0, 18.0, 16.0, 13.0, 9.0, 7.0, 4.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.002300262451171875, -0.002229154109954834, -0.002158045768737793, -0.002086937427520752, -0.002015829086303711, -0.00194472074508667, -0.001873612403869629, -0.0018025040626525879, -0.0017313957214355469, -0.0016602873802185059, -0.0015891790390014648, -0.0015180706977844238, -0.0014469623565673828, -0.0013758540153503418, -0.0013047456741333008, -0.0012336373329162598, -0.0011625289916992188, -0.0010914206504821777, -0.0010203123092651367, -0.0009492039680480957, -0.0008780956268310547, -0.0008069872856140137, -0.0007358789443969727, -0.0006647706031799316, -0.0005936622619628906, -0.0005225539207458496, -0.0004514455795288086, -0.0003803372383117676, -0.00030922889709472656, -0.00023812055587768555, -0.00016701221466064453, -9.590387344360352e-05, -2.47955322265625e-05, 4.6312808990478516e-05, 0.00011742115020751953, 0.00018852949142456055, 0.00025963783264160156, 0.0003307461738586426, 0.0004018545150756836, 0.0004729628562927246, 0.0005440711975097656, 0.0006151795387268066, 0.0006862878799438477, 0.0007573962211608887, 0.0008285045623779297, 0.0008996129035949707, 0.0009707212448120117, 0.0010418295860290527, 0.0011129379272460938, 0.0011840462684631348, 0.0012551546096801758, 0.0013262629508972168, 0.0013973712921142578, 0.0014684796333312988, 0.0015395879745483398, 0.0016106963157653809, 0.0016818046569824219, 0.0017529129981994629, 0.001824021339416504, 0.001895129680633545, 0.001966238021850586, 0.002037346363067627, 0.002108454704284668, 0.002179563045501709, 0.00225067138671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 0.0, 8.0, 10.0, 7.0, 9.0, 22.0, 32.0, 41.0, 63.0, 99.0, 124.0, 185.0, 285.0, 393.0, 609.0, 860.0, 1255.0, 1855.0, 2970.0, 4642.0, 7141.0, 11557.0, 18840.0, 32022.0, 57034.0, 106907.0, 207248.0, 261874.0, 148407.0, 77263.0, 42258.0, 24262.0, 14575.0, 9013.0, 5682.0, 3669.0, 2422.0, 1612.0, 1083.0, 670.0, 490.0, 344.0, 222.0, 148.0, 111.0, 83.0, 52.0, 28.0, 24.0, 16.0, 14.0, 6.0, 5.0, 5.0, 8.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.5703125, -14.10400390625, -13.6376953125, -13.17138671875, -12.705078125, -12.23876953125, -11.7724609375, -11.30615234375, -10.83984375, -10.37353515625, -9.9072265625, -9.44091796875, -8.974609375, -8.50830078125, -8.0419921875, -7.57568359375, -7.109375, -6.64306640625, -6.1767578125, -5.71044921875, -5.244140625, -4.77783203125, -4.3115234375, -3.84521484375, -3.37890625, -2.91259765625, -2.4462890625, -1.97998046875, -1.513671875, -1.04736328125, -0.5810546875, -0.11474609375, 0.3515625, 0.81787109375, 1.2841796875, 1.75048828125, 2.216796875, 2.68310546875, 3.1494140625, 3.61572265625, 4.08203125, 4.54833984375, 5.0146484375, 5.48095703125, 5.947265625, 6.41357421875, 6.8798828125, 7.34619140625, 7.8125, 8.27880859375, 8.7451171875, 9.21142578125, 9.677734375, 10.14404296875, 10.6103515625, 11.07666015625, 11.54296875, 12.00927734375, 12.4755859375, 12.94189453125, 13.408203125, 13.87451171875, 14.3408203125, 14.80712890625, 15.2734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 6.0, 9.0, 8.0, 7.0, 11.0, 11.0, 16.0, 25.0, 16.0, 22.0, 31.0, 35.0, 72.0, 53.0, 80.0, 89.0, 79.0, 73.0, 55.0, 56.0, 55.0, 32.0, 18.0, 25.0, 24.0, 19.0, 17.0, 10.0, 5.0, 6.0, 10.0, 7.0, 5.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.26171875, -6.05865478515625, -5.8555908203125, -5.65252685546875, -5.449462890625, -5.24639892578125, -5.0433349609375, -4.84027099609375, -4.63720703125, -4.43414306640625, -4.2310791015625, -4.02801513671875, -3.824951171875, -3.62188720703125, -3.4188232421875, -3.21575927734375, -3.0126953125, -2.80963134765625, -2.6065673828125, -2.40350341796875, -2.200439453125, -1.99737548828125, -1.7943115234375, -1.59124755859375, -1.38818359375, -1.18511962890625, -0.9820556640625, -0.77899169921875, -0.575927734375, -0.37286376953125, -0.1697998046875, 0.03326416015625, 0.236328125, 0.43939208984375, 0.6424560546875, 0.84552001953125, 1.048583984375, 1.25164794921875, 1.4547119140625, 1.65777587890625, 1.86083984375, 2.06390380859375, 2.2669677734375, 2.47003173828125, 2.673095703125, 2.87615966796875, 3.0792236328125, 3.28228759765625, 3.4853515625, 3.68841552734375, 3.8914794921875, 4.09454345703125, 4.297607421875, 4.50067138671875, 4.7037353515625, 4.90679931640625, 5.10986328125, 5.31292724609375, 5.5159912109375, 5.71905517578125, 5.922119140625, 6.12518310546875, 6.3282470703125, 6.53131103515625, 6.734375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 12.0, 12.0, 13.0, 24.0, 23.0, 33.0, 50.0, 48.0, 69.0, 70.0, 67.0, 75.0, 96.0, 72.0, 58.0, 60.0, 49.0, 30.0, 23.0, 23.0, 22.0, 13.0, 17.0, 7.0, 7.0, 4.0, 2.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.99857711791992, -38.51227951049805, -37.02598571777344, -35.53968811035156, -34.05339431762695, -32.56709671020508, -31.080801010131836, -29.594505310058594, -28.10820770263672, -26.621912002563477, -25.135616302490234, -23.64931869506836, -22.163022994995117, -20.676727294921875, -19.190431594848633, -17.70413589477539, -16.21784019470215, -14.731544494628906, -13.245247840881348, -11.758952140808105, -10.272655487060547, -8.786359786987305, -7.3000640869140625, -5.813767433166504, -4.327471733093262, -2.8411755561828613, -1.35487961769104, 0.13141632080078125, 1.6177124977111816, 3.104008674621582, 4.590304374694824, 6.076601028442383, 7.562896728515625, 9.049192428588867, 10.535489082336426, 12.021784782409668, 13.508081436157227, 14.994377136230469, 16.48067283630371, 17.966968536376953, 19.453266143798828, 20.93956184387207, 22.425857543945312, 23.912155151367188, 25.39845085144043, 26.884746551513672, 28.371042251586914, 29.857337951660156, 31.3436336517334, 32.82992935180664, 34.316226959228516, 35.802520751953125, 37.288818359375, 38.775115966796875, 40.261409759521484, 41.74770736694336, 43.23400115966797, 44.720298767089844, 46.20659255981445, 47.69289016723633, 49.17918395996094, 50.66548156738281, 52.15177917480469, 53.6380729675293, 55.12437057495117]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 5.0, 8.0, 9.0, 12.0, 13.0, 12.0, 12.0, 17.0, 23.0, 20.0, 30.0, 24.0, 36.0, 34.0, 36.0, 29.0, 33.0, 43.0, 39.0, 47.0, 34.0, 41.0, 52.0, 46.0, 32.0, 30.0, 32.0, 32.0, 27.0, 20.0, 23.0, 21.0, 14.0, 15.0, 26.0, 12.0, 11.0, 4.0, 6.0, 6.0, 6.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.39145851135254, -28.269893646240234, -27.14832878112793, -26.026763916015625, -24.905197143554688, -23.783632278442383, -22.662067413330078, -21.540502548217773, -20.41893768310547, -19.297372817993164, -18.17580795288086, -17.054241180419922, -15.932676315307617, -14.811111450195312, -13.689546585083008, -12.567981719970703, -11.446414947509766, -10.324850082397461, -9.20328426361084, -8.081719398498535, -6.960154056549072, -5.838588714599609, -4.717023849487305, -3.595458507537842, -2.473893165588379, -1.3523279428482056, -0.23076272010803223, 0.8908023834228516, 2.0123677253723145, 3.1339330673217773, 4.255497932434082, 5.377063274383545, 6.498630523681641, 7.6201958656311035, 8.741761207580566, 9.863326072692871, 10.984891891479492, 12.106456756591797, 13.228021621704102, 14.349586486816406, 15.471152305603027, 16.59271812438965, 17.714282989501953, 18.835847854614258, 19.957412719726562, 21.0789794921875, 22.200542449951172, 23.32210922241211, 24.443674087524414, 25.56523895263672, 26.686803817749023, 27.808368682861328, 28.929935455322266, 30.05150032043457, 31.173065185546875, 32.29463195800781, 33.416194915771484, 34.53776168823242, 35.659324645996094, 36.78089141845703, 37.9024543762207, 39.02402114868164, 40.14558410644531, 41.26715087890625, 42.38871765136719]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 9.0, 3.0, 10.0, 14.0, 17.0, 28.0, 54.0, 59.0, 111.0, 131.0, 240.0, 398.0, 649.0, 1057.0, 1780.0, 3201.0, 5966.0, 11605.0, 23979.0, 57151.0, 172535.0, 697435.0, 1882726.0, 964660.0, 232681.0, 73740.0, 30838.0, 15012.0, 7865.0, 4300.0, 2431.0, 1439.0, 829.0, 498.0, 299.0, 194.0, 107.0, 79.0, 58.0, 31.0, 23.0, 10.0, 9.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0], "bins": [-62.90625, -61.08935546875, -59.2724609375, -57.45556640625, -55.638671875, -53.82177734375, -52.0048828125, -50.18798828125, -48.37109375, -46.55419921875, -44.7373046875, -42.92041015625, -41.103515625, -39.28662109375, -37.4697265625, -35.65283203125, -33.8359375, -32.01904296875, -30.2021484375, -28.38525390625, -26.568359375, -24.75146484375, -22.9345703125, -21.11767578125, -19.30078125, -17.48388671875, -15.6669921875, -13.85009765625, -12.033203125, -10.21630859375, -8.3994140625, -6.58251953125, -4.765625, -2.94873046875, -1.1318359375, 0.68505859375, 2.501953125, 4.31884765625, 6.1357421875, 7.95263671875, 9.76953125, 11.58642578125, 13.4033203125, 15.22021484375, 17.037109375, 18.85400390625, 20.6708984375, 22.48779296875, 24.3046875, 26.12158203125, 27.9384765625, 29.75537109375, 31.572265625, 33.38916015625, 35.2060546875, 37.02294921875, 38.83984375, 40.65673828125, 42.4736328125, 44.29052734375, 46.107421875, 47.92431640625, 49.7412109375, 51.55810546875, 53.375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 9.0, 6.0, 13.0, 9.0, 14.0, 11.0, 18.0, 15.0, 26.0, 22.0, 19.0, 30.0, 42.0, 38.0, 33.0, 35.0, 35.0, 47.0, 57.0, 47.0, 36.0, 45.0, 51.0, 36.0, 41.0, 29.0, 24.0, 33.0, 14.0, 23.0, 21.0, 18.0, 19.0, 12.0, 10.0, 15.0, 6.0, 10.0, 4.0, 3.0, 9.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.609375, -25.604736328125, -24.60009765625, -23.595458984375, -22.5908203125, -21.586181640625, -20.58154296875, -19.576904296875, -18.572265625, -17.567626953125, -16.56298828125, -15.558349609375, -14.5537109375, -13.549072265625, -12.54443359375, -11.539794921875, -10.53515625, -9.530517578125, -8.52587890625, -7.521240234375, -6.5166015625, -5.511962890625, -4.50732421875, -3.502685546875, -2.498046875, -1.493408203125, -0.48876953125, 0.515869140625, 1.5205078125, 2.525146484375, 3.52978515625, 4.534423828125, 5.5390625, 6.543701171875, 7.54833984375, 8.552978515625, 9.5576171875, 10.562255859375, 11.56689453125, 12.571533203125, 13.576171875, 14.580810546875, 15.58544921875, 16.590087890625, 17.5947265625, 18.599365234375, 19.60400390625, 20.608642578125, 21.61328125, 22.617919921875, 23.62255859375, 24.627197265625, 25.6318359375, 26.636474609375, 27.64111328125, 28.645751953125, 29.650390625, 30.655029296875, 31.65966796875, 32.664306640625, 33.6689453125, 34.673583984375, 35.67822265625, 36.682861328125, 37.6875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 9.0, 11.0, 18.0, 36.0, 37.0, 50.0, 110.0, 157.0, 239.0, 350.0, 545.0, 836.0, 1234.0, 2072.0, 3244.0, 5231.0, 8815.0, 15605.0, 27678.0, 52944.0, 108112.0, 238694.0, 588532.0, 1465872.0, 978704.0, 371943.0, 159102.0, 75622.0, 38080.0, 20755.0, 11826.0, 6758.0, 4001.0, 2492.0, 1606.0, 964.0, 678.0, 436.0, 282.0, 214.0, 132.0, 91.0, 59.0, 35.0, 33.0, 19.0, 9.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0], "bins": [-51.875, -50.38232421875, -48.8896484375, -47.39697265625, -45.904296875, -44.41162109375, -42.9189453125, -41.42626953125, -39.93359375, -38.44091796875, -36.9482421875, -35.45556640625, -33.962890625, -32.47021484375, -30.9775390625, -29.48486328125, -27.9921875, -26.49951171875, -25.0068359375, -23.51416015625, -22.021484375, -20.52880859375, -19.0361328125, -17.54345703125, -16.05078125, -14.55810546875, -13.0654296875, -11.57275390625, -10.080078125, -8.58740234375, -7.0947265625, -5.60205078125, -4.109375, -2.61669921875, -1.1240234375, 0.36865234375, 1.861328125, 3.35400390625, 4.8466796875, 6.33935546875, 7.83203125, 9.32470703125, 10.8173828125, 12.31005859375, 13.802734375, 15.29541015625, 16.7880859375, 18.28076171875, 19.7734375, 21.26611328125, 22.7587890625, 24.25146484375, 25.744140625, 27.23681640625, 28.7294921875, 30.22216796875, 31.71484375, 33.20751953125, 34.7001953125, 36.19287109375, 37.685546875, 39.17822265625, 40.6708984375, 42.16357421875, 43.65625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 3.0, 5.0, 5.0, 13.0, 12.0, 28.0, 21.0, 26.0, 37.0, 62.0, 65.0, 97.0, 122.0, 149.0, 213.0, 248.0, 317.0, 373.0, 437.0, 376.0, 326.0, 248.0, 192.0, 147.0, 121.0, 107.0, 62.0, 60.0, 51.0, 47.0, 16.0, 23.0, 15.0, 17.0, 9.0, 5.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-20.03125, -19.4810791015625, -18.930908203125, -18.3807373046875, -17.83056640625, -17.2803955078125, -16.730224609375, -16.1800537109375, -15.6298828125, -15.0797119140625, -14.529541015625, -13.9793701171875, -13.42919921875, -12.8790283203125, -12.328857421875, -11.7786865234375, -11.228515625, -10.6783447265625, -10.128173828125, -9.5780029296875, -9.02783203125, -8.4776611328125, -7.927490234375, -7.3773193359375, -6.8271484375, -6.2769775390625, -5.726806640625, -5.1766357421875, -4.62646484375, -4.0762939453125, -3.526123046875, -2.9759521484375, -2.42578125, -1.8756103515625, -1.325439453125, -0.7752685546875, -0.22509765625, 0.3250732421875, 0.875244140625, 1.4254150390625, 1.9755859375, 2.5257568359375, 3.075927734375, 3.6260986328125, 4.17626953125, 4.7264404296875, 5.276611328125, 5.8267822265625, 6.376953125, 6.9271240234375, 7.477294921875, 8.0274658203125, 8.57763671875, 9.1278076171875, 9.677978515625, 10.2281494140625, 10.7783203125, 11.3284912109375, 11.878662109375, 12.4288330078125, 12.97900390625, 13.5291748046875, 14.079345703125, 14.6295166015625, 15.1796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 1.0, 7.0, 8.0, 11.0, 11.0, 9.0, 26.0, 22.0, 28.0, 30.0, 32.0, 39.0, 52.0, 87.0, 66.0, 60.0, 69.0, 64.0, 63.0, 55.0, 43.0, 34.0, 34.0, 33.0, 21.0, 26.0, 12.0, 14.0, 10.0, 10.0, 7.0, 1.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.72513961791992, -40.499412536621094, -39.27368927001953, -38.0479621887207, -36.822235107421875, -35.59650802612305, -34.37078094482422, -33.145057678222656, -31.919330596923828, -30.693603515625, -29.467878341674805, -28.24215316772461, -27.01642608642578, -25.790699005126953, -24.564973831176758, -23.339248657226562, -22.113521575927734, -20.887794494628906, -19.66206932067871, -18.436344146728516, -17.210617065429688, -15.984890937805176, -14.759164810180664, -13.533438682556152, -12.30771255493164, -11.081986427307129, -9.856260299682617, -8.630534172058105, -7.404808044433594, -6.179081916809082, -4.95335578918457, -3.7276296615600586, -2.5019073486328125, -1.2761812210083008, -0.05045509338378906, 1.1752710342407227, 2.4009971618652344, 3.626723289489746, 4.852449417114258, 6.0781755447387695, 7.303901672363281, 8.529627799987793, 9.755353927612305, 10.981080055236816, 12.206806182861328, 13.43253231048584, 14.658258438110352, 15.883984565734863, 17.109710693359375, 18.335437774658203, 19.5611629486084, 20.786888122558594, 22.012615203857422, 23.23834228515625, 24.464067459106445, 25.68979263305664, 26.91551971435547, 28.141246795654297, 29.366971969604492, 30.592697143554688, 31.818424224853516, 33.044151306152344, 34.269874572753906, 35.495601654052734, 36.72132873535156]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 2.0, 11.0, 10.0, 9.0, 9.0, 15.0, 26.0, 14.0, 19.0, 22.0, 30.0, 24.0, 21.0, 33.0, 32.0, 38.0, 44.0, 41.0, 45.0, 42.0, 51.0, 37.0, 29.0, 37.0, 45.0, 32.0, 34.0, 22.0, 23.0, 34.0, 25.0, 22.0, 21.0, 14.0, 15.0, 11.0, 10.0, 7.0, 8.0, 9.0, 4.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.4442024230957, -32.367523193359375, -31.290842056274414, -30.214160919189453, -29.137481689453125, -28.060800552368164, -26.984119415283203, -25.907440185546875, -24.830759048461914, -23.754077911376953, -22.677398681640625, -21.600717544555664, -20.524036407470703, -19.447357177734375, -18.370676040649414, -17.293994903564453, -16.217315673828125, -15.14063549041748, -14.063955307006836, -12.987274169921875, -11.91059398651123, -10.833913803100586, -9.757232666015625, -8.68055248260498, -7.603872299194336, -6.527192115783691, -5.450511455535889, -4.373830795288086, -3.2971506118774414, -2.220470428466797, -1.1437897682189941, -0.0671091079711914, 1.0095710754394531, 2.0862514972686768, 3.1629319190979004, 4.239612579345703, 5.316292762756348, 6.392972946166992, 7.469653606414795, 8.546334266662598, 9.623014450073242, 10.699694633483887, 11.776374816894531, 12.853055953979492, 13.929736137390137, 15.006416320800781, 16.083097457885742, 17.159778594970703, 18.23645782470703, 19.313138961791992, 20.38981819152832, 21.46649932861328, 22.54317855834961, 23.61985969543457, 24.69654083251953, 25.77322006225586, 26.84990119934082, 27.92658233642578, 29.00326156616211, 30.07994270324707, 31.15662384033203, 32.23330307006836, 33.30998229980469, 34.38666534423828, 35.46334457397461]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 12.0, 28.0, 43.0, 45.0, 61.0, 85.0, 146.0, 187.0, 264.0, 357.0, 563.0, 780.0, 1068.0, 1600.0, 2360.0, 3190.0, 4899.0, 6851.0, 10342.0, 15147.0, 22040.0, 33851.0, 52644.0, 89955.0, 167896.0, 259128.0, 148390.0, 80809.0, 48776.0, 31460.0, 20803.0, 14027.0, 9450.0, 6466.0, 4618.0, 3112.0, 2110.0, 1592.0, 1015.0, 736.0, 508.0, 346.0, 259.0, 166.0, 105.0, 82.0, 61.0, 41.0, 24.0, 17.0, 12.0, 6.0, 1.0, 4.0, 5.0, 4.0, 1.0], "bins": [-10.4921875, -10.16845703125, -9.8447265625, -9.52099609375, -9.197265625, -8.87353515625, -8.5498046875, -8.22607421875, -7.90234375, -7.57861328125, -7.2548828125, -6.93115234375, -6.607421875, -6.28369140625, -5.9599609375, -5.63623046875, -5.3125, -4.98876953125, -4.6650390625, -4.34130859375, -4.017578125, -3.69384765625, -3.3701171875, -3.04638671875, -2.72265625, -2.39892578125, -2.0751953125, -1.75146484375, -1.427734375, -1.10400390625, -0.7802734375, -0.45654296875, -0.1328125, 0.19091796875, 0.5146484375, 0.83837890625, 1.162109375, 1.48583984375, 1.8095703125, 2.13330078125, 2.45703125, 2.78076171875, 3.1044921875, 3.42822265625, 3.751953125, 4.07568359375, 4.3994140625, 4.72314453125, 5.046875, 5.37060546875, 5.6943359375, 6.01806640625, 6.341796875, 6.66552734375, 6.9892578125, 7.31298828125, 7.63671875, 7.96044921875, 8.2841796875, 8.60791015625, 8.931640625, 9.25537109375, 9.5791015625, 9.90283203125, 10.2265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 1.0, 13.0, 7.0, 8.0, 14.0, 15.0, 17.0, 21.0, 25.0, 26.0, 26.0, 28.0, 32.0, 36.0, 37.0, 60.0, 32.0, 44.0, 37.0, 56.0, 48.0, 42.0, 37.0, 47.0, 27.0, 32.0, 25.0, 25.0, 39.0, 27.0, 19.0, 18.0, 7.0, 12.0, 13.0, 7.0, 7.0, 6.0, 10.0, 6.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.125, -35.939453125, -34.75390625, -33.568359375, -32.3828125, -31.197265625, -30.01171875, -28.826171875, -27.640625, -26.455078125, -25.26953125, -24.083984375, -22.8984375, -21.712890625, -20.52734375, -19.341796875, -18.15625, -16.970703125, -15.78515625, -14.599609375, -13.4140625, -12.228515625, -11.04296875, -9.857421875, -8.671875, -7.486328125, -6.30078125, -5.115234375, -3.9296875, -2.744140625, -1.55859375, -0.373046875, 0.8125, 1.998046875, 3.18359375, 4.369140625, 5.5546875, 6.740234375, 7.92578125, 9.111328125, 10.296875, 11.482421875, 12.66796875, 13.853515625, 15.0390625, 16.224609375, 17.41015625, 18.595703125, 19.78125, 20.966796875, 22.15234375, 23.337890625, 24.5234375, 25.708984375, 26.89453125, 28.080078125, 29.265625, 30.451171875, 31.63671875, 32.822265625, 34.0078125, 35.193359375, 36.37890625, 37.564453125, 38.75]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 9.0, 12.0, 27.0, 33.0, 37.0, 59.0, 74.0, 99.0, 151.0, 214.0, 317.0, 436.0, 561.0, 893.0, 1172.0, 1701.0, 2447.0, 3698.0, 5478.0, 8944.0, 16383.0, 43908.0, 325356.0, 535731.0, 53791.0, 18494.0, 9942.0, 5951.0, 3834.0, 2616.0, 1791.0, 1267.0, 909.0, 653.0, 463.0, 296.0, 236.0, 169.0, 112.0, 86.0, 55.0, 51.0, 15.0, 35.0, 17.0, 9.0, 2.0, 4.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0], "bins": [-15.1015625, -14.64501953125, -14.1884765625, -13.73193359375, -13.275390625, -12.81884765625, -12.3623046875, -11.90576171875, -11.44921875, -10.99267578125, -10.5361328125, -10.07958984375, -9.623046875, -9.16650390625, -8.7099609375, -8.25341796875, -7.796875, -7.34033203125, -6.8837890625, -6.42724609375, -5.970703125, -5.51416015625, -5.0576171875, -4.60107421875, -4.14453125, -3.68798828125, -3.2314453125, -2.77490234375, -2.318359375, -1.86181640625, -1.4052734375, -0.94873046875, -0.4921875, -0.03564453125, 0.4208984375, 0.87744140625, 1.333984375, 1.79052734375, 2.2470703125, 2.70361328125, 3.16015625, 3.61669921875, 4.0732421875, 4.52978515625, 4.986328125, 5.44287109375, 5.8994140625, 6.35595703125, 6.8125, 7.26904296875, 7.7255859375, 8.18212890625, 8.638671875, 9.09521484375, 9.5517578125, 10.00830078125, 10.46484375, 10.92138671875, 11.3779296875, 11.83447265625, 12.291015625, 12.74755859375, 13.2041015625, 13.66064453125, 14.1171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 6.0, 3.0, 4.0, 8.0, 9.0, 10.0, 19.0, 14.0, 26.0, 14.0, 26.0, 22.0, 20.0, 25.0, 30.0, 41.0, 40.0, 41.0, 34.0, 33.0, 42.0, 47.0, 51.0, 34.0, 33.0, 41.0, 26.0, 28.0, 39.0, 36.0, 21.0, 25.0, 25.0, 20.0, 16.0, 15.0, 12.0, 14.0, 9.0, 4.0, 5.0, 10.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.953125, -23.225830078125, -22.49853515625, -21.771240234375, -21.0439453125, -20.316650390625, -19.58935546875, -18.862060546875, -18.134765625, -17.407470703125, -16.68017578125, -15.952880859375, -15.2255859375, -14.498291015625, -13.77099609375, -13.043701171875, -12.31640625, -11.589111328125, -10.86181640625, -10.134521484375, -9.4072265625, -8.679931640625, -7.95263671875, -7.225341796875, -6.498046875, -5.770751953125, -5.04345703125, -4.316162109375, -3.5888671875, -2.861572265625, -2.13427734375, -1.406982421875, -0.6796875, 0.047607421875, 0.77490234375, 1.502197265625, 2.2294921875, 2.956787109375, 3.68408203125, 4.411376953125, 5.138671875, 5.865966796875, 6.59326171875, 7.320556640625, 8.0478515625, 8.775146484375, 9.50244140625, 10.229736328125, 10.95703125, 11.684326171875, 12.41162109375, 13.138916015625, 13.8662109375, 14.593505859375, 15.32080078125, 16.048095703125, 16.775390625, 17.502685546875, 18.22998046875, 18.957275390625, 19.6845703125, 20.411865234375, 21.13916015625, 21.866455078125, 22.59375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 8.0, 10.0, 15.0, 20.0, 33.0, 53.0, 91.0, 112.0, 194.0, 330.0, 668.0, 1188.0, 2726.0, 6881.0, 21547.0, 314818.0, 661284.0, 24870.0, 7757.0, 3002.0, 1327.0, 645.0, 394.0, 201.0, 129.0, 72.0, 51.0, 30.0, 29.0, 18.0, 18.0, 9.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.451171875, -2.363800048828125, -2.27642822265625, -2.189056396484375, -2.1016845703125, -2.014312744140625, -1.92694091796875, -1.839569091796875, -1.752197265625, -1.664825439453125, -1.57745361328125, -1.490081787109375, -1.4027099609375, -1.315338134765625, -1.22796630859375, -1.140594482421875, -1.05322265625, -0.965850830078125, -0.87847900390625, -0.791107177734375, -0.7037353515625, -0.616363525390625, -0.52899169921875, -0.441619873046875, -0.354248046875, -0.266876220703125, -0.17950439453125, -0.092132568359375, -0.0047607421875, 0.082611083984375, 0.16998291015625, 0.257354736328125, 0.3447265625, 0.432098388671875, 0.51947021484375, 0.606842041015625, 0.6942138671875, 0.781585693359375, 0.86895751953125, 0.956329345703125, 1.043701171875, 1.131072998046875, 1.21844482421875, 1.305816650390625, 1.3931884765625, 1.480560302734375, 1.56793212890625, 1.655303955078125, 1.74267578125, 1.830047607421875, 1.91741943359375, 2.004791259765625, 2.0921630859375, 2.179534912109375, 2.26690673828125, 2.354278564453125, 2.441650390625, 2.529022216796875, 2.61639404296875, 2.703765869140625, 2.7911376953125, 2.878509521484375, 2.96588134765625, 3.053253173828125, 3.140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 4.0, 4.0, 7.0, 15.0, 27.0, 25.0, 23.0, 31.0, 48.0, 51.0, 68.0, 85.0, 81.0, 88.0, 92.0, 68.0, 60.0, 46.0, 35.0, 24.0, 20.0, 20.0, 14.0, 11.0, 8.0, 13.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00017261505126953125, -0.00016794726252555847, -0.0001632794737815857, -0.00015861168503761292, -0.00015394389629364014, -0.00014927610754966736, -0.00014460831880569458, -0.0001399405300617218, -0.00013527274131774902, -0.00013060495257377625, -0.00012593716382980347, -0.00012126937508583069, -0.00011660158634185791, -0.00011193379759788513, -0.00010726600885391235, -0.00010259822010993958, -9.79304313659668e-05, -9.326264262199402e-05, -8.859485387802124e-05, -8.392706513404846e-05, -7.925927639007568e-05, -7.45914876461029e-05, -6.992369890213013e-05, -6.525591015815735e-05, -6.058812141418457e-05, -5.592033267021179e-05, -5.1252543926239014e-05, -4.6584755182266235e-05, -4.191696643829346e-05, -3.724917769432068e-05, -3.25813889503479e-05, -2.7913600206375122e-05, -2.3245811462402344e-05, -1.8578022718429565e-05, -1.3910233974456787e-05, -9.242445230484009e-06, -4.5746564865112305e-06, 9.313225746154785e-08, 4.760921001434326e-06, 9.428709745407104e-06, 1.4096498489379883e-05, 1.876428723335266e-05, 2.343207597732544e-05, 2.8099864721298218e-05, 3.2767653465270996e-05, 3.7435442209243774e-05, 4.210323095321655e-05, 4.677101969718933e-05, 5.143880844116211e-05, 5.610659718513489e-05, 6.0774385929107666e-05, 6.544217467308044e-05, 7.010996341705322e-05, 7.4777752161026e-05, 7.944554090499878e-05, 8.411332964897156e-05, 8.878111839294434e-05, 9.344890713691711e-05, 9.811669588088989e-05, 0.00010278448462486267, 0.00010745227336883545, 0.00011212006211280823, 0.000116787850856781, 0.00012145563960075378, 0.00012612342834472656]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 8.0, 21.0, 26.0, 25.0, 45.0, 75.0, 101.0, 152.0, 205.0, 312.0, 547.0, 944.0, 1485.0, 2440.0, 4211.0, 7593.0, 13712.0, 26913.0, 55674.0, 121926.0, 261450.0, 286208.0, 137120.0, 62686.0, 29945.0, 15111.0, 8252.0, 4533.0, 2641.0, 1567.0, 907.0, 578.0, 386.0, 234.0, 189.0, 114.0, 66.0, 54.0, 29.0, 24.0, 12.0, 10.0, 3.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.93359375, -1.871368408203125, -1.80914306640625, -1.746917724609375, -1.6846923828125, -1.622467041015625, -1.56024169921875, -1.498016357421875, -1.435791015625, -1.373565673828125, -1.31134033203125, -1.249114990234375, -1.1868896484375, -1.124664306640625, -1.06243896484375, -1.000213623046875, -0.93798828125, -0.875762939453125, -0.81353759765625, -0.751312255859375, -0.6890869140625, -0.626861572265625, -0.56463623046875, -0.502410888671875, -0.440185546875, -0.377960205078125, -0.31573486328125, -0.253509521484375, -0.1912841796875, -0.129058837890625, -0.06683349609375, -0.004608154296875, 0.0576171875, 0.119842529296875, 0.18206787109375, 0.244293212890625, 0.3065185546875, 0.368743896484375, 0.43096923828125, 0.493194580078125, 0.555419921875, 0.617645263671875, 0.67987060546875, 0.742095947265625, 0.8043212890625, 0.866546630859375, 0.92877197265625, 0.990997314453125, 1.05322265625, 1.115447998046875, 1.17767333984375, 1.239898681640625, 1.3021240234375, 1.364349365234375, 1.42657470703125, 1.488800048828125, 1.551025390625, 1.613250732421875, 1.67547607421875, 1.737701416015625, 1.7999267578125, 1.862152099609375, 1.92437744140625, 1.986602783203125, 2.048828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 7.0, 8.0, 6.0, 10.0, 13.0, 12.0, 13.0, 28.0, 28.0, 41.0, 43.0, 49.0, 53.0, 57.0, 60.0, 68.0, 51.0, 56.0, 61.0, 45.0, 52.0, 49.0, 41.0, 29.0, 36.0, 20.0, 16.0, 11.0, 10.0, 10.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44873046875, -0.431121826171875, -0.41351318359375, -0.395904541015625, -0.3782958984375, -0.360687255859375, -0.34307861328125, -0.325469970703125, -0.307861328125, -0.290252685546875, -0.27264404296875, -0.255035400390625, -0.2374267578125, -0.219818115234375, -0.20220947265625, -0.184600830078125, -0.1669921875, -0.149383544921875, -0.13177490234375, -0.114166259765625, -0.0965576171875, -0.078948974609375, -0.06134033203125, -0.043731689453125, -0.026123046875, -0.008514404296875, 0.00909423828125, 0.026702880859375, 0.0443115234375, 0.061920166015625, 0.07952880859375, 0.097137451171875, 0.11474609375, 0.132354736328125, 0.14996337890625, 0.167572021484375, 0.1851806640625, 0.202789306640625, 0.22039794921875, 0.238006591796875, 0.255615234375, 0.273223876953125, 0.29083251953125, 0.308441162109375, 0.3260498046875, 0.343658447265625, 0.36126708984375, 0.378875732421875, 0.396484375, 0.414093017578125, 0.43170166015625, 0.449310302734375, 0.4669189453125, 0.484527587890625, 0.50213623046875, 0.519744873046875, 0.537353515625, 0.554962158203125, 0.57257080078125, 0.590179443359375, 0.6077880859375, 0.625396728515625, 0.64300537109375, 0.660614013671875, 0.67822265625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 5.0, 3.0, 6.0, 13.0, 10.0, 15.0, 15.0, 19.0, 34.0, 29.0, 27.0, 45.0, 44.0, 73.0, 74.0, 54.0, 73.0, 61.0, 61.0, 57.0, 53.0, 38.0, 36.0, 27.0, 24.0, 25.0, 22.0, 11.0, 11.0, 8.0, 5.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-41.68342590332031, -40.505332946777344, -39.327239990234375, -38.149147033691406, -36.97105407714844, -35.79296112060547, -34.6148681640625, -33.436771392822266, -32.2586784362793, -31.080585479736328, -29.90249252319336, -28.72439956665039, -27.54630470275879, -26.36821174621582, -25.19011878967285, -24.01202392578125, -22.833932876586914, -21.655839920043945, -20.477746963500977, -19.299652099609375, -18.121559143066406, -16.943466186523438, -15.765373229980469, -14.587279319763184, -13.409186363220215, -12.231093406677246, -11.052999496459961, -9.874906539916992, -8.696813583374023, -7.518719673156738, -6.3406267166137695, -5.162532806396484, -3.9844398498535156, -2.8063464164733887, -1.6282532215118408, -0.45016002655029297, 0.727933406829834, 1.906026840209961, 3.0841197967529297, 4.262213706970215, 5.440306663513184, 6.6184000968933105, 7.7964935302734375, 8.974586486816406, 10.152679443359375, 11.33077335357666, 12.508866310119629, 13.686960220336914, 14.865053176879883, 16.04314613342285, 17.22123908996582, 18.399333953857422, 19.57742691040039, 20.75551986694336, 21.933612823486328, 23.111705780029297, 24.289798736572266, 25.467891693115234, 26.645984649658203, 27.824077606201172, 29.002172470092773, 30.180265426635742, 31.35835838317871, 32.53645324707031, 33.71454620361328]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 8.0, 3.0, 10.0, 7.0, 13.0, 8.0, 18.0, 23.0, 15.0, 20.0, 21.0, 30.0, 22.0, 24.0, 29.0, 36.0, 38.0, 45.0, 42.0, 44.0, 43.0, 51.0, 34.0, 31.0, 40.0, 41.0, 36.0, 33.0, 19.0, 27.0, 30.0, 25.0, 22.0, 21.0, 12.0, 16.0, 12.0, 9.0, 8.0, 6.0, 10.0, 3.0, 6.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.25746536254883, -32.19170379638672, -31.125944137573242, -30.060182571411133, -28.994422912597656, -27.928661346435547, -26.862899780273438, -25.797138214111328, -24.73137855529785, -23.665616989135742, -22.599857330322266, -21.534095764160156, -20.468334197998047, -19.40257453918457, -18.33681297302246, -17.271053314208984, -16.205291748046875, -15.139531135559082, -14.073770523071289, -13.00800895690918, -11.942248344421387, -10.876487731933594, -9.810726165771484, -8.744965553283691, -7.679204940795898, -6.6134443283081055, -5.547683238983154, -4.481922149658203, -3.41616153717041, -2.350400924682617, -1.284639835357666, -0.21887874603271484, 0.8468818664550781, 1.9126427173614502, 2.9784035682678223, 4.044164657592773, 5.109925270080566, 6.175685882568359, 7.2414469718933105, 8.307208061218262, 9.372968673706055, 10.438729286193848, 11.50448989868164, 12.57025146484375, 13.636012077331543, 14.701772689819336, 15.767534255981445, 16.833293914794922, 17.89905548095703, 18.96481704711914, 20.030576705932617, 21.096338272094727, 22.162097930908203, 23.227859497070312, 24.293621063232422, 25.35938262939453, 26.425142288208008, 27.490903854370117, 28.556663513183594, 29.622425079345703, 30.688186645507812, 31.75394630432129, 32.819705963134766, 33.885467529296875, 34.951229095458984]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 11.0, 10.0, 23.0, 32.0, 38.0, 53.0, 67.0, 110.0, 156.0, 259.0, 379.0, 543.0, 809.0, 1284.0, 2078.0, 2982.0, 4781.0, 7460.0, 11775.0, 18716.0, 29679.0, 48776.0, 80301.0, 131647.0, 195806.0, 189278.0, 123607.0, 75086.0, 45860.0, 28325.0, 17684.0, 11063.0, 7063.0, 4359.0, 2944.0, 1880.0, 1214.0, 788.0, 561.0, 357.0, 238.0, 151.0, 105.0, 64.0, 50.0, 31.0, 31.0, 13.0, 11.0, 8.0, 5.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.78125, -36.56005859375, -35.3388671875, -34.11767578125, -32.896484375, -31.67529296875, -30.4541015625, -29.23291015625, -28.01171875, -26.79052734375, -25.5693359375, -24.34814453125, -23.126953125, -21.90576171875, -20.6845703125, -19.46337890625, -18.2421875, -17.02099609375, -15.7998046875, -14.57861328125, -13.357421875, -12.13623046875, -10.9150390625, -9.69384765625, -8.47265625, -7.25146484375, -6.0302734375, -4.80908203125, -3.587890625, -2.36669921875, -1.1455078125, 0.07568359375, 1.296875, 2.51806640625, 3.7392578125, 4.96044921875, 6.181640625, 7.40283203125, 8.6240234375, 9.84521484375, 11.06640625, 12.28759765625, 13.5087890625, 14.72998046875, 15.951171875, 17.17236328125, 18.3935546875, 19.61474609375, 20.8359375, 22.05712890625, 23.2783203125, 24.49951171875, 25.720703125, 26.94189453125, 28.1630859375, 29.38427734375, 30.60546875, 31.82666015625, 33.0478515625, 34.26904296875, 35.490234375, 36.71142578125, 37.9326171875, 39.15380859375, 40.375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 6.0, 3.0, 5.0, 9.0, 14.0, 17.0, 18.0, 18.0, 18.0, 20.0, 32.0, 23.0, 29.0, 31.0, 33.0, 35.0, 43.0, 41.0, 47.0, 38.0, 48.0, 42.0, 49.0, 38.0, 48.0, 43.0, 35.0, 29.0, 26.0, 24.0, 20.0, 24.0, 17.0, 14.0, 8.0, 11.0, 7.0, 8.0, 7.0, 4.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.53125, -34.4287109375, -33.326171875, -32.2236328125, -31.12109375, -30.0185546875, -28.916015625, -27.8134765625, -26.7109375, -25.6083984375, -24.505859375, -23.4033203125, -22.30078125, -21.1982421875, -20.095703125, -18.9931640625, -17.890625, -16.7880859375, -15.685546875, -14.5830078125, -13.48046875, -12.3779296875, -11.275390625, -10.1728515625, -9.0703125, -7.9677734375, -6.865234375, -5.7626953125, -4.66015625, -3.5576171875, -2.455078125, -1.3525390625, -0.25, 0.8525390625, 1.955078125, 3.0576171875, 4.16015625, 5.2626953125, 6.365234375, 7.4677734375, 8.5703125, 9.6728515625, 10.775390625, 11.8779296875, 12.98046875, 14.0830078125, 15.185546875, 16.2880859375, 17.390625, 18.4931640625, 19.595703125, 20.6982421875, 21.80078125, 22.9033203125, 24.005859375, 25.1083984375, 26.2109375, 27.3134765625, 28.416015625, 29.5185546875, 30.62109375, 31.7236328125, 32.826171875, 33.9287109375, 35.03125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 20.0, 15.0, 29.0, 48.0, 79.0, 125.0, 215.0, 361.0, 549.0, 1014.0, 1725.0, 2846.0, 4721.0, 8072.0, 13563.0, 23207.0, 39727.0, 66573.0, 110994.0, 176970.0, 210911.0, 154943.0, 94981.0, 55834.0, 33490.0, 19159.0, 11608.0, 6909.0, 3992.0, 2421.0, 1373.0, 851.0, 469.0, 316.0, 165.0, 112.0, 58.0, 37.0, 22.0, 15.0, 11.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.65625, -38.2568359375, -36.857421875, -35.4580078125, -34.05859375, -32.6591796875, -31.259765625, -29.8603515625, -28.4609375, -27.0615234375, -25.662109375, -24.2626953125, -22.86328125, -21.4638671875, -20.064453125, -18.6650390625, -17.265625, -15.8662109375, -14.466796875, -13.0673828125, -11.66796875, -10.2685546875, -8.869140625, -7.4697265625, -6.0703125, -4.6708984375, -3.271484375, -1.8720703125, -0.47265625, 0.9267578125, 2.326171875, 3.7255859375, 5.125, 6.5244140625, 7.923828125, 9.3232421875, 10.72265625, 12.1220703125, 13.521484375, 14.9208984375, 16.3203125, 17.7197265625, 19.119140625, 20.5185546875, 21.91796875, 23.3173828125, 24.716796875, 26.1162109375, 27.515625, 28.9150390625, 30.314453125, 31.7138671875, 33.11328125, 34.5126953125, 35.912109375, 37.3115234375, 38.7109375, 40.1103515625, 41.509765625, 42.9091796875, 44.30859375, 45.7080078125, 47.107421875, 48.5068359375, 49.90625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 6.0, 9.0, 6.0, 7.0, 10.0, 14.0, 18.0, 12.0, 26.0, 17.0, 17.0, 22.0, 20.0, 29.0, 23.0, 29.0, 33.0, 34.0, 37.0, 28.0, 30.0, 21.0, 24.0, 32.0, 28.0, 34.0, 41.0, 36.0, 39.0, 39.0, 38.0, 29.0, 27.0, 22.0, 23.0, 20.0, 19.0, 17.0, 14.0, 11.0, 8.0, 6.0, 7.0, 8.0, 3.0, 9.0, 7.0, 4.0, 0.0, 4.0, 1.0, 3.0, 2.0], "bins": [-19.796875, -19.20751953125, -18.6181640625, -18.02880859375, -17.439453125, -16.85009765625, -16.2607421875, -15.67138671875, -15.08203125, -14.49267578125, -13.9033203125, -13.31396484375, -12.724609375, -12.13525390625, -11.5458984375, -10.95654296875, -10.3671875, -9.77783203125, -9.1884765625, -8.59912109375, -8.009765625, -7.42041015625, -6.8310546875, -6.24169921875, -5.65234375, -5.06298828125, -4.4736328125, -3.88427734375, -3.294921875, -2.70556640625, -2.1162109375, -1.52685546875, -0.9375, -0.34814453125, 0.2412109375, 0.83056640625, 1.419921875, 2.00927734375, 2.5986328125, 3.18798828125, 3.77734375, 4.36669921875, 4.9560546875, 5.54541015625, 6.134765625, 6.72412109375, 7.3134765625, 7.90283203125, 8.4921875, 9.08154296875, 9.6708984375, 10.26025390625, 10.849609375, 11.43896484375, 12.0283203125, 12.61767578125, 13.20703125, 13.79638671875, 14.3857421875, 14.97509765625, 15.564453125, 16.15380859375, 16.7431640625, 17.33251953125, 17.921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 7.0, 18.0, 14.0, 16.0, 43.0, 48.0, 63.0, 124.0, 201.0, 276.0, 449.0, 648.0, 1215.0, 1803.0, 2890.0, 4934.0, 8529.0, 15266.0, 28317.0, 54122.0, 109481.0, 212633.0, 269052.0, 164224.0, 81927.0, 41280.0, 21710.0, 11869.0, 6807.0, 4105.0, 2418.0, 1516.0, 913.0, 551.0, 373.0, 261.0, 170.0, 88.0, 69.0, 30.0, 22.0, 26.0, 13.0, 8.0, 11.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-16.296875, -15.792236328125, -15.28759765625, -14.782958984375, -14.2783203125, -13.773681640625, -13.26904296875, -12.764404296875, -12.259765625, -11.755126953125, -11.25048828125, -10.745849609375, -10.2412109375, -9.736572265625, -9.23193359375, -8.727294921875, -8.22265625, -7.718017578125, -7.21337890625, -6.708740234375, -6.2041015625, -5.699462890625, -5.19482421875, -4.690185546875, -4.185546875, -3.680908203125, -3.17626953125, -2.671630859375, -2.1669921875, -1.662353515625, -1.15771484375, -0.653076171875, -0.1484375, 0.356201171875, 0.86083984375, 1.365478515625, 1.8701171875, 2.374755859375, 2.87939453125, 3.384033203125, 3.888671875, 4.393310546875, 4.89794921875, 5.402587890625, 5.9072265625, 6.411865234375, 6.91650390625, 7.421142578125, 7.92578125, 8.430419921875, 8.93505859375, 9.439697265625, 9.9443359375, 10.448974609375, 10.95361328125, 11.458251953125, 11.962890625, 12.467529296875, 12.97216796875, 13.476806640625, 13.9814453125, 14.486083984375, 14.99072265625, 15.495361328125, 16.0]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 16.0, 20.0, 25.0, 34.0, 55.0, 71.0, 106.0, 137.0, 134.0, 123.0, 89.0, 62.0, 40.0, 28.0, 23.0, 8.0, 4.0, 1.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028667449951171875, -0.0027831196784973145, -0.0026994943618774414, -0.0026158690452575684, -0.0025322437286376953, -0.0024486184120178223, -0.0023649930953979492, -0.002281367778778076, -0.002197742462158203, -0.00211411714553833, -0.002030491828918457, -0.001946866512298584, -0.001863241195678711, -0.0017796158790588379, -0.0016959905624389648, -0.0016123652458190918, -0.0015287399291992188, -0.0014451146125793457, -0.0013614892959594727, -0.0012778639793395996, -0.0011942386627197266, -0.0011106133460998535, -0.0010269880294799805, -0.0009433627128601074, -0.0008597373962402344, -0.0007761120796203613, -0.0006924867630004883, -0.0006088614463806152, -0.0005252361297607422, -0.00044161081314086914, -0.0003579854965209961, -0.00027436017990112305, -0.00019073486328125, -0.00010710954666137695, -2.3484230041503906e-05, 6.014108657836914e-05, 0.0001437664031982422, 0.00022739171981811523, 0.0003110170364379883, 0.00039464235305786133, 0.0004782676696777344, 0.0005618929862976074, 0.0006455183029174805, 0.0007291436195373535, 0.0008127689361572266, 0.0008963942527770996, 0.0009800195693969727, 0.0010636448860168457, 0.0011472702026367188, 0.0012308955192565918, 0.0013145208358764648, 0.0013981461524963379, 0.001481771469116211, 0.001565396785736084, 0.001649022102355957, 0.00173264741897583, 0.0018162727355957031, 0.0018998980522155762, 0.0019835233688354492, 0.0020671486854553223, 0.0021507740020751953, 0.0022343993186950684, 0.0023180246353149414, 0.0024016499519348145, 0.0024852752685546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 11.0, 14.0, 14.0, 18.0, 34.0, 49.0, 94.0, 136.0, 176.0, 299.0, 476.0, 889.0, 1398.0, 2365.0, 4209.0, 7195.0, 13135.0, 24536.0, 47046.0, 92638.0, 184090.0, 279658.0, 189629.0, 95699.0, 48234.0, 25263.0, 13455.0, 7481.0, 4198.0, 2382.0, 1452.0, 873.0, 528.0, 325.0, 214.0, 115.0, 81.0, 50.0, 38.0, 18.0, 14.0, 7.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.59375, -18.0390625, -17.484375, -16.9296875, -16.375, -15.8203125, -15.265625, -14.7109375, -14.15625, -13.6015625, -13.046875, -12.4921875, -11.9375, -11.3828125, -10.828125, -10.2734375, -9.71875, -9.1640625, -8.609375, -8.0546875, -7.5, -6.9453125, -6.390625, -5.8359375, -5.28125, -4.7265625, -4.171875, -3.6171875, -3.0625, -2.5078125, -1.953125, -1.3984375, -0.84375, -0.2890625, 0.265625, 0.8203125, 1.375, 1.9296875, 2.484375, 3.0390625, 3.59375, 4.1484375, 4.703125, 5.2578125, 5.8125, 6.3671875, 6.921875, 7.4765625, 8.03125, 8.5859375, 9.140625, 9.6953125, 10.25, 10.8046875, 11.359375, 11.9140625, 12.46875, 13.0234375, 13.578125, 14.1328125, 14.6875, 15.2421875, 15.796875, 16.3515625, 16.90625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 10.0, 5.0, 12.0, 13.0, 16.0, 25.0, 24.0, 18.0, 35.0, 42.0, 37.0, 54.0, 60.0, 54.0, 65.0, 62.0, 52.0, 70.0, 41.0, 39.0, 37.0, 27.0, 28.0, 29.0, 24.0, 27.0, 13.0, 13.0, 7.0, 7.0, 6.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.734375, -4.58251953125, -4.4306640625, -4.27880859375, -4.126953125, -3.97509765625, -3.8232421875, -3.67138671875, -3.51953125, -3.36767578125, -3.2158203125, -3.06396484375, -2.912109375, -2.76025390625, -2.6083984375, -2.45654296875, -2.3046875, -2.15283203125, -2.0009765625, -1.84912109375, -1.697265625, -1.54541015625, -1.3935546875, -1.24169921875, -1.08984375, -0.93798828125, -0.7861328125, -0.63427734375, -0.482421875, -0.33056640625, -0.1787109375, -0.02685546875, 0.125, 0.27685546875, 0.4287109375, 0.58056640625, 0.732421875, 0.88427734375, 1.0361328125, 1.18798828125, 1.33984375, 1.49169921875, 1.6435546875, 1.79541015625, 1.947265625, 2.09912109375, 2.2509765625, 2.40283203125, 2.5546875, 2.70654296875, 2.8583984375, 3.01025390625, 3.162109375, 3.31396484375, 3.4658203125, 3.61767578125, 3.76953125, 3.92138671875, 4.0732421875, 4.22509765625, 4.376953125, 4.52880859375, 4.6806640625, 4.83251953125, 4.984375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 0.0, 4.0, 3.0, 3.0, 9.0, 5.0, 3.0, 9.0, 14.0, 12.0, 8.0, 13.0, 26.0, 20.0, 33.0, 37.0, 35.0, 45.0, 68.0, 56.0, 50.0, 69.0, 69.0, 46.0, 47.0, 54.0, 40.0, 38.0, 29.0, 23.0, 25.0, 18.0, 21.0, 17.0, 14.0, 4.0, 8.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.427425384521484, -34.3779411315918, -33.32845687866211, -32.278968811035156, -31.2294864654541, -30.18000030517578, -29.130516052246094, -28.081031799316406, -27.03154754638672, -25.98206329345703, -24.93257713317871, -23.883092880249023, -22.833608627319336, -21.784122467041016, -20.734638214111328, -19.68515396118164, -18.63566780090332, -17.586183547973633, -16.536697387695312, -15.487213134765625, -14.437728881835938, -13.388243675231934, -12.33875846862793, -11.289274215698242, -10.239789009094238, -9.190303802490234, -8.140819549560547, -7.091334342956543, -6.041849613189697, -4.992364883422852, -3.9428796768188477, -2.893394947052002, -1.843912124633789, -0.7944272756576538, 0.25505757331848145, 1.3045425415039062, 2.354027271270752, 3.4035120010375977, 4.452997207641602, 5.502481937408447, 6.551966667175293, 7.601451396942139, 8.650936126708984, 9.700421333312988, 10.749906539916992, 11.79939079284668, 12.848875999450684, 13.898361206054688, 14.947845458984375, 15.997330665588379, 17.046815872192383, 18.09630012512207, 19.145784378051758, 20.195270538330078, 21.244754791259766, 22.294239044189453, 23.34372329711914, 24.393207550048828, 25.44269371032715, 26.492177963256836, 27.541662216186523, 28.591148376464844, 29.64063262939453, 30.69011688232422, 31.73960304260254]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 10.0, 4.0, 5.0, 7.0, 8.0, 12.0, 13.0, 13.0, 24.0, 19.0, 26.0, 26.0, 30.0, 29.0, 24.0, 39.0, 36.0, 43.0, 46.0, 26.0, 44.0, 54.0, 36.0, 49.0, 44.0, 27.0, 45.0, 28.0, 29.0, 29.0, 26.0, 23.0, 27.0, 17.0, 11.0, 12.0, 13.0, 10.0, 8.0, 5.0, 8.0, 1.0, 8.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.69272232055664, -34.54065704345703, -33.38859176635742, -32.23652648925781, -31.084461212158203, -29.932395935058594, -28.780332565307617, -27.628267288208008, -26.4762020111084, -25.32413673400879, -24.17207145690918, -23.02000617980957, -21.867942810058594, -20.715877532958984, -19.563812255859375, -18.411746978759766, -17.259681701660156, -16.107616424560547, -14.955551147460938, -13.803486824035645, -12.651421546936035, -11.499356269836426, -10.347291946411133, -9.195226669311523, -8.043161392211914, -6.891096115112305, -5.7390313148498535, -4.586966514587402, -3.434901237487793, -2.2828359603881836, -1.1307711601257324, 0.02129364013671875, 1.1733627319335938, 2.325427770614624, 3.4774928092956543, 4.6295576095581055, 5.781622886657715, 6.933688163757324, 8.085752487182617, 9.237817764282227, 10.389883041381836, 11.541948318481445, 12.694013595581055, 13.846077919006348, 14.998143196105957, 16.15020751953125, 17.30227279663086, 18.45433807373047, 19.606403350830078, 20.758468627929688, 21.910533905029297, 23.062599182128906, 24.214664459228516, 25.366729736328125, 26.5187931060791, 27.67085838317871, 28.82292366027832, 29.97498893737793, 31.12705421447754, 32.279117584228516, 33.431182861328125, 34.583248138427734, 35.735313415527344, 36.88737869262695, 38.03944396972656]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [6.0, 4.0, 1.0, 6.0, 10.0, 9.0, 9.0, 19.0, 19.0, 33.0, 49.0, 69.0, 92.0, 174.0, 243.0, 373.0, 595.0, 895.0, 1286.0, 2006.0, 3065.0, 4840.0, 8058.0, 14009.0, 24995.0, 50342.0, 118007.0, 335318.0, 944276.0, 1478702.0, 754540.0, 258088.0, 95391.0, 42832.0, 22583.0, 12591.0, 7594.0, 4630.0, 2943.0, 1893.0, 1278.0, 833.0, 525.0, 352.0, 221.0, 165.0, 108.0, 68.0, 54.0, 23.0, 19.0, 15.0, 14.0, 8.0, 10.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.375, -38.03515625, -36.6953125, -35.35546875, -34.015625, -32.67578125, -31.3359375, -29.99609375, -28.65625, -27.31640625, -25.9765625, -24.63671875, -23.296875, -21.95703125, -20.6171875, -19.27734375, -17.9375, -16.59765625, -15.2578125, -13.91796875, -12.578125, -11.23828125, -9.8984375, -8.55859375, -7.21875, -5.87890625, -4.5390625, -3.19921875, -1.859375, -0.51953125, 0.8203125, 2.16015625, 3.5, 4.83984375, 6.1796875, 7.51953125, 8.859375, 10.19921875, 11.5390625, 12.87890625, 14.21875, 15.55859375, 16.8984375, 18.23828125, 19.578125, 20.91796875, 22.2578125, 23.59765625, 24.9375, 26.27734375, 27.6171875, 28.95703125, 30.296875, 31.63671875, 32.9765625, 34.31640625, 35.65625, 36.99609375, 38.3359375, 39.67578125, 41.015625, 42.35546875, 43.6953125, 45.03515625, 46.375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 7.0, 3.0, 7.0, 6.0, 10.0, 8.0, 5.0, 14.0, 19.0, 13.0, 26.0, 26.0, 26.0, 25.0, 26.0, 27.0, 31.0, 37.0, 41.0, 47.0, 47.0, 44.0, 46.0, 45.0, 42.0, 46.0, 50.0, 36.0, 24.0, 29.0, 31.0, 24.0, 22.0, 18.0, 18.0, 11.0, 16.0, 13.0, 7.0, 7.0, 5.0, 4.0, 3.0, 3.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-33.5, -32.45068359375, -31.4013671875, -30.35205078125, -29.302734375, -28.25341796875, -27.2041015625, -26.15478515625, -25.10546875, -24.05615234375, -23.0068359375, -21.95751953125, -20.908203125, -19.85888671875, -18.8095703125, -17.76025390625, -16.7109375, -15.66162109375, -14.6123046875, -13.56298828125, -12.513671875, -11.46435546875, -10.4150390625, -9.36572265625, -8.31640625, -7.26708984375, -6.2177734375, -5.16845703125, -4.119140625, -3.06982421875, -2.0205078125, -0.97119140625, 0.078125, 1.12744140625, 2.1767578125, 3.22607421875, 4.275390625, 5.32470703125, 6.3740234375, 7.42333984375, 8.47265625, 9.52197265625, 10.5712890625, 11.62060546875, 12.669921875, 13.71923828125, 14.7685546875, 15.81787109375, 16.8671875, 17.91650390625, 18.9658203125, 20.01513671875, 21.064453125, 22.11376953125, 23.1630859375, 24.21240234375, 25.26171875, 26.31103515625, 27.3603515625, 28.40966796875, 29.458984375, 30.50830078125, 31.5576171875, 32.60693359375, 33.65625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 6.0, 23.0, 17.0, 35.0, 46.0, 90.0, 123.0, 179.0, 268.0, 415.0, 691.0, 1131.0, 1746.0, 2961.0, 5265.0, 8998.0, 16391.0, 31611.0, 63654.0, 134770.0, 316016.0, 841564.0, 1580156.0, 688738.0, 265503.0, 116633.0, 55129.0, 27653.0, 14738.0, 8049.0, 4574.0, 2725.0, 1616.0, 1015.0, 606.0, 391.0, 242.0, 166.0, 111.0, 84.0, 56.0, 27.0, 17.0, 12.0, 13.0, 11.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-54.125, -52.5517578125, -50.978515625, -49.4052734375, -47.83203125, -46.2587890625, -44.685546875, -43.1123046875, -41.5390625, -39.9658203125, -38.392578125, -36.8193359375, -35.24609375, -33.6728515625, -32.099609375, -30.5263671875, -28.953125, -27.3798828125, -25.806640625, -24.2333984375, -22.66015625, -21.0869140625, -19.513671875, -17.9404296875, -16.3671875, -14.7939453125, -13.220703125, -11.6474609375, -10.07421875, -8.5009765625, -6.927734375, -5.3544921875, -3.78125, -2.2080078125, -0.634765625, 0.9384765625, 2.51171875, 4.0849609375, 5.658203125, 7.2314453125, 8.8046875, 10.3779296875, 11.951171875, 13.5244140625, 15.09765625, 16.6708984375, 18.244140625, 19.8173828125, 21.390625, 22.9638671875, 24.537109375, 26.1103515625, 27.68359375, 29.2568359375, 30.830078125, 32.4033203125, 33.9765625, 35.5498046875, 37.123046875, 38.6962890625, 40.26953125, 41.8427734375, 43.416015625, 44.9892578125, 46.5625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 7.0, 6.0, 9.0, 15.0, 12.0, 10.0, 20.0, 21.0, 29.0, 44.0, 52.0, 61.0, 86.0, 98.0, 113.0, 167.0, 182.0, 215.0, 281.0, 314.0, 351.0, 354.0, 309.0, 234.0, 233.0, 161.0, 138.0, 119.0, 100.0, 67.0, 59.0, 49.0, 34.0, 30.0, 23.0, 17.0, 19.0, 12.0, 11.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0], "bins": [-18.09375, -17.6011962890625, -17.108642578125, -16.6160888671875, -16.12353515625, -15.6309814453125, -15.138427734375, -14.6458740234375, -14.1533203125, -13.6607666015625, -13.168212890625, -12.6756591796875, -12.18310546875, -11.6905517578125, -11.197998046875, -10.7054443359375, -10.212890625, -9.7203369140625, -9.227783203125, -8.7352294921875, -8.24267578125, -7.7501220703125, -7.257568359375, -6.7650146484375, -6.2724609375, -5.7799072265625, -5.287353515625, -4.7947998046875, -4.30224609375, -3.8096923828125, -3.317138671875, -2.8245849609375, -2.33203125, -1.8394775390625, -1.346923828125, -0.8543701171875, -0.36181640625, 0.1307373046875, 0.623291015625, 1.1158447265625, 1.6083984375, 2.1009521484375, 2.593505859375, 3.0860595703125, 3.57861328125, 4.0711669921875, 4.563720703125, 5.0562744140625, 5.548828125, 6.0413818359375, 6.533935546875, 7.0264892578125, 7.51904296875, 8.0115966796875, 8.504150390625, 8.9967041015625, 9.4892578125, 9.9818115234375, 10.474365234375, 10.9669189453125, 11.45947265625, 11.9520263671875, 12.444580078125, 12.9371337890625, 13.4296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 9.0, 6.0, 10.0, 7.0, 9.0, 14.0, 12.0, 14.0, 19.0, 29.0, 42.0, 43.0, 44.0, 64.0, 72.0, 74.0, 73.0, 64.0, 60.0, 50.0, 48.0, 41.0, 29.0, 25.0, 38.0, 19.0, 18.0, 18.0, 9.0, 5.0, 8.0, 9.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.86423110961914, -39.64664840698242, -38.42906188964844, -37.21147918701172, -35.993896484375, -34.77631378173828, -33.5587272644043, -32.34114456176758, -31.123559951782227, -29.905975341796875, -28.688392639160156, -27.470808029174805, -26.253223419189453, -25.035640716552734, -23.818056106567383, -22.60047149658203, -21.382888793945312, -20.16530418395996, -18.947721481323242, -17.73013687133789, -16.512554168701172, -15.29496955871582, -14.077384948730469, -12.859801292419434, -11.642217636108398, -10.424633979797363, -9.207050323486328, -7.989465713500977, -6.771882057189941, -5.554298400878906, -4.336714267730713, -3.1191301345825195, -1.9015426635742188, -0.6839587688446045, 0.5336251258850098, 1.751209020614624, 2.9687929153442383, 4.186376571655273, 5.403960704803467, 6.62154483795166, 7.839128494262695, 9.05671215057373, 10.274295806884766, 11.491880416870117, 12.709464073181152, 13.927047729492188, 15.144632339477539, 16.36221694946289, 17.57979965209961, 18.79738426208496, 20.01496696472168, 21.23255157470703, 22.45013427734375, 23.6677188873291, 24.885303497314453, 26.102886199951172, 27.320470809936523, 28.538055419921875, 29.755638122558594, 30.973222732543945, 32.1908073425293, 33.408390045166016, 34.625972747802734, 35.84355926513672, 37.06114196777344]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 8.0, 9.0, 8.0, 10.0, 18.0, 19.0, 32.0, 19.0, 27.0, 33.0, 29.0, 26.0, 37.0, 30.0, 40.0, 46.0, 41.0, 43.0, 41.0, 37.0, 51.0, 37.0, 44.0, 40.0, 27.0, 31.0, 43.0, 21.0, 30.0, 17.0, 16.0, 19.0, 15.0, 7.0, 14.0, 10.0, 4.0, 3.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.64574432373047, -41.444091796875, -40.24243927001953, -39.04078674316406, -37.839134216308594, -36.63748550415039, -35.43583297729492, -34.23418045043945, -33.032527923583984, -31.830875396728516, -30.629222869873047, -29.42757225036621, -28.225919723510742, -27.024267196655273, -25.822616577148438, -24.62096405029297, -23.4193115234375, -22.21765899658203, -21.016006469726562, -19.814355850219727, -18.612703323364258, -17.41105079650879, -16.209400177001953, -15.007747650146484, -13.806095123291016, -12.604442596435547, -11.402791023254395, -10.201139450073242, -8.999486923217773, -7.797834873199463, -6.596182823181152, -5.39453125, -4.192882537841797, -2.9912304878234863, -1.7895784378051758, -0.5879263877868652, 0.6137256622314453, 1.8153777122497559, 3.0170297622680664, 4.218681335449219, 5.4203338623046875, 6.621985912322998, 7.823637962341309, 9.025289535522461, 10.22694206237793, 11.428594589233398, 12.63024616241455, 13.831897735595703, 15.033550262451172, 16.23520278930664, 17.43685531616211, 18.638505935668945, 19.840158462524414, 21.041810989379883, 22.24346160888672, 23.445114135742188, 24.646766662597656, 25.848419189453125, 27.050071716308594, 28.25172233581543, 29.4533748626709, 30.655027389526367, 31.856678009033203, 33.05833053588867, 34.25998306274414]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 11.0, 16.0, 22.0, 27.0, 28.0, 48.0, 89.0, 122.0, 177.0, 284.0, 360.0, 544.0, 813.0, 1276.0, 1832.0, 2682.0, 4327.0, 6478.0, 9975.0, 15518.0, 24432.0, 39346.0, 67176.0, 128860.0, 295937.0, 210478.0, 95300.0, 53253.0, 31746.0, 20216.0, 12879.0, 8318.0, 5354.0, 3552.0, 2350.0, 1562.0, 1010.0, 692.0, 474.0, 342.0, 217.0, 152.0, 95.0, 63.0, 44.0, 35.0, 15.0, 13.0, 11.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.25, -11.8387451171875, -11.427490234375, -11.0162353515625, -10.60498046875, -10.1937255859375, -9.782470703125, -9.3712158203125, -8.9599609375, -8.5487060546875, -8.137451171875, -7.7261962890625, -7.31494140625, -6.9036865234375, -6.492431640625, -6.0811767578125, -5.669921875, -5.2586669921875, -4.847412109375, -4.4361572265625, -4.02490234375, -3.6136474609375, -3.202392578125, -2.7911376953125, -2.3798828125, -1.9686279296875, -1.557373046875, -1.1461181640625, -0.73486328125, -0.3236083984375, 0.087646484375, 0.4989013671875, 0.91015625, 1.3214111328125, 1.732666015625, 2.1439208984375, 2.55517578125, 2.9664306640625, 3.377685546875, 3.7889404296875, 4.2001953125, 4.6114501953125, 5.022705078125, 5.4339599609375, 5.84521484375, 6.2564697265625, 6.667724609375, 7.0789794921875, 7.490234375, 7.9014892578125, 8.312744140625, 8.7239990234375, 9.13525390625, 9.5465087890625, 9.957763671875, 10.3690185546875, 10.7802734375, 11.1915283203125, 11.602783203125, 12.0140380859375, 12.42529296875, 12.8365478515625, 13.247802734375, 13.6590576171875, 14.0703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 8.0, 4.0, 5.0, 7.0, 7.0, 13.0, 23.0, 18.0, 26.0, 21.0, 34.0, 27.0, 30.0, 32.0, 33.0, 37.0, 52.0, 47.0, 42.0, 47.0, 47.0, 47.0, 47.0, 30.0, 44.0, 29.0, 31.0, 34.0, 33.0, 20.0, 26.0, 20.0, 15.0, 10.0, 6.0, 13.0, 12.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-44.8125, -43.5634765625, -42.314453125, -41.0654296875, -39.81640625, -38.5673828125, -37.318359375, -36.0693359375, -34.8203125, -33.5712890625, -32.322265625, -31.0732421875, -29.82421875, -28.5751953125, -27.326171875, -26.0771484375, -24.828125, -23.5791015625, -22.330078125, -21.0810546875, -19.83203125, -18.5830078125, -17.333984375, -16.0849609375, -14.8359375, -13.5869140625, -12.337890625, -11.0888671875, -9.83984375, -8.5908203125, -7.341796875, -6.0927734375, -4.84375, -3.5947265625, -2.345703125, -1.0966796875, 0.15234375, 1.4013671875, 2.650390625, 3.8994140625, 5.1484375, 6.3974609375, 7.646484375, 8.8955078125, 10.14453125, 11.3935546875, 12.642578125, 13.8916015625, 15.140625, 16.3896484375, 17.638671875, 18.8876953125, 20.13671875, 21.3857421875, 22.634765625, 23.8837890625, 25.1328125, 26.3818359375, 27.630859375, 28.8798828125, 30.12890625, 31.3779296875, 32.626953125, 33.8759765625, 35.125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 12.0, 11.0, 12.0, 32.0, 50.0, 59.0, 96.0, 129.0, 199.0, 288.0, 414.0, 613.0, 798.0, 1133.0, 1679.0, 2429.0, 3723.0, 5706.0, 9704.0, 18688.0, 59409.0, 621852.0, 246602.0, 36917.0, 14574.0, 8017.0, 5032.0, 3252.0, 2215.0, 1476.0, 1023.0, 740.0, 529.0, 357.0, 258.0, 181.0, 115.0, 79.0, 54.0, 30.0, 19.0, 18.0, 13.0, 9.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1875, -14.678466796875, -14.16943359375, -13.660400390625, -13.1513671875, -12.642333984375, -12.13330078125, -11.624267578125, -11.115234375, -10.606201171875, -10.09716796875, -9.588134765625, -9.0791015625, -8.570068359375, -8.06103515625, -7.552001953125, -7.04296875, -6.533935546875, -6.02490234375, -5.515869140625, -5.0068359375, -4.497802734375, -3.98876953125, -3.479736328125, -2.970703125, -2.461669921875, -1.95263671875, -1.443603515625, -0.9345703125, -0.425537109375, 0.08349609375, 0.592529296875, 1.1015625, 1.610595703125, 2.11962890625, 2.628662109375, 3.1376953125, 3.646728515625, 4.15576171875, 4.664794921875, 5.173828125, 5.682861328125, 6.19189453125, 6.700927734375, 7.2099609375, 7.718994140625, 8.22802734375, 8.737060546875, 9.24609375, 9.755126953125, 10.26416015625, 10.773193359375, 11.2822265625, 11.791259765625, 12.30029296875, 12.809326171875, 13.318359375, 13.827392578125, 14.33642578125, 14.845458984375, 15.3544921875, 15.863525390625, 16.37255859375, 16.881591796875, 17.390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 9.0, 11.0, 3.0, 14.0, 11.0, 14.0, 12.0, 16.0, 20.0, 28.0, 28.0, 26.0, 25.0, 35.0, 32.0, 32.0, 39.0, 40.0, 43.0, 42.0, 49.0, 44.0, 29.0, 37.0, 40.0, 33.0, 39.0, 29.0, 26.0, 39.0, 15.0, 28.0, 10.0, 19.0, 19.0, 14.0, 12.0, 11.0, 9.0, 9.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.625, -23.810546875, -22.99609375, -22.181640625, -21.3671875, -20.552734375, -19.73828125, -18.923828125, -18.109375, -17.294921875, -16.48046875, -15.666015625, -14.8515625, -14.037109375, -13.22265625, -12.408203125, -11.59375, -10.779296875, -9.96484375, -9.150390625, -8.3359375, -7.521484375, -6.70703125, -5.892578125, -5.078125, -4.263671875, -3.44921875, -2.634765625, -1.8203125, -1.005859375, -0.19140625, 0.623046875, 1.4375, 2.251953125, 3.06640625, 3.880859375, 4.6953125, 5.509765625, 6.32421875, 7.138671875, 7.953125, 8.767578125, 9.58203125, 10.396484375, 11.2109375, 12.025390625, 12.83984375, 13.654296875, 14.46875, 15.283203125, 16.09765625, 16.912109375, 17.7265625, 18.541015625, 19.35546875, 20.169921875, 20.984375, 21.798828125, 22.61328125, 23.427734375, 24.2421875, 25.056640625, 25.87109375, 26.685546875, 27.5]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 19.0, 21.0, 38.0, 62.0, 66.0, 105.0, 166.0, 266.0, 403.0, 643.0, 1162.0, 2042.0, 3844.0, 8198.0, 19319.0, 78904.0, 850255.0, 52076.0, 16106.0, 7026.0, 3387.0, 1750.0, 1024.0, 561.0, 408.0, 213.0, 159.0, 102.0, 53.0, 48.0, 40.0, 20.0, 21.0, 12.0, 3.0, 4.0, 3.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.3671875, -2.300323486328125, -2.23345947265625, -2.166595458984375, -2.0997314453125, -2.032867431640625, -1.96600341796875, -1.899139404296875, -1.832275390625, -1.765411376953125, -1.69854736328125, -1.631683349609375, -1.5648193359375, -1.497955322265625, -1.43109130859375, -1.364227294921875, -1.29736328125, -1.230499267578125, -1.16363525390625, -1.096771240234375, -1.0299072265625, -0.963043212890625, -0.89617919921875, -0.829315185546875, -0.762451171875, -0.695587158203125, -0.62872314453125, -0.561859130859375, -0.4949951171875, -0.428131103515625, -0.36126708984375, -0.294403076171875, -0.2275390625, -0.160675048828125, -0.09381103515625, -0.026947021484375, 0.0399169921875, 0.106781005859375, 0.17364501953125, 0.240509033203125, 0.307373046875, 0.374237060546875, 0.44110107421875, 0.507965087890625, 0.5748291015625, 0.641693115234375, 0.70855712890625, 0.775421142578125, 0.84228515625, 0.909149169921875, 0.97601318359375, 1.042877197265625, 1.1097412109375, 1.176605224609375, 1.24346923828125, 1.310333251953125, 1.377197265625, 1.444061279296875, 1.51092529296875, 1.577789306640625, 1.6446533203125, 1.711517333984375, 1.77838134765625, 1.845245361328125, 1.912109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 8.0, 6.0, 6.0, 10.0, 15.0, 16.0, 24.0, 30.0, 39.0, 44.0, 45.0, 55.0, 55.0, 57.0, 57.0, 68.0, 61.0, 67.0, 46.0, 56.0, 30.0, 33.0, 31.0, 27.0, 17.0, 13.0, 17.0, 15.0, 7.0, 2.0, 6.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00010657310485839844, -0.00010285340249538422, -9.913370013237e-05, -9.541399776935577e-05, -9.169429540634155e-05, -8.797459304332733e-05, -8.425489068031311e-05, -8.053518831729889e-05, -7.681548595428467e-05, -7.309578359127045e-05, -6.937608122825623e-05, -6.5656378865242e-05, -6.193667650222778e-05, -5.821697413921356e-05, -5.449727177619934e-05, -5.077756941318512e-05, -4.70578670501709e-05, -4.333816468715668e-05, -3.9618462324142456e-05, -3.5898759961128235e-05, -3.2179057598114014e-05, -2.8459355235099792e-05, -2.473965287208557e-05, -2.101995050907135e-05, -1.730024814605713e-05, -1.3580545783042908e-05, -9.860843420028687e-06, -6.141141057014465e-06, -2.421438694000244e-06, 1.298263669013977e-06, 5.017966032028198e-06, 8.73766839504242e-06, 1.245737075805664e-05, 1.6177073121070862e-05, 1.9896775484085083e-05, 2.3616477847099304e-05, 2.7336180210113525e-05, 3.1055882573127747e-05, 3.477558493614197e-05, 3.849528729915619e-05, 4.221498966217041e-05, 4.593469202518463e-05, 4.965439438819885e-05, 5.3374096751213074e-05, 5.7093799114227295e-05, 6.0813501477241516e-05, 6.453320384025574e-05, 6.825290620326996e-05, 7.197260856628418e-05, 7.56923109292984e-05, 7.941201329231262e-05, 8.313171565532684e-05, 8.685141801834106e-05, 9.057112038135529e-05, 9.429082274436951e-05, 9.801052510738373e-05, 0.00010173022747039795, 0.00010544992983341217, 0.00010916963219642639, 0.00011288933455944061, 0.00011660903692245483, 0.00012032873928546906, 0.00012404844164848328, 0.0001277681440114975, 0.00013148784637451172]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 10.0, 7.0, 14.0, 21.0, 33.0, 57.0, 69.0, 101.0, 175.0, 284.0, 389.0, 588.0, 910.0, 1406.0, 2179.0, 3305.0, 5198.0, 8086.0, 12698.0, 20802.0, 35033.0, 62811.0, 115887.0, 212500.0, 240877.0, 141461.0, 76049.0, 42261.0, 24416.0, 15040.0, 9361.0, 5685.0, 3701.0, 2439.0, 1545.0, 1097.0, 713.0, 492.0, 295.0, 191.0, 130.0, 87.0, 48.0, 33.0, 28.0, 21.0, 9.0, 6.0, 6.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.197265625, -1.1600341796875, -1.122802734375, -1.0855712890625, -1.04833984375, -1.0111083984375, -0.973876953125, -0.9366455078125, -0.8994140625, -0.8621826171875, -0.824951171875, -0.7877197265625, -0.75048828125, -0.7132568359375, -0.676025390625, -0.6387939453125, -0.6015625, -0.5643310546875, -0.527099609375, -0.4898681640625, -0.45263671875, -0.4154052734375, -0.378173828125, -0.3409423828125, -0.3037109375, -0.2664794921875, -0.229248046875, -0.1920166015625, -0.15478515625, -0.1175537109375, -0.080322265625, -0.0430908203125, -0.005859375, 0.0313720703125, 0.068603515625, 0.1058349609375, 0.14306640625, 0.1802978515625, 0.217529296875, 0.2547607421875, 0.2919921875, 0.3292236328125, 0.366455078125, 0.4036865234375, 0.44091796875, 0.4781494140625, 0.515380859375, 0.5526123046875, 0.58984375, 0.6270751953125, 0.664306640625, 0.7015380859375, 0.73876953125, 0.7760009765625, 0.813232421875, 0.8504638671875, 0.8876953125, 0.9249267578125, 0.962158203125, 0.9993896484375, 1.03662109375, 1.0738525390625, 1.111083984375, 1.1483154296875, 1.185546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 6.0, 10.0, 5.0, 10.0, 10.0, 12.0, 16.0, 11.0, 19.0, 28.0, 21.0, 40.0, 26.0, 39.0, 45.0, 61.0, 60.0, 55.0, 66.0, 47.0, 64.0, 40.0, 43.0, 35.0, 39.0, 24.0, 30.0, 18.0, 14.0, 18.0, 15.0, 15.0, 8.0, 11.0, 12.0, 4.0, 8.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43115234375, -0.416015625, -0.40087890625, -0.3857421875, -0.37060546875, -0.35546875, -0.34033203125, -0.3251953125, -0.31005859375, -0.294921875, -0.27978515625, -0.2646484375, -0.24951171875, -0.234375, -0.21923828125, -0.2041015625, -0.18896484375, -0.173828125, -0.15869140625, -0.1435546875, -0.12841796875, -0.11328125, -0.09814453125, -0.0830078125, -0.06787109375, -0.052734375, -0.03759765625, -0.0224609375, -0.00732421875, 0.0078125, 0.02294921875, 0.0380859375, 0.05322265625, 0.068359375, 0.08349609375, 0.0986328125, 0.11376953125, 0.12890625, 0.14404296875, 0.1591796875, 0.17431640625, 0.189453125, 0.20458984375, 0.2197265625, 0.23486328125, 0.25, 0.26513671875, 0.2802734375, 0.29541015625, 0.310546875, 0.32568359375, 0.3408203125, 0.35595703125, 0.37109375, 0.38623046875, 0.4013671875, 0.41650390625, 0.431640625, 0.44677734375, 0.4619140625, 0.47705078125, 0.4921875, 0.50732421875, 0.5224609375, 0.53759765625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 11.0, 6.0, 7.0, 11.0, 15.0, 18.0, 19.0, 28.0, 25.0, 48.0, 60.0, 59.0, 75.0, 73.0, 72.0, 56.0, 67.0, 62.0, 45.0, 32.0, 40.0, 32.0, 32.0, 18.0, 20.0, 15.0, 12.0, 6.0, 6.0, 9.0, 8.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.30769729614258, -44.071327209472656, -42.834957122802734, -41.59859085083008, -40.362220764160156, -39.125850677490234, -37.88948059082031, -36.65311050415039, -35.41674041748047, -34.18037033081055, -32.944000244140625, -31.707632064819336, -30.471263885498047, -29.234893798828125, -27.998523712158203, -26.76215362548828, -25.525787353515625, -24.289417266845703, -23.053049087524414, -21.816679000854492, -20.580310821533203, -19.34394073486328, -18.10757064819336, -16.871200561523438, -15.634832382202148, -14.398463249206543, -13.162094116210938, -11.925724029541016, -10.68935489654541, -9.452985763549805, -8.216615676879883, -6.980246543884277, -5.743877410888672, -4.507508277893066, -3.2711386680603027, -2.034769296646118, -0.7983999252319336, 0.4379692077636719, 1.6743388175964355, 2.910708427429199, 4.147077560424805, 5.38344669342041, 6.619816303253174, 7.8561859130859375, 9.092555046081543, 10.328924179077148, 11.56529426574707, 12.801663398742676, 14.038032531738281, 15.274401664733887, 16.510770797729492, 17.747140884399414, 18.983509063720703, 20.219879150390625, 21.456249237060547, 22.69261932373047, 23.928987503051758, 25.16535758972168, 26.40172576904297, 27.63809585571289, 28.874465942382812, 30.1108341217041, 31.347204208374023, 32.58357238769531, 33.819942474365234]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 6.0, 11.0, 8.0, 9.0, 16.0, 22.0, 31.0, 21.0, 25.0, 35.0, 27.0, 27.0, 37.0, 27.0, 39.0, 49.0, 42.0, 40.0, 45.0, 35.0, 48.0, 41.0, 42.0, 43.0, 25.0, 32.0, 42.0, 23.0, 25.0, 23.0, 15.0, 17.0, 15.0, 11.0, 11.0, 10.0, 5.0, 3.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-41.921695709228516, -40.73655319213867, -39.55141067504883, -38.36627197265625, -37.181129455566406, -35.99598693847656, -34.81084442138672, -33.625701904296875, -32.44055938720703, -31.255416870117188, -30.070276260375977, -28.885133743286133, -27.699993133544922, -26.514850616455078, -25.329708099365234, -24.14456558227539, -22.959426879882812, -21.77428436279297, -20.589143753051758, -19.404001235961914, -18.218860626220703, -17.03371810913086, -15.848575592041016, -14.663434028625488, -13.478292465209961, -12.293150901794434, -11.108009338378906, -9.922866821289062, -8.737725257873535, -7.552583694458008, -6.367441654205322, -5.182299613952637, -3.9971580505371094, -2.812016248703003, -1.6268744468688965, -0.44173264503479004, 0.7434091567993164, 1.9285507202148438, 3.1136927604675293, 4.298834800720215, 5.483976364135742, 6.6691179275512695, 7.854259967803955, 9.03940200805664, 10.224543571472168, 11.409685134887695, 12.594827651977539, 13.779969215393066, 14.965110778808594, 16.150253295898438, 17.33539390563965, 18.520536422729492, 19.705677032470703, 20.890819549560547, 22.07596206665039, 23.261104583740234, 24.446245193481445, 25.63138771057129, 26.8165283203125, 28.001670837402344, 29.186813354492188, 30.3719539642334, 31.557096481323242, 32.74223709106445, 33.9273796081543]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 7.0, 11.0, 28.0, 30.0, 46.0, 86.0, 103.0, 153.0, 284.0, 450.0, 749.0, 1223.0, 1894.0, 3098.0, 5300.0, 9160.0, 15612.0, 27023.0, 47604.0, 84836.0, 149208.0, 225623.0, 198985.0, 119578.0, 67377.0, 37616.0, 21401.0, 12438.0, 7308.0, 4448.0, 2627.0, 1613.0, 945.0, 606.0, 393.0, 245.0, 159.0, 107.0, 64.0, 31.0, 43.0, 15.0, 10.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-52.5625, -51.09423828125, -49.6259765625, -48.15771484375, -46.689453125, -45.22119140625, -43.7529296875, -42.28466796875, -40.81640625, -39.34814453125, -37.8798828125, -36.41162109375, -34.943359375, -33.47509765625, -32.0068359375, -30.53857421875, -29.0703125, -27.60205078125, -26.1337890625, -24.66552734375, -23.197265625, -21.72900390625, -20.2607421875, -18.79248046875, -17.32421875, -15.85595703125, -14.3876953125, -12.91943359375, -11.451171875, -9.98291015625, -8.5146484375, -7.04638671875, -5.578125, -4.10986328125, -2.6416015625, -1.17333984375, 0.294921875, 1.76318359375, 3.2314453125, 4.69970703125, 6.16796875, 7.63623046875, 9.1044921875, 10.57275390625, 12.041015625, 13.50927734375, 14.9775390625, 16.44580078125, 17.9140625, 19.38232421875, 20.8505859375, 22.31884765625, 23.787109375, 25.25537109375, 26.7236328125, 28.19189453125, 29.66015625, 31.12841796875, 32.5966796875, 34.06494140625, 35.533203125, 37.00146484375, 38.4697265625, 39.93798828125, 41.40625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 14.0, 19.0, 21.0, 29.0, 21.0, 31.0, 27.0, 34.0, 42.0, 31.0, 41.0, 53.0, 43.0, 50.0, 42.0, 33.0, 52.0, 46.0, 45.0, 47.0, 27.0, 33.0, 28.0, 33.0, 27.0, 20.0, 15.0, 13.0, 10.0, 16.0, 10.0, 5.0, 3.0, 0.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-44.40625, -43.1826171875, -41.958984375, -40.7353515625, -39.51171875, -38.2880859375, -37.064453125, -35.8408203125, -34.6171875, -33.3935546875, -32.169921875, -30.9462890625, -29.72265625, -28.4990234375, -27.275390625, -26.0517578125, -24.828125, -23.6044921875, -22.380859375, -21.1572265625, -19.93359375, -18.7099609375, -17.486328125, -16.2626953125, -15.0390625, -13.8154296875, -12.591796875, -11.3681640625, -10.14453125, -8.9208984375, -7.697265625, -6.4736328125, -5.25, -4.0263671875, -2.802734375, -1.5791015625, -0.35546875, 0.8681640625, 2.091796875, 3.3154296875, 4.5390625, 5.7626953125, 6.986328125, 8.2099609375, 9.43359375, 10.6572265625, 11.880859375, 13.1044921875, 14.328125, 15.5517578125, 16.775390625, 17.9990234375, 19.22265625, 20.4462890625, 21.669921875, 22.8935546875, 24.1171875, 25.3408203125, 26.564453125, 27.7880859375, 29.01171875, 30.2353515625, 31.458984375, 32.6826171875, 33.90625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 10.0, 10.0, 16.0, 22.0, 31.0, 54.0, 70.0, 123.0, 175.0, 286.0, 418.0, 762.0, 1185.0, 2068.0, 3155.0, 5330.0, 8860.0, 14698.0, 25547.0, 43898.0, 75236.0, 128402.0, 202312.0, 208056.0, 135677.0, 79535.0, 46112.0, 26705.0, 15945.0, 9351.0, 5766.0, 3419.0, 2060.0, 1287.0, 748.0, 488.0, 272.0, 166.0, 118.0, 71.0, 42.0, 34.0, 18.0, 10.0, 11.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.21875, -46.71435546875, -45.2099609375, -43.70556640625, -42.201171875, -40.69677734375, -39.1923828125, -37.68798828125, -36.18359375, -34.67919921875, -33.1748046875, -31.67041015625, -30.166015625, -28.66162109375, -27.1572265625, -25.65283203125, -24.1484375, -22.64404296875, -21.1396484375, -19.63525390625, -18.130859375, -16.62646484375, -15.1220703125, -13.61767578125, -12.11328125, -10.60888671875, -9.1044921875, -7.60009765625, -6.095703125, -4.59130859375, -3.0869140625, -1.58251953125, -0.078125, 1.42626953125, 2.9306640625, 4.43505859375, 5.939453125, 7.44384765625, 8.9482421875, 10.45263671875, 11.95703125, 13.46142578125, 14.9658203125, 16.47021484375, 17.974609375, 19.47900390625, 20.9833984375, 22.48779296875, 23.9921875, 25.49658203125, 27.0009765625, 28.50537109375, 30.009765625, 31.51416015625, 33.0185546875, 34.52294921875, 36.02734375, 37.53173828125, 39.0361328125, 40.54052734375, 42.044921875, 43.54931640625, 45.0537109375, 46.55810546875, 48.0625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 4.0, 5.0, 13.0, 11.0, 12.0, 20.0, 19.0, 23.0, 22.0, 31.0, 29.0, 39.0, 36.0, 36.0, 46.0, 35.0, 48.0, 41.0, 51.0, 43.0, 40.0, 47.0, 43.0, 39.0, 43.0, 30.0, 31.0, 26.0, 22.0, 18.0, 19.0, 13.0, 9.0, 8.0, 8.0, 5.0, 11.0, 5.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.046875, -24.247314453125, -23.44775390625, -22.648193359375, -21.8486328125, -21.049072265625, -20.24951171875, -19.449951171875, -18.650390625, -17.850830078125, -17.05126953125, -16.251708984375, -15.4521484375, -14.652587890625, -13.85302734375, -13.053466796875, -12.25390625, -11.454345703125, -10.65478515625, -9.855224609375, -9.0556640625, -8.256103515625, -7.45654296875, -6.656982421875, -5.857421875, -5.057861328125, -4.25830078125, -3.458740234375, -2.6591796875, -1.859619140625, -1.06005859375, -0.260498046875, 0.5390625, 1.338623046875, 2.13818359375, 2.937744140625, 3.7373046875, 4.536865234375, 5.33642578125, 6.135986328125, 6.935546875, 7.735107421875, 8.53466796875, 9.334228515625, 10.1337890625, 10.933349609375, 11.73291015625, 12.532470703125, 13.33203125, 14.131591796875, 14.93115234375, 15.730712890625, 16.5302734375, 17.329833984375, 18.12939453125, 18.928955078125, 19.728515625, 20.528076171875, 21.32763671875, 22.127197265625, 22.9267578125, 23.726318359375, 24.52587890625, 25.325439453125, 26.125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 5.0, 7.0, 15.0, 14.0, 12.0, 34.0, 41.0, 82.0, 117.0, 134.0, 233.0, 335.0, 496.0, 784.0, 1164.0, 1878.0, 2988.0, 4936.0, 8175.0, 13709.0, 24187.0, 42858.0, 78231.0, 145393.0, 243020.0, 212395.0, 117993.0, 64116.0, 35448.0, 19949.0, 11413.0, 7003.0, 4056.0, 2606.0, 1584.0, 1101.0, 682.0, 443.0, 288.0, 195.0, 136.0, 102.0, 59.0, 34.0, 38.0, 22.0, 21.0, 14.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-16.28125, -15.800048828125, -15.31884765625, -14.837646484375, -14.3564453125, -13.875244140625, -13.39404296875, -12.912841796875, -12.431640625, -11.950439453125, -11.46923828125, -10.988037109375, -10.5068359375, -10.025634765625, -9.54443359375, -9.063232421875, -8.58203125, -8.100830078125, -7.61962890625, -7.138427734375, -6.6572265625, -6.176025390625, -5.69482421875, -5.213623046875, -4.732421875, -4.251220703125, -3.77001953125, -3.288818359375, -2.8076171875, -2.326416015625, -1.84521484375, -1.364013671875, -0.8828125, -0.401611328125, 0.07958984375, 0.560791015625, 1.0419921875, 1.523193359375, 2.00439453125, 2.485595703125, 2.966796875, 3.447998046875, 3.92919921875, 4.410400390625, 4.8916015625, 5.372802734375, 5.85400390625, 6.335205078125, 6.81640625, 7.297607421875, 7.77880859375, 8.260009765625, 8.7412109375, 9.222412109375, 9.70361328125, 10.184814453125, 10.666015625, 11.147216796875, 11.62841796875, 12.109619140625, 12.5908203125, 13.072021484375, 13.55322265625, 14.034423828125, 14.515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 10.0, 10.0, 9.0, 28.0, 37.0, 24.0, 54.0, 61.0, 83.0, 101.0, 131.0, 123.0, 74.0, 62.0, 39.0, 45.0, 24.0, 26.0, 13.0, 10.0, 6.0, 8.0, 9.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00222015380859375, -0.0021537840366363525, -0.002087414264678955, -0.0020210444927215576, -0.00195467472076416, -0.0018883049488067627, -0.0018219351768493652, -0.0017555654048919678, -0.0016891956329345703, -0.0016228258609771729, -0.0015564560890197754, -0.001490086317062378, -0.0014237165451049805, -0.001357346773147583, -0.0012909770011901855, -0.001224607229232788, -0.0011582374572753906, -0.0010918676853179932, -0.0010254979133605957, -0.0009591281414031982, -0.0008927583694458008, -0.0008263885974884033, -0.0007600188255310059, -0.0006936490535736084, -0.0006272792816162109, -0.0005609095096588135, -0.000494539737701416, -0.00042816996574401855, -0.0003618001937866211, -0.00029543042182922363, -0.00022906064987182617, -0.0001626908779144287, -9.632110595703125e-05, -2.995133399963379e-05, 3.641843795776367e-05, 0.00010278820991516113, 0.0001691579818725586, 0.00023552775382995605, 0.0003018975257873535, 0.000368267297744751, 0.00043463706970214844, 0.0005010068416595459, 0.0005673766136169434, 0.0006337463855743408, 0.0007001161575317383, 0.0007664859294891357, 0.0008328557014465332, 0.0008992254734039307, 0.0009655952453613281, 0.0010319650173187256, 0.001098334789276123, 0.0011647045612335205, 0.001231074333190918, 0.0012974441051483154, 0.0013638138771057129, 0.0014301836490631104, 0.0014965534210205078, 0.0015629231929779053, 0.0016292929649353027, 0.0016956627368927002, 0.0017620325088500977, 0.0018284022808074951, 0.0018947720527648926, 0.00196114182472229, 0.0020275115966796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 10.0, 8.0, 11.0, 15.0, 19.0, 32.0, 56.0, 92.0, 123.0, 134.0, 208.0, 345.0, 441.0, 683.0, 972.0, 1431.0, 2027.0, 3102.0, 4467.0, 6479.0, 9991.0, 14856.0, 23054.0, 36585.0, 58885.0, 96033.0, 151804.0, 195102.0, 161571.0, 104013.0, 63434.0, 39148.0, 25054.0, 15894.0, 10520.0, 7157.0, 4816.0, 3151.0, 2089.0, 1517.0, 1065.0, 693.0, 467.0, 314.0, 203.0, 158.0, 114.0, 79.0, 42.0, 28.0, 20.0, 17.0, 15.0, 9.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.2578125, -11.8433837890625, -11.428955078125, -11.0145263671875, -10.60009765625, -10.1856689453125, -9.771240234375, -9.3568115234375, -8.9423828125, -8.5279541015625, -8.113525390625, -7.6990966796875, -7.28466796875, -6.8702392578125, -6.455810546875, -6.0413818359375, -5.626953125, -5.2125244140625, -4.798095703125, -4.3836669921875, -3.96923828125, -3.5548095703125, -3.140380859375, -2.7259521484375, -2.3115234375, -1.8970947265625, -1.482666015625, -1.0682373046875, -0.65380859375, -0.2393798828125, 0.175048828125, 0.5894775390625, 1.00390625, 1.4183349609375, 1.832763671875, 2.2471923828125, 2.66162109375, 3.0760498046875, 3.490478515625, 3.9049072265625, 4.3193359375, 4.7337646484375, 5.148193359375, 5.5626220703125, 5.97705078125, 6.3914794921875, 6.805908203125, 7.2203369140625, 7.634765625, 8.0491943359375, 8.463623046875, 8.8780517578125, 9.29248046875, 9.7069091796875, 10.121337890625, 10.5357666015625, 10.9501953125, 11.3646240234375, 11.779052734375, 12.1934814453125, 12.60791015625, 13.0223388671875, 13.436767578125, 13.8511962890625, 14.265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 3.0, 5.0, 8.0, 18.0, 10.0, 20.0, 22.0, 25.0, 23.0, 27.0, 31.0, 44.0, 53.0, 48.0, 48.0, 36.0, 55.0, 40.0, 62.0, 54.0, 44.0, 34.0, 52.0, 33.0, 31.0, 29.0, 20.0, 25.0, 14.0, 15.0, 9.0, 6.0, 8.0, 10.0, 5.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.27734375, -5.10687255859375, -4.9364013671875, -4.76593017578125, -4.595458984375, -4.42498779296875, -4.2545166015625, -4.08404541015625, -3.91357421875, -3.74310302734375, -3.5726318359375, -3.40216064453125, -3.231689453125, -3.06121826171875, -2.8907470703125, -2.72027587890625, -2.5498046875, -2.37933349609375, -2.2088623046875, -2.03839111328125, -1.867919921875, -1.69744873046875, -1.5269775390625, -1.35650634765625, -1.18603515625, -1.01556396484375, -0.8450927734375, -0.67462158203125, -0.504150390625, -0.33367919921875, -0.1632080078125, 0.00726318359375, 0.177734375, 0.34820556640625, 0.5186767578125, 0.68914794921875, 0.859619140625, 1.03009033203125, 1.2005615234375, 1.37103271484375, 1.54150390625, 1.71197509765625, 1.8824462890625, 2.05291748046875, 2.223388671875, 2.39385986328125, 2.5643310546875, 2.73480224609375, 2.9052734375, 3.07574462890625, 3.2462158203125, 3.41668701171875, 3.587158203125, 3.75762939453125, 3.9281005859375, 4.09857177734375, 4.26904296875, 4.43951416015625, 4.6099853515625, 4.78045654296875, 4.950927734375, 5.12139892578125, 5.2918701171875, 5.46234130859375, 5.6328125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 2.0, 4.0, 8.0, 6.0, 8.0, 6.0, 12.0, 15.0, 18.0, 27.0, 43.0, 39.0, 39.0, 42.0, 61.0, 61.0, 53.0, 72.0, 70.0, 50.0, 50.0, 48.0, 45.0, 31.0, 40.0, 32.0, 20.0, 17.0, 13.0, 12.0, 9.0, 9.0, 10.0, 4.0, 4.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-41.44779968261719, -40.31585693359375, -39.18391418457031, -38.051971435546875, -36.9200325012207, -35.788089752197266, -34.65614700317383, -33.52420425415039, -32.39226150512695, -31.260318756103516, -30.12837791442871, -28.996435165405273, -27.864492416381836, -26.73255157470703, -25.600608825683594, -24.468666076660156, -23.33672523498535, -22.204782485961914, -21.07284164428711, -19.940898895263672, -18.808956146240234, -17.677013397216797, -16.545072555541992, -15.413129806518555, -14.281188011169434, -13.149246215820312, -12.017303466796875, -10.885361671447754, -9.753419876098633, -8.621477127075195, -7.489535331726074, -6.357593059539795, -5.225648880004883, -4.0937066078186035, -2.9617645740509033, -1.8298225402832031, -0.6978802680969238, 0.43406200408935547, 1.5660037994384766, 2.697946071624756, 3.829888343811035, 4.9618306159973145, 6.093772888183594, 7.225714683532715, 8.357656478881836, 9.489599227905273, 10.621541023254395, 11.753482818603516, 12.885425567626953, 14.017367362976074, 15.149310111999512, 16.281251907348633, 17.41319465637207, 18.545135498046875, 19.677078247070312, 20.80902099609375, 21.940963745117188, 23.072906494140625, 24.20484733581543, 25.336790084838867, 26.468732833862305, 27.60067367553711, 28.732616424560547, 29.864559173583984, 30.99650001525879]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 0.0, 6.0, 8.0, 7.0, 14.0, 10.0, 14.0, 14.0, 22.0, 21.0, 20.0, 27.0, 26.0, 43.0, 40.0, 33.0, 36.0, 47.0, 36.0, 42.0, 37.0, 49.0, 26.0, 43.0, 39.0, 40.0, 44.0, 30.0, 27.0, 31.0, 21.0, 22.0, 20.0, 20.0, 15.0, 7.0, 11.0, 14.0, 11.0, 9.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0], "bins": [-44.825984954833984, -43.59872055053711, -42.3714599609375, -41.144195556640625, -39.91693115234375, -38.689666748046875, -37.46240234375, -36.23514175415039, -35.007877349853516, -33.78061294555664, -32.55335235595703, -31.326087951660156, -30.09882354736328, -28.871559143066406, -27.644296646118164, -26.417034149169922, -25.189769744873047, -23.962505340576172, -22.73524284362793, -21.507980346679688, -20.280715942382812, -19.053451538085938, -17.826189041137695, -16.598926544189453, -15.371662139892578, -14.14439868927002, -12.917135238647461, -11.689871788024902, -10.462608337402344, -9.235344886779785, -8.008081436157227, -6.780817985534668, -5.553554534912109, -4.326291084289551, -3.099027633666992, -1.8717641830444336, -0.644500732421875, 0.5827627182006836, 1.8100261688232422, 3.037289619445801, 4.264553070068359, 5.491816520690918, 6.719079971313477, 7.946343421936035, 9.173606872558594, 10.400870323181152, 11.628133773803711, 12.85539722442627, 14.082660675048828, 15.309924125671387, 16.537187576293945, 17.764450073242188, 18.991714477539062, 20.218978881835938, 21.44624137878418, 22.673503875732422, 23.900768280029297, 25.128032684326172, 26.355295181274414, 27.582557678222656, 28.80982208251953, 30.037086486816406, 31.26434898376465, 32.49161148071289, 33.718875885009766]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 2.0, 7.0, 10.0, 14.0, 14.0, 26.0, 29.0, 60.0, 80.0, 148.0, 197.0, 313.0, 540.0, 907.0, 1627.0, 2678.0, 4898.0, 9039.0, 17128.0, 33968.0, 74075.0, 198409.0, 624795.0, 1512840.0, 1116349.0, 370514.0, 122305.0, 51243.0, 24210.0, 12264.0, 6486.0, 3693.0, 2086.0, 1214.0, 748.0, 483.0, 299.0, 206.0, 116.0, 97.0, 49.0, 30.0, 30.0, 14.0, 14.0, 10.0, 12.0, 5.0, 1.0, 2.0, 0.0, 3.0], "bins": [-55.84375, -54.28271484375, -52.7216796875, -51.16064453125, -49.599609375, -48.03857421875, -46.4775390625, -44.91650390625, -43.35546875, -41.79443359375, -40.2333984375, -38.67236328125, -37.111328125, -35.55029296875, -33.9892578125, -32.42822265625, -30.8671875, -29.30615234375, -27.7451171875, -26.18408203125, -24.623046875, -23.06201171875, -21.5009765625, -19.93994140625, -18.37890625, -16.81787109375, -15.2568359375, -13.69580078125, -12.134765625, -10.57373046875, -9.0126953125, -7.45166015625, -5.890625, -4.32958984375, -2.7685546875, -1.20751953125, 0.353515625, 1.91455078125, 3.4755859375, 5.03662109375, 6.59765625, 8.15869140625, 9.7197265625, 11.28076171875, 12.841796875, 14.40283203125, 15.9638671875, 17.52490234375, 19.0859375, 20.64697265625, 22.2080078125, 23.76904296875, 25.330078125, 26.89111328125, 28.4521484375, 30.01318359375, 31.57421875, 33.13525390625, 34.6962890625, 36.25732421875, 37.818359375, 39.37939453125, 40.9404296875, 42.50146484375, 44.0625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 6.0, 6.0, 6.0, 11.0, 8.0, 14.0, 11.0, 19.0, 15.0, 19.0, 23.0, 27.0, 35.0, 36.0, 42.0, 26.0, 43.0, 44.0, 55.0, 36.0, 37.0, 40.0, 50.0, 44.0, 46.0, 36.0, 40.0, 29.0, 25.0, 18.0, 30.0, 22.0, 19.0, 8.0, 15.0, 13.0, 10.0, 9.0, 6.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0], "bins": [-41.90625, -40.759765625, -39.61328125, -38.466796875, -37.3203125, -36.173828125, -35.02734375, -33.880859375, -32.734375, -31.587890625, -30.44140625, -29.294921875, -28.1484375, -27.001953125, -25.85546875, -24.708984375, -23.5625, -22.416015625, -21.26953125, -20.123046875, -18.9765625, -17.830078125, -16.68359375, -15.537109375, -14.390625, -13.244140625, -12.09765625, -10.951171875, -9.8046875, -8.658203125, -7.51171875, -6.365234375, -5.21875, -4.072265625, -2.92578125, -1.779296875, -0.6328125, 0.513671875, 1.66015625, 2.806640625, 3.953125, 5.099609375, 6.24609375, 7.392578125, 8.5390625, 9.685546875, 10.83203125, 11.978515625, 13.125, 14.271484375, 15.41796875, 16.564453125, 17.7109375, 18.857421875, 20.00390625, 21.150390625, 22.296875, 23.443359375, 24.58984375, 25.736328125, 26.8828125, 28.029296875, 29.17578125, 30.322265625, 31.46875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 5.0, 5.0, 6.0, 11.0, 13.0, 20.0, 31.0, 41.0, 56.0, 85.0, 123.0, 149.0, 234.0, 361.0, 461.0, 691.0, 1043.0, 1515.0, 2126.0, 3273.0, 4918.0, 7572.0, 11573.0, 18861.0, 30677.0, 51646.0, 88587.0, 160155.0, 302681.0, 604025.0, 1131380.0, 847756.0, 419416.0, 216546.0, 117259.0, 66427.0, 39167.0, 23342.0, 14690.0, 9328.0, 5910.0, 3900.0, 2585.0, 1753.0, 1168.0, 831.0, 583.0, 382.0, 279.0, 211.0, 138.0, 88.0, 68.0, 38.0, 35.0, 25.0, 19.0, 15.0, 6.0, 9.0, 1.0, 2.0, 2.0], "bins": [-37.90625, -36.7119140625, -35.517578125, -34.3232421875, -33.12890625, -31.9345703125, -30.740234375, -29.5458984375, -28.3515625, -27.1572265625, -25.962890625, -24.7685546875, -23.57421875, -22.3798828125, -21.185546875, -19.9912109375, -18.796875, -17.6025390625, -16.408203125, -15.2138671875, -14.01953125, -12.8251953125, -11.630859375, -10.4365234375, -9.2421875, -8.0478515625, -6.853515625, -5.6591796875, -4.46484375, -3.2705078125, -2.076171875, -0.8818359375, 0.3125, 1.5068359375, 2.701171875, 3.8955078125, 5.08984375, 6.2841796875, 7.478515625, 8.6728515625, 9.8671875, 11.0615234375, 12.255859375, 13.4501953125, 14.64453125, 15.8388671875, 17.033203125, 18.2275390625, 19.421875, 20.6162109375, 21.810546875, 23.0048828125, 24.19921875, 25.3935546875, 26.587890625, 27.7822265625, 28.9765625, 30.1708984375, 31.365234375, 32.5595703125, 33.75390625, 34.9482421875, 36.142578125, 37.3369140625, 38.53125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 9.0, 6.0, 13.0, 17.0, 23.0, 39.0, 50.0, 66.0, 58.0, 86.0, 97.0, 106.0, 174.0, 184.0, 230.0, 269.0, 302.0, 339.0, 335.0, 296.0, 258.0, 220.0, 185.0, 149.0, 115.0, 79.0, 75.0, 52.0, 50.0, 38.0, 31.0, 29.0, 13.0, 19.0, 16.0, 6.0, 7.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.40625, -15.877197265625, -15.34814453125, -14.819091796875, -14.2900390625, -13.760986328125, -13.23193359375, -12.702880859375, -12.173828125, -11.644775390625, -11.11572265625, -10.586669921875, -10.0576171875, -9.528564453125, -8.99951171875, -8.470458984375, -7.94140625, -7.412353515625, -6.88330078125, -6.354248046875, -5.8251953125, -5.296142578125, -4.76708984375, -4.238037109375, -3.708984375, -3.179931640625, -2.65087890625, -2.121826171875, -1.5927734375, -1.063720703125, -0.53466796875, -0.005615234375, 0.5234375, 1.052490234375, 1.58154296875, 2.110595703125, 2.6396484375, 3.168701171875, 3.69775390625, 4.226806640625, 4.755859375, 5.284912109375, 5.81396484375, 6.343017578125, 6.8720703125, 7.401123046875, 7.93017578125, 8.459228515625, 8.98828125, 9.517333984375, 10.04638671875, 10.575439453125, 11.1044921875, 11.633544921875, 12.16259765625, 12.691650390625, 13.220703125, 13.749755859375, 14.27880859375, 14.807861328125, 15.3369140625, 15.865966796875, 16.39501953125, 16.924072265625, 17.453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 2.0, 6.0, 5.0, 8.0, 7.0, 19.0, 20.0, 24.0, 24.0, 54.0, 43.0, 54.0, 73.0, 78.0, 74.0, 69.0, 72.0, 69.0, 56.0, 43.0, 43.0, 42.0, 25.0, 21.0, 19.0, 14.0, 8.0, 7.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.03807830810547, -48.57343292236328, -47.108787536621094, -45.64413833618164, -44.17949295043945, -42.714847564697266, -41.25020217895508, -39.785552978515625, -38.32090759277344, -36.85626220703125, -35.39161682128906, -33.92696762084961, -32.46232223510742, -30.997676849365234, -29.533031463623047, -28.068384170532227, -26.60373878479004, -25.13909339904785, -23.67444610595703, -22.209800720214844, -20.745153427124023, -19.280508041381836, -17.815860748291016, -16.351215362548828, -14.886569023132324, -13.42192268371582, -11.957276344299316, -10.492630004882812, -9.027984619140625, -7.563337802886963, -6.098691940307617, -4.634045600891113, -3.1693992614746094, -1.704753041267395, -0.24010682106018066, 1.2245392799377441, 2.689185619354248, 4.153831958770752, 5.618477821350098, 7.083124160766602, 8.547770500183105, 10.01241683959961, 11.477063179016113, 12.941709518432617, 14.406354904174805, 15.871002197265625, 17.335647583007812, 18.80029296875, 20.26494026184082, 21.729585647583008, 23.194232940673828, 24.658878326416016, 26.123525619506836, 27.588171005249023, 29.052818298339844, 30.51746368408203, 31.98210906982422, 33.446754455566406, 34.911399841308594, 36.37604904174805, 37.840694427490234, 39.30533981323242, 40.76998519897461, 42.23463439941406, 43.69927978515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 4.0, 5.0, 7.0, 11.0, 12.0, 20.0, 27.0, 17.0, 24.0, 23.0, 36.0, 30.0, 34.0, 51.0, 40.0, 49.0, 47.0, 35.0, 44.0, 53.0, 31.0, 44.0, 41.0, 32.0, 37.0, 39.0, 25.0, 31.0, 21.0, 16.0, 25.0, 12.0, 13.0, 13.0, 6.0, 8.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.723575592041016, -45.40193176269531, -44.080284118652344, -42.75864028930664, -41.43699645996094, -40.11534881591797, -38.793704986572266, -37.47206115722656, -36.150413513183594, -34.82876968383789, -33.50712203979492, -32.18547821044922, -30.863832473754883, -29.542186737060547, -28.220542907714844, -26.898897171020508, -25.577251434326172, -24.255605697631836, -22.9339599609375, -21.612316131591797, -20.29067039489746, -18.969024658203125, -17.647380828857422, -16.325735092163086, -15.00408935546875, -13.682443618774414, -12.360798835754395, -11.039154052734375, -9.717508316040039, -8.395862579345703, -7.074217796325684, -5.752573013305664, -4.430927276611328, -3.1092820167541504, -1.7876367568969727, -0.4659914970397949, 0.8556537628173828, 2.1772990226745605, 3.4989442825317383, 4.820589065551758, 6.142234802246094, 7.4638800621032715, 8.78552532196045, 10.107170104980469, 11.428815841674805, 12.75046157836914, 14.07210636138916, 15.39375114440918, 16.715396881103516, 18.03704261779785, 19.358688354492188, 20.68033218383789, 22.001977920532227, 23.323623657226562, 24.645267486572266, 25.9669132232666, 27.288558959960938, 28.610204696655273, 29.93185043334961, 31.253494262695312, 32.57514190673828, 33.896785736083984, 35.21842956542969, 36.540077209472656, 37.86172103881836]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 25.0, 42.0, 46.0, 84.0, 113.0, 184.0, 274.0, 356.0, 562.0, 839.0, 1156.0, 1726.0, 2677.0, 3825.0, 6068.0, 9015.0, 13955.0, 21518.0, 34111.0, 56055.0, 97308.0, 200437.0, 281695.0, 128603.0, 70444.0, 41743.0, 26286.0, 16918.0, 11019.0, 7100.0, 4709.0, 3232.0, 2114.0, 1396.0, 955.0, 640.0, 407.0, 280.0, 204.0, 153.0, 83.0, 48.0, 47.0, 32.0, 21.0, 10.0, 10.0, 12.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-13.8984375, -13.467041015625, -13.03564453125, -12.604248046875, -12.1728515625, -11.741455078125, -11.31005859375, -10.878662109375, -10.447265625, -10.015869140625, -9.58447265625, -9.153076171875, -8.7216796875, -8.290283203125, -7.85888671875, -7.427490234375, -6.99609375, -6.564697265625, -6.13330078125, -5.701904296875, -5.2705078125, -4.839111328125, -4.40771484375, -3.976318359375, -3.544921875, -3.113525390625, -2.68212890625, -2.250732421875, -1.8193359375, -1.387939453125, -0.95654296875, -0.525146484375, -0.09375, 0.337646484375, 0.76904296875, 1.200439453125, 1.6318359375, 2.063232421875, 2.49462890625, 2.926025390625, 3.357421875, 3.788818359375, 4.22021484375, 4.651611328125, 5.0830078125, 5.514404296875, 5.94580078125, 6.377197265625, 6.80859375, 7.239990234375, 7.67138671875, 8.102783203125, 8.5341796875, 8.965576171875, 9.39697265625, 9.828369140625, 10.259765625, 10.691162109375, 11.12255859375, 11.553955078125, 11.9853515625, 12.416748046875, 12.84814453125, 13.279541015625, 13.7109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 2.0, 11.0, 8.0, 12.0, 9.0, 22.0, 14.0, 21.0, 30.0, 31.0, 26.0, 33.0, 48.0, 50.0, 39.0, 37.0, 47.0, 44.0, 53.0, 43.0, 37.0, 44.0, 39.0, 33.0, 33.0, 32.0, 30.0, 23.0, 27.0, 15.0, 13.0, 30.0, 8.0, 9.0, 14.0, 4.0, 5.0, 3.0, 5.0, 4.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.5, -43.150390625, -41.80078125, -40.451171875, -39.1015625, -37.751953125, -36.40234375, -35.052734375, -33.703125, -32.353515625, -31.00390625, -29.654296875, -28.3046875, -26.955078125, -25.60546875, -24.255859375, -22.90625, -21.556640625, -20.20703125, -18.857421875, -17.5078125, -16.158203125, -14.80859375, -13.458984375, -12.109375, -10.759765625, -9.41015625, -8.060546875, -6.7109375, -5.361328125, -4.01171875, -2.662109375, -1.3125, 0.037109375, 1.38671875, 2.736328125, 4.0859375, 5.435546875, 6.78515625, 8.134765625, 9.484375, 10.833984375, 12.18359375, 13.533203125, 14.8828125, 16.232421875, 17.58203125, 18.931640625, 20.28125, 21.630859375, 22.98046875, 24.330078125, 25.6796875, 27.029296875, 28.37890625, 29.728515625, 31.078125, 32.427734375, 33.77734375, 35.126953125, 36.4765625, 37.826171875, 39.17578125, 40.525390625, 41.875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 8.0, 9.0, 13.0, 24.0, 31.0, 35.0, 58.0, 78.0, 125.0, 186.0, 245.0, 367.0, 525.0, 733.0, 1113.0, 1473.0, 2089.0, 3191.0, 4721.0, 7489.0, 13357.0, 31792.0, 191990.0, 675553.0, 65966.0, 19531.0, 9653.0, 5928.0, 3753.0, 2610.0, 1790.0, 1235.0, 832.0, 596.0, 464.0, 281.0, 228.0, 160.0, 106.0, 58.0, 41.0, 39.0, 21.0, 13.0, 13.0, 8.0, 3.0, 7.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.1875, -17.62353515625, -17.0595703125, -16.49560546875, -15.931640625, -15.36767578125, -14.8037109375, -14.23974609375, -13.67578125, -13.11181640625, -12.5478515625, -11.98388671875, -11.419921875, -10.85595703125, -10.2919921875, -9.72802734375, -9.1640625, -8.60009765625, -8.0361328125, -7.47216796875, -6.908203125, -6.34423828125, -5.7802734375, -5.21630859375, -4.65234375, -4.08837890625, -3.5244140625, -2.96044921875, -2.396484375, -1.83251953125, -1.2685546875, -0.70458984375, -0.140625, 0.42333984375, 0.9873046875, 1.55126953125, 2.115234375, 2.67919921875, 3.2431640625, 3.80712890625, 4.37109375, 4.93505859375, 5.4990234375, 6.06298828125, 6.626953125, 7.19091796875, 7.7548828125, 8.31884765625, 8.8828125, 9.44677734375, 10.0107421875, 10.57470703125, 11.138671875, 11.70263671875, 12.2666015625, 12.83056640625, 13.39453125, 13.95849609375, 14.5224609375, 15.08642578125, 15.650390625, 16.21435546875, 16.7783203125, 17.34228515625, 17.90625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 5.0, 8.0, 9.0, 13.0, 15.0, 19.0, 17.0, 29.0, 24.0, 19.0, 39.0, 25.0, 38.0, 29.0, 26.0, 40.0, 42.0, 51.0, 54.0, 45.0, 48.0, 38.0, 46.0, 46.0, 45.0, 29.0, 40.0, 15.0, 33.0, 23.0, 16.0, 13.0, 15.0, 15.0, 8.0, 7.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.6875, -33.719482421875, -32.75146484375, -31.783447265625, -30.8154296875, -29.847412109375, -28.87939453125, -27.911376953125, -26.943359375, -25.975341796875, -25.00732421875, -24.039306640625, -23.0712890625, -22.103271484375, -21.13525390625, -20.167236328125, -19.19921875, -18.231201171875, -17.26318359375, -16.295166015625, -15.3271484375, -14.359130859375, -13.39111328125, -12.423095703125, -11.455078125, -10.487060546875, -9.51904296875, -8.551025390625, -7.5830078125, -6.614990234375, -5.64697265625, -4.678955078125, -3.7109375, -2.742919921875, -1.77490234375, -0.806884765625, 0.1611328125, 1.129150390625, 2.09716796875, 3.065185546875, 4.033203125, 5.001220703125, 5.96923828125, 6.937255859375, 7.9052734375, 8.873291015625, 9.84130859375, 10.809326171875, 11.77734375, 12.745361328125, 13.71337890625, 14.681396484375, 15.6494140625, 16.617431640625, 17.58544921875, 18.553466796875, 19.521484375, 20.489501953125, 21.45751953125, 22.425537109375, 23.3935546875, 24.361572265625, 25.32958984375, 26.297607421875, 27.265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 3.0, 9.0, 14.0, 23.0, 21.0, 38.0, 64.0, 99.0, 126.0, 163.0, 251.0, 413.0, 721.0, 1159.0, 1961.0, 3722.0, 7814.0, 20096.0, 126214.0, 824091.0, 38130.0, 11957.0, 5081.0, 2701.0, 1416.0, 806.0, 518.0, 311.0, 193.0, 119.0, 111.0, 61.0, 27.0, 34.0, 14.0, 14.0, 10.0, 9.0, 10.0, 3.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.517578125, -3.408477783203125, -3.29937744140625, -3.190277099609375, -3.0811767578125, -2.972076416015625, -2.86297607421875, -2.753875732421875, -2.644775390625, -2.535675048828125, -2.42657470703125, -2.317474365234375, -2.2083740234375, -2.099273681640625, -1.99017333984375, -1.881072998046875, -1.77197265625, -1.662872314453125, -1.55377197265625, -1.444671630859375, -1.3355712890625, -1.226470947265625, -1.11737060546875, -1.008270263671875, -0.899169921875, -0.790069580078125, -0.68096923828125, -0.571868896484375, -0.4627685546875, -0.353668212890625, -0.24456787109375, -0.135467529296875, -0.0263671875, 0.082733154296875, 0.19183349609375, 0.300933837890625, 0.4100341796875, 0.519134521484375, 0.62823486328125, 0.737335205078125, 0.846435546875, 0.955535888671875, 1.06463623046875, 1.173736572265625, 1.2828369140625, 1.391937255859375, 1.50103759765625, 1.610137939453125, 1.71923828125, 1.828338623046875, 1.93743896484375, 2.046539306640625, 2.1556396484375, 2.264739990234375, 2.37384033203125, 2.482940673828125, 2.592041015625, 2.701141357421875, 2.81024169921875, 2.919342041015625, 3.0284423828125, 3.137542724609375, 3.24664306640625, 3.355743408203125, 3.46484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 10.0, 9.0, 4.0, 9.0, 22.0, 20.0, 38.0, 43.0, 36.0, 54.0, 79.0, 85.0, 90.0, 87.0, 81.0, 77.0, 58.0, 41.0, 39.0, 27.0, 17.0, 18.0, 5.0, 14.0, 6.0, 5.0, 2.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019788742065429688, -0.0001916550099849701, -0.0001854225993156433, -0.00017919018864631653, -0.00017295777797698975, -0.00016672536730766296, -0.00016049295663833618, -0.0001542605459690094, -0.00014802813529968262, -0.00014179572463035583, -0.00013556331396102905, -0.00012933090329170227, -0.0001230984926223755, -0.0001168660819530487, -0.00011063367128372192, -0.00010440126061439514, -9.816884994506836e-05, -9.193643927574158e-05, -8.57040286064148e-05, -7.947161793708801e-05, -7.323920726776123e-05, -6.700679659843445e-05, -6.0774385929107666e-05, -5.4541975259780884e-05, -4.83095645904541e-05, -4.207715392112732e-05, -3.584474325180054e-05, -2.9612332582473755e-05, -2.3379921913146973e-05, -1.714751124382019e-05, -1.0915100574493408e-05, -4.682689905166626e-06, 1.5497207641601562e-06, 7.782131433486938e-06, 1.401454210281372e-05, 2.0246952772140503e-05, 2.6479363441467285e-05, 3.271177411079407e-05, 3.894418478012085e-05, 4.517659544944763e-05, 5.1409006118774414e-05, 5.7641416788101196e-05, 6.387382745742798e-05, 7.010623812675476e-05, 7.633864879608154e-05, 8.257105946540833e-05, 8.880347013473511e-05, 9.503588080406189e-05, 0.00010126829147338867, 0.00010750070214271545, 0.00011373311281204224, 0.00011996552348136902, 0.0001261979341506958, 0.00013243034482002258, 0.00013866275548934937, 0.00014489516615867615, 0.00015112757682800293, 0.0001573599874973297, 0.0001635923981666565, 0.00016982480883598328, 0.00017605721950531006, 0.00018228963017463684, 0.00018852204084396362, 0.0001947544515132904, 0.0002009868621826172]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 6.0, 8.0, 15.0, 23.0, 34.0, 44.0, 71.0, 90.0, 136.0, 197.0, 283.0, 440.0, 566.0, 844.0, 1170.0, 1743.0, 2607.0, 4139.0, 6503.0, 10932.0, 18743.0, 34814.0, 69799.0, 155098.0, 305974.0, 224936.0, 99869.0, 47487.0, 24759.0, 13782.0, 8351.0, 5129.0, 3224.0, 2162.0, 1373.0, 995.0, 649.0, 500.0, 313.0, 240.0, 150.0, 109.0, 83.0, 58.0, 45.0, 18.0, 12.0, 12.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7236328125, -1.6693115234375, -1.614990234375, -1.5606689453125, -1.50634765625, -1.4520263671875, -1.397705078125, -1.3433837890625, -1.2890625, -1.2347412109375, -1.180419921875, -1.1260986328125, -1.07177734375, -1.0174560546875, -0.963134765625, -0.9088134765625, -0.8544921875, -0.8001708984375, -0.745849609375, -0.6915283203125, -0.63720703125, -0.5828857421875, -0.528564453125, -0.4742431640625, -0.419921875, -0.3656005859375, -0.311279296875, -0.2569580078125, -0.20263671875, -0.1483154296875, -0.093994140625, -0.0396728515625, 0.0146484375, 0.0689697265625, 0.123291015625, 0.1776123046875, 0.23193359375, 0.2862548828125, 0.340576171875, 0.3948974609375, 0.44921875, 0.5035400390625, 0.557861328125, 0.6121826171875, 0.66650390625, 0.7208251953125, 0.775146484375, 0.8294677734375, 0.8837890625, 0.9381103515625, 0.992431640625, 1.0467529296875, 1.10107421875, 1.1553955078125, 1.209716796875, 1.2640380859375, 1.318359375, 1.3726806640625, 1.427001953125, 1.4813232421875, 1.53564453125, 1.5899658203125, 1.644287109375, 1.6986083984375, 1.7529296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 6.0, 4.0, 6.0, 4.0, 9.0, 14.0, 10.0, 14.0, 25.0, 29.0, 28.0, 38.0, 45.0, 62.0, 98.0, 87.0, 86.0, 73.0, 61.0, 54.0, 46.0, 37.0, 29.0, 25.0, 14.0, 15.0, 7.0, 5.0, 8.0, 9.0, 3.0, 2.0, 0.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5869140625, -0.5678863525390625, -0.548858642578125, -0.5298309326171875, -0.51080322265625, -0.4917755126953125, -0.472747802734375, -0.4537200927734375, -0.4346923828125, -0.4156646728515625, -0.396636962890625, -0.3776092529296875, -0.35858154296875, -0.3395538330078125, -0.320526123046875, -0.3014984130859375, -0.282470703125, -0.2634429931640625, -0.244415283203125, -0.2253875732421875, -0.20635986328125, -0.1873321533203125, -0.168304443359375, -0.1492767333984375, -0.1302490234375, -0.1112213134765625, -0.092193603515625, -0.0731658935546875, -0.05413818359375, -0.0351104736328125, -0.016082763671875, 0.0029449462890625, 0.02197265625, 0.0410003662109375, 0.060028076171875, 0.0790557861328125, 0.09808349609375, 0.1171112060546875, 0.136138916015625, 0.1551666259765625, 0.1741943359375, 0.1932220458984375, 0.212249755859375, 0.2312774658203125, 0.25030517578125, 0.2693328857421875, 0.288360595703125, 0.3073883056640625, 0.326416015625, 0.3454437255859375, 0.364471435546875, 0.3834991455078125, 0.40252685546875, 0.4215545654296875, 0.440582275390625, 0.4596099853515625, 0.4786376953125, 0.4976654052734375, 0.516693115234375, 0.5357208251953125, 0.55474853515625, 0.5737762451171875, 0.592803955078125, 0.6118316650390625, 0.630859375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 6.0, 8.0, 13.0, 10.0, 24.0, 20.0, 29.0, 41.0, 52.0, 57.0, 67.0, 65.0, 89.0, 75.0, 74.0, 73.0, 38.0, 56.0, 49.0, 47.0, 18.0, 16.0, 15.0, 16.0, 10.0, 5.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.29299545288086, -48.8133430480957, -47.33369064331055, -45.85403823852539, -44.3743896484375, -42.894737243652344, -41.41508483886719, -39.93543243408203, -38.455780029296875, -36.97612762451172, -35.49647521972656, -34.016822814941406, -32.53717041015625, -31.057519912719727, -29.577869415283203, -28.098217010498047, -26.61856460571289, -25.138912200927734, -23.659259796142578, -22.179609298706055, -20.6999568939209, -19.220304489135742, -17.74065399169922, -16.261001586914062, -14.781349182128906, -13.30169677734375, -11.82204532623291, -10.34239387512207, -8.862741470336914, -7.383089542388916, -5.903437614440918, -4.423786163330078, -2.9441299438476562, -1.4644780158996582, 0.015173912048339844, 1.494825839996338, 2.974477767944336, 4.454129695892334, 5.933781623840332, 7.413433074951172, 8.893085479736328, 10.372737884521484, 11.852389335632324, 13.332040786743164, 14.81169319152832, 16.291345596313477, 17.77099609375, 19.250648498535156, 20.730300903320312, 22.20995330810547, 23.689605712890625, 25.16925621032715, 26.648908615112305, 28.12856101989746, 29.608211517333984, 31.08786392211914, 32.5675163269043, 34.04716873168945, 35.52682113647461, 37.006473541259766, 38.486122131347656, 39.96577453613281, 41.44542694091797, 42.925079345703125, 44.40473175048828]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 3.0, 7.0, 6.0, 12.0, 16.0, 15.0, 32.0, 14.0, 22.0, 27.0, 36.0, 33.0, 30.0, 50.0, 42.0, 50.0, 47.0, 35.0, 45.0, 48.0, 35.0, 42.0, 42.0, 27.0, 42.0, 39.0, 26.0, 28.0, 20.0, 15.0, 24.0, 13.0, 13.0, 13.0, 5.0, 8.0, 6.0, 8.0, 4.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.716773986816406, -44.41510009765625, -43.11343002319336, -41.8117561340332, -40.51008605957031, -39.208412170410156, -37.906742095947266, -36.60506820678711, -35.30339813232422, -34.00172424316406, -32.70005416870117, -31.39838218688965, -30.096710205078125, -28.79503631591797, -27.493364334106445, -26.191692352294922, -24.890018463134766, -23.588346481323242, -22.28667449951172, -20.985002517700195, -19.683330535888672, -18.381656646728516, -17.079984664916992, -15.778312683105469, -14.476640701293945, -13.174968719482422, -11.873296737670898, -10.571623802185059, -9.269951820373535, -7.968279838562012, -6.66660737991333, -5.364934921264648, -4.063266754150391, -2.761594533920288, -1.4599223136901855, -0.158250093460083, 1.1434221267700195, 2.445094108581543, 3.7467665672302246, 5.048439025878906, 6.35011100769043, 7.651782989501953, 8.953454971313477, 10.255127906799316, 11.55679988861084, 12.858471870422363, 14.160144805908203, 15.461816787719727, 16.76348876953125, 18.065160751342773, 19.366832733154297, 20.66850471496582, 21.970176696777344, 23.2718505859375, 24.573522567749023, 25.875194549560547, 27.17686653137207, 28.478538513183594, 29.780210494995117, 31.08188247680664, 32.3835563659668, 33.68522644042969, 34.986900329589844, 36.28857421875, 37.59024429321289]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 12.0, 13.0, 17.0, 27.0, 62.0, 74.0, 109.0, 168.0, 216.0, 371.0, 515.0, 757.0, 1153.0, 1754.0, 2619.0, 3931.0, 6070.0, 9270.0, 14060.0, 21993.0, 33861.0, 52554.0, 81888.0, 124907.0, 173497.0, 171500.0, 122420.0, 79538.0, 50797.0, 32959.0, 21097.0, 13755.0, 9133.0, 5828.0, 3899.0, 2632.0, 1640.0, 1176.0, 765.0, 504.0, 341.0, 217.0, 142.0, 111.0, 68.0, 49.0, 28.0, 21.0, 12.0, 6.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.03125, -35.83544921875, -34.6396484375, -33.44384765625, -32.248046875, -31.05224609375, -29.8564453125, -28.66064453125, -27.46484375, -26.26904296875, -25.0732421875, -23.87744140625, -22.681640625, -21.48583984375, -20.2900390625, -19.09423828125, -17.8984375, -16.70263671875, -15.5068359375, -14.31103515625, -13.115234375, -11.91943359375, -10.7236328125, -9.52783203125, -8.33203125, -7.13623046875, -5.9404296875, -4.74462890625, -3.548828125, -2.35302734375, -1.1572265625, 0.03857421875, 1.234375, 2.43017578125, 3.6259765625, 4.82177734375, 6.017578125, 7.21337890625, 8.4091796875, 9.60498046875, 10.80078125, 11.99658203125, 13.1923828125, 14.38818359375, 15.583984375, 16.77978515625, 17.9755859375, 19.17138671875, 20.3671875, 21.56298828125, 22.7587890625, 23.95458984375, 25.150390625, 26.34619140625, 27.5419921875, 28.73779296875, 29.93359375, 31.12939453125, 32.3251953125, 33.52099609375, 34.716796875, 35.91259765625, 37.1083984375, 38.30419921875, 39.5]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 2.0, 7.0, 3.0, 12.0, 11.0, 11.0, 14.0, 14.0, 14.0, 27.0, 18.0, 31.0, 35.0, 34.0, 40.0, 39.0, 31.0, 49.0, 43.0, 43.0, 49.0, 51.0, 38.0, 37.0, 38.0, 25.0, 33.0, 38.0, 37.0, 23.0, 24.0, 19.0, 12.0, 24.0, 16.0, 10.0, 9.0, 7.0, 8.0, 2.0, 6.0, 1.0, 5.0, 5.0, 1.0, 1.0, 2.0], "bins": [-43.65625, -42.4814453125, -41.306640625, -40.1318359375, -38.95703125, -37.7822265625, -36.607421875, -35.4326171875, -34.2578125, -33.0830078125, -31.908203125, -30.7333984375, -29.55859375, -28.3837890625, -27.208984375, -26.0341796875, -24.859375, -23.6845703125, -22.509765625, -21.3349609375, -20.16015625, -18.9853515625, -17.810546875, -16.6357421875, -15.4609375, -14.2861328125, -13.111328125, -11.9365234375, -10.76171875, -9.5869140625, -8.412109375, -7.2373046875, -6.0625, -4.8876953125, -3.712890625, -2.5380859375, -1.36328125, -0.1884765625, 0.986328125, 2.1611328125, 3.3359375, 4.5107421875, 5.685546875, 6.8603515625, 8.03515625, 9.2099609375, 10.384765625, 11.5595703125, 12.734375, 13.9091796875, 15.083984375, 16.2587890625, 17.43359375, 18.6083984375, 19.783203125, 20.9580078125, 22.1328125, 23.3076171875, 24.482421875, 25.6572265625, 26.83203125, 28.0068359375, 29.181640625, 30.3564453125, 31.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 12.0, 17.0, 26.0, 32.0, 59.0, 94.0, 150.0, 227.0, 280.0, 501.0, 617.0, 1071.0, 1510.0, 2258.0, 3380.0, 4949.0, 7716.0, 11658.0, 17576.0, 27036.0, 41552.0, 64477.0, 98818.0, 144514.0, 175056.0, 148534.0, 103082.0, 67525.0, 43488.0, 28000.0, 18402.0, 11843.0, 7944.0, 5378.0, 3574.0, 2429.0, 1545.0, 1038.0, 731.0, 514.0, 325.0, 201.0, 136.0, 94.0, 74.0, 38.0, 18.0, 24.0, 17.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0], "bins": [-44.65625, -43.3251953125, -41.994140625, -40.6630859375, -39.33203125, -38.0009765625, -36.669921875, -35.3388671875, -34.0078125, -32.6767578125, -31.345703125, -30.0146484375, -28.68359375, -27.3525390625, -26.021484375, -24.6904296875, -23.359375, -22.0283203125, -20.697265625, -19.3662109375, -18.03515625, -16.7041015625, -15.373046875, -14.0419921875, -12.7109375, -11.3798828125, -10.048828125, -8.7177734375, -7.38671875, -6.0556640625, -4.724609375, -3.3935546875, -2.0625, -0.7314453125, 0.599609375, 1.9306640625, 3.26171875, 4.5927734375, 5.923828125, 7.2548828125, 8.5859375, 9.9169921875, 11.248046875, 12.5791015625, 13.91015625, 15.2412109375, 16.572265625, 17.9033203125, 19.234375, 20.5654296875, 21.896484375, 23.2275390625, 24.55859375, 25.8896484375, 27.220703125, 28.5517578125, 29.8828125, 31.2138671875, 32.544921875, 33.8759765625, 35.20703125, 36.5380859375, 37.869140625, 39.2001953125, 40.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 8.0, 1.0, 7.0, 7.0, 12.0, 18.0, 12.0, 19.0, 16.0, 19.0, 21.0, 32.0, 24.0, 32.0, 43.0, 41.0, 34.0, 47.0, 38.0, 45.0, 49.0, 45.0, 35.0, 39.0, 30.0, 28.0, 47.0, 32.0, 29.0, 29.0, 17.0, 17.0, 24.0, 17.0, 14.0, 16.0, 13.0, 13.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-25.25, -24.47705078125, -23.7041015625, -22.93115234375, -22.158203125, -21.38525390625, -20.6123046875, -19.83935546875, -19.06640625, -18.29345703125, -17.5205078125, -16.74755859375, -15.974609375, -15.20166015625, -14.4287109375, -13.65576171875, -12.8828125, -12.10986328125, -11.3369140625, -10.56396484375, -9.791015625, -9.01806640625, -8.2451171875, -7.47216796875, -6.69921875, -5.92626953125, -5.1533203125, -4.38037109375, -3.607421875, -2.83447265625, -2.0615234375, -1.28857421875, -0.515625, 0.25732421875, 1.0302734375, 1.80322265625, 2.576171875, 3.34912109375, 4.1220703125, 4.89501953125, 5.66796875, 6.44091796875, 7.2138671875, 7.98681640625, 8.759765625, 9.53271484375, 10.3056640625, 11.07861328125, 11.8515625, 12.62451171875, 13.3974609375, 14.17041015625, 14.943359375, 15.71630859375, 16.4892578125, 17.26220703125, 18.03515625, 18.80810546875, 19.5810546875, 20.35400390625, 21.126953125, 21.89990234375, 22.6728515625, 23.44580078125, 24.21875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 10.0, 9.0, 18.0, 16.0, 38.0, 55.0, 71.0, 99.0, 109.0, 199.0, 303.0, 424.0, 726.0, 954.0, 1564.0, 2464.0, 3856.0, 6246.0, 10394.0, 17899.0, 32796.0, 62548.0, 125794.0, 244406.0, 254918.0, 133708.0, 66270.0, 34733.0, 19134.0, 10890.0, 6554.0, 3963.0, 2515.0, 1599.0, 1099.0, 701.0, 470.0, 332.0, 198.0, 149.0, 90.0, 80.0, 42.0, 36.0, 29.0, 20.0, 11.0, 7.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-25.703125, -24.92529296875, -24.1474609375, -23.36962890625, -22.591796875, -21.81396484375, -21.0361328125, -20.25830078125, -19.48046875, -18.70263671875, -17.9248046875, -17.14697265625, -16.369140625, -15.59130859375, -14.8134765625, -14.03564453125, -13.2578125, -12.47998046875, -11.7021484375, -10.92431640625, -10.146484375, -9.36865234375, -8.5908203125, -7.81298828125, -7.03515625, -6.25732421875, -5.4794921875, -4.70166015625, -3.923828125, -3.14599609375, -2.3681640625, -1.59033203125, -0.8125, -0.03466796875, 0.7431640625, 1.52099609375, 2.298828125, 3.07666015625, 3.8544921875, 4.63232421875, 5.41015625, 6.18798828125, 6.9658203125, 7.74365234375, 8.521484375, 9.29931640625, 10.0771484375, 10.85498046875, 11.6328125, 12.41064453125, 13.1884765625, 13.96630859375, 14.744140625, 15.52197265625, 16.2998046875, 17.07763671875, 17.85546875, 18.63330078125, 19.4111328125, 20.18896484375, 20.966796875, 21.74462890625, 22.5224609375, 23.30029296875, 24.078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 11.0, 14.0, 20.0, 15.0, 28.0, 46.0, 52.0, 81.0, 118.0, 131.0, 151.0, 97.0, 81.0, 42.0, 29.0, 18.0, 14.0, 10.0, 6.0, 4.0, 2.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004322052001953125, -0.004204541444778442, -0.00408703088760376, -0.003969520330429077, -0.0038520097732543945, -0.003734499216079712, -0.0036169886589050293, -0.0034994781017303467, -0.003381967544555664, -0.0032644569873809814, -0.003146946430206299, -0.003029435873031616, -0.0029119253158569336, -0.002794414758682251, -0.0026769042015075684, -0.0025593936443328857, -0.002441883087158203, -0.0023243725299835205, -0.002206861972808838, -0.0020893514156341553, -0.0019718408584594727, -0.00185433030128479, -0.0017368197441101074, -0.0016193091869354248, -0.0015017986297607422, -0.0013842880725860596, -0.001266777515411377, -0.0011492669582366943, -0.0010317564010620117, -0.0009142458438873291, -0.0007967352867126465, -0.0006792247295379639, -0.0005617141723632812, -0.00044420361518859863, -0.000326693058013916, -0.0002091825008392334, -9.167194366455078e-05, 2.5838613510131836e-05, 0.00014334917068481445, 0.00026085972785949707, 0.0003783702850341797, 0.0004958808422088623, 0.0006133913993835449, 0.0007309019565582275, 0.0008484125137329102, 0.0009659230709075928, 0.0010834336280822754, 0.001200944185256958, 0.0013184547424316406, 0.0014359652996063232, 0.0015534758567810059, 0.0016709864139556885, 0.001788496971130371, 0.0019060075283050537, 0.0020235180854797363, 0.002141028642654419, 0.0022585391998291016, 0.002376049757003784, 0.002493560314178467, 0.0026110708713531494, 0.002728581428527832, 0.0028460919857025146, 0.0029636025428771973, 0.00308111310005188, 0.0031986236572265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 6.0, 15.0, 11.0, 25.0, 41.0, 48.0, 64.0, 107.0, 146.0, 226.0, 316.0, 502.0, 756.0, 1224.0, 1670.0, 2751.0, 4186.0, 6598.0, 10827.0, 18028.0, 31444.0, 57096.0, 107765.0, 206597.0, 262466.0, 151374.0, 79394.0, 42589.0, 24149.0, 14105.0, 8718.0, 5441.0, 3466.0, 2206.0, 1403.0, 959.0, 599.0, 392.0, 281.0, 180.0, 136.0, 79.0, 53.0, 38.0, 29.0, 17.0, 12.0, 4.0, 8.0, 4.0, 3.0, 1.0, 0.0, 3.0], "bins": [-25.203125, -24.467529296875, -23.73193359375, -22.996337890625, -22.2607421875, -21.525146484375, -20.78955078125, -20.053955078125, -19.318359375, -18.582763671875, -17.84716796875, -17.111572265625, -16.3759765625, -15.640380859375, -14.90478515625, -14.169189453125, -13.43359375, -12.697998046875, -11.96240234375, -11.226806640625, -10.4912109375, -9.755615234375, -9.02001953125, -8.284423828125, -7.548828125, -6.813232421875, -6.07763671875, -5.342041015625, -4.6064453125, -3.870849609375, -3.13525390625, -2.399658203125, -1.6640625, -0.928466796875, -0.19287109375, 0.542724609375, 1.2783203125, 2.013916015625, 2.74951171875, 3.485107421875, 4.220703125, 4.956298828125, 5.69189453125, 6.427490234375, 7.1630859375, 7.898681640625, 8.63427734375, 9.369873046875, 10.10546875, 10.841064453125, 11.57666015625, 12.312255859375, 13.0478515625, 13.783447265625, 14.51904296875, 15.254638671875, 15.990234375, 16.725830078125, 17.46142578125, 18.197021484375, 18.9326171875, 19.668212890625, 20.40380859375, 21.139404296875, 21.875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 4.0, 11.0, 19.0, 13.0, 16.0, 27.0, 32.0, 25.0, 36.0, 56.0, 63.0, 70.0, 75.0, 63.0, 66.0, 81.0, 60.0, 58.0, 51.0, 37.0, 28.0, 16.0, 15.0, 10.0, 18.0, 12.0, 6.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.5443115234375, -9.213623046875, -8.8829345703125, -8.55224609375, -8.2215576171875, -7.890869140625, -7.5601806640625, -7.2294921875, -6.8988037109375, -6.568115234375, -6.2374267578125, -5.90673828125, -5.5760498046875, -5.245361328125, -4.9146728515625, -4.583984375, -4.2532958984375, -3.922607421875, -3.5919189453125, -3.26123046875, -2.9305419921875, -2.599853515625, -2.2691650390625, -1.9384765625, -1.6077880859375, -1.277099609375, -0.9464111328125, -0.61572265625, -0.2850341796875, 0.045654296875, 0.3763427734375, 0.70703125, 1.0377197265625, 1.368408203125, 1.6990966796875, 2.02978515625, 2.3604736328125, 2.691162109375, 3.0218505859375, 3.3525390625, 3.6832275390625, 4.013916015625, 4.3446044921875, 4.67529296875, 5.0059814453125, 5.336669921875, 5.6673583984375, 5.998046875, 6.3287353515625, 6.659423828125, 6.9901123046875, 7.32080078125, 7.6514892578125, 7.982177734375, 8.3128662109375, 8.6435546875, 8.9742431640625, 9.304931640625, 9.6356201171875, 9.96630859375, 10.2969970703125, 10.627685546875, 10.9583740234375, 11.2890625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 17.0, 16.0, 12.0, 23.0, 24.0, 34.0, 28.0, 31.0, 40.0, 50.0, 57.0, 61.0, 55.0, 78.0, 70.0, 60.0, 53.0, 42.0, 44.0, 36.0, 26.0, 25.0, 23.0, 16.0, 9.0, 10.0, 11.0, 6.0, 4.0, 6.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.91347885131836, -45.59896469116211, -44.284454345703125, -42.969940185546875, -41.655426025390625, -40.34091567993164, -39.02640151977539, -37.711891174316406, -36.397377014160156, -35.082862854003906, -33.76835250854492, -32.45383834838867, -31.139326095581055, -29.824813842773438, -28.510299682617188, -27.19578742980957, -25.881275177001953, -24.566762924194336, -23.25225067138672, -21.93773651123047, -20.62322425842285, -19.308712005615234, -17.994197845458984, -16.679685592651367, -15.36517333984375, -14.050661087036133, -12.7361478805542, -11.421634674072266, -10.107122421264648, -8.792610168457031, -7.478096961975098, -6.163583755493164, -4.849067687988281, -3.534554958343506, -2.2200422286987305, -0.9055294990539551, 0.4089832305908203, 1.7234959602355957, 3.038008689880371, 4.352521896362305, 5.667034149169922, 6.981546878814697, 8.296059608459473, 9.610572814941406, 10.925085067749023, 12.23959732055664, 13.554110527038574, 14.868623733520508, 16.183135986328125, 17.497648239135742, 18.81216049194336, 20.12667465209961, 21.441186904907227, 22.755699157714844, 24.070213317871094, 25.38472557067871, 26.699237823486328, 28.013750076293945, 29.328262329101562, 30.642776489257812, 31.95728874206543, 33.27180099487305, 34.5863151550293, 35.90082550048828, 37.21533966064453]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 7.0, 11.0, 4.0, 10.0, 9.0, 17.0, 15.0, 19.0, 22.0, 21.0, 21.0, 39.0, 35.0, 38.0, 38.0, 32.0, 43.0, 48.0, 32.0, 45.0, 45.0, 49.0, 45.0, 33.0, 41.0, 34.0, 22.0, 36.0, 32.0, 17.0, 30.0, 16.0, 16.0, 14.0, 12.0, 10.0, 8.0, 3.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-45.423152923583984, -44.04756546020508, -42.67197799682617, -41.296390533447266, -39.92080307006836, -38.54521560668945, -37.16962814331055, -35.79404067993164, -34.418453216552734, -33.04286575317383, -31.667278289794922, -30.291690826416016, -28.91610336303711, -27.540515899658203, -26.164928436279297, -24.78934097290039, -23.413755416870117, -22.03816795349121, -20.662580490112305, -19.2869930267334, -17.911405563354492, -16.535818099975586, -15.160231590270996, -13.78464412689209, -12.409056663513184, -11.033469200134277, -9.657881736755371, -8.282295227050781, -6.906707286834717, -5.5311198234558105, -4.1555328369140625, -2.7799453735351562, -1.40435791015625, -0.0287705659866333, 1.3468167781829834, 2.7224040031433105, 4.097991466522217, 5.473578929901123, 6.849165916442871, 8.224753379821777, 9.600340843200684, 10.97592830657959, 12.351515769958496, 13.727102279663086, 15.102689743041992, 16.4782772064209, 17.853864669799805, 19.22945213317871, 20.605039596557617, 21.980627059936523, 23.35621452331543, 24.731801986694336, 26.107389450073242, 27.48297691345215, 28.858562469482422, 30.234149932861328, 31.609737396240234, 32.98532485961914, 34.36091232299805, 35.73649978637695, 37.11208724975586, 38.487674713134766, 39.86326217651367, 41.23884963989258, 42.614437103271484]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 9.0, 8.0, 16.0, 17.0, 16.0, 28.0, 26.0, 25.0, 41.0, 53.0, 63.0, 85.0, 100.0, 134.0, 166.0, 202.0, 286.0, 359.0, 450.0, 589.0, 697.0, 1043945.0, 730.0, 582.0, 455.0, 347.0, 225.0, 197.0, 147.0, 109.0, 96.0, 78.0, 61.0, 58.0, 50.0, 25.0, 28.0, 26.0, 26.0, 7.0, 4.0, 7.0, 6.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-714.0451049804688, -691.9876708984375, -669.9302368164062, -647.872802734375, -625.8153686523438, -603.7579345703125, -581.7005004882812, -559.64306640625, -537.5856323242188, -515.5281982421875, -493.47076416015625, -471.413330078125, -449.35589599609375, -427.2984619140625, -405.24102783203125, -383.18359375, -361.12615966796875, -339.0687255859375, -317.01129150390625, -294.953857421875, -272.89642333984375, -250.8389892578125, -228.78155517578125, -206.72412109375, -184.66668701171875, -162.6092529296875, -140.55181884765625, -118.494384765625, -96.43695068359375, -74.3795166015625, -52.32208251953125, -30.2646484375, -8.207275390625, 13.85015869140625, 35.9075927734375, 57.96502685546875, 80.0224609375, 102.07989501953125, 124.1373291015625, 146.19476318359375, 168.252197265625, 190.30963134765625, 212.3670654296875, 234.42449951171875, 256.48193359375, 278.53936767578125, 300.5968017578125, 322.65423583984375, 344.711669921875, 366.76910400390625, 388.8265380859375, 410.88397216796875, 432.94140625, 454.99884033203125, 477.0562744140625, 499.11370849609375, 521.171142578125, 543.2285766601562, 565.2860107421875, 587.3434448242188, 609.40087890625, 631.4583129882812, 653.5157470703125, 675.5731811523438, 697.630615234375]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 1.0, 7.0, 7.0, 14.0, 18.0, 13.0, 17.0, 35.0, 27.0, 48.0, 57.0, 54.0, 78.0, 85.0, 121.0, 143.0, 154.0, 176.0, 230.0, 241.0, 380.0, 625.0, 1301.0, 51318996.0, 144589.0, 1306.0, 646.0, 394.0, 290.0, 221.0, 193.0, 155.0, 106.0, 118.0, 75.0, 81.0, 53.0, 48.0, 45.0, 41.0, 24.0, 26.0, 21.0, 13.0, 14.0, 4.0, 6.0, 7.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1786.1605224609375, -1730.3333740234375, -1674.5062255859375, -1618.6790771484375, -1562.8519287109375, -1507.0247802734375, -1451.1976318359375, -1395.3704833984375, -1339.5433349609375, -1283.7161865234375, -1227.8890380859375, -1172.0618896484375, -1116.2347412109375, -1060.4075927734375, -1004.5804443359375, -948.7532958984375, -892.9261474609375, -837.0989990234375, -781.2718505859375, -725.4447021484375, -669.6175537109375, -613.7904052734375, -557.9632568359375, -502.1361083984375, -446.3089599609375, -390.4818115234375, -334.6546630859375, -278.8275146484375, -223.0003662109375, -167.1732177734375, -111.3460693359375, -55.5189208984375, 0.308349609375, 56.135498046875, 111.962646484375, 167.789794921875, 223.616943359375, 279.444091796875, 335.271240234375, 391.098388671875, 446.925537109375, 502.752685546875, 558.579833984375, 614.406982421875, 670.234130859375, 726.061279296875, 781.888427734375, 837.715576171875, 893.542724609375, 949.369873046875, 1005.197021484375, 1061.024169921875, 1116.851318359375, 1172.678466796875, 1228.505615234375, 1284.332763671875, 1340.159912109375, 1395.987060546875, 1451.814208984375, 1507.641357421875, 1563.468505859375, 1619.295654296875, 1675.122802734375, 1730.949951171875, 1786.777099609375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 6.0, 6.0, 11.0, 10.0, 20.0, 22.0, 21.0, 28.0, 35.0, 51.0, 73.0, 127.0, 123.0, 100.0, 78.0, 62.0, 47.0, 31.0, 33.0, 18.0, 14.0, 12.0, 12.0, 7.0, 8.0, 8.0, 6.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1279.698486328125, -1233.0745849609375, -1186.4508056640625, -1139.826904296875, -1093.203125, -1046.5792236328125, -999.955322265625, -953.3314819335938, -906.7076416015625, -860.0838012695312, -813.4599609375, -766.8360595703125, -720.2122192382812, -673.58837890625, -626.9644775390625, -580.3406372070312, -533.716796875, -487.09295654296875, -440.4690856933594, -393.84521484375, -347.22137451171875, -300.5975341796875, -253.97366333007812, -207.34979248046875, -160.7259521484375, -114.10209655761719, -67.47824096679688, -20.854385375976562, 25.76947021484375, 72.39332580566406, 119.01718139648438, 165.64105224609375, 212.2647705078125, 258.88861083984375, 305.5124816894531, 352.1363525390625, 398.76019287109375, 445.384033203125, 492.0079040527344, 538.6317749023438, 585.255615234375, 631.8794555664062, 678.5032958984375, 725.127197265625, 771.7510375976562, 818.3748779296875, 864.998779296875, 911.6226196289062, 958.2464599609375, 1004.8703002929688, 1051.494140625, 1098.1180419921875, 1144.741943359375, 1191.36572265625, 1237.9896240234375, 1284.613525390625, 1331.2373046875, 1377.8612060546875, 1424.4849853515625, 1471.10888671875, 1517.732666015625, 1564.3565673828125, 1610.98046875, 1657.604248046875, 1704.2281494140625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 14.0, 15.0, 16.0, 20.0, 26.0, 23.0, 39.0, 27.0, 30.0, 38.0, 46.0, 55.0, 75.0, 64.0, 62.0, 55.0, 65.0, 38.0, 30.0, 31.0, 23.0, 24.0, 20.0, 24.0, 16.0, 15.0, 21.0, 7.0, 11.0, 7.0, 8.0, 9.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1612.0467529296875, -1564.2908935546875, -1516.534912109375, -1468.779052734375, -1421.023193359375, -1373.267333984375, -1325.511474609375, -1277.7554931640625, -1229.9996337890625, -1182.2437744140625, -1134.48779296875, -1086.73193359375, -1038.97607421875, -991.22021484375, -943.4642944335938, -895.7083740234375, -847.9525146484375, -800.1966552734375, -752.4407348632812, -704.684814453125, -656.928955078125, -609.173095703125, -561.4171752929688, -513.6612548828125, -465.9053955078125, -418.1495056152344, -370.39361572265625, -322.6377258300781, -274.8818359375, -227.12594604492188, -179.37005615234375, -131.61416625976562, -83.858154296875, -36.102264404296875, 11.65362548828125, 59.409515380859375, 107.1654052734375, 154.92129516601562, 202.67718505859375, 250.43307495117188, 298.18896484375, 345.9448547363281, 393.70074462890625, 441.4566345214844, 489.2125244140625, 536.9683837890625, 584.7243041992188, 632.480224609375, 680.236083984375, 727.991943359375, 775.7478637695312, 823.5037841796875, 871.2596435546875, 919.0155029296875, 966.7714233398438, 1014.52734375, 1062.283203125, 1110.0390625, 1157.794921875, 1205.5509033203125, 1253.3067626953125, 1301.0626220703125, 1348.818603515625, 1396.574462890625, 1444.330322265625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 9.0, 10.0, 12.0, 26.0, 34.0, 66.0, 92.0, 108.0, 177.0, 281.0, 415.0, 580.0, 932.0, 1343.0, 2071.0, 3285.0, 4980.0, 8122.0, 13395.0, 23531.0, 43091.0, 85659.0, 197450.0, 777587.0, 2531208.0, 270571.0, 105972.0, 51615.0, 28025.0, 15711.0, 9598.0, 6047.0, 3863.0, 2543.0, 1789.0, 1216.0, 827.0, 569.0, 410.0, 316.0, 211.0, 144.0, 116.0, 88.0, 52.0, 45.0, 30.0, 18.0, 20.0, 11.0, 10.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.578125, -25.634521484375, -24.69091796875, -23.747314453125, -22.8037109375, -21.860107421875, -20.91650390625, -19.972900390625, -19.029296875, -18.085693359375, -17.14208984375, -16.198486328125, -15.2548828125, -14.311279296875, -13.36767578125, -12.424072265625, -11.48046875, -10.536865234375, -9.59326171875, -8.649658203125, -7.7060546875, -6.762451171875, -5.81884765625, -4.875244140625, -3.931640625, -2.988037109375, -2.04443359375, -1.100830078125, -0.1572265625, 0.786376953125, 1.72998046875, 2.673583984375, 3.6171875, 4.560791015625, 5.50439453125, 6.447998046875, 7.3916015625, 8.335205078125, 9.27880859375, 10.222412109375, 11.166015625, 12.109619140625, 13.05322265625, 13.996826171875, 14.9404296875, 15.884033203125, 16.82763671875, 17.771240234375, 18.71484375, 19.658447265625, 20.60205078125, 21.545654296875, 22.4892578125, 23.432861328125, 24.37646484375, 25.320068359375, 26.263671875, 27.207275390625, 28.15087890625, 29.094482421875, 30.0380859375, 30.981689453125, 31.92529296875, 32.868896484375, 33.8125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 7.0, 2.0, 5.0, 4.0, 7.0, 9.0, 8.0, 12.0, 12.0, 18.0, 25.0, 25.0, 32.0, 39.0, 53.0, 60.0, 48.0, 65.0, 74.0, 73.0, 72.0, 55.0, 45.0, 56.0, 40.0, 36.0, 29.0, 16.0, 13.0, 15.0, 10.0, 10.0, 7.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.617706298828125, -2.52056884765625, -2.423431396484375, -2.3262939453125, -2.229156494140625, -2.13201904296875, -2.034881591796875, -1.937744140625, -1.840606689453125, -1.74346923828125, -1.646331787109375, -1.5491943359375, -1.452056884765625, -1.35491943359375, -1.257781982421875, -1.16064453125, -1.063507080078125, -0.96636962890625, -0.869232177734375, -0.7720947265625, -0.674957275390625, -0.57781982421875, -0.480682373046875, -0.383544921875, -0.286407470703125, -0.18927001953125, -0.092132568359375, 0.0050048828125, 0.102142333984375, 0.19927978515625, 0.296417236328125, 0.3935546875, 0.490692138671875, 0.58782958984375, 0.684967041015625, 0.7821044921875, 0.879241943359375, 0.97637939453125, 1.073516845703125, 1.170654296875, 1.267791748046875, 1.36492919921875, 1.462066650390625, 1.5592041015625, 1.656341552734375, 1.75347900390625, 1.850616455078125, 1.94775390625, 2.044891357421875, 2.14202880859375, 2.239166259765625, 2.3363037109375, 2.433441162109375, 2.53057861328125, 2.627716064453125, 2.724853515625, 2.821990966796875, 2.91912841796875, 3.016265869140625, 3.1134033203125, 3.210540771484375, 3.30767822265625, 3.404815673828125, 3.501953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 11.0, 21.0, 19.0, 20.0, 49.0, 66.0, 102.0, 256.0, 387.0, 670.0, 1250.0, 2367.0, 4601.0, 9543.0, 20680.0, 48211.0, 121742.0, 389460.0, 2598060.0, 699974.0, 177450.0, 66995.0, 27795.0, 12508.0, 5726.0, 2896.0, 1482.0, 843.0, 433.0, 257.0, 152.0, 103.0, 49.0, 35.0, 23.0, 19.0, 7.0, 14.0, 3.0, 1.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -22.18310546875, -21.4599609375, -20.73681640625, -20.013671875, -19.29052734375, -18.5673828125, -17.84423828125, -17.12109375, -16.39794921875, -15.6748046875, -14.95166015625, -14.228515625, -13.50537109375, -12.7822265625, -12.05908203125, -11.3359375, -10.61279296875, -9.8896484375, -9.16650390625, -8.443359375, -7.72021484375, -6.9970703125, -6.27392578125, -5.55078125, -4.82763671875, -4.1044921875, -3.38134765625, -2.658203125, -1.93505859375, -1.2119140625, -0.48876953125, 0.234375, 0.95751953125, 1.6806640625, 2.40380859375, 3.126953125, 3.85009765625, 4.5732421875, 5.29638671875, 6.01953125, 6.74267578125, 7.4658203125, 8.18896484375, 8.912109375, 9.63525390625, 10.3583984375, 11.08154296875, 11.8046875, 12.52783203125, 13.2509765625, 13.97412109375, 14.697265625, 15.42041015625, 16.1435546875, 16.86669921875, 17.58984375, 18.31298828125, 19.0361328125, 19.75927734375, 20.482421875, 21.20556640625, 21.9287109375, 22.65185546875, 23.375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 9.0, 13.0, 13.0, 19.0, 29.0, 26.0, 31.0, 43.0, 50.0, 62.0, 80.0, 85.0, 100.0, 144.0, 182.0, 270.0, 489.0, 902.0, 387.0, 241.0, 174.0, 144.0, 93.0, 92.0, 74.0, 68.0, 54.0, 43.0, 52.0, 28.0, 17.0, 11.0, 15.0, 14.0, 4.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5703125, -6.353515625, -6.13671875, -5.919921875, -5.703125, -5.486328125, -5.26953125, -5.052734375, -4.8359375, -4.619140625, -4.40234375, -4.185546875, -3.96875, -3.751953125, -3.53515625, -3.318359375, -3.1015625, -2.884765625, -2.66796875, -2.451171875, -2.234375, -2.017578125, -1.80078125, -1.583984375, -1.3671875, -1.150390625, -0.93359375, -0.716796875, -0.5, -0.283203125, -0.06640625, 0.150390625, 0.3671875, 0.583984375, 0.80078125, 1.017578125, 1.234375, 1.451171875, 1.66796875, 1.884765625, 2.1015625, 2.318359375, 2.53515625, 2.751953125, 2.96875, 3.185546875, 3.40234375, 3.619140625, 3.8359375, 4.052734375, 4.26953125, 4.486328125, 4.703125, 4.919921875, 5.13671875, 5.353515625, 5.5703125, 5.787109375, 6.00390625, 6.220703125, 6.4375, 6.654296875, 6.87109375, 7.087890625, 7.3046875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 1.0, 3.0, 8.0, 11.0, 20.0, 36.0, 56.0, 100.0, 157.0, 213.0, 152.0, 111.0, 51.0, 42.0, 18.0, 9.0, 9.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.82499694824219, -104.59039306640625, -101.35578155517578, -98.12117767333984, -94.88656616210938, -91.65196228027344, -88.4173583984375, -85.18275451660156, -81.9481430053711, -78.71353912353516, -75.47892761230469, -72.24432373046875, -69.00971984863281, -65.77510833740234, -62.540504455566406, -59.3058967590332, -56.0712890625, -52.8366813659668, -49.602073669433594, -46.367469787597656, -43.13286209106445, -39.89825439453125, -36.66365051269531, -33.42904281616211, -30.194435119628906, -26.959827423095703, -23.725221633911133, -20.490615844726562, -17.25600814819336, -14.021400451660156, -10.786794662475586, -7.552188873291016, -4.3175811767578125, -1.0829744338989258, 2.151632308959961, 5.386239051818848, 8.620845794677734, 11.855453491210938, 15.090059280395508, 18.324665069580078, 21.55927276611328, 24.793880462646484, 28.028486251831055, 31.263092041015625, 34.49769973754883, 37.73230743408203, 40.96691131591797, 44.20151901245117, 47.436126708984375, 50.67073440551758, 53.90534210205078, 57.13994598388672, 60.37455368041992, 63.609161376953125, 66.84376525878906, 70.078369140625, 73.31298065185547, 76.5475845336914, 79.78219604492188, 83.01679992675781, 86.25140380859375, 89.48601531982422, 92.72061920166016, 95.95523071289062, 99.18983459472656]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 7.0, 13.0, 8.0, 15.0, 18.0, 11.0, 25.0, 29.0, 26.0, 36.0, 41.0, 45.0, 40.0, 50.0, 44.0, 58.0, 54.0, 60.0, 54.0, 46.0, 63.0, 50.0, 33.0, 33.0, 29.0, 25.0, 11.0, 15.0, 17.0, 12.0, 6.0, 8.0, 9.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.41141128540039, -38.95561218261719, -37.499813079833984, -36.04401397705078, -34.58821487426758, -33.132415771484375, -31.676616668701172, -30.22081756591797, -28.765018463134766, -27.309219360351562, -25.85342025756836, -24.397621154785156, -22.941822052001953, -21.48602294921875, -20.030223846435547, -18.574424743652344, -17.11862564086914, -15.662826538085938, -14.207027435302734, -12.751228332519531, -11.295429229736328, -9.839630126953125, -8.383831024169922, -6.928031921386719, -5.472232818603516, -4.0164337158203125, -2.5606346130371094, -1.1048355102539062, 0.3509635925292969, 1.8067626953125, 3.262561798095703, 4.718360900878906, 6.174163818359375, 7.629962921142578, 9.085762023925781, 10.541561126708984, 11.997360229492188, 13.45315933227539, 14.908958435058594, 16.364757537841797, 17.820556640625, 19.276355743408203, 20.732154846191406, 22.18795394897461, 23.643753051757812, 25.099552154541016, 26.55535125732422, 28.011150360107422, 29.466949462890625, 30.922748565673828, 32.37854766845703, 33.834346771240234, 35.29014587402344, 36.74594497680664, 38.201744079589844, 39.65754318237305, 41.11334228515625, 42.56914138793945, 44.024940490722656, 45.48073959350586, 46.93653869628906, 48.392337799072266, 49.84813690185547, 51.30393600463867, 52.759735107421875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 8.0, 9.0, 17.0, 19.0, 20.0, 37.0, 47.0, 68.0, 88.0, 109.0, 172.0, 238.0, 340.0, 538.0, 817.0, 1243.0, 2010.0, 3153.0, 5321.0, 9482.0, 17515.0, 34945.0, 74938.0, 206868.0, 435783.0, 137241.0, 56600.0, 27080.0, 14057.0, 7682.0, 4527.0, 2677.0, 1634.0, 1068.0, 682.0, 465.0, 312.0, 208.0, 146.0, 117.0, 65.0, 56.0, 51.0, 26.0, 22.0, 14.0, 14.0, 6.0, 4.0, 12.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.71875, -12.29931640625, -11.8798828125, -11.46044921875, -11.041015625, -10.62158203125, -10.2021484375, -9.78271484375, -9.36328125, -8.94384765625, -8.5244140625, -8.10498046875, -7.685546875, -7.26611328125, -6.8466796875, -6.42724609375, -6.0078125, -5.58837890625, -5.1689453125, -4.74951171875, -4.330078125, -3.91064453125, -3.4912109375, -3.07177734375, -2.65234375, -2.23291015625, -1.8134765625, -1.39404296875, -0.974609375, -0.55517578125, -0.1357421875, 0.28369140625, 0.703125, 1.12255859375, 1.5419921875, 1.96142578125, 2.380859375, 2.80029296875, 3.2197265625, 3.63916015625, 4.05859375, 4.47802734375, 4.8974609375, 5.31689453125, 5.736328125, 6.15576171875, 6.5751953125, 6.99462890625, 7.4140625, 7.83349609375, 8.2529296875, 8.67236328125, 9.091796875, 9.51123046875, 9.9306640625, 10.35009765625, 10.76953125, 11.18896484375, 11.6083984375, 12.02783203125, 12.447265625, 12.86669921875, 13.2861328125, 13.70556640625, 14.125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 11.0, 10.0, 13.0, 11.0, 30.0, 22.0, 33.0, 49.0, 32.0, 39.0, 68.0, 53.0, 63.0, 65.0, 74.0, 74.0, 59.0, 40.0, 54.0, 37.0, 29.0, 22.0, 23.0, 26.0, 7.0, 6.0, 8.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16015625, -3.053375244140625, -2.94659423828125, -2.839813232421875, -2.7330322265625, -2.626251220703125, -2.51947021484375, -2.412689208984375, -2.305908203125, -2.199127197265625, -2.09234619140625, -1.985565185546875, -1.8787841796875, -1.772003173828125, -1.66522216796875, -1.558441162109375, -1.45166015625, -1.344879150390625, -1.23809814453125, -1.131317138671875, -1.0245361328125, -0.917755126953125, -0.81097412109375, -0.704193115234375, -0.597412109375, -0.490631103515625, -0.38385009765625, -0.277069091796875, -0.1702880859375, -0.063507080078125, 0.04327392578125, 0.150054931640625, 0.2568359375, 0.363616943359375, 0.47039794921875, 0.577178955078125, 0.6839599609375, 0.790740966796875, 0.89752197265625, 1.004302978515625, 1.111083984375, 1.217864990234375, 1.32464599609375, 1.431427001953125, 1.5382080078125, 1.644989013671875, 1.75177001953125, 1.858551025390625, 1.96533203125, 2.072113037109375, 2.17889404296875, 2.285675048828125, 2.3924560546875, 2.499237060546875, 2.60601806640625, 2.712799072265625, 2.819580078125, 2.926361083984375, 3.03314208984375, 3.139923095703125, 3.2467041015625, 3.353485107421875, 3.46026611328125, 3.567047119140625, 3.673828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 11.0, 13.0, 21.0, 20.0, 23.0, 36.0, 64.0, 83.0, 156.0, 297.0, 728.0, 1693.0, 5409.0, 22065.0, 161376.0, 763423.0, 74016.0, 13141.0, 3522.0, 1315.0, 499.0, 243.0, 126.0, 85.0, 49.0, 41.0, 18.0, 18.0, 11.0, 11.0, 8.0, 3.0, 6.0, 1.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-31.34375, -30.374267578125, -29.40478515625, -28.435302734375, -27.4658203125, -26.496337890625, -25.52685546875, -24.557373046875, -23.587890625, -22.618408203125, -21.64892578125, -20.679443359375, -19.7099609375, -18.740478515625, -17.77099609375, -16.801513671875, -15.83203125, -14.862548828125, -13.89306640625, -12.923583984375, -11.9541015625, -10.984619140625, -10.01513671875, -9.045654296875, -8.076171875, -7.106689453125, -6.13720703125, -5.167724609375, -4.1982421875, -3.228759765625, -2.25927734375, -1.289794921875, -0.3203125, 0.649169921875, 1.61865234375, 2.588134765625, 3.5576171875, 4.527099609375, 5.49658203125, 6.466064453125, 7.435546875, 8.405029296875, 9.37451171875, 10.343994140625, 11.3134765625, 12.282958984375, 13.25244140625, 14.221923828125, 15.19140625, 16.160888671875, 17.13037109375, 18.099853515625, 19.0693359375, 20.038818359375, 21.00830078125, 21.977783203125, 22.947265625, 23.916748046875, 24.88623046875, 25.855712890625, 26.8251953125, 27.794677734375, 28.76416015625, 29.733642578125, 30.703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 2.0, 2.0, 6.0, 3.0, 10.0, 13.0, 6.0, 9.0, 16.0, 13.0, 12.0, 17.0, 25.0, 20.0, 19.0, 37.0, 24.0, 31.0, 46.0, 45.0, 46.0, 35.0, 44.0, 43.0, 36.0, 46.0, 40.0, 44.0, 40.0, 30.0, 34.0, 22.0, 24.0, 21.0, 22.0, 26.0, 21.0, 12.0, 13.0, 10.0, 8.0, 3.0, 5.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.3203125, -10.96435546875, -10.6083984375, -10.25244140625, -9.896484375, -9.54052734375, -9.1845703125, -8.82861328125, -8.47265625, -8.11669921875, -7.7607421875, -7.40478515625, -7.048828125, -6.69287109375, -6.3369140625, -5.98095703125, -5.625, -5.26904296875, -4.9130859375, -4.55712890625, -4.201171875, -3.84521484375, -3.4892578125, -3.13330078125, -2.77734375, -2.42138671875, -2.0654296875, -1.70947265625, -1.353515625, -0.99755859375, -0.6416015625, -0.28564453125, 0.0703125, 0.42626953125, 0.7822265625, 1.13818359375, 1.494140625, 1.85009765625, 2.2060546875, 2.56201171875, 2.91796875, 3.27392578125, 3.6298828125, 3.98583984375, 4.341796875, 4.69775390625, 5.0537109375, 5.40966796875, 5.765625, 6.12158203125, 6.4775390625, 6.83349609375, 7.189453125, 7.54541015625, 7.9013671875, 8.25732421875, 8.61328125, 8.96923828125, 9.3251953125, 9.68115234375, 10.037109375, 10.39306640625, 10.7490234375, 11.10498046875, 11.4609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 10.0, 9.0, 22.0, 30.0, 38.0, 91.0, 132.0, 326.0, 786.0, 2562.0, 15816.0, 771468.0, 244392.0, 9695.0, 1934.0, 625.0, 276.0, 124.0, 78.0, 43.0, 28.0, 19.0, 11.0, 15.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.8125, -41.27734375, -39.7421875, -38.20703125, -36.671875, -35.13671875, -33.6015625, -32.06640625, -30.53125, -28.99609375, -27.4609375, -25.92578125, -24.390625, -22.85546875, -21.3203125, -19.78515625, -18.25, -16.71484375, -15.1796875, -13.64453125, -12.109375, -10.57421875, -9.0390625, -7.50390625, -5.96875, -4.43359375, -2.8984375, -1.36328125, 0.171875, 1.70703125, 3.2421875, 4.77734375, 6.3125, 7.84765625, 9.3828125, 10.91796875, 12.453125, 13.98828125, 15.5234375, 17.05859375, 18.59375, 20.12890625, 21.6640625, 23.19921875, 24.734375, 26.26953125, 27.8046875, 29.33984375, 30.875, 32.41015625, 33.9453125, 35.48046875, 37.015625, 38.55078125, 40.0859375, 41.62109375, 43.15625, 44.69140625, 46.2265625, 47.76171875, 49.296875, 50.83203125, 52.3671875, 53.90234375, 55.4375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 6.0, 5.0, 4.0, 3.0, 5.0, 15.0, 9.0, 5.0, 17.0, 18.0, 28.0, 42.0, 30.0, 54.0, 70.0, 64.0, 88.0, 84.0, 81.0, 73.0, 50.0, 69.0, 32.0, 30.0, 23.0, 23.0, 11.0, 8.0, 10.0, 3.0, 6.0, 10.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008544921875, -0.0008272528648376465, -0.000800013542175293, -0.0007727742195129395, -0.0007455348968505859, -0.0007182955741882324, -0.0006910562515258789, -0.0006638169288635254, -0.0006365776062011719, -0.0006093382835388184, -0.0005820989608764648, -0.0005548596382141113, -0.0005276203155517578, -0.0005003809928894043, -0.0004731416702270508, -0.00044590234756469727, -0.00041866302490234375, -0.00039142370223999023, -0.0003641843795776367, -0.0003369450569152832, -0.0003097057342529297, -0.00028246641159057617, -0.00025522708892822266, -0.00022798776626586914, -0.00020074844360351562, -0.0001735091209411621, -0.0001462697982788086, -0.00011903047561645508, -9.179115295410156e-05, -6.455183029174805e-05, -3.731250762939453e-05, -1.0073184967041016e-05, 1.71661376953125e-05, 4.4405460357666016e-05, 7.164478302001953e-05, 9.888410568237305e-05, 0.00012612342834472656, 0.00015336275100708008, 0.0001806020736694336, 0.0002078413963317871, 0.00023508071899414062, 0.00026232004165649414, 0.00028955936431884766, 0.00031679868698120117, 0.0003440380096435547, 0.0003712773323059082, 0.0003985166549682617, 0.00042575597763061523, 0.00045299530029296875, 0.00048023462295532227, 0.0005074739456176758, 0.0005347132682800293, 0.0005619525909423828, 0.0005891919136047363, 0.0006164312362670898, 0.0006436705589294434, 0.0006709098815917969, 0.0006981492042541504, 0.0007253885269165039, 0.0007526278495788574, 0.0007798671722412109, 0.0008071064949035645, 0.000834345817565918, 0.0008615851402282715, 0.000888824462890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 8.0, 13.0, 17.0, 25.0, 22.0, 41.0, 52.0, 78.0, 130.0, 198.0, 310.0, 487.0, 807.0, 1364.0, 2474.0, 4792.0, 10393.0, 26000.0, 87835.0, 505057.0, 310596.0, 60742.0, 19642.0, 8292.0, 3913.0, 2083.0, 1214.0, 738.0, 421.0, 264.0, 166.0, 121.0, 72.0, 61.0, 39.0, 27.0, 15.0, 13.0, 7.0, 10.0, 2.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.234375, -15.7550048828125, -15.275634765625, -14.7962646484375, -14.31689453125, -13.8375244140625, -13.358154296875, -12.8787841796875, -12.3994140625, -11.9200439453125, -11.440673828125, -10.9613037109375, -10.48193359375, -10.0025634765625, -9.523193359375, -9.0438232421875, -8.564453125, -8.0850830078125, -7.605712890625, -7.1263427734375, -6.64697265625, -6.1676025390625, -5.688232421875, -5.2088623046875, -4.7294921875, -4.2501220703125, -3.770751953125, -3.2913818359375, -2.81201171875, -2.3326416015625, -1.853271484375, -1.3739013671875, -0.89453125, -0.4151611328125, 0.064208984375, 0.5435791015625, 1.02294921875, 1.5023193359375, 1.981689453125, 2.4610595703125, 2.9404296875, 3.4197998046875, 3.899169921875, 4.3785400390625, 4.85791015625, 5.3372802734375, 5.816650390625, 6.2960205078125, 6.775390625, 7.2547607421875, 7.734130859375, 8.2135009765625, 8.69287109375, 9.1722412109375, 9.651611328125, 10.1309814453125, 10.6103515625, 11.0897216796875, 11.569091796875, 12.0484619140625, 12.52783203125, 13.0072021484375, 13.486572265625, 13.9659423828125, 14.4453125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 5.0, 2.0, 7.0, 10.0, 12.0, 10.0, 13.0, 20.0, 21.0, 27.0, 38.0, 36.0, 42.0, 50.0, 43.0, 60.0, 68.0, 64.0, 64.0, 63.0, 52.0, 55.0, 47.0, 28.0, 30.0, 21.0, 11.0, 18.0, 8.0, 9.0, 12.0, 9.0, 8.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.76953125, -7.52935791015625, -7.2891845703125, -7.04901123046875, -6.808837890625, -6.56866455078125, -6.3284912109375, -6.08831787109375, -5.84814453125, -5.60797119140625, -5.3677978515625, -5.12762451171875, -4.887451171875, -4.64727783203125, -4.4071044921875, -4.16693115234375, -3.9267578125, -3.68658447265625, -3.4464111328125, -3.20623779296875, -2.966064453125, -2.72589111328125, -2.4857177734375, -2.24554443359375, -2.00537109375, -1.76519775390625, -1.5250244140625, -1.28485107421875, -1.044677734375, -0.80450439453125, -0.5643310546875, -0.32415771484375, -0.083984375, 0.15618896484375, 0.3963623046875, 0.63653564453125, 0.876708984375, 1.11688232421875, 1.3570556640625, 1.59722900390625, 1.83740234375, 2.07757568359375, 2.3177490234375, 2.55792236328125, 2.798095703125, 3.03826904296875, 3.2784423828125, 3.51861572265625, 3.7587890625, 3.99896240234375, 4.2391357421875, 4.47930908203125, 4.719482421875, 4.95965576171875, 5.1998291015625, 5.44000244140625, 5.68017578125, 5.92034912109375, 6.1605224609375, 6.40069580078125, 6.640869140625, 6.88104248046875, 7.1212158203125, 7.36138916015625, 7.6015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 9.0, 8.0, 9.0, 18.0, 35.0, 57.0, 137.0, 234.0, 227.0, 136.0, 61.0, 26.0, 17.0, 14.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-256.1457824707031, -249.74057006835938, -243.33535766601562, -236.93014526367188, -230.52491760253906, -224.1197052001953, -217.71449279785156, -211.3092803955078, -204.904052734375, -198.49884033203125, -192.0936279296875, -185.68841552734375, -179.28318786621094, -172.8779754638672, -166.47276306152344, -160.0675506591797, -153.66233825683594, -147.2571258544922, -140.85191345214844, -134.44668579101562, -128.04147338867188, -121.63626098632812, -115.23104858398438, -108.82583618164062, -102.42061614990234, -96.0154037475586, -89.61018371582031, -83.20497131347656, -76.79975891113281, -70.39453887939453, -63.98932647705078, -57.584110260009766, -51.17890930175781, -44.7736930847168, -38.36847686767578, -31.96326446533203, -25.558048248291016, -19.15283203125, -12.74761962890625, -6.342403411865234, 0.06281280517578125, 6.4680280685424805, 12.87324333190918, 19.278457641601562, 25.683673858642578, 32.088890075683594, 38.494102478027344, 44.89931869506836, 51.304534912109375, 57.70975112915039, 64.1149673461914, 70.52017974853516, 76.92539978027344, 83.33061218261719, 89.73582458496094, 96.14103698730469, 102.54625701904297, 108.95146942138672, 115.356689453125, 121.76190185546875, 128.1671142578125, 134.57232666015625, 140.9775390625, 147.3827667236328, 153.78797912597656]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 1.0, 9.0, 4.0, 9.0, 10.0, 12.0, 32.0, 42.0, 74.0, 88.0, 110.0, 137.0, 127.0, 99.0, 73.0, 48.0, 38.0, 16.0, 15.0, 5.0, 6.0, 5.0, 7.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-273.7947692871094, -266.71441650390625, -259.6340637207031, -252.55369567871094, -245.47332763671875, -238.39297485351562, -231.31260681152344, -224.2322540283203, -217.15188598632812, -210.071533203125, -202.9911651611328, -195.9108123779297, -188.8304443359375, -181.75009155273438, -174.6697235107422, -167.58937072753906, -160.50900268554688, -153.42864990234375, -146.34828186035156, -139.26792907714844, -132.18756103515625, -125.10720825195312, -118.02684020996094, -110.94648742675781, -103.86613464355469, -96.78577423095703, -89.70541381835938, -82.62505340576172, -75.54469299316406, -68.46434020996094, -61.383975982666016, -54.30361557006836, -47.22325134277344, -40.14289093017578, -33.062530517578125, -25.9821720123291, -18.901811599731445, -11.821453094482422, -4.741092681884766, 2.3392677307128906, 9.419628143310547, 16.499988555908203, 23.58034896850586, 30.660707473754883, 37.741065979003906, 44.82142639160156, 51.90178680419922, 58.982147216796875, 66.06250762939453, 73.14286804199219, 80.22322845458984, 87.3035888671875, 94.38394927978516, 101.46430969238281, 108.54466247558594, 115.62503051757812, 122.70538330078125, 129.78573608398438, 136.86610412597656, 143.9464569091797, 151.02682495117188, 158.107177734375, 165.1875457763672, 172.2678985595703, 179.3482666015625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 7.0, 6.0, 18.0, 12.0, 16.0, 38.0, 46.0, 58.0, 95.0, 153.0, 252.0, 461.0, 793.0, 1527.0, 3276.0, 7821.0, 22855.0, 97458.0, 3759496.0, 241640.0, 36912.0, 11739.0, 4654.0, 2159.0, 1094.0, 641.0, 351.0, 210.0, 164.0, 105.0, 70.0, 43.0, 27.0, 18.0, 16.0, 18.0, 9.0, 7.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-72.0625, -69.71484375, -67.3671875, -65.01953125, -62.671875, -60.32421875, -57.9765625, -55.62890625, -53.28125, -50.93359375, -48.5859375, -46.23828125, -43.890625, -41.54296875, -39.1953125, -36.84765625, -34.5, -32.15234375, -29.8046875, -27.45703125, -25.109375, -22.76171875, -20.4140625, -18.06640625, -15.71875, -13.37109375, -11.0234375, -8.67578125, -6.328125, -3.98046875, -1.6328125, 0.71484375, 3.0625, 5.41015625, 7.7578125, 10.10546875, 12.453125, 14.80078125, 17.1484375, 19.49609375, 21.84375, 24.19140625, 26.5390625, 28.88671875, 31.234375, 33.58203125, 35.9296875, 38.27734375, 40.625, 42.97265625, 45.3203125, 47.66796875, 50.015625, 52.36328125, 54.7109375, 57.05859375, 59.40625, 61.75390625, 64.1015625, 66.44921875, 68.796875, 71.14453125, 73.4921875, 75.83984375, 78.1875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 9.0, 10.0, 8.0, 5.0, 10.0, 16.0, 14.0, 20.0, 33.0, 42.0, 29.0, 38.0, 50.0, 48.0, 56.0, 64.0, 52.0, 68.0, 67.0, 61.0, 37.0, 48.0, 30.0, 32.0, 31.0, 25.0, 18.0, 11.0, 17.0, 7.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.01953125, -2.920623779296875, -2.82171630859375, -2.722808837890625, -2.6239013671875, -2.524993896484375, -2.42608642578125, -2.327178955078125, -2.228271484375, -2.129364013671875, -2.03045654296875, -1.931549072265625, -1.8326416015625, -1.733734130859375, -1.63482666015625, -1.535919189453125, -1.43701171875, -1.338104248046875, -1.23919677734375, -1.140289306640625, -1.0413818359375, -0.942474365234375, -0.84356689453125, -0.744659423828125, -0.645751953125, -0.546844482421875, -0.44793701171875, -0.349029541015625, -0.2501220703125, -0.151214599609375, -0.05230712890625, 0.046600341796875, 0.1455078125, 0.244415283203125, 0.34332275390625, 0.442230224609375, 0.5411376953125, 0.640045166015625, 0.73895263671875, 0.837860107421875, 0.936767578125, 1.035675048828125, 1.13458251953125, 1.233489990234375, 1.3323974609375, 1.431304931640625, 1.53021240234375, 1.629119873046875, 1.72802734375, 1.826934814453125, 1.92584228515625, 2.024749755859375, 2.1236572265625, 2.222564697265625, 2.32147216796875, 2.420379638671875, 2.519287109375, 2.618194580078125, 2.71710205078125, 2.816009521484375, 2.9149169921875, 3.013824462890625, 3.11273193359375, 3.211639404296875, 3.310546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 5.0, 9.0, 12.0, 7.0, 27.0, 42.0, 55.0, 81.0, 139.0, 205.0, 344.0, 502.0, 829.0, 1393.0, 2390.0, 4198.0, 7750.0, 14968.0, 31671.0, 78155.0, 297245.0, 3331789.0, 282929.0, 76400.0, 30783.0, 14610.0, 7694.0, 4100.0, 2391.0, 1363.0, 812.0, 521.0, 327.0, 174.0, 122.0, 77.0, 61.0, 29.0, 25.0, 20.0, 9.0, 6.0, 8.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.03125, -33.84326171875, -32.6552734375, -31.46728515625, -30.279296875, -29.09130859375, -27.9033203125, -26.71533203125, -25.52734375, -24.33935546875, -23.1513671875, -21.96337890625, -20.775390625, -19.58740234375, -18.3994140625, -17.21142578125, -16.0234375, -14.83544921875, -13.6474609375, -12.45947265625, -11.271484375, -10.08349609375, -8.8955078125, -7.70751953125, -6.51953125, -5.33154296875, -4.1435546875, -2.95556640625, -1.767578125, -0.57958984375, 0.6083984375, 1.79638671875, 2.984375, 4.17236328125, 5.3603515625, 6.54833984375, 7.736328125, 8.92431640625, 10.1123046875, 11.30029296875, 12.48828125, 13.67626953125, 14.8642578125, 16.05224609375, 17.240234375, 18.42822265625, 19.6162109375, 20.80419921875, 21.9921875, 23.18017578125, 24.3681640625, 25.55615234375, 26.744140625, 27.93212890625, 29.1201171875, 30.30810546875, 31.49609375, 32.68408203125, 33.8720703125, 35.06005859375, 36.248046875, 37.43603515625, 38.6240234375, 39.81201171875, 41.0]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 2.0, 4.0, 6.0, 3.0, 9.0, 8.0, 10.0, 22.0, 6.0, 11.0, 21.0, 30.0, 28.0, 50.0, 60.0, 77.0, 116.0, 188.0, 334.0, 2009.0, 411.0, 196.0, 111.0, 73.0, 43.0, 51.0, 39.0, 26.0, 20.0, 21.0, 21.0, 8.0, 9.0, 8.0, 11.0, 7.0, 5.0, 10.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.47265625, -5.29412841796875, -5.1156005859375, -4.93707275390625, -4.758544921875, -4.58001708984375, -4.4014892578125, -4.22296142578125, -4.04443359375, -3.86590576171875, -3.6873779296875, -3.50885009765625, -3.330322265625, -3.15179443359375, -2.9732666015625, -2.79473876953125, -2.6162109375, -2.43768310546875, -2.2591552734375, -2.08062744140625, -1.902099609375, -1.72357177734375, -1.5450439453125, -1.36651611328125, -1.18798828125, -1.00946044921875, -0.8309326171875, -0.65240478515625, -0.473876953125, -0.29534912109375, -0.1168212890625, 0.06170654296875, 0.240234375, 0.41876220703125, 0.5972900390625, 0.77581787109375, 0.954345703125, 1.13287353515625, 1.3114013671875, 1.48992919921875, 1.66845703125, 1.84698486328125, 2.0255126953125, 2.20404052734375, 2.382568359375, 2.56109619140625, 2.7396240234375, 2.91815185546875, 3.0966796875, 3.27520751953125, 3.4537353515625, 3.63226318359375, 3.810791015625, 3.98931884765625, 4.1678466796875, 4.34637451171875, 4.52490234375, 4.70343017578125, 4.8819580078125, 5.06048583984375, 5.239013671875, 5.41754150390625, 5.5960693359375, 5.77459716796875, 5.953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 3.0, 12.0, 25.0, 50.0, 85.0, 130.0, 201.0, 201.0, 140.0, 70.0, 34.0, 22.0, 8.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.876670837402344, -35.98329162597656, -34.08991241455078, -32.196533203125, -30.303150177001953, -28.409770965576172, -26.51639175415039, -24.62301254272461, -22.729631423950195, -20.836252212524414, -18.94287109375, -17.04949188232422, -15.156111717224121, -13.262731552124023, -11.369352340698242, -9.475972175598145, -7.582592010498047, -5.689211845397949, -3.7958321571350098, -1.9024524688720703, -0.009072303771972656, 1.884307861328125, 3.7776870727539062, 5.671067237854004, 7.564447402954102, 9.4578275680542, 11.351207733154297, 13.244586944580078, 15.137967109680176, 17.031347274780273, 18.924726486206055, 20.81810760498047, 22.71148681640625, 24.60486602783203, 26.498247146606445, 28.391626358032227, 30.28500747680664, 32.17838668823242, 34.0717658996582, 35.965145111083984, 37.85852813720703, 39.75190734863281, 41.645286560058594, 43.538665771484375, 45.43204879760742, 47.3254280090332, 49.218807220458984, 51.112186431884766, 53.00556564331055, 54.89894485473633, 56.79232406616211, 58.685707092285156, 60.57908630371094, 62.47246551513672, 64.3658447265625, 66.25922393798828, 68.15260314941406, 70.04598236083984, 71.93936157226562, 73.8327407836914, 75.72611999511719, 77.6195068359375, 79.51287841796875, 81.40626525878906, 83.29964447021484]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 7.0, 6.0, 7.0, 11.0, 10.0, 11.0, 17.0, 18.0, 21.0, 36.0, 26.0, 30.0, 41.0, 36.0, 37.0, 46.0, 45.0, 55.0, 51.0, 42.0, 50.0, 40.0, 54.0, 40.0, 43.0, 27.0, 31.0, 31.0, 24.0, 20.0, 22.0, 18.0, 8.0, 6.0, 4.0, 3.0, 9.0, 4.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.90411949157715, -18.21017837524414, -17.516237258911133, -16.822296142578125, -16.128353118896484, -15.434412956237793, -14.740470886230469, -14.046529769897461, -13.352588653564453, -12.658647537231445, -11.964706420898438, -11.270764350891113, -10.576823234558105, -9.882882118225098, -9.188940048217773, -8.494998931884766, -7.801057815551758, -7.10711669921875, -6.413175106048584, -5.719233512878418, -5.02529239654541, -4.331351280212402, -3.6374096870422363, -2.9434680938720703, -2.2495269775390625, -1.5555856227874756, -0.8616442680358887, -0.16770291328430176, 0.5262384414672852, 1.220179796218872, 1.914121150970459, 2.608062744140625, 3.302003860473633, 3.9959452152252197, 4.689886569976807, 5.383828163146973, 6.0777692794799805, 6.771710395812988, 7.465651988983154, 8.15959358215332, 8.853534698486328, 9.547475814819336, 10.241416931152344, 10.935359001159668, 11.629300117492676, 12.323241233825684, 13.017183303833008, 13.711124420166016, 14.405065536499023, 15.099006652832031, 15.792947769165039, 16.486888885498047, 17.180831909179688, 17.874773025512695, 18.568714141845703, 19.26265525817871, 19.95659637451172, 20.650537490844727, 21.344478607177734, 22.038419723510742, 22.73236083984375, 23.42630386352539, 24.1202449798584, 24.814186096191406, 25.508127212524414]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 6.0, 6.0, 9.0, 9.0, 9.0, 23.0, 14.0, 31.0, 61.0, 77.0, 98.0, 132.0, 243.0, 372.0, 639.0, 1041.0, 1825.0, 3468.0, 6497.0, 13271.0, 29266.0, 68498.0, 208904.0, 462752.0, 149587.0, 54525.0, 23738.0, 10975.0, 5549.0, 2899.0, 1535.0, 950.0, 546.0, 343.0, 243.0, 140.0, 99.0, 67.0, 34.0, 24.0, 17.0, 10.0, 12.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-29.3125, -28.279296875, -27.24609375, -26.212890625, -25.1796875, -24.146484375, -23.11328125, -22.080078125, -21.046875, -20.013671875, -18.98046875, -17.947265625, -16.9140625, -15.880859375, -14.84765625, -13.814453125, -12.78125, -11.748046875, -10.71484375, -9.681640625, -8.6484375, -7.615234375, -6.58203125, -5.548828125, -4.515625, -3.482421875, -2.44921875, -1.416015625, -0.3828125, 0.650390625, 1.68359375, 2.716796875, 3.75, 4.783203125, 5.81640625, 6.849609375, 7.8828125, 8.916015625, 9.94921875, 10.982421875, 12.015625, 13.048828125, 14.08203125, 15.115234375, 16.1484375, 17.181640625, 18.21484375, 19.248046875, 20.28125, 21.314453125, 22.34765625, 23.380859375, 24.4140625, 25.447265625, 26.48046875, 27.513671875, 28.546875, 29.580078125, 30.61328125, 31.646484375, 32.6796875, 33.712890625, 34.74609375, 35.779296875, 36.8125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 6.0, 9.0, 5.0, 6.0, 6.0, 13.0, 13.0, 21.0, 22.0, 29.0, 28.0, 33.0, 39.0, 42.0, 32.0, 60.0, 59.0, 64.0, 67.0, 57.0, 52.0, 57.0, 47.0, 34.0, 25.0, 31.0, 24.0, 26.0, 20.0, 23.0, 8.0, 7.0, 12.0, 13.0, 3.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.79296875, -2.693695068359375, -2.59442138671875, -2.495147705078125, -2.3958740234375, -2.296600341796875, -2.19732666015625, -2.098052978515625, -1.998779296875, -1.899505615234375, -1.80023193359375, -1.700958251953125, -1.6016845703125, -1.502410888671875, -1.40313720703125, -1.303863525390625, -1.20458984375, -1.105316162109375, -1.00604248046875, -0.906768798828125, -0.8074951171875, -0.708221435546875, -0.60894775390625, -0.509674072265625, -0.410400390625, -0.311126708984375, -0.21185302734375, -0.112579345703125, -0.0133056640625, 0.085968017578125, 0.18524169921875, 0.284515380859375, 0.3837890625, 0.483062744140625, 0.58233642578125, 0.681610107421875, 0.7808837890625, 0.880157470703125, 0.97943115234375, 1.078704833984375, 1.177978515625, 1.277252197265625, 1.37652587890625, 1.475799560546875, 1.5750732421875, 1.674346923828125, 1.77362060546875, 1.872894287109375, 1.97216796875, 2.071441650390625, 2.17071533203125, 2.269989013671875, 2.3692626953125, 2.468536376953125, 2.56781005859375, 2.667083740234375, 2.766357421875, 2.865631103515625, 2.96490478515625, 3.064178466796875, 3.1634521484375, 3.262725830078125, 3.36199951171875, 3.461273193359375, 3.560546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 7.0, 11.0, 11.0, 20.0, 15.0, 36.0, 46.0, 66.0, 102.0, 131.0, 187.0, 299.0, 498.0, 860.0, 1506.0, 2996.0, 6423.0, 14908.0, 39402.0, 123822.0, 493835.0, 253832.0, 66643.0, 23659.0, 9687.0, 4401.0, 2153.0, 1158.0, 677.0, 386.0, 221.0, 164.0, 107.0, 75.0, 57.0, 46.0, 27.0, 29.0, 14.0, 9.0, 3.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-31.375, -30.4453125, -29.515625, -28.5859375, -27.65625, -26.7265625, -25.796875, -24.8671875, -23.9375, -23.0078125, -22.078125, -21.1484375, -20.21875, -19.2890625, -18.359375, -17.4296875, -16.5, -15.5703125, -14.640625, -13.7109375, -12.78125, -11.8515625, -10.921875, -9.9921875, -9.0625, -8.1328125, -7.203125, -6.2734375, -5.34375, -4.4140625, -3.484375, -2.5546875, -1.625, -0.6953125, 0.234375, 1.1640625, 2.09375, 3.0234375, 3.953125, 4.8828125, 5.8125, 6.7421875, 7.671875, 8.6015625, 9.53125, 10.4609375, 11.390625, 12.3203125, 13.25, 14.1796875, 15.109375, 16.0390625, 16.96875, 17.8984375, 18.828125, 19.7578125, 20.6875, 21.6171875, 22.546875, 23.4765625, 24.40625, 25.3359375, 26.265625, 27.1953125, 28.125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 11.0, 7.0, 7.0, 10.0, 29.0, 22.0, 34.0, 48.0, 51.0, 43.0, 48.0, 55.0, 63.0, 59.0, 72.0, 69.0, 71.0, 53.0, 48.0, 41.0, 40.0, 20.0, 24.0, 24.0, 10.0, 9.0, 11.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.796875, -17.200439453125, -16.60400390625, -16.007568359375, -15.4111328125, -14.814697265625, -14.21826171875, -13.621826171875, -13.025390625, -12.428955078125, -11.83251953125, -11.236083984375, -10.6396484375, -10.043212890625, -9.44677734375, -8.850341796875, -8.25390625, -7.657470703125, -7.06103515625, -6.464599609375, -5.8681640625, -5.271728515625, -4.67529296875, -4.078857421875, -3.482421875, -2.885986328125, -2.28955078125, -1.693115234375, -1.0966796875, -0.500244140625, 0.09619140625, 0.692626953125, 1.2890625, 1.885498046875, 2.48193359375, 3.078369140625, 3.6748046875, 4.271240234375, 4.86767578125, 5.464111328125, 6.060546875, 6.656982421875, 7.25341796875, 7.849853515625, 8.4462890625, 9.042724609375, 9.63916015625, 10.235595703125, 10.83203125, 11.428466796875, 12.02490234375, 12.621337890625, 13.2177734375, 13.814208984375, 14.41064453125, 15.007080078125, 15.603515625, 16.199951171875, 16.79638671875, 17.392822265625, 17.9892578125, 18.585693359375, 19.18212890625, 19.778564453125, 20.375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 8.0, 8.0, 15.0, 21.0, 24.0, 44.0, 88.0, 160.0, 335.0, 830.0, 2244.0, 7429.0, 36664.0, 523613.0, 434304.0, 32318.0, 6910.0, 2114.0, 723.0, 353.0, 141.0, 81.0, 49.0, 32.0, 14.0, 13.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-59.40625, -57.919921875, -56.43359375, -54.947265625, -53.4609375, -51.974609375, -50.48828125, -49.001953125, -47.515625, -46.029296875, -44.54296875, -43.056640625, -41.5703125, -40.083984375, -38.59765625, -37.111328125, -35.625, -34.138671875, -32.65234375, -31.166015625, -29.6796875, -28.193359375, -26.70703125, -25.220703125, -23.734375, -22.248046875, -20.76171875, -19.275390625, -17.7890625, -16.302734375, -14.81640625, -13.330078125, -11.84375, -10.357421875, -8.87109375, -7.384765625, -5.8984375, -4.412109375, -2.92578125, -1.439453125, 0.046875, 1.533203125, 3.01953125, 4.505859375, 5.9921875, 7.478515625, 8.96484375, 10.451171875, 11.9375, 13.423828125, 14.91015625, 16.396484375, 17.8828125, 19.369140625, 20.85546875, 22.341796875, 23.828125, 25.314453125, 26.80078125, 28.287109375, 29.7734375, 31.259765625, 32.74609375, 34.232421875, 35.71875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 10.0, 11.0, 11.0, 24.0, 22.0, 42.0, 65.0, 93.0, 134.0, 145.0, 148.0, 90.0, 52.0, 32.0, 23.0, 17.0, 13.0, 12.0, 11.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0031375885009765625, -0.003019005060195923, -0.002900421619415283, -0.0027818381786346436, -0.002663254737854004, -0.0025446712970733643, -0.0024260878562927246, -0.002307504415512085, -0.0021889209747314453, -0.0020703375339508057, -0.001951754093170166, -0.0018331706523895264, -0.0017145872116088867, -0.001596003770828247, -0.0014774203300476074, -0.0013588368892669678, -0.0012402534484863281, -0.0011216700077056885, -0.0010030865669250488, -0.0008845031261444092, -0.0007659196853637695, -0.0006473362445831299, -0.0005287528038024902, -0.0004101693630218506, -0.00029158592224121094, -0.0001730024814605713, -5.441904067993164e-05, 6.416440010070801e-05, 0.00018274784088134766, 0.0003013312816619873, 0.00041991472244262695, 0.0005384981632232666, 0.0006570816040039062, 0.0007756650447845459, 0.0008942484855651855, 0.0010128319263458252, 0.0011314153671264648, 0.0012499988079071045, 0.0013685822486877441, 0.0014871656894683838, 0.0016057491302490234, 0.001724332571029663, 0.0018429160118103027, 0.0019614994525909424, 0.002080082893371582, 0.0021986663341522217, 0.0023172497749328613, 0.002435833215713501, 0.0025544166564941406, 0.0026730000972747803, 0.00279158353805542, 0.0029101669788360596, 0.0030287504196166992, 0.003147333860397339, 0.0032659173011779785, 0.003384500741958618, 0.003503084182739258, 0.0036216676235198975, 0.003740251064300537, 0.0038588345050811768, 0.003977417945861816, 0.004096001386642456, 0.004214584827423096, 0.004333168268203735, 0.004451751708984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 9.0, 4.0, 18.0, 19.0, 32.0, 35.0, 72.0, 84.0, 153.0, 246.0, 443.0, 815.0, 1517.0, 3084.0, 6899.0, 18638.0, 65528.0, 362233.0, 468622.0, 83452.0, 21955.0, 7858.0, 3379.0, 1543.0, 802.0, 470.0, 235.0, 145.0, 95.0, 64.0, 36.0, 25.0, 11.0, 13.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.734375, -25.92626953125, -25.1181640625, -24.31005859375, -23.501953125, -22.69384765625, -21.8857421875, -21.07763671875, -20.26953125, -19.46142578125, -18.6533203125, -17.84521484375, -17.037109375, -16.22900390625, -15.4208984375, -14.61279296875, -13.8046875, -12.99658203125, -12.1884765625, -11.38037109375, -10.572265625, -9.76416015625, -8.9560546875, -8.14794921875, -7.33984375, -6.53173828125, -5.7236328125, -4.91552734375, -4.107421875, -3.29931640625, -2.4912109375, -1.68310546875, -0.875, -0.06689453125, 0.7412109375, 1.54931640625, 2.357421875, 3.16552734375, 3.9736328125, 4.78173828125, 5.58984375, 6.39794921875, 7.2060546875, 8.01416015625, 8.822265625, 9.63037109375, 10.4384765625, 11.24658203125, 12.0546875, 12.86279296875, 13.6708984375, 14.47900390625, 15.287109375, 16.09521484375, 16.9033203125, 17.71142578125, 18.51953125, 19.32763671875, 20.1357421875, 20.94384765625, 21.751953125, 22.56005859375, 23.3681640625, 24.17626953125, 24.984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 7.0, 4.0, 4.0, 5.0, 15.0, 15.0, 17.0, 20.0, 27.0, 30.0, 59.0, 56.0, 64.0, 74.0, 79.0, 73.0, 87.0, 74.0, 63.0, 49.0, 43.0, 27.0, 26.0, 20.0, 9.0, 19.0, 3.0, 6.0, 5.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.6796875, -13.3135986328125, -12.947509765625, -12.5814208984375, -12.21533203125, -11.8492431640625, -11.483154296875, -11.1170654296875, -10.7509765625, -10.3848876953125, -10.018798828125, -9.6527099609375, -9.28662109375, -8.9205322265625, -8.554443359375, -8.1883544921875, -7.822265625, -7.4561767578125, -7.090087890625, -6.7239990234375, -6.35791015625, -5.9918212890625, -5.625732421875, -5.2596435546875, -4.8935546875, -4.5274658203125, -4.161376953125, -3.7952880859375, -3.42919921875, -3.0631103515625, -2.697021484375, -2.3309326171875, -1.96484375, -1.5987548828125, -1.232666015625, -0.8665771484375, -0.50048828125, -0.1343994140625, 0.231689453125, 0.5977783203125, 0.9638671875, 1.3299560546875, 1.696044921875, 2.0621337890625, 2.42822265625, 2.7943115234375, 3.160400390625, 3.5264892578125, 3.892578125, 4.2586669921875, 4.624755859375, 4.9908447265625, 5.35693359375, 5.7230224609375, 6.089111328125, 6.4552001953125, 6.8212890625, 7.1873779296875, 7.553466796875, 7.9195556640625, 8.28564453125, 8.6517333984375, 9.017822265625, 9.3839111328125, 9.75]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 12.0, 16.0, 21.0, 61.0, 130.0, 285.0, 246.0, 101.0, 61.0, 30.0, 14.0, 13.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.111572265625, -253.68032836914062, -244.24908447265625, -234.81784057617188, -225.3865966796875, -215.95535278320312, -206.52410888671875, -197.09286499023438, -187.66162109375, -178.23037719726562, -168.79913330078125, -159.36788940429688, -149.9366455078125, -140.50540161132812, -131.07415771484375, -121.64290618896484, -112.21165466308594, -102.78041076660156, -93.34916687011719, -83.91792297363281, -74.48667907714844, -65.05543518066406, -55.624183654785156, -46.19293975830078, -36.761695861816406, -27.33045196533203, -17.899206161499023, -8.467960357666016, 0.9632835388183594, 10.394527435302734, 19.825775146484375, 29.25701904296875, 38.688262939453125, 48.1195068359375, 57.550750732421875, 66.98199462890625, 76.41323852539062, 85.844482421875, 95.2757339477539, 104.70697784423828, 114.13822174072266, 123.56946563720703, 133.00071716308594, 142.4319610595703, 151.8632049560547, 161.29444885253906, 170.72569274902344, 180.1569366455078, 189.5881805419922, 199.01942443847656, 208.45066833496094, 217.8819122314453, 227.3131561279297, 236.74440002441406, 246.1756591796875, 255.60690307617188, 265.03814697265625, 274.4693908691406, 283.900634765625, 293.3318786621094, 302.76312255859375, 312.1943664550781, 321.6256103515625, 331.0568542480469, 340.48809814453125]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 7.0, 4.0, 11.0, 18.0, 18.0, 23.0, 40.0, 45.0, 44.0, 58.0, 64.0, 55.0, 65.0, 77.0, 69.0, 69.0, 49.0, 50.0, 50.0, 47.0, 32.0, 16.0, 16.0, 12.0, 14.0, 11.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-147.695556640625, -143.18995666503906, -138.68435668945312, -134.1787567138672, -129.67315673828125, -125.16755676269531, -120.66195678710938, -116.15635681152344, -111.6507568359375, -107.14515686035156, -102.63955688476562, -98.13395690917969, -93.62835693359375, -89.12275695800781, -84.61715698242188, -80.11155700683594, -75.60596466064453, -71.1003646850586, -66.59476470947266, -62.08916473388672, -57.58356475830078, -53.077964782714844, -48.57236862182617, -44.066768646240234, -39.5611686706543, -35.05556869506836, -30.549968719482422, -26.044370651245117, -21.53877067565918, -17.033170700073242, -12.527572631835938, -8.02197265625, -3.5163726806640625, 0.9892268180847168, 5.494826316833496, 10.000425338745117, 14.506025314331055, 19.011625289916992, 23.517223358154297, 28.022823333740234, 32.52842330932617, 37.03402328491211, 41.53962326049805, 46.04521942138672, 50.550819396972656, 55.056419372558594, 59.56201934814453, 64.06761932373047, 68.5732192993164, 73.07881927490234, 77.58441925048828, 82.09001922607422, 86.59561920166016, 91.1012191772461, 95.6068115234375, 100.11241149902344, 104.61801147460938, 109.12361145019531, 113.62921142578125, 118.13481140136719, 122.64041137695312, 127.14601135253906, 131.651611328125, 136.15721130371094, 140.66281127929688]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 7.0, 2.0, 7.0, 8.0, 20.0, 24.0, 38.0, 57.0, 91.0, 170.0, 250.0, 417.0, 739.0, 1304.0, 2416.0, 4483.0, 8787.0, 18481.0, 45212.0, 161359.0, 3551847.0, 291888.0, 60603.0, 22537.0, 10469.0, 5368.0, 2867.0, 1713.0, 965.0, 636.0, 433.0, 295.0, 203.0, 144.0, 110.0, 61.0, 63.0, 54.0, 32.0, 26.0, 21.0, 13.0, 27.0, 7.0, 4.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-51.28125, -49.11279296875, -46.9443359375, -44.77587890625, -42.607421875, -40.43896484375, -38.2705078125, -36.10205078125, -33.93359375, -31.76513671875, -29.5966796875, -27.42822265625, -25.259765625, -23.09130859375, -20.9228515625, -18.75439453125, -16.5859375, -14.41748046875, -12.2490234375, -10.08056640625, -7.912109375, -5.74365234375, -3.5751953125, -1.40673828125, 0.76171875, 2.93017578125, 5.0986328125, 7.26708984375, 9.435546875, 11.60400390625, 13.7724609375, 15.94091796875, 18.109375, 20.27783203125, 22.4462890625, 24.61474609375, 26.783203125, 28.95166015625, 31.1201171875, 33.28857421875, 35.45703125, 37.62548828125, 39.7939453125, 41.96240234375, 44.130859375, 46.29931640625, 48.4677734375, 50.63623046875, 52.8046875, 54.97314453125, 57.1416015625, 59.31005859375, 61.478515625, 63.64697265625, 65.8154296875, 67.98388671875, 70.15234375, 72.32080078125, 74.4892578125, 76.65771484375, 78.826171875, 80.99462890625, 83.1630859375, 85.33154296875, 87.5]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 12.0, 14.0, 21.0, 20.0, 32.0, 48.0, 51.0, 56.0, 69.0, 83.0, 94.0, 90.0, 72.0, 81.0, 54.0, 52.0, 52.0, 32.0, 18.0, 18.0, 13.0, 7.0, 4.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.66796875, -3.5091552734375, -3.350341796875, -3.1915283203125, -3.03271484375, -2.8739013671875, -2.715087890625, -2.5562744140625, -2.3974609375, -2.2386474609375, -2.079833984375, -1.9210205078125, -1.76220703125, -1.6033935546875, -1.444580078125, -1.2857666015625, -1.126953125, -0.9681396484375, -0.809326171875, -0.6505126953125, -0.49169921875, -0.3328857421875, -0.174072265625, -0.0152587890625, 0.1435546875, 0.3023681640625, 0.461181640625, 0.6199951171875, 0.77880859375, 0.9376220703125, 1.096435546875, 1.2552490234375, 1.4140625, 1.5728759765625, 1.731689453125, 1.8905029296875, 2.04931640625, 2.2081298828125, 2.366943359375, 2.5257568359375, 2.6845703125, 2.8433837890625, 3.002197265625, 3.1610107421875, 3.31982421875, 3.4786376953125, 3.637451171875, 3.7962646484375, 3.955078125, 4.1138916015625, 4.272705078125, 4.4315185546875, 4.59033203125, 4.7491455078125, 4.907958984375, 5.0667724609375, 5.2255859375, 5.3843994140625, 5.543212890625, 5.7020263671875, 5.86083984375, 6.0196533203125, 6.178466796875, 6.3372802734375, 6.49609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 20.0, 23.0, 31.0, 50.0, 105.0, 189.0, 346.0, 897.0, 2348.0, 7774.0, 34785.0, 348887.0, 3681356.0, 94429.0, 16271.0, 4238.0, 1412.0, 525.0, 247.0, 123.0, 61.0, 42.0, 33.0, 13.0, 7.0, 11.0, 9.0, 7.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.4375, -99.3427734375, -95.248046875, -91.1533203125, -87.05859375, -82.9638671875, -78.869140625, -74.7744140625, -70.6796875, -66.5849609375, -62.490234375, -58.3955078125, -54.30078125, -50.2060546875, -46.111328125, -42.0166015625, -37.921875, -33.8271484375, -29.732421875, -25.6376953125, -21.54296875, -17.4482421875, -13.353515625, -9.2587890625, -5.1640625, -1.0693359375, 3.025390625, 7.1201171875, 11.21484375, 15.3095703125, 19.404296875, 23.4990234375, 27.59375, 31.6884765625, 35.783203125, 39.8779296875, 43.97265625, 48.0673828125, 52.162109375, 56.2568359375, 60.3515625, 64.4462890625, 68.541015625, 72.6357421875, 76.73046875, 80.8251953125, 84.919921875, 89.0146484375, 93.109375, 97.2041015625, 101.298828125, 105.3935546875, 109.48828125, 113.5830078125, 117.677734375, 121.7724609375, 125.8671875, 129.9619140625, 134.056640625, 138.1513671875, 142.24609375, 146.3408203125, 150.435546875, 154.5302734375, 158.625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 8.0, 3.0, 8.0, 18.0, 15.0, 17.0, 22.0, 45.0, 38.0, 49.0, 84.0, 113.0, 185.0, 424.0, 1924.0, 469.0, 204.0, 125.0, 81.0, 54.0, 43.0, 30.0, 22.0, 20.0, 12.0, 14.0, 9.0, 7.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.328125, -12.9730224609375, -12.617919921875, -12.2628173828125, -11.90771484375, -11.5526123046875, -11.197509765625, -10.8424072265625, -10.4873046875, -10.1322021484375, -9.777099609375, -9.4219970703125, -9.06689453125, -8.7117919921875, -8.356689453125, -8.0015869140625, -7.646484375, -7.2913818359375, -6.936279296875, -6.5811767578125, -6.22607421875, -5.8709716796875, -5.515869140625, -5.1607666015625, -4.8056640625, -4.4505615234375, -4.095458984375, -3.7403564453125, -3.38525390625, -3.0301513671875, -2.675048828125, -2.3199462890625, -1.96484375, -1.6097412109375, -1.254638671875, -0.8995361328125, -0.54443359375, -0.1893310546875, 0.165771484375, 0.5208740234375, 0.8759765625, 1.2310791015625, 1.586181640625, 1.9412841796875, 2.29638671875, 2.6514892578125, 3.006591796875, 3.3616943359375, 3.716796875, 4.0718994140625, 4.427001953125, 4.7821044921875, 5.13720703125, 5.4923095703125, 5.847412109375, 6.2025146484375, 6.5576171875, 6.9127197265625, 7.267822265625, 7.6229248046875, 7.97802734375, 8.3331298828125, 8.688232421875, 9.0433349609375, 9.3984375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 11.0, 20.0, 34.0, 67.0, 128.0, 209.0, 225.0, 120.0, 70.0, 36.0, 22.0, 19.0, 15.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.61849594116211, -58.402278900146484, -55.186065673828125, -51.9698486328125, -48.753631591796875, -45.53741455078125, -42.32120132446289, -39.104984283447266, -35.888771057128906, -32.67255401611328, -29.45633888244629, -26.240123748779297, -23.023906707763672, -19.80769157409668, -16.591476440429688, -13.375259399414062, -10.159042358398438, -6.942826271057129, -3.7266106605529785, -0.5103950500488281, 2.7058210372924805, 5.922037124633789, 9.138252258300781, 12.354469299316406, 15.570684432983398, 18.78689956665039, 22.003116607666016, 25.219331741333008, 28.435546875, 31.651763916015625, 34.86798095703125, 38.084197998046875, 41.30040740966797, 44.516624450683594, 47.73283767700195, 50.94905471801758, 54.1652717590332, 57.38148498535156, 60.59770202636719, 63.81391906738281, 67.03013610839844, 70.24635314941406, 73.46257019042969, 76.67878723144531, 79.8949966430664, 83.11121368408203, 86.32743072509766, 89.54364776611328, 92.75985717773438, 95.97607421875, 99.19229125976562, 102.40850830078125, 105.62471771240234, 108.84093475341797, 112.0571517944336, 115.27336883544922, 118.48958587646484, 121.70580291748047, 124.9220199584961, 128.1382293701172, 131.3544464111328, 134.57066345214844, 137.78688049316406, 141.0030975341797, 144.2193145751953]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 9.0, 13.0, 13.0, 16.0, 26.0, 29.0, 40.0, 43.0, 49.0, 39.0, 46.0, 48.0, 45.0, 40.0, 59.0, 62.0, 43.0, 47.0, 48.0, 43.0, 39.0, 29.0, 37.0, 30.0, 20.0, 19.0, 13.0, 14.0, 11.0, 6.0, 2.0, 7.0, 2.0, 2.0], "bins": [-67.78295135498047, -66.23178100585938, -64.68061828613281, -63.12944793701172, -61.578277587890625, -60.02710723876953, -58.4759407043457, -56.924774169921875, -55.37360382080078, -53.82243347167969, -52.27126693725586, -50.72010040283203, -49.16893005371094, -47.617759704589844, -46.066593170166016, -44.51542663574219, -42.964256286621094, -41.4130859375, -39.86191940307617, -38.310752868652344, -36.75958251953125, -35.208412170410156, -33.65724563598633, -32.1060791015625, -30.554908752441406, -29.003740310668945, -27.452571868896484, -25.901403427124023, -24.350234985351562, -22.7990665435791, -21.24789810180664, -19.69672966003418, -18.14556121826172, -16.594392776489258, -15.043224334716797, -13.492055892944336, -11.940887451171875, -10.389719009399414, -8.838550567626953, -7.287382125854492, -5.736213684082031, -4.18504524230957, -2.6338768005371094, -1.0827083587646484, 0.4684600830078125, 2.0196285247802734, 3.5707969665527344, 5.121965408325195, 6.673133850097656, 8.224302291870117, 9.775470733642578, 11.326639175415039, 12.8778076171875, 14.428976058959961, 15.980144500732422, 17.531312942504883, 19.082481384277344, 20.633649826049805, 22.184818267822266, 23.735986709594727, 25.287155151367188, 26.83832359313965, 28.38949203491211, 29.94066047668457, 31.49182891845703]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 6.0, 6.0, 10.0, 12.0, 14.0, 22.0, 31.0, 46.0, 50.0, 79.0, 112.0, 170.0, 278.0, 434.0, 663.0, 1080.0, 1748.0, 2998.0, 4979.0, 8993.0, 17210.0, 33552.0, 69483.0, 157766.0, 333117.0, 225723.0, 95642.0, 44482.0, 22300.0, 11601.0, 6476.0, 3563.0, 2251.0, 1306.0, 822.0, 509.0, 339.0, 205.0, 136.0, 93.0, 69.0, 46.0, 36.0, 28.0, 19.0, 12.0, 14.0, 9.0, 4.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.28125, -30.32470703125, -29.3681640625, -28.41162109375, -27.455078125, -26.49853515625, -25.5419921875, -24.58544921875, -23.62890625, -22.67236328125, -21.7158203125, -20.75927734375, -19.802734375, -18.84619140625, -17.8896484375, -16.93310546875, -15.9765625, -15.02001953125, -14.0634765625, -13.10693359375, -12.150390625, -11.19384765625, -10.2373046875, -9.28076171875, -8.32421875, -7.36767578125, -6.4111328125, -5.45458984375, -4.498046875, -3.54150390625, -2.5849609375, -1.62841796875, -0.671875, 0.28466796875, 1.2412109375, 2.19775390625, 3.154296875, 4.11083984375, 5.0673828125, 6.02392578125, 6.98046875, 7.93701171875, 8.8935546875, 9.85009765625, 10.806640625, 11.76318359375, 12.7197265625, 13.67626953125, 14.6328125, 15.58935546875, 16.5458984375, 17.50244140625, 18.458984375, 19.41552734375, 20.3720703125, 21.32861328125, 22.28515625, 23.24169921875, 24.1982421875, 25.15478515625, 26.111328125, 27.06787109375, 28.0244140625, 28.98095703125, 29.9375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 6.0, 5.0, 19.0, 21.0, 26.0, 23.0, 38.0, 33.0, 39.0, 48.0, 45.0, 58.0, 54.0, 58.0, 45.0, 50.0, 51.0, 60.0, 54.0, 47.0, 36.0, 27.0, 31.0, 23.0, 19.0, 17.0, 13.0, 8.0, 11.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.568359375, -3.450469970703125, -3.33258056640625, -3.214691162109375, -3.0968017578125, -2.978912353515625, -2.86102294921875, -2.743133544921875, -2.625244140625, -2.507354736328125, -2.38946533203125, -2.271575927734375, -2.1536865234375, -2.035797119140625, -1.91790771484375, -1.800018310546875, -1.68212890625, -1.564239501953125, -1.44635009765625, -1.328460693359375, -1.2105712890625, -1.092681884765625, -0.97479248046875, -0.856903076171875, -0.739013671875, -0.621124267578125, -0.50323486328125, -0.385345458984375, -0.2674560546875, -0.149566650390625, -0.03167724609375, 0.086212158203125, 0.2041015625, 0.321990966796875, 0.43988037109375, 0.557769775390625, 0.6756591796875, 0.793548583984375, 0.91143798828125, 1.029327392578125, 1.147216796875, 1.265106201171875, 1.38299560546875, 1.500885009765625, 1.6187744140625, 1.736663818359375, 1.85455322265625, 1.972442626953125, 2.09033203125, 2.208221435546875, 2.32611083984375, 2.444000244140625, 2.5618896484375, 2.679779052734375, 2.79766845703125, 2.915557861328125, 3.033447265625, 3.151336669921875, 3.26922607421875, 3.387115478515625, 3.5050048828125, 3.622894287109375, 3.74078369140625, 3.858673095703125, 3.9765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 6.0, 4.0, 12.0, 14.0, 34.0, 23.0, 35.0, 58.0, 79.0, 130.0, 199.0, 309.0, 569.0, 1181.0, 2152.0, 4854.0, 11649.0, 31397.0, 104597.0, 480432.0, 301607.0, 70087.0, 22683.0, 8738.0, 3729.0, 1815.0, 907.0, 438.0, 283.0, 182.0, 107.0, 75.0, 45.0, 33.0, 24.0, 24.0, 10.0, 10.0, 9.0, 2.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-51.25, -49.58837890625, -47.9267578125, -46.26513671875, -44.603515625, -42.94189453125, -41.2802734375, -39.61865234375, -37.95703125, -36.29541015625, -34.6337890625, -32.97216796875, -31.310546875, -29.64892578125, -27.9873046875, -26.32568359375, -24.6640625, -23.00244140625, -21.3408203125, -19.67919921875, -18.017578125, -16.35595703125, -14.6943359375, -13.03271484375, -11.37109375, -9.70947265625, -8.0478515625, -6.38623046875, -4.724609375, -3.06298828125, -1.4013671875, 0.26025390625, 1.921875, 3.58349609375, 5.2451171875, 6.90673828125, 8.568359375, 10.22998046875, 11.8916015625, 13.55322265625, 15.21484375, 16.87646484375, 18.5380859375, 20.19970703125, 21.861328125, 23.52294921875, 25.1845703125, 26.84619140625, 28.5078125, 30.16943359375, 31.8310546875, 33.49267578125, 35.154296875, 36.81591796875, 38.4775390625, 40.13916015625, 41.80078125, 43.46240234375, 45.1240234375, 46.78564453125, 48.447265625, 50.10888671875, 51.7705078125, 53.43212890625, 55.09375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 4.0, 15.0, 6.0, 11.0, 4.0, 16.0, 15.0, 25.0, 24.0, 23.0, 32.0, 41.0, 42.0, 45.0, 47.0, 49.0, 52.0, 54.0, 56.0, 44.0, 66.0, 41.0, 33.0, 40.0, 50.0, 27.0, 18.0, 22.0, 8.0, 14.0, 23.0, 11.0, 9.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.46875, -21.705322265625, -20.94189453125, -20.178466796875, -19.4150390625, -18.651611328125, -17.88818359375, -17.124755859375, -16.361328125, -15.597900390625, -14.83447265625, -14.071044921875, -13.3076171875, -12.544189453125, -11.78076171875, -11.017333984375, -10.25390625, -9.490478515625, -8.72705078125, -7.963623046875, -7.2001953125, -6.436767578125, -5.67333984375, -4.909912109375, -4.146484375, -3.383056640625, -2.61962890625, -1.856201171875, -1.0927734375, -0.329345703125, 0.43408203125, 1.197509765625, 1.9609375, 2.724365234375, 3.48779296875, 4.251220703125, 5.0146484375, 5.778076171875, 6.54150390625, 7.304931640625, 8.068359375, 8.831787109375, 9.59521484375, 10.358642578125, 11.1220703125, 11.885498046875, 12.64892578125, 13.412353515625, 14.17578125, 14.939208984375, 15.70263671875, 16.466064453125, 17.2294921875, 17.992919921875, 18.75634765625, 19.519775390625, 20.283203125, 21.046630859375, 21.81005859375, 22.573486328125, 23.3369140625, 24.100341796875, 24.86376953125, 25.627197265625, 26.390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 8.0, 8.0, 16.0, 32.0, 35.0, 61.0, 90.0, 151.0, 257.0, 434.0, 879.0, 1670.0, 3308.0, 7394.0, 18929.0, 56520.0, 228179.0, 512420.0, 150862.0, 40918.0, 14502.0, 5977.0, 2804.0, 1420.0, 701.0, 382.0, 208.0, 124.0, 83.0, 53.0, 42.0, 24.0, 17.0, 11.0, 10.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.5625, -26.65478515625, -25.7470703125, -24.83935546875, -23.931640625, -23.02392578125, -22.1162109375, -21.20849609375, -20.30078125, -19.39306640625, -18.4853515625, -17.57763671875, -16.669921875, -15.76220703125, -14.8544921875, -13.94677734375, -13.0390625, -12.13134765625, -11.2236328125, -10.31591796875, -9.408203125, -8.50048828125, -7.5927734375, -6.68505859375, -5.77734375, -4.86962890625, -3.9619140625, -3.05419921875, -2.146484375, -1.23876953125, -0.3310546875, 0.57666015625, 1.484375, 2.39208984375, 3.2998046875, 4.20751953125, 5.115234375, 6.02294921875, 6.9306640625, 7.83837890625, 8.74609375, 9.65380859375, 10.5615234375, 11.46923828125, 12.376953125, 13.28466796875, 14.1923828125, 15.10009765625, 16.0078125, 16.91552734375, 17.8232421875, 18.73095703125, 19.638671875, 20.54638671875, 21.4541015625, 22.36181640625, 23.26953125, 24.17724609375, 25.0849609375, 25.99267578125, 26.900390625, 27.80810546875, 28.7158203125, 29.62353515625, 30.53125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 4.0, 6.0, 3.0, 3.0, 17.0, 8.0, 20.0, 19.0, 31.0, 48.0, 79.0, 102.0, 122.0, 140.0, 113.0, 79.0, 45.0, 53.0, 24.0, 18.0, 14.0, 13.0, 7.0, 7.0, 7.0, 3.0, 7.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00626373291015625, -0.006099998950958252, -0.005936264991760254, -0.005772531032562256, -0.005608797073364258, -0.00544506311416626, -0.005281329154968262, -0.005117595195770264, -0.004953861236572266, -0.004790127277374268, -0.0046263933181762695, -0.0044626593589782715, -0.0042989253997802734, -0.004135191440582275, -0.003971457481384277, -0.0038077235221862793, -0.0036439895629882812, -0.003480255603790283, -0.003316521644592285, -0.003152787685394287, -0.002989053726196289, -0.002825319766998291, -0.002661585807800293, -0.002497851848602295, -0.002334117889404297, -0.002170383930206299, -0.0020066499710083008, -0.0018429160118103027, -0.0016791820526123047, -0.0015154480934143066, -0.0013517141342163086, -0.0011879801750183105, -0.0010242462158203125, -0.0008605122566223145, -0.0006967782974243164, -0.0005330443382263184, -0.0003693103790283203, -0.00020557641983032227, -4.184246063232422e-05, 0.00012189149856567383, 0.0002856254577636719, 0.0004493594169616699, 0.000613093376159668, 0.000776827335357666, 0.0009405612945556641, 0.0011042952537536621, 0.0012680292129516602, 0.0014317631721496582, 0.0015954971313476562, 0.0017592310905456543, 0.0019229650497436523, 0.0020866990089416504, 0.0022504329681396484, 0.0024141669273376465, 0.0025779008865356445, 0.0027416348457336426, 0.0029053688049316406, 0.0030691027641296387, 0.0032328367233276367, 0.0033965706825256348, 0.003560304641723633, 0.003724038600921631, 0.003887772560119629, 0.004051506519317627, 0.004215240478515625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 7.0, 7.0, 8.0, 27.0, 22.0, 51.0, 52.0, 74.0, 88.0, 178.0, 258.0, 487.0, 922.0, 1789.0, 3825.0, 8999.0, 23856.0, 76512.0, 310262.0, 448964.0, 116729.0, 33715.0, 12092.0, 4969.0, 2208.0, 1015.0, 548.0, 337.0, 185.0, 117.0, 68.0, 55.0, 40.0, 20.0, 16.0, 13.0, 10.0, 10.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.03125, -29.152099609375, -28.27294921875, -27.393798828125, -26.5146484375, -25.635498046875, -24.75634765625, -23.877197265625, -22.998046875, -22.118896484375, -21.23974609375, -20.360595703125, -19.4814453125, -18.602294921875, -17.72314453125, -16.843994140625, -15.96484375, -15.085693359375, -14.20654296875, -13.327392578125, -12.4482421875, -11.569091796875, -10.68994140625, -9.810791015625, -8.931640625, -8.052490234375, -7.17333984375, -6.294189453125, -5.4150390625, -4.535888671875, -3.65673828125, -2.777587890625, -1.8984375, -1.019287109375, -0.14013671875, 0.739013671875, 1.6181640625, 2.497314453125, 3.37646484375, 4.255615234375, 5.134765625, 6.013916015625, 6.89306640625, 7.772216796875, 8.6513671875, 9.530517578125, 10.40966796875, 11.288818359375, 12.16796875, 13.047119140625, 13.92626953125, 14.805419921875, 15.6845703125, 16.563720703125, 17.44287109375, 18.322021484375, 19.201171875, 20.080322265625, 20.95947265625, 21.838623046875, 22.7177734375, 23.596923828125, 24.47607421875, 25.355224609375, 26.234375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 10.0, 11.0, 6.0, 7.0, 9.0, 9.0, 11.0, 26.0, 20.0, 20.0, 28.0, 38.0, 43.0, 57.0, 51.0, 52.0, 53.0, 62.0, 53.0, 39.0, 55.0, 49.0, 51.0, 45.0, 46.0, 27.0, 18.0, 18.0, 9.0, 13.0, 19.0, 9.0, 8.0, 4.0, 8.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.75, -11.392578125, -11.03515625, -10.677734375, -10.3203125, -9.962890625, -9.60546875, -9.248046875, -8.890625, -8.533203125, -8.17578125, -7.818359375, -7.4609375, -7.103515625, -6.74609375, -6.388671875, -6.03125, -5.673828125, -5.31640625, -4.958984375, -4.6015625, -4.244140625, -3.88671875, -3.529296875, -3.171875, -2.814453125, -2.45703125, -2.099609375, -1.7421875, -1.384765625, -1.02734375, -0.669921875, -0.3125, 0.044921875, 0.40234375, 0.759765625, 1.1171875, 1.474609375, 1.83203125, 2.189453125, 2.546875, 2.904296875, 3.26171875, 3.619140625, 3.9765625, 4.333984375, 4.69140625, 5.048828125, 5.40625, 5.763671875, 6.12109375, 6.478515625, 6.8359375, 7.193359375, 7.55078125, 7.908203125, 8.265625, 8.623046875, 8.98046875, 9.337890625, 9.6953125, 10.052734375, 10.41015625, 10.767578125, 11.125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 7.0, 11.0, 13.0, 23.0, 26.0, 52.0, 75.0, 110.0, 153.0, 148.0, 133.0, 83.0, 54.0, 37.0, 23.0, 14.0, 7.0, 8.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-220.2195587158203, -211.78562927246094, -203.3516845703125, -194.91775512695312, -186.48382568359375, -178.04989624023438, -169.615966796875, -161.18202209472656, -152.7480926513672, -144.3141632080078, -135.88021850585938, -127.4462890625, -119.01235961914062, -110.57843017578125, -102.14449310302734, -93.71055603027344, -85.27662658691406, -76.84269714355469, -68.40876007080078, -59.97482681274414, -51.5408935546875, -43.10696029663086, -34.67302703857422, -26.239093780517578, -17.805160522460938, -9.371227264404297, -0.9372940063476562, 7.496639251708984, 15.930572509765625, 24.364505767822266, 32.798439025878906, 41.23237228393555, 49.66632080078125, 58.10025405883789, 66.53418731689453, 74.96812438964844, 83.40205383300781, 91.83598327636719, 100.2699203491211, 108.703857421875, 117.13778686523438, 125.57171630859375, 134.00564575195312, 142.43959045410156, 150.87351989746094, 159.3074493408203, 167.74139404296875, 176.17532348632812, 184.6092529296875, 193.04318237304688, 201.47711181640625, 209.9110565185547, 218.34498596191406, 226.77891540527344, 235.21286010742188, 243.64678955078125, 252.08071899414062, 260.5146484375, 268.9485778808594, 277.38250732421875, 285.81646728515625, 294.2503967285156, 302.684326171875, 311.1182556152344, 319.55218505859375]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 8.0, 12.0, 13.0, 16.0, 26.0, 20.0, 21.0, 26.0, 29.0, 33.0, 42.0, 52.0, 48.0, 48.0, 64.0, 46.0, 68.0, 47.0, 46.0, 55.0, 44.0, 38.0, 34.0, 22.0, 28.0, 29.0, 13.0, 10.0, 10.0, 7.0, 9.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-193.78839111328125, -187.7338409423828, -181.6792755126953, -175.62472534179688, -169.57017517089844, -163.515625, -157.4610595703125, -151.40650939941406, -145.35195922851562, -139.2974090576172, -133.2428436279297, -127.18829345703125, -121.13374328613281, -115.07918548583984, -109.02462768554688, -102.97007751464844, -96.91551208496094, -90.86095428466797, -84.80640411376953, -78.75184631347656, -72.69729614257812, -66.64273834228516, -60.58818054199219, -54.533626556396484, -48.47907257080078, -42.42451858520508, -36.369964599609375, -30.315406799316406, -24.260852813720703, -18.206298828125, -12.151741027832031, -6.097187042236328, -0.0426483154296875, 6.011906623840332, 12.066461563110352, 18.121017456054688, 24.17557144165039, 30.230125427246094, 36.28468322753906, 42.339237213134766, 48.39379119873047, 54.44834518432617, 60.502899169921875, 66.55745697021484, 72.61201477050781, 78.66656494140625, 84.72112274169922, 90.77568054199219, 96.83023071289062, 102.8847885131836, 108.93933868408203, 114.993896484375, 121.04844665527344, 127.1030044555664, 133.15756225585938, 139.2121124267578, 145.26666259765625, 151.3212127685547, 157.3757781982422, 163.43032836914062, 169.48487854003906, 175.5394287109375, 181.593994140625, 187.64854431152344, 193.70310974121094]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 7.0, 3.0, 10.0, 12.0, 11.0, 18.0, 27.0, 36.0, 49.0, 67.0, 85.0, 129.0, 182.0, 263.0, 431.0, 747.0, 1235.0, 2362.0, 4338.0, 9233.0, 21611.0, 61188.0, 313240.0, 3540044.0, 164641.0, 42470.0, 16342.0, 7225.0, 3539.0, 1930.0, 1032.0, 618.0, 391.0, 249.0, 166.0, 93.0, 81.0, 46.0, 32.0, 24.0, 15.0, 19.0, 10.0, 6.0, 5.0, 5.0, 2.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-78.3125, -75.9638671875, -73.615234375, -71.2666015625, -68.91796875, -66.5693359375, -64.220703125, -61.8720703125, -59.5234375, -57.1748046875, -54.826171875, -52.4775390625, -50.12890625, -47.7802734375, -45.431640625, -43.0830078125, -40.734375, -38.3857421875, -36.037109375, -33.6884765625, -31.33984375, -28.9912109375, -26.642578125, -24.2939453125, -21.9453125, -19.5966796875, -17.248046875, -14.8994140625, -12.55078125, -10.2021484375, -7.853515625, -5.5048828125, -3.15625, -0.8076171875, 1.541015625, 3.8896484375, 6.23828125, 8.5869140625, 10.935546875, 13.2841796875, 15.6328125, 17.9814453125, 20.330078125, 22.6787109375, 25.02734375, 27.3759765625, 29.724609375, 32.0732421875, 34.421875, 36.7705078125, 39.119140625, 41.4677734375, 43.81640625, 46.1650390625, 48.513671875, 50.8623046875, 53.2109375, 55.5595703125, 57.908203125, 60.2568359375, 62.60546875, 64.9541015625, 67.302734375, 69.6513671875, 72.0]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 6.0, 5.0, 6.0, 19.0, 23.0, 22.0, 26.0, 39.0, 48.0, 60.0, 65.0, 54.0, 70.0, 71.0, 68.0, 53.0, 61.0, 56.0, 44.0, 50.0, 33.0, 30.0, 22.0, 17.0, 15.0, 4.0, 7.0, 4.0, 6.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.67578125, -5.4912109375, -5.306640625, -5.1220703125, -4.9375, -4.7529296875, -4.568359375, -4.3837890625, -4.19921875, -4.0146484375, -3.830078125, -3.6455078125, -3.4609375, -3.2763671875, -3.091796875, -2.9072265625, -2.72265625, -2.5380859375, -2.353515625, -2.1689453125, -1.984375, -1.7998046875, -1.615234375, -1.4306640625, -1.24609375, -1.0615234375, -0.876953125, -0.6923828125, -0.5078125, -0.3232421875, -0.138671875, 0.0458984375, 0.23046875, 0.4150390625, 0.599609375, 0.7841796875, 0.96875, 1.1533203125, 1.337890625, 1.5224609375, 1.70703125, 1.8916015625, 2.076171875, 2.2607421875, 2.4453125, 2.6298828125, 2.814453125, 2.9990234375, 3.18359375, 3.3681640625, 3.552734375, 3.7373046875, 3.921875, 4.1064453125, 4.291015625, 4.4755859375, 4.66015625, 4.8447265625, 5.029296875, 5.2138671875, 5.3984375, 5.5830078125, 5.767578125, 5.9521484375, 6.13671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 8.0, 10.0, 14.0, 9.0, 19.0, 28.0, 34.0, 46.0, 80.0, 130.0, 264.0, 710.0, 2404.0, 12377.0, 135029.0, 3906469.0, 121727.0, 11303.0, 2300.0, 735.0, 259.0, 125.0, 66.0, 36.0, 24.0, 25.0, 16.0, 6.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 0.0, 0.0, 2.0, 1.0], "bins": [-229.625, -223.658203125, -217.69140625, -211.724609375, -205.7578125, -199.791015625, -193.82421875, -187.857421875, -181.890625, -175.923828125, -169.95703125, -163.990234375, -158.0234375, -152.056640625, -146.08984375, -140.123046875, -134.15625, -128.189453125, -122.22265625, -116.255859375, -110.2890625, -104.322265625, -98.35546875, -92.388671875, -86.421875, -80.455078125, -74.48828125, -68.521484375, -62.5546875, -56.587890625, -50.62109375, -44.654296875, -38.6875, -32.720703125, -26.75390625, -20.787109375, -14.8203125, -8.853515625, -2.88671875, 3.080078125, 9.046875, 15.013671875, 20.98046875, 26.947265625, 32.9140625, 38.880859375, 44.84765625, 50.814453125, 56.78125, 62.748046875, 68.71484375, 74.681640625, 80.6484375, 86.615234375, 92.58203125, 98.548828125, 104.515625, 110.482421875, 116.44921875, 122.416015625, 128.3828125, 134.349609375, 140.31640625, 146.283203125, 152.25]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 14.0, 20.0, 32.0, 45.0, 76.0, 127.0, 245.0, 989.0, 1902.0, 270.0, 137.0, 86.0, 52.0, 24.0, 14.0, 16.0, 9.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5625, -34.674560546875, -33.78662109375, -32.898681640625, -32.0107421875, -31.122802734375, -30.23486328125, -29.346923828125, -28.458984375, -27.571044921875, -26.68310546875, -25.795166015625, -24.9072265625, -24.019287109375, -23.13134765625, -22.243408203125, -21.35546875, -20.467529296875, -19.57958984375, -18.691650390625, -17.8037109375, -16.915771484375, -16.02783203125, -15.139892578125, -14.251953125, -13.364013671875, -12.47607421875, -11.588134765625, -10.7001953125, -9.812255859375, -8.92431640625, -8.036376953125, -7.1484375, -6.260498046875, -5.37255859375, -4.484619140625, -3.5966796875, -2.708740234375, -1.82080078125, -0.932861328125, -0.044921875, 0.843017578125, 1.73095703125, 2.618896484375, 3.5068359375, 4.394775390625, 5.28271484375, 6.170654296875, 7.05859375, 7.946533203125, 8.83447265625, 9.722412109375, 10.6103515625, 11.498291015625, 12.38623046875, 13.274169921875, 14.162109375, 15.050048828125, 15.93798828125, 16.825927734375, 17.7138671875, 18.601806640625, 19.48974609375, 20.377685546875, 21.265625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 8.0, 10.0, 15.0, 14.0, 26.0, 46.0, 88.0, 117.0, 192.0, 187.0, 143.0, 64.0, 34.0, 24.0, 15.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.19717407226562, -184.57598876953125, -179.95480346679688, -175.33363342285156, -170.7124481201172, -166.0912628173828, -161.47007751464844, -156.84890747070312, -152.22772216796875, -147.60653686523438, -142.9853515625, -138.3641815185547, -133.7429962158203, -129.12181091308594, -124.50062561035156, -119.87944793701172, -115.25826263427734, -110.63707733154297, -106.01589965820312, -101.39471435546875, -96.7735366821289, -92.15235137939453, -87.53117370605469, -82.90998840332031, -78.28880310058594, -73.66761779785156, -69.04644012451172, -64.42525482177734, -59.8040771484375, -55.182891845703125, -50.561710357666016, -45.940528869628906, -41.31934356689453, -36.69816207885742, -32.07698059082031, -27.45579719543457, -22.83461570739746, -18.21343421936035, -13.59225082397461, -8.9710693359375, -4.349887847900391, 0.27129411697387695, 4.8924760818481445, 9.51365852355957, 14.13484001159668, 18.75602149963379, 23.37720489501953, 27.99838638305664, 32.61956787109375, 37.24074935913086, 41.86193084716797, 46.483116149902344, 51.10429382324219, 55.72547912597656, 60.34666061401367, 64.96784210205078, 69.58901977539062, 74.210205078125, 78.83138275146484, 83.45256805419922, 88.07374572753906, 92.69493103027344, 97.31611633300781, 101.93729400634766, 106.55847930908203]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 12.0, 12.0, 19.0, 13.0, 24.0, 24.0, 31.0, 27.0, 44.0, 45.0, 48.0, 52.0, 62.0, 67.0, 61.0, 53.0, 53.0, 48.0, 41.0, 45.0, 40.0, 24.0, 27.0, 19.0, 24.0, 17.0, 18.0, 10.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.23884582519531, -61.92860412597656, -59.61836624145508, -57.30812454223633, -54.997886657714844, -52.687644958496094, -50.377403259277344, -48.06716537475586, -45.756927490234375, -43.446685791015625, -41.13644790649414, -38.82620620727539, -36.515968322753906, -34.205726623535156, -31.89548683166504, -29.585247039794922, -27.275005340576172, -24.964765548706055, -22.654525756835938, -20.344284057617188, -18.034046173095703, -15.72380542755127, -13.413564682006836, -11.103324890136719, -8.793085098266602, -6.482845306396484, -4.172605037689209, -1.8623647689819336, 0.4478750228881836, 2.758114814758301, 5.068355560302734, 7.378595352172852, 9.688835144042969, 11.999074935913086, 14.309314727783203, 16.619556427001953, 18.929794311523438, 21.240036010742188, 23.550275802612305, 25.860515594482422, 28.17075538635254, 30.480995178222656, 32.791236877441406, 35.10147476196289, 37.41171646118164, 39.721954345703125, 42.032196044921875, 44.342437744140625, 46.65267562866211, 48.96291732788086, 51.273155212402344, 53.583396911621094, 55.89363479614258, 58.20387649536133, 60.51411437988281, 62.82435607910156, 65.13459777832031, 67.44483947753906, 69.75508117675781, 72.06531524658203, 74.37555694580078, 76.68579864501953, 78.99604034423828, 81.3062744140625, 83.61651611328125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 7.0, 9.0, 18.0, 22.0, 22.0, 48.0, 53.0, 61.0, 91.0, 164.0, 248.0, 378.0, 607.0, 1041.0, 1806.0, 3371.0, 6296.0, 13200.0, 30055.0, 78474.0, 231757.0, 413005.0, 164919.0, 57597.0, 23030.0, 10364.0, 5231.0, 2783.0, 1497.0, 871.0, 521.0, 346.0, 193.0, 141.0, 91.0, 61.0, 42.0, 36.0, 28.0, 16.0, 12.0, 10.0, 11.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.71875, -41.35595703125, -39.9931640625, -38.63037109375, -37.267578125, -35.90478515625, -34.5419921875, -33.17919921875, -31.81640625, -30.45361328125, -29.0908203125, -27.72802734375, -26.365234375, -25.00244140625, -23.6396484375, -22.27685546875, -20.9140625, -19.55126953125, -18.1884765625, -16.82568359375, -15.462890625, -14.10009765625, -12.7373046875, -11.37451171875, -10.01171875, -8.64892578125, -7.2861328125, -5.92333984375, -4.560546875, -3.19775390625, -1.8349609375, -0.47216796875, 0.890625, 2.25341796875, 3.6162109375, 4.97900390625, 6.341796875, 7.70458984375, 9.0673828125, 10.43017578125, 11.79296875, 13.15576171875, 14.5185546875, 15.88134765625, 17.244140625, 18.60693359375, 19.9697265625, 21.33251953125, 22.6953125, 24.05810546875, 25.4208984375, 26.78369140625, 28.146484375, 29.50927734375, 30.8720703125, 32.23486328125, 33.59765625, 34.96044921875, 36.3232421875, 37.68603515625, 39.048828125, 40.41162109375, 41.7744140625, 43.13720703125, 44.5]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 12.0, 16.0, 16.0, 17.0, 23.0, 32.0, 45.0, 54.0, 43.0, 55.0, 57.0, 85.0, 79.0, 59.0, 62.0, 62.0, 53.0, 52.0, 38.0, 24.0, 22.0, 23.0, 14.0, 8.0, 8.0, 10.0, 6.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.85394287109375, -6.6414794921875, -6.42901611328125, -6.216552734375, -6.00408935546875, -5.7916259765625, -5.57916259765625, -5.36669921875, -5.15423583984375, -4.9417724609375, -4.72930908203125, -4.516845703125, -4.30438232421875, -4.0919189453125, -3.87945556640625, -3.6669921875, -3.45452880859375, -3.2420654296875, -3.02960205078125, -2.817138671875, -2.60467529296875, -2.3922119140625, -2.17974853515625, -1.96728515625, -1.75482177734375, -1.5423583984375, -1.32989501953125, -1.117431640625, -0.90496826171875, -0.6925048828125, -0.48004150390625, -0.267578125, -0.05511474609375, 0.1573486328125, 0.36981201171875, 0.582275390625, 0.79473876953125, 1.0072021484375, 1.21966552734375, 1.43212890625, 1.64459228515625, 1.8570556640625, 2.06951904296875, 2.281982421875, 2.49444580078125, 2.7069091796875, 2.91937255859375, 3.1318359375, 3.34429931640625, 3.5567626953125, 3.76922607421875, 3.981689453125, 4.19415283203125, 4.4066162109375, 4.61907958984375, 4.83154296875, 5.04400634765625, 5.2564697265625, 5.46893310546875, 5.681396484375, 5.89385986328125, 6.1063232421875, 6.31878662109375, 6.53125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 12.0, 10.0, 18.0, 9.0, 13.0, 19.0, 36.0, 43.0, 61.0, 116.0, 119.0, 210.0, 334.0, 543.0, 971.0, 1737.0, 3297.0, 6617.0, 14642.0, 36731.0, 110571.0, 393290.0, 330548.0, 92059.0, 31317.0, 12744.0, 5808.0, 2957.0, 1529.0, 842.0, 508.0, 282.0, 175.0, 106.0, 73.0, 54.0, 38.0, 28.0, 28.0, 18.0, 14.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.53125, -52.875, -51.21875, -49.5625, -47.90625, -46.25, -44.59375, -42.9375, -41.28125, -39.625, -37.96875, -36.3125, -34.65625, -33.0, -31.34375, -29.6875, -28.03125, -26.375, -24.71875, -23.0625, -21.40625, -19.75, -18.09375, -16.4375, -14.78125, -13.125, -11.46875, -9.8125, -8.15625, -6.5, -4.84375, -3.1875, -1.53125, 0.125, 1.78125, 3.4375, 5.09375, 6.75, 8.40625, 10.0625, 11.71875, 13.375, 15.03125, 16.6875, 18.34375, 20.0, 21.65625, 23.3125, 24.96875, 26.625, 28.28125, 29.9375, 31.59375, 33.25, 34.90625, 36.5625, 38.21875, 39.875, 41.53125, 43.1875, 44.84375, 46.5, 48.15625, 49.8125, 51.46875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 6.0, 6.0, 8.0, 9.0, 13.0, 17.0, 12.0, 12.0, 23.0, 20.0, 31.0, 34.0, 33.0, 43.0, 34.0, 47.0, 44.0, 39.0, 33.0, 43.0, 41.0, 53.0, 52.0, 38.0, 38.0, 31.0, 39.0, 35.0, 31.0, 18.0, 23.0, 9.0, 10.0, 16.0, 7.0, 11.0, 9.0, 2.0, 9.0, 2.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.40625, -30.4423828125, -29.478515625, -28.5146484375, -27.55078125, -26.5869140625, -25.623046875, -24.6591796875, -23.6953125, -22.7314453125, -21.767578125, -20.8037109375, -19.83984375, -18.8759765625, -17.912109375, -16.9482421875, -15.984375, -15.0205078125, -14.056640625, -13.0927734375, -12.12890625, -11.1650390625, -10.201171875, -9.2373046875, -8.2734375, -7.3095703125, -6.345703125, -5.3818359375, -4.41796875, -3.4541015625, -2.490234375, -1.5263671875, -0.5625, 0.4013671875, 1.365234375, 2.3291015625, 3.29296875, 4.2568359375, 5.220703125, 6.1845703125, 7.1484375, 8.1123046875, 9.076171875, 10.0400390625, 11.00390625, 11.9677734375, 12.931640625, 13.8955078125, 14.859375, 15.8232421875, 16.787109375, 17.7509765625, 18.71484375, 19.6787109375, 20.642578125, 21.6064453125, 22.5703125, 23.5341796875, 24.498046875, 25.4619140625, 26.42578125, 27.3896484375, 28.353515625, 29.3173828125, 30.28125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 11.0, 20.0, 31.0, 49.0, 44.0, 67.0, 106.0, 153.0, 232.0, 324.0, 457.0, 695.0, 1035.0, 1460.0, 2100.0, 3271.0, 5364.0, 9288.0, 20146.0, 60397.0, 291035.0, 487473.0, 104811.0, 29304.0, 12501.0, 6425.0, 3953.0, 2465.0, 1744.0, 1118.0, 762.0, 506.0, 380.0, 260.0, 171.0, 128.0, 96.0, 64.0, 34.0, 33.0, 13.0, 13.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.109375, -24.21875, -23.328125, -22.4375, -21.546875, -20.65625, -19.765625, -18.875, -17.984375, -17.09375, -16.203125, -15.3125, -14.421875, -13.53125, -12.640625, -11.75, -10.859375, -9.96875, -9.078125, -8.1875, -7.296875, -6.40625, -5.515625, -4.625, -3.734375, -2.84375, -1.953125, -1.0625, -0.171875, 0.71875, 1.609375, 2.5, 3.390625, 4.28125, 5.171875, 6.0625, 6.953125, 7.84375, 8.734375, 9.625, 10.515625, 11.40625, 12.296875, 13.1875, 14.078125, 14.96875, 15.859375, 16.75, 17.640625, 18.53125, 19.421875, 20.3125, 21.203125, 22.09375, 22.984375, 23.875, 24.765625, 25.65625, 26.546875, 27.4375, 28.328125, 29.21875, 30.109375, 31.0, 31.890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 11.0, 7.0, 18.0, 20.0, 25.0, 53.0, 113.0, 162.0, 201.0, 156.0, 86.0, 54.0, 26.0, 20.0, 11.0, 11.0, 6.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00714111328125, -0.006860613822937012, -0.0065801143646240234, -0.006299614906311035, -0.006019115447998047, -0.005738615989685059, -0.00545811653137207, -0.005177617073059082, -0.004897117614746094, -0.0046166181564331055, -0.004336118698120117, -0.004055619239807129, -0.0037751197814941406, -0.0034946203231811523, -0.003214120864868164, -0.0029336214065551758, -0.0026531219482421875, -0.0023726224899291992, -0.002092123031616211, -0.0018116235733032227, -0.0015311241149902344, -0.001250624656677246, -0.0009701251983642578, -0.0006896257400512695, -0.00040912628173828125, -0.00012862682342529297, 0.0001518726348876953, 0.0004323720932006836, 0.0007128715515136719, 0.0009933710098266602, 0.0012738704681396484, 0.0015543699264526367, 0.001834869384765625, 0.0021153688430786133, 0.0023958683013916016, 0.00267636775970459, 0.002956867218017578, 0.0032373666763305664, 0.0035178661346435547, 0.003798365592956543, 0.004078865051269531, 0.0043593645095825195, 0.004639863967895508, 0.004920363426208496, 0.005200862884521484, 0.005481362342834473, 0.005761861801147461, 0.006042361259460449, 0.0063228607177734375, 0.006603360176086426, 0.006883859634399414, 0.007164359092712402, 0.007444858551025391, 0.007725358009338379, 0.008005857467651367, 0.008286356925964355, 0.008566856384277344, 0.008847355842590332, 0.00912785530090332, 0.009408354759216309, 0.009688854217529297, 0.009969353675842285, 0.010249853134155273, 0.010530352592468262, 0.01081085205078125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 9.0, 13.0, 13.0, 13.0, 24.0, 42.0, 46.0, 93.0, 120.0, 201.0, 409.0, 640.0, 1258.0, 2463.0, 5335.0, 14037.0, 68065.0, 754202.0, 165265.0, 22428.0, 7191.0, 3109.0, 1591.0, 825.0, 480.0, 251.0, 160.0, 88.0, 50.0, 42.0, 23.0, 24.0, 10.0, 5.0, 4.0, 3.0, 8.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.40625, -58.5576171875, -56.708984375, -54.8603515625, -53.01171875, -51.1630859375, -49.314453125, -47.4658203125, -45.6171875, -43.7685546875, -41.919921875, -40.0712890625, -38.22265625, -36.3740234375, -34.525390625, -32.6767578125, -30.828125, -28.9794921875, -27.130859375, -25.2822265625, -23.43359375, -21.5849609375, -19.736328125, -17.8876953125, -16.0390625, -14.1904296875, -12.341796875, -10.4931640625, -8.64453125, -6.7958984375, -4.947265625, -3.0986328125, -1.25, 0.5986328125, 2.447265625, 4.2958984375, 6.14453125, 7.9931640625, 9.841796875, 11.6904296875, 13.5390625, 15.3876953125, 17.236328125, 19.0849609375, 20.93359375, 22.7822265625, 24.630859375, 26.4794921875, 28.328125, 30.1767578125, 32.025390625, 33.8740234375, 35.72265625, 37.5712890625, 39.419921875, 41.2685546875, 43.1171875, 44.9658203125, 46.814453125, 48.6630859375, 50.51171875, 52.3603515625, 54.208984375, 56.0576171875, 57.90625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 9.0, 2.0, 13.0, 15.0, 27.0, 46.0, 64.0, 92.0, 158.0, 144.0, 139.0, 80.0, 54.0, 30.0, 18.0, 12.0, 13.0, 13.0, 9.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.890625, -28.9658203125, -28.041015625, -27.1162109375, -26.19140625, -25.2666015625, -24.341796875, -23.4169921875, -22.4921875, -21.5673828125, -20.642578125, -19.7177734375, -18.79296875, -17.8681640625, -16.943359375, -16.0185546875, -15.09375, -14.1689453125, -13.244140625, -12.3193359375, -11.39453125, -10.4697265625, -9.544921875, -8.6201171875, -7.6953125, -6.7705078125, -5.845703125, -4.9208984375, -3.99609375, -3.0712890625, -2.146484375, -1.2216796875, -0.296875, 0.6279296875, 1.552734375, 2.4775390625, 3.40234375, 4.3271484375, 5.251953125, 6.1767578125, 7.1015625, 8.0263671875, 8.951171875, 9.8759765625, 10.80078125, 11.7255859375, 12.650390625, 13.5751953125, 14.5, 15.4248046875, 16.349609375, 17.2744140625, 18.19921875, 19.1240234375, 20.048828125, 20.9736328125, 21.8984375, 22.8232421875, 23.748046875, 24.6728515625, 25.59765625, 26.5224609375, 27.447265625, 28.3720703125, 29.296875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 8.0, 8.0, 5.0, 10.0, 14.0, 36.0, 44.0, 92.0, 101.0, 141.0, 186.0, 126.0, 71.0, 55.0, 39.0, 16.0, 14.0, 19.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-296.50390625, -284.24200439453125, -271.9801330566406, -259.7182312011719, -247.4563446044922, -235.1944580078125, -222.93255615234375, -210.67066955566406, -198.40878295898438, -186.1468963623047, -173.88499450683594, -161.62310791015625, -149.36122131347656, -137.09933471679688, -124.83743286132812, -112.57554626464844, -100.31364440917969, -88.05175018310547, -75.78986358642578, -63.52796936035156, -51.26607894897461, -39.004188537597656, -26.742294311523438, -14.48040771484375, -2.2185134887695312, 10.043377876281738, 22.305269241333008, 34.567161560058594, 46.82905197143555, 59.0909423828125, 71.35283660888672, 83.6147232055664, 95.87661743164062, 108.13851165771484, 120.40039825439453, 132.66229248046875, 144.92417907714844, 157.18606567382812, 169.44796752929688, 181.70985412597656, 193.97174072265625, 206.23362731933594, 218.4955291748047, 230.75741577148438, 243.01930236816406, 255.28118896484375, 267.5430908203125, 279.80499267578125, 292.06689453125, 304.32879638671875, 316.5906677246094, 328.8525695800781, 341.1144714355469, 353.3763427734375, 365.63824462890625, 377.900146484375, 390.1620178222656, 402.4239196777344, 414.685791015625, 426.94769287109375, 439.2095947265625, 451.4714660644531, 463.7333679199219, 475.9952392578125, 488.25714111328125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 1.0, 3.0, 7.0, 11.0, 6.0, 11.0, 9.0, 12.0, 14.0, 19.0, 13.0, 28.0, 26.0, 31.0, 26.0, 32.0, 35.0, 28.0, 41.0, 51.0, 46.0, 36.0, 34.0, 41.0, 51.0, 48.0, 41.0, 42.0, 34.0, 29.0, 35.0, 33.0, 14.0, 27.0, 14.0, 9.0, 16.0, 16.0, 8.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-254.588623046875, -247.61636352539062, -240.64410400390625, -233.67184448242188, -226.69956970214844, -219.72731018066406, -212.7550506591797, -205.7827911376953, -198.81051635742188, -191.8382568359375, -184.86599731445312, -177.89373779296875, -170.9214630126953, -163.94920349121094, -156.97694396972656, -150.0046844482422, -143.0324249267578, -136.06016540527344, -129.08790588378906, -122.11563873291016, -115.14337158203125, -108.17111206054688, -101.1988525390625, -94.22659301757812, -87.25432586669922, -80.28206634521484, -73.30979919433594, -66.33753967285156, -59.36527633666992, -52.39301300048828, -45.420753479003906, -38.448490142822266, -31.476242065429688, -24.503978729248047, -17.53171730041504, -10.559455871582031, -3.5871925354003906, 3.38507080078125, 10.357330322265625, 17.329593658447266, 24.301856994628906, 31.274120330810547, 38.24638366699219, 45.21864318847656, 52.1909065246582, 59.163169860839844, 66.13542938232422, 73.10769653320312, 80.0799560546875, 87.05221557617188, 94.02448272705078, 100.99674224853516, 107.96900939941406, 114.94126892089844, 121.91352844238281, 128.8857879638672, 135.85806274414062, 142.830322265625, 149.80258178710938, 156.77484130859375, 163.7471160888672, 170.71937561035156, 177.69163513183594, 184.6638946533203, 191.6361541748047]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 8.0, 5.0, 3.0, 7.0, 6.0, 9.0, 15.0, 22.0, 17.0, 47.0, 61.0, 79.0, 104.0, 180.0, 262.0, 416.0, 730.0, 1196.0, 2180.0, 4479.0, 10078.0, 26491.0, 97076.0, 3627172.0, 341345.0, 50854.0, 16644.0, 6961.0, 3430.0, 1742.0, 993.0, 619.0, 350.0, 229.0, 152.0, 103.0, 70.0, 49.0, 36.0, 19.0, 10.0, 9.0, 2.0, 5.0, 4.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-68.6875, -66.5263671875, -64.365234375, -62.2041015625, -60.04296875, -57.8818359375, -55.720703125, -53.5595703125, -51.3984375, -49.2373046875, -47.076171875, -44.9150390625, -42.75390625, -40.5927734375, -38.431640625, -36.2705078125, -34.109375, -31.9482421875, -29.787109375, -27.6259765625, -25.46484375, -23.3037109375, -21.142578125, -18.9814453125, -16.8203125, -14.6591796875, -12.498046875, -10.3369140625, -8.17578125, -6.0146484375, -3.853515625, -1.6923828125, 0.46875, 2.6298828125, 4.791015625, 6.9521484375, 9.11328125, 11.2744140625, 13.435546875, 15.5966796875, 17.7578125, 19.9189453125, 22.080078125, 24.2412109375, 26.40234375, 28.5634765625, 30.724609375, 32.8857421875, 35.046875, 37.2080078125, 39.369140625, 41.5302734375, 43.69140625, 45.8525390625, 48.013671875, 50.1748046875, 52.3359375, 54.4970703125, 56.658203125, 58.8193359375, 60.98046875, 63.1416015625, 65.302734375, 67.4638671875, 69.625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 8.0, 13.0, 12.0, 23.0, 29.0, 36.0, 36.0, 30.0, 49.0, 50.0, 56.0, 65.0, 57.0, 59.0, 54.0, 61.0, 43.0, 43.0, 35.0, 50.0, 32.0, 33.0, 27.0, 17.0, 13.0, 9.0, 9.0, 10.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.046875, -5.825927734375, -5.60498046875, -5.384033203125, -5.1630859375, -4.942138671875, -4.72119140625, -4.500244140625, -4.279296875, -4.058349609375, -3.83740234375, -3.616455078125, -3.3955078125, -3.174560546875, -2.95361328125, -2.732666015625, -2.51171875, -2.290771484375, -2.06982421875, -1.848876953125, -1.6279296875, -1.406982421875, -1.18603515625, -0.965087890625, -0.744140625, -0.523193359375, -0.30224609375, -0.081298828125, 0.1396484375, 0.360595703125, 0.58154296875, 0.802490234375, 1.0234375, 1.244384765625, 1.46533203125, 1.686279296875, 1.9072265625, 2.128173828125, 2.34912109375, 2.570068359375, 2.791015625, 3.011962890625, 3.23291015625, 3.453857421875, 3.6748046875, 3.895751953125, 4.11669921875, 4.337646484375, 4.55859375, 4.779541015625, 5.00048828125, 5.221435546875, 5.4423828125, 5.663330078125, 5.88427734375, 6.105224609375, 6.326171875, 6.547119140625, 6.76806640625, 6.989013671875, 7.2099609375, 7.430908203125, 7.65185546875, 7.872802734375, 8.09375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 9.0, 8.0, 18.0, 35.0, 23.0, 36.0, 40.0, 75.0, 112.0, 205.0, 343.0, 651.0, 1324.0, 2777.0, 6446.0, 18874.0, 83110.0, 3353880.0, 644200.0, 57770.0, 14358.0, 5254.0, 2252.0, 1094.0, 581.0, 287.0, 179.0, 105.0, 69.0, 52.0, 38.0, 22.0, 22.0, 10.0, 9.0, 5.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.25, -90.4150390625, -87.580078125, -84.7451171875, -81.91015625, -79.0751953125, -76.240234375, -73.4052734375, -70.5703125, -67.7353515625, -64.900390625, -62.0654296875, -59.23046875, -56.3955078125, -53.560546875, -50.7255859375, -47.890625, -45.0556640625, -42.220703125, -39.3857421875, -36.55078125, -33.7158203125, -30.880859375, -28.0458984375, -25.2109375, -22.3759765625, -19.541015625, -16.7060546875, -13.87109375, -11.0361328125, -8.201171875, -5.3662109375, -2.53125, 0.3037109375, 3.138671875, 5.9736328125, 8.80859375, 11.6435546875, 14.478515625, 17.3134765625, 20.1484375, 22.9833984375, 25.818359375, 28.6533203125, 31.48828125, 34.3232421875, 37.158203125, 39.9931640625, 42.828125, 45.6630859375, 48.498046875, 51.3330078125, 54.16796875, 57.0029296875, 59.837890625, 62.6728515625, 65.5078125, 68.3427734375, 71.177734375, 74.0126953125, 76.84765625, 79.6826171875, 82.517578125, 85.3525390625, 88.1875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 12.0, 12.0, 15.0, 19.0, 27.0, 53.0, 79.0, 157.0, 415.0, 2587.0, 327.0, 156.0, 81.0, 40.0, 34.0, 15.0, 12.0, 7.0, 6.0, 2.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.5625, -27.732666015625, -26.90283203125, -26.072998046875, -25.2431640625, -24.413330078125, -23.58349609375, -22.753662109375, -21.923828125, -21.093994140625, -20.26416015625, -19.434326171875, -18.6044921875, -17.774658203125, -16.94482421875, -16.114990234375, -15.28515625, -14.455322265625, -13.62548828125, -12.795654296875, -11.9658203125, -11.135986328125, -10.30615234375, -9.476318359375, -8.646484375, -7.816650390625, -6.98681640625, -6.156982421875, -5.3271484375, -4.497314453125, -3.66748046875, -2.837646484375, -2.0078125, -1.177978515625, -0.34814453125, 0.481689453125, 1.3115234375, 2.141357421875, 2.97119140625, 3.801025390625, 4.630859375, 5.460693359375, 6.29052734375, 7.120361328125, 7.9501953125, 8.780029296875, 9.60986328125, 10.439697265625, 11.26953125, 12.099365234375, 12.92919921875, 13.759033203125, 14.5888671875, 15.418701171875, 16.24853515625, 17.078369140625, 17.908203125, 18.738037109375, 19.56787109375, 20.397705078125, 21.2275390625, 22.057373046875, 22.88720703125, 23.717041015625, 24.546875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 11.0, 22.0, 27.0, 36.0, 61.0, 104.0, 132.0, 155.0, 143.0, 125.0, 70.0, 45.0, 25.0, 19.0, 10.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.69446563720703, -111.07264709472656, -107.45083618164062, -103.82901763916016, -100.20720672607422, -96.58538818359375, -92.96357727050781, -89.34175872802734, -85.7199478149414, -82.09812927246094, -78.476318359375, -74.85449981689453, -71.2326889038086, -67.61087036132812, -63.98905944824219, -60.36724090576172, -56.745426177978516, -53.12361145019531, -49.50179672241211, -45.879981994628906, -42.2581672668457, -38.6363525390625, -35.01453399658203, -31.39272117614746, -27.770906448364258, -24.149091720581055, -20.52727699279785, -16.905460357666016, -13.283646583557129, -9.66183090209961, -6.040016174316406, -2.418201446533203, 1.20361328125, 4.825428009033203, 8.447242736816406, 12.069058418273926, 15.690873146057129, 19.31268882751465, 22.93450355529785, 26.556318283081055, 30.178133010864258, 33.799949645996094, 37.4217643737793, 41.0435791015625, 44.6653938293457, 48.287208557128906, 51.90902328491211, 55.53083801269531, 59.152652740478516, 62.77446746826172, 66.39628601074219, 70.01809692382812, 73.6399154663086, 77.26172637939453, 80.883544921875, 84.50535583496094, 88.1271743774414, 91.74899291992188, 95.37080383300781, 98.99262237548828, 102.61443328857422, 106.23625183105469, 109.85806274414062, 113.4798812866211, 117.10169219970703]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 8.0, 18.0, 16.0, 18.0, 23.0, 28.0, 25.0, 22.0, 21.0, 34.0, 31.0, 38.0, 38.0, 37.0, 39.0, 34.0, 41.0, 27.0, 38.0, 41.0, 51.0, 35.0, 30.0, 38.0, 21.0, 29.0, 27.0, 17.0, 28.0, 26.0, 17.0, 10.0, 16.0, 12.0, 12.0, 6.0, 4.0, 2.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.5582389831543, -44.98756408691406, -43.41688537597656, -41.84620666503906, -40.27553176879883, -38.704856872558594, -37.134178161621094, -35.563499450683594, -33.99282455444336, -32.422149658203125, -30.851470947265625, -29.280794143676758, -27.71011734008789, -26.139440536499023, -24.568763732910156, -22.99808692932129, -21.427410125732422, -19.856733322143555, -18.286056518554688, -16.71537971496582, -15.144702911376953, -13.574026107788086, -12.003349304199219, -10.432672500610352, -8.861995697021484, -7.291318893432617, -5.72064208984375, -4.149965286254883, -2.5792884826660156, -1.0086116790771484, 0.5620651245117188, 2.132741928100586, 3.7034225463867188, 5.274099349975586, 6.844776153564453, 8.41545295715332, 9.986129760742188, 11.556806564331055, 13.127483367919922, 14.698160171508789, 16.268836975097656, 17.839513778686523, 19.41019058227539, 20.980867385864258, 22.551544189453125, 24.122220993041992, 25.69289779663086, 27.263574600219727, 28.834251403808594, 30.40492820739746, 31.975605010986328, 33.54627990722656, 35.11695861816406, 36.68763732910156, 38.2583122253418, 39.82898712158203, 41.39966583251953, 42.97034454345703, 44.541019439697266, 46.1116943359375, 47.682373046875, 49.2530517578125, 50.823726654052734, 52.39440155029297, 53.96508026123047]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 0.0, 7.0, 9.0, 13.0, 22.0, 34.0, 35.0, 55.0, 100.0, 102.0, 233.0, 366.0, 566.0, 926.0, 1650.0, 2944.0, 5763.0, 11578.0, 24762.0, 57560.0, 148383.0, 368619.0, 255669.0, 94931.0, 39032.0, 17239.0, 8284.0, 4204.0, 2244.0, 1198.0, 752.0, 459.0, 278.0, 169.0, 122.0, 74.0, 50.0, 38.0, 24.0, 16.0, 17.0, 14.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.125, -34.91162109375, -33.6982421875, -32.48486328125, -31.271484375, -30.05810546875, -28.8447265625, -27.63134765625, -26.41796875, -25.20458984375, -23.9912109375, -22.77783203125, -21.564453125, -20.35107421875, -19.1376953125, -17.92431640625, -16.7109375, -15.49755859375, -14.2841796875, -13.07080078125, -11.857421875, -10.64404296875, -9.4306640625, -8.21728515625, -7.00390625, -5.79052734375, -4.5771484375, -3.36376953125, -2.150390625, -0.93701171875, 0.2763671875, 1.48974609375, 2.703125, 3.91650390625, 5.1298828125, 6.34326171875, 7.556640625, 8.77001953125, 9.9833984375, 11.19677734375, 12.41015625, 13.62353515625, 14.8369140625, 16.05029296875, 17.263671875, 18.47705078125, 19.6904296875, 20.90380859375, 22.1171875, 23.33056640625, 24.5439453125, 25.75732421875, 26.970703125, 28.18408203125, 29.3974609375, 30.61083984375, 31.82421875, 33.03759765625, 34.2509765625, 35.46435546875, 36.677734375, 37.89111328125, 39.1044921875, 40.31787109375, 41.53125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 8.0, 10.0, 8.0, 13.0, 28.0, 38.0, 40.0, 40.0, 47.0, 70.0, 68.0, 59.0, 66.0, 72.0, 62.0, 54.0, 66.0, 50.0, 36.0, 29.0, 33.0, 23.0, 16.0, 14.0, 8.0, 15.0, 9.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.4537353515625, -8.188720703125, -7.9237060546875, -7.65869140625, -7.3936767578125, -7.128662109375, -6.8636474609375, -6.5986328125, -6.3336181640625, -6.068603515625, -5.8035888671875, -5.53857421875, -5.2735595703125, -5.008544921875, -4.7435302734375, -4.478515625, -4.2135009765625, -3.948486328125, -3.6834716796875, -3.41845703125, -3.1534423828125, -2.888427734375, -2.6234130859375, -2.3583984375, -2.0933837890625, -1.828369140625, -1.5633544921875, -1.29833984375, -1.0333251953125, -0.768310546875, -0.5032958984375, -0.23828125, 0.0267333984375, 0.291748046875, 0.5567626953125, 0.82177734375, 1.0867919921875, 1.351806640625, 1.6168212890625, 1.8818359375, 2.1468505859375, 2.411865234375, 2.6768798828125, 2.94189453125, 3.2069091796875, 3.471923828125, 3.7369384765625, 4.001953125, 4.2669677734375, 4.531982421875, 4.7969970703125, 5.06201171875, 5.3270263671875, 5.592041015625, 5.8570556640625, 6.1220703125, 6.3870849609375, 6.652099609375, 6.9171142578125, 7.18212890625, 7.4471435546875, 7.712158203125, 7.9771728515625, 8.2421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 8.0, 7.0, 8.0, 16.0, 28.0, 34.0, 42.0, 67.0, 117.0, 194.0, 280.0, 458.0, 818.0, 1335.0, 2284.0, 4323.0, 8027.0, 16583.0, 36610.0, 96332.0, 310286.0, 372038.0, 117124.0, 42833.0, 18752.0, 8981.0, 4652.0, 2597.0, 1429.0, 819.0, 512.0, 349.0, 180.0, 133.0, 100.0, 58.0, 39.0, 27.0, 18.0, 17.0, 12.0, 13.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-44.75, -43.3974609375, -42.044921875, -40.6923828125, -39.33984375, -37.9873046875, -36.634765625, -35.2822265625, -33.9296875, -32.5771484375, -31.224609375, -29.8720703125, -28.51953125, -27.1669921875, -25.814453125, -24.4619140625, -23.109375, -21.7568359375, -20.404296875, -19.0517578125, -17.69921875, -16.3466796875, -14.994140625, -13.6416015625, -12.2890625, -10.9365234375, -9.583984375, -8.2314453125, -6.87890625, -5.5263671875, -4.173828125, -2.8212890625, -1.46875, -0.1162109375, 1.236328125, 2.5888671875, 3.94140625, 5.2939453125, 6.646484375, 7.9990234375, 9.3515625, 10.7041015625, 12.056640625, 13.4091796875, 14.76171875, 16.1142578125, 17.466796875, 18.8193359375, 20.171875, 21.5244140625, 22.876953125, 24.2294921875, 25.58203125, 26.9345703125, 28.287109375, 29.6396484375, 30.9921875, 32.3447265625, 33.697265625, 35.0498046875, 36.40234375, 37.7548828125, 39.107421875, 40.4599609375, 41.8125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 12.0, 6.0, 7.0, 9.0, 10.0, 13.0, 19.0, 16.0, 23.0, 39.0, 32.0, 37.0, 46.0, 51.0, 50.0, 52.0, 57.0, 42.0, 53.0, 54.0, 48.0, 38.0, 40.0, 36.0, 29.0, 26.0, 25.0, 22.0, 24.0, 16.0, 10.0, 14.0, 15.0, 10.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.78125, -42.5419921875, -41.302734375, -40.0634765625, -38.82421875, -37.5849609375, -36.345703125, -35.1064453125, -33.8671875, -32.6279296875, -31.388671875, -30.1494140625, -28.91015625, -27.6708984375, -26.431640625, -25.1923828125, -23.953125, -22.7138671875, -21.474609375, -20.2353515625, -18.99609375, -17.7568359375, -16.517578125, -15.2783203125, -14.0390625, -12.7998046875, -11.560546875, -10.3212890625, -9.08203125, -7.8427734375, -6.603515625, -5.3642578125, -4.125, -2.8857421875, -1.646484375, -0.4072265625, 0.83203125, 2.0712890625, 3.310546875, 4.5498046875, 5.7890625, 7.0283203125, 8.267578125, 9.5068359375, 10.74609375, 11.9853515625, 13.224609375, 14.4638671875, 15.703125, 16.9423828125, 18.181640625, 19.4208984375, 20.66015625, 21.8994140625, 23.138671875, 24.3779296875, 25.6171875, 26.8564453125, 28.095703125, 29.3349609375, 30.57421875, 31.8134765625, 33.052734375, 34.2919921875, 35.53125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 14.0, 17.0, 17.0, 22.0, 17.0, 40.0, 70.0, 109.0, 131.0, 145.0, 222.0, 365.0, 493.0, 721.0, 1161.0, 1887.0, 3991.0, 11952.0, 76858.0, 765024.0, 156605.0, 17371.0, 5159.0, 2313.0, 1262.0, 818.0, 557.0, 352.0, 263.0, 182.0, 111.0, 84.0, 52.0, 46.0, 40.0, 32.0, 9.0, 17.0, 4.0, 4.0, 3.0, 6.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.4375, -39.990234375, -38.54296875, -37.095703125, -35.6484375, -34.201171875, -32.75390625, -31.306640625, -29.859375, -28.412109375, -26.96484375, -25.517578125, -24.0703125, -22.623046875, -21.17578125, -19.728515625, -18.28125, -16.833984375, -15.38671875, -13.939453125, -12.4921875, -11.044921875, -9.59765625, -8.150390625, -6.703125, -5.255859375, -3.80859375, -2.361328125, -0.9140625, 0.533203125, 1.98046875, 3.427734375, 4.875, 6.322265625, 7.76953125, 9.216796875, 10.6640625, 12.111328125, 13.55859375, 15.005859375, 16.453125, 17.900390625, 19.34765625, 20.794921875, 22.2421875, 23.689453125, 25.13671875, 26.583984375, 28.03125, 29.478515625, 30.92578125, 32.373046875, 33.8203125, 35.267578125, 36.71484375, 38.162109375, 39.609375, 41.056640625, 42.50390625, 43.951171875, 45.3984375, 46.845703125, 48.29296875, 49.740234375, 51.1875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 21.0, 30.0, 121.0, 446.0, 253.0, 72.0, 24.0, 16.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0269775390625, -0.0263746976852417, -0.0257718563079834, -0.025169014930725098, -0.024566173553466797, -0.023963332176208496, -0.023360490798950195, -0.022757649421691895, -0.022154808044433594, -0.021551966667175293, -0.020949125289916992, -0.02034628391265869, -0.01974344253540039, -0.01914060115814209, -0.01853775978088379, -0.01793491840362549, -0.017332077026367188, -0.016729235649108887, -0.016126394271850586, -0.015523552894592285, -0.014920711517333984, -0.014317870140075684, -0.013715028762817383, -0.013112187385559082, -0.012509346008300781, -0.01190650463104248, -0.01130366325378418, -0.010700821876525879, -0.010097980499267578, -0.009495139122009277, -0.008892297744750977, -0.008289456367492676, -0.007686614990234375, -0.007083773612976074, -0.0064809322357177734, -0.005878090858459473, -0.005275249481201172, -0.004672408103942871, -0.00406956672668457, -0.0034667253494262695, -0.0028638839721679688, -0.002261042594909668, -0.0016582012176513672, -0.0010553598403930664, -0.0004525184631347656, 0.00015032291412353516, 0.0007531642913818359, 0.0013560056686401367, 0.0019588470458984375, 0.0025616884231567383, 0.003164529800415039, 0.00376737117767334, 0.004370212554931641, 0.004973053932189941, 0.005575895309448242, 0.006178736686706543, 0.006781578063964844, 0.0073844194412231445, 0.007987260818481445, 0.008590102195739746, 0.009192943572998047, 0.009795784950256348, 0.010398626327514648, 0.01100146770477295, 0.01160430908203125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 11.0, 10.0, 32.0, 33.0, 35.0, 52.0, 69.0, 103.0, 164.0, 264.0, 379.0, 594.0, 934.0, 1616.0, 3179.0, 8660.0, 45211.0, 661392.0, 289432.0, 24171.0, 5950.0, 2449.0, 1415.0, 854.0, 493.0, 342.0, 209.0, 163.0, 106.0, 65.0, 52.0, 28.0, 24.0, 11.0, 16.0, 7.0, 6.0, 7.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-56.09375, -54.611328125, -53.12890625, -51.646484375, -50.1640625, -48.681640625, -47.19921875, -45.716796875, -44.234375, -42.751953125, -41.26953125, -39.787109375, -38.3046875, -36.822265625, -35.33984375, -33.857421875, -32.375, -30.892578125, -29.41015625, -27.927734375, -26.4453125, -24.962890625, -23.48046875, -21.998046875, -20.515625, -19.033203125, -17.55078125, -16.068359375, -14.5859375, -13.103515625, -11.62109375, -10.138671875, -8.65625, -7.173828125, -5.69140625, -4.208984375, -2.7265625, -1.244140625, 0.23828125, 1.720703125, 3.203125, 4.685546875, 6.16796875, 7.650390625, 9.1328125, 10.615234375, 12.09765625, 13.580078125, 15.0625, 16.544921875, 18.02734375, 19.509765625, 20.9921875, 22.474609375, 23.95703125, 25.439453125, 26.921875, 28.404296875, 29.88671875, 31.369140625, 32.8515625, 34.333984375, 35.81640625, 37.298828125, 38.78125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 8.0, 4.0, 11.0, 19.0, 27.0, 46.0, 66.0, 112.0, 168.0, 176.0, 132.0, 85.0, 54.0, 24.0, 22.0, 17.0, 8.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-38.09375, -37.0986328125, -36.103515625, -35.1083984375, -34.11328125, -33.1181640625, -32.123046875, -31.1279296875, -30.1328125, -29.1376953125, -28.142578125, -27.1474609375, -26.15234375, -25.1572265625, -24.162109375, -23.1669921875, -22.171875, -21.1767578125, -20.181640625, -19.1865234375, -18.19140625, -17.1962890625, -16.201171875, -15.2060546875, -14.2109375, -13.2158203125, -12.220703125, -11.2255859375, -10.23046875, -9.2353515625, -8.240234375, -7.2451171875, -6.25, -5.2548828125, -4.259765625, -3.2646484375, -2.26953125, -1.2744140625, -0.279296875, 0.7158203125, 1.7109375, 2.7060546875, 3.701171875, 4.6962890625, 5.69140625, 6.6865234375, 7.681640625, 8.6767578125, 9.671875, 10.6669921875, 11.662109375, 12.6572265625, 13.65234375, 14.6474609375, 15.642578125, 16.6376953125, 17.6328125, 18.6279296875, 19.623046875, 20.6181640625, 21.61328125, 22.6083984375, 23.603515625, 24.5986328125, 25.59375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 7.0, 8.0, 9.0, 14.0, 18.0, 21.0, 38.0, 35.0, 48.0, 62.0, 87.0, 103.0, 91.0, 93.0, 76.0, 68.0, 56.0, 40.0, 25.0, 25.0, 25.0, 13.0, 9.0, 7.0, 2.0, 6.0, 3.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-176.0668182373047, -168.53146362304688, -160.99612426757812, -153.4607696533203, -145.9254150390625, -138.39007568359375, -130.85472106933594, -123.31936645507812, -115.78401947021484, -108.24867248535156, -100.71331787109375, -93.17797088623047, -85.64262390136719, -78.10726928710938, -70.5719223022461, -63.03657150268555, -55.501220703125, -47.96586990356445, -40.430519104003906, -32.895172119140625, -25.359821319580078, -17.82447052001953, -10.28912353515625, -2.753772735595703, 4.781578063964844, 12.316927909851074, 19.852277755737305, 27.38762664794922, 34.922977447509766, 42.45832824707031, 49.993675231933594, 57.52902603149414, 65.06439208984375, 72.59973907470703, 80.13509368896484, 87.67044067382812, 95.20579528808594, 102.74114227294922, 110.2764892578125, 117.81184387207031, 125.3471908569336, 132.88253784179688, 140.4178924560547, 147.9532470703125, 155.48858642578125, 163.02394104003906, 170.55929565429688, 178.09463500976562, 185.62998962402344, 193.16534423828125, 200.70068359375, 208.2360382080078, 215.77139282226562, 223.30673217773438, 230.8420867919922, 238.37744140625, 245.91278076171875, 253.44813537597656, 260.9834899902344, 268.5188293457031, 276.0541687011719, 283.58953857421875, 291.1248779296875, 298.66021728515625, 306.1955871582031]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 4.0, 5.0, 5.0, 6.0, 8.0, 11.0, 18.0, 12.0, 22.0, 22.0, 21.0, 29.0, 31.0, 38.0, 46.0, 32.0, 36.0, 47.0, 39.0, 58.0, 45.0, 59.0, 31.0, 37.0, 32.0, 51.0, 32.0, 35.0, 30.0, 21.0, 30.0, 19.0, 17.0, 13.0, 13.0, 5.0, 5.0, 12.0, 9.0, 6.0, 1.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-201.77781677246094, -195.5265350341797, -189.27525329589844, -183.0239715576172, -176.77268981933594, -170.52142333984375, -164.2701416015625, -158.01885986328125, -151.767578125, -145.51629638671875, -139.2650146484375, -133.01373291015625, -126.76245880126953, -120.51117706298828, -114.25989532470703, -108.00862121582031, -101.75733184814453, -95.50605010986328, -89.25476837158203, -83.00349426269531, -76.75221252441406, -70.50093078613281, -64.24964904785156, -57.99837112426758, -51.74708938598633, -45.49580764770508, -39.244529724121094, -32.993247985839844, -26.741968154907227, -20.49068832397461, -14.23940658569336, -7.988128662109375, -1.736846923828125, 4.51443338394165, 10.765713691711426, 17.01699447631836, 23.268274307250977, 29.519554138183594, 35.770835876464844, 42.02211380004883, 48.27339553833008, 54.52467727661133, 60.77595520019531, 67.02723693847656, 73.27851867675781, 79.52980041503906, 85.78108215332031, 92.03235626220703, 98.28363800048828, 104.53491973876953, 110.78620147705078, 117.0374755859375, 123.28875732421875, 129.5400390625, 135.79132080078125, 142.0426025390625, 148.29388427734375, 154.545166015625, 160.79644775390625, 167.0477294921875, 173.29901123046875, 179.55029296875, 185.80157470703125, 192.05284118652344, 198.3041229248047]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 8.0, 12.0, 11.0, 20.0, 34.0, 41.0, 77.0, 116.0, 178.0, 297.0, 564.0, 993.0, 2302.0, 5913.0, 20776.0, 162451.0, 3920404.0, 60440.0, 12126.0, 4065.0, 1609.0, 817.0, 401.0, 227.0, 134.0, 87.0, 68.0, 37.0, 23.0, 16.0, 11.0, 10.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-101.5, -98.541015625, -95.58203125, -92.623046875, -89.6640625, -86.705078125, -83.74609375, -80.787109375, -77.828125, -74.869140625, -71.91015625, -68.951171875, -65.9921875, -63.033203125, -60.07421875, -57.115234375, -54.15625, -51.197265625, -48.23828125, -45.279296875, -42.3203125, -39.361328125, -36.40234375, -33.443359375, -30.484375, -27.525390625, -24.56640625, -21.607421875, -18.6484375, -15.689453125, -12.73046875, -9.771484375, -6.8125, -3.853515625, -0.89453125, 2.064453125, 5.0234375, 7.982421875, 10.94140625, 13.900390625, 16.859375, 19.818359375, 22.77734375, 25.736328125, 28.6953125, 31.654296875, 34.61328125, 37.572265625, 40.53125, 43.490234375, 46.44921875, 49.408203125, 52.3671875, 55.326171875, 58.28515625, 61.244140625, 64.203125, 67.162109375, 70.12109375, 73.080078125, 76.0390625, 78.998046875, 81.95703125, 84.916015625, 87.875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 18.0, 22.0, 22.0, 23.0, 20.0, 36.0, 39.0, 44.0, 51.0, 55.0, 63.0, 52.0, 55.0, 67.0, 43.0, 58.0, 51.0, 39.0, 36.0, 42.0, 28.0, 20.0, 18.0, 16.0, 12.0, 18.0, 14.0, 7.0, 5.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.11834716796875, -7.8695068359375, -7.62066650390625, -7.371826171875, -7.12298583984375, -6.8741455078125, -6.62530517578125, -6.37646484375, -6.12762451171875, -5.8787841796875, -5.62994384765625, -5.381103515625, -5.13226318359375, -4.8834228515625, -4.63458251953125, -4.3857421875, -4.13690185546875, -3.8880615234375, -3.63922119140625, -3.390380859375, -3.14154052734375, -2.8927001953125, -2.64385986328125, -2.39501953125, -2.14617919921875, -1.8973388671875, -1.64849853515625, -1.399658203125, -1.15081787109375, -0.9019775390625, -0.65313720703125, -0.404296875, -0.15545654296875, 0.0933837890625, 0.34222412109375, 0.591064453125, 0.83990478515625, 1.0887451171875, 1.33758544921875, 1.58642578125, 1.83526611328125, 2.0841064453125, 2.33294677734375, 2.581787109375, 2.83062744140625, 3.0794677734375, 3.32830810546875, 3.5771484375, 3.82598876953125, 4.0748291015625, 4.32366943359375, 4.572509765625, 4.82135009765625, 5.0701904296875, 5.31903076171875, 5.56787109375, 5.81671142578125, 6.0655517578125, 6.31439208984375, 6.563232421875, 6.81207275390625, 7.0609130859375, 7.30975341796875, 7.55859375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 4.0, 11.0, 12.0, 15.0, 18.0, 32.0, 50.0, 65.0, 104.0, 143.0, 264.0, 345.0, 683.0, 1351.0, 2935.0, 8085.0, 30215.0, 251723.0, 3780167.0, 91730.0, 17007.0, 5146.0, 2133.0, 929.0, 459.0, 270.0, 153.0, 93.0, 45.0, 31.0, 18.0, 18.0, 9.0, 11.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-112.625, -109.60546875, -106.5859375, -103.56640625, -100.546875, -97.52734375, -94.5078125, -91.48828125, -88.46875, -85.44921875, -82.4296875, -79.41015625, -76.390625, -73.37109375, -70.3515625, -67.33203125, -64.3125, -61.29296875, -58.2734375, -55.25390625, -52.234375, -49.21484375, -46.1953125, -43.17578125, -40.15625, -37.13671875, -34.1171875, -31.09765625, -28.078125, -25.05859375, -22.0390625, -19.01953125, -16.0, -12.98046875, -9.9609375, -6.94140625, -3.921875, -0.90234375, 2.1171875, 5.13671875, 8.15625, 11.17578125, 14.1953125, 17.21484375, 20.234375, 23.25390625, 26.2734375, 29.29296875, 32.3125, 35.33203125, 38.3515625, 41.37109375, 44.390625, 47.41015625, 50.4296875, 53.44921875, 56.46875, 59.48828125, 62.5078125, 65.52734375, 68.546875, 71.56640625, 74.5859375, 77.60546875, 80.625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 8.0, 9.0, 3.0, 15.0, 12.0, 24.0, 37.0, 64.0, 91.0, 179.0, 726.0, 2322.0, 237.0, 125.0, 63.0, 54.0, 37.0, 12.0, 13.0, 4.0, 5.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.625, -26.953369140625, -26.28173828125, -25.610107421875, -24.9384765625, -24.266845703125, -23.59521484375, -22.923583984375, -22.251953125, -21.580322265625, -20.90869140625, -20.237060546875, -19.5654296875, -18.893798828125, -18.22216796875, -17.550537109375, -16.87890625, -16.207275390625, -15.53564453125, -14.864013671875, -14.1923828125, -13.520751953125, -12.84912109375, -12.177490234375, -11.505859375, -10.834228515625, -10.16259765625, -9.490966796875, -8.8193359375, -8.147705078125, -7.47607421875, -6.804443359375, -6.1328125, -5.461181640625, -4.78955078125, -4.117919921875, -3.4462890625, -2.774658203125, -2.10302734375, -1.431396484375, -0.759765625, -0.088134765625, 0.58349609375, 1.255126953125, 1.9267578125, 2.598388671875, 3.27001953125, 3.941650390625, 4.61328125, 5.284912109375, 5.95654296875, 6.628173828125, 7.2998046875, 7.971435546875, 8.64306640625, 9.314697265625, 9.986328125, 10.657958984375, 11.32958984375, 12.001220703125, 12.6728515625, 13.344482421875, 14.01611328125, 14.687744140625, 15.359375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 11.0, 16.0, 43.0, 60.0, 77.0, 106.0, 162.0, 174.0, 128.0, 89.0, 52.0, 29.0, 14.0, 16.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.265480041503906, -59.545352935791016, -55.82522201538086, -52.10509490966797, -48.38496398925781, -44.66483688354492, -40.94470977783203, -37.224578857421875, -33.504451751708984, -29.78432273864746, -26.064193725585938, -22.344066619873047, -18.623937606811523, -14.90380859375, -11.18368148803711, -7.463552474975586, -3.7434234619140625, -0.023294925689697266, 3.696833610534668, 7.416961669921875, 11.137090682983398, 14.857219696044922, 18.577346801757812, 22.297475814819336, 26.01760482788086, 29.737733840942383, 33.457862854003906, 37.1779899597168, 40.89811706542969, 44.618247985839844, 48.338375091552734, 52.058502197265625, 55.77862548828125, 59.49875259399414, 63.2188835144043, 66.93901062011719, 70.65914154052734, 74.3792724609375, 78.09939575195312, 81.81952667236328, 85.53965759277344, 89.2597885131836, 92.97991180419922, 96.70004272460938, 100.42017364501953, 104.14030456542969, 107.86042785644531, 111.58055877685547, 115.3006820678711, 119.02081298828125, 122.74093627929688, 126.46106719970703, 130.1811981201172, 133.9013214111328, 137.6214599609375, 141.34158325195312, 145.06170654296875, 148.78182983398438, 152.50196838378906, 156.2220916748047, 159.9422149658203, 163.662353515625, 167.38247680664062, 171.10260009765625, 174.82273864746094]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 12.0, 5.0, 11.0, 13.0, 15.0, 14.0, 19.0, 18.0, 28.0, 28.0, 32.0, 31.0, 28.0, 39.0, 42.0, 38.0, 35.0, 39.0, 41.0, 37.0, 30.0, 43.0, 41.0, 24.0, 44.0, 34.0, 28.0, 33.0, 23.0, 28.0, 26.0, 16.0, 15.0, 9.0, 13.0, 9.0, 14.0, 9.0, 4.0, 6.0, 5.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.437034606933594, -45.999656677246094, -44.562278747558594, -43.124900817871094, -41.687522888183594, -40.250144958496094, -38.812767028808594, -37.375389099121094, -35.938011169433594, -34.500633239746094, -33.063255310058594, -31.625877380371094, -30.188499450683594, -28.751121520996094, -27.313745498657227, -25.876367568969727, -24.43899154663086, -23.00161361694336, -21.56423568725586, -20.12685775756836, -18.68947982788086, -17.25210189819336, -15.814725875854492, -14.377347946166992, -12.939970016479492, -11.502592086791992, -10.065214157104492, -8.627837181091309, -7.190459251403809, -5.753081321716309, -4.315704345703125, -2.878326416015625, -1.440948486328125, -0.0035707950592041016, 1.4338068962097168, 2.8711843490600586, 4.308562278747559, 5.745940208435059, 7.183317184448242, 8.620695114135742, 10.058073043823242, 11.495450973510742, 12.932828903198242, 14.370205879211426, 15.807583808898926, 17.24496078491211, 18.68233871459961, 20.11971664428711, 21.55709457397461, 22.99447250366211, 24.43185043334961, 25.86922836303711, 27.30660629272461, 28.74398422241211, 30.181360244750977, 31.618738174438477, 33.056114196777344, 34.493492126464844, 35.930870056152344, 37.368247985839844, 38.805625915527344, 40.243003845214844, 41.680381774902344, 43.117759704589844, 44.555137634277344]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 15.0, 9.0, 17.0, 20.0, 31.0, 42.0, 60.0, 102.0, 126.0, 185.0, 319.0, 436.0, 694.0, 1026.0, 1598.0, 2609.0, 4432.0, 7734.0, 13947.0, 26872.0, 55572.0, 121814.0, 269241.0, 287012.0, 131082.0, 59679.0, 28649.0, 14827.0, 8101.0, 4649.0, 2795.0, 1693.0, 1090.0, 689.0, 401.0, 327.0, 204.0, 125.0, 104.0, 64.0, 51.0, 29.0, 24.0, 21.0, 12.0, 9.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-33.3125, -32.304443359375, -31.29638671875, -30.288330078125, -29.2802734375, -28.272216796875, -27.26416015625, -26.256103515625, -25.248046875, -24.239990234375, -23.23193359375, -22.223876953125, -21.2158203125, -20.207763671875, -19.19970703125, -18.191650390625, -17.18359375, -16.175537109375, -15.16748046875, -14.159423828125, -13.1513671875, -12.143310546875, -11.13525390625, -10.127197265625, -9.119140625, -8.111083984375, -7.10302734375, -6.094970703125, -5.0869140625, -4.078857421875, -3.07080078125, -2.062744140625, -1.0546875, -0.046630859375, 0.96142578125, 1.969482421875, 2.9775390625, 3.985595703125, 4.99365234375, 6.001708984375, 7.009765625, 8.017822265625, 9.02587890625, 10.033935546875, 11.0419921875, 12.050048828125, 13.05810546875, 14.066162109375, 15.07421875, 16.082275390625, 17.09033203125, 18.098388671875, 19.1064453125, 20.114501953125, 21.12255859375, 22.130615234375, 23.138671875, 24.146728515625, 25.15478515625, 26.162841796875, 27.1708984375, 28.178955078125, 29.18701171875, 30.195068359375, 31.203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 3.0, 6.0, 5.0, 7.0, 4.0, 12.0, 17.0, 14.0, 25.0, 22.0, 21.0, 28.0, 31.0, 39.0, 38.0, 37.0, 47.0, 38.0, 45.0, 43.0, 51.0, 42.0, 47.0, 41.0, 43.0, 33.0, 27.0, 23.0, 41.0, 37.0, 23.0, 27.0, 12.0, 9.0, 16.0, 3.0, 12.0, 10.0, 3.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.828125, -6.62347412109375, -6.4188232421875, -6.21417236328125, -6.009521484375, -5.80487060546875, -5.6002197265625, -5.39556884765625, -5.19091796875, -4.98626708984375, -4.7816162109375, -4.57696533203125, -4.372314453125, -4.16766357421875, -3.9630126953125, -3.75836181640625, -3.5537109375, -3.34906005859375, -3.1444091796875, -2.93975830078125, -2.735107421875, -2.53045654296875, -2.3258056640625, -2.12115478515625, -1.91650390625, -1.71185302734375, -1.5072021484375, -1.30255126953125, -1.097900390625, -0.89324951171875, -0.6885986328125, -0.48394775390625, -0.279296875, -0.07464599609375, 0.1300048828125, 0.33465576171875, 0.539306640625, 0.74395751953125, 0.9486083984375, 1.15325927734375, 1.35791015625, 1.56256103515625, 1.7672119140625, 1.97186279296875, 2.176513671875, 2.38116455078125, 2.5858154296875, 2.79046630859375, 2.9951171875, 3.19976806640625, 3.4044189453125, 3.60906982421875, 3.813720703125, 4.01837158203125, 4.2230224609375, 4.42767333984375, 4.63232421875, 4.83697509765625, 5.0416259765625, 5.24627685546875, 5.450927734375, 5.65557861328125, 5.8602294921875, 6.06488037109375, 6.26953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 12.0, 13.0, 25.0, 19.0, 57.0, 71.0, 121.0, 206.0, 325.0, 723.0, 1420.0, 3420.0, 9279.0, 30119.0, 123839.0, 523893.0, 270807.0, 58135.0, 16382.0, 5491.0, 2176.0, 914.0, 496.0, 260.0, 127.0, 70.0, 58.0, 33.0, 22.0, 11.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.625, -49.94580078125, -48.2666015625, -46.58740234375, -44.908203125, -43.22900390625, -41.5498046875, -39.87060546875, -38.19140625, -36.51220703125, -34.8330078125, -33.15380859375, -31.474609375, -29.79541015625, -28.1162109375, -26.43701171875, -24.7578125, -23.07861328125, -21.3994140625, -19.72021484375, -18.041015625, -16.36181640625, -14.6826171875, -13.00341796875, -11.32421875, -9.64501953125, -7.9658203125, -6.28662109375, -4.607421875, -2.92822265625, -1.2490234375, 0.43017578125, 2.109375, 3.78857421875, 5.4677734375, 7.14697265625, 8.826171875, 10.50537109375, 12.1845703125, 13.86376953125, 15.54296875, 17.22216796875, 18.9013671875, 20.58056640625, 22.259765625, 23.93896484375, 25.6181640625, 27.29736328125, 28.9765625, 30.65576171875, 32.3349609375, 34.01416015625, 35.693359375, 37.37255859375, 39.0517578125, 40.73095703125, 42.41015625, 44.08935546875, 45.7685546875, 47.44775390625, 49.126953125, 50.80615234375, 52.4853515625, 54.16455078125, 55.84375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 7.0, 5.0, 9.0, 12.0, 13.0, 19.0, 36.0, 20.0, 31.0, 43.0, 44.0, 53.0, 47.0, 58.0, 51.0, 72.0, 66.0, 63.0, 59.0, 54.0, 45.0, 45.0, 46.0, 23.0, 15.0, 10.0, 14.0, 12.0, 17.0, 8.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.6875, -41.357421875, -40.02734375, -38.697265625, -37.3671875, -36.037109375, -34.70703125, -33.376953125, -32.046875, -30.716796875, -29.38671875, -28.056640625, -26.7265625, -25.396484375, -24.06640625, -22.736328125, -21.40625, -20.076171875, -18.74609375, -17.416015625, -16.0859375, -14.755859375, -13.42578125, -12.095703125, -10.765625, -9.435546875, -8.10546875, -6.775390625, -5.4453125, -4.115234375, -2.78515625, -1.455078125, -0.125, 1.205078125, 2.53515625, 3.865234375, 5.1953125, 6.525390625, 7.85546875, 9.185546875, 10.515625, 11.845703125, 13.17578125, 14.505859375, 15.8359375, 17.166015625, 18.49609375, 19.826171875, 21.15625, 22.486328125, 23.81640625, 25.146484375, 26.4765625, 27.806640625, 29.13671875, 30.466796875, 31.796875, 33.126953125, 34.45703125, 35.787109375, 37.1171875, 38.447265625, 39.77734375, 41.107421875, 42.4375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 10.0, 16.0, 18.0, 23.0, 35.0, 53.0, 87.0, 119.0, 149.0, 222.0, 337.0, 545.0, 746.0, 1187.0, 1968.0, 3286.0, 5846.0, 12178.0, 29283.0, 95436.0, 437259.0, 338813.0, 73265.0, 24144.0, 10299.0, 5104.0, 2941.0, 1706.0, 1115.0, 711.0, 493.0, 329.0, 235.0, 180.0, 120.0, 63.0, 75.0, 40.0, 29.0, 23.0, 23.0, 18.0, 8.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-21.109375, -20.42626953125, -19.7431640625, -19.06005859375, -18.376953125, -17.69384765625, -17.0107421875, -16.32763671875, -15.64453125, -14.96142578125, -14.2783203125, -13.59521484375, -12.912109375, -12.22900390625, -11.5458984375, -10.86279296875, -10.1796875, -9.49658203125, -8.8134765625, -8.13037109375, -7.447265625, -6.76416015625, -6.0810546875, -5.39794921875, -4.71484375, -4.03173828125, -3.3486328125, -2.66552734375, -1.982421875, -1.29931640625, -0.6162109375, 0.06689453125, 0.75, 1.43310546875, 2.1162109375, 2.79931640625, 3.482421875, 4.16552734375, 4.8486328125, 5.53173828125, 6.21484375, 6.89794921875, 7.5810546875, 8.26416015625, 8.947265625, 9.63037109375, 10.3134765625, 10.99658203125, 11.6796875, 12.36279296875, 13.0458984375, 13.72900390625, 14.412109375, 15.09521484375, 15.7783203125, 16.46142578125, 17.14453125, 17.82763671875, 18.5107421875, 19.19384765625, 19.876953125, 20.56005859375, 21.2431640625, 21.92626953125, 22.609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 8.0, 8.0, 11.0, 30.0, 41.0, 52.0, 98.0, 204.0, 197.0, 132.0, 94.0, 38.0, 25.0, 18.0, 12.0, 11.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0107421875, -0.010418534278869629, -0.010094881057739258, -0.009771227836608887, -0.009447574615478516, -0.009123921394348145, -0.008800268173217773, -0.008476614952087402, -0.008152961730957031, -0.00782930850982666, -0.007505655288696289, -0.007182002067565918, -0.006858348846435547, -0.006534695625305176, -0.006211042404174805, -0.005887389183044434, -0.0055637359619140625, -0.005240082740783691, -0.00491642951965332, -0.004592776298522949, -0.004269123077392578, -0.003945469856262207, -0.003621816635131836, -0.003298163414001465, -0.0029745101928710938, -0.0026508569717407227, -0.0023272037506103516, -0.0020035505294799805, -0.0016798973083496094, -0.0013562440872192383, -0.0010325908660888672, -0.0007089376449584961, -0.000385284423828125, -6.16312026977539e-05, 0.0002620220184326172, 0.0005856752395629883, 0.0009093284606933594, 0.0012329816818237305, 0.0015566349029541016, 0.0018802881240844727, 0.0022039413452148438, 0.002527594566345215, 0.002851247787475586, 0.003174901008605957, 0.003498554229736328, 0.0038222074508666992, 0.00414586067199707, 0.004469513893127441, 0.0047931671142578125, 0.005116820335388184, 0.005440473556518555, 0.005764126777648926, 0.006087779998779297, 0.006411433219909668, 0.006735086441040039, 0.00705873966217041, 0.007382392883300781, 0.007706046104431152, 0.008029699325561523, 0.008353352546691895, 0.008677005767822266, 0.009000658988952637, 0.009324312210083008, 0.009647965431213379, 0.00997161865234375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 5.0, 7.0, 9.0, 11.0, 23.0, 27.0, 36.0, 73.0, 110.0, 139.0, 259.0, 445.0, 693.0, 1299.0, 2448.0, 5251.0, 13152.0, 43899.0, 331098.0, 551898.0, 67068.0, 17310.0, 6610.0, 3000.0, 1525.0, 867.0, 476.0, 301.0, 176.0, 103.0, 91.0, 47.0, 22.0, 26.0, 12.0, 13.0, 5.0, 11.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.0625, -36.007568359375, -34.95263671875, -33.897705078125, -32.8427734375, -31.787841796875, -30.73291015625, -29.677978515625, -28.623046875, -27.568115234375, -26.51318359375, -25.458251953125, -24.4033203125, -23.348388671875, -22.29345703125, -21.238525390625, -20.18359375, -19.128662109375, -18.07373046875, -17.018798828125, -15.9638671875, -14.908935546875, -13.85400390625, -12.799072265625, -11.744140625, -10.689208984375, -9.63427734375, -8.579345703125, -7.5244140625, -6.469482421875, -5.41455078125, -4.359619140625, -3.3046875, -2.249755859375, -1.19482421875, -0.139892578125, 0.9150390625, 1.969970703125, 3.02490234375, 4.079833984375, 5.134765625, 6.189697265625, 7.24462890625, 8.299560546875, 9.3544921875, 10.409423828125, 11.46435546875, 12.519287109375, 13.57421875, 14.629150390625, 15.68408203125, 16.739013671875, 17.7939453125, 18.848876953125, 19.90380859375, 20.958740234375, 22.013671875, 23.068603515625, 24.12353515625, 25.178466796875, 26.2333984375, 27.288330078125, 28.34326171875, 29.398193359375, 30.453125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 6.0, 6.0, 9.0, 16.0, 19.0, 22.0, 39.0, 66.0, 85.0, 111.0, 126.0, 142.0, 109.0, 79.0, 46.0, 31.0, 24.0, 18.0, 12.0, 6.0, 5.0, 5.0, 1.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.96875, -28.182373046875, -27.39599609375, -26.609619140625, -25.8232421875, -25.036865234375, -24.25048828125, -23.464111328125, -22.677734375, -21.891357421875, -21.10498046875, -20.318603515625, -19.5322265625, -18.745849609375, -17.95947265625, -17.173095703125, -16.38671875, -15.600341796875, -14.81396484375, -14.027587890625, -13.2412109375, -12.454833984375, -11.66845703125, -10.882080078125, -10.095703125, -9.309326171875, -8.52294921875, -7.736572265625, -6.9501953125, -6.163818359375, -5.37744140625, -4.591064453125, -3.8046875, -3.018310546875, -2.23193359375, -1.445556640625, -0.6591796875, 0.127197265625, 0.91357421875, 1.699951171875, 2.486328125, 3.272705078125, 4.05908203125, 4.845458984375, 5.6318359375, 6.418212890625, 7.20458984375, 7.990966796875, 8.77734375, 9.563720703125, 10.35009765625, 11.136474609375, 11.9228515625, 12.709228515625, 13.49560546875, 14.281982421875, 15.068359375, 15.854736328125, 16.64111328125, 17.427490234375, 18.2138671875, 19.000244140625, 19.78662109375, 20.572998046875, 21.359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 10.0, 30.0, 55.0, 90.0, 123.0, 173.0, 175.0, 151.0, 92.0, 44.0, 31.0, 12.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-419.60833740234375, -406.0770568847656, -392.5458068847656, -379.0145263671875, -365.4832458496094, -351.95196533203125, -338.42071533203125, -324.8894348144531, -311.358154296875, -297.8268737792969, -284.2956237792969, -270.76434326171875, -257.2330627441406, -243.70179748535156, -230.1705322265625, -216.63925170898438, -203.10800170898438, -189.5767364501953, -176.0454559326172, -162.51419067382812, -148.98291015625, -135.45164489746094, -121.92037963867188, -108.38910675048828, -94.85783386230469, -81.3265609741211, -67.7952880859375, -54.26402282714844, -40.732749938964844, -27.20147705078125, -13.670211791992188, -0.13893890380859375, 13.392333984375, 26.92360496520996, 40.45487594604492, 53.98614501953125, 67.51741790771484, 81.04869079589844, 94.5799560546875, 108.1112289428711, 121.64250183105469, 135.17376708984375, 148.70504760742188, 162.23631286621094, 175.767578125, 189.29885864257812, 202.8301239013672, 216.36138916015625, 229.89266967773438, 243.42393493652344, 256.9552001953125, 270.4864807128906, 284.01776123046875, 297.54901123046875, 311.0802917480469, 324.611572265625, 338.142822265625, 351.6741027832031, 365.2053527832031, 378.73663330078125, 392.2679138183594, 405.7991943359375, 419.3304443359375, 432.8617248535156, 446.39300537109375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 6.0, 7.0, 6.0, 8.0, 9.0, 7.0, 17.0, 17.0, 18.0, 25.0, 28.0, 38.0, 36.0, 32.0, 36.0, 46.0, 38.0, 39.0, 51.0, 29.0, 50.0, 39.0, 48.0, 40.0, 36.0, 36.0, 27.0, 31.0, 27.0, 19.0, 17.0, 27.0, 15.0, 18.0, 10.0, 15.0, 8.0, 8.0, 9.0, 3.0, 4.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-155.17877197265625, -149.85716247558594, -144.5355682373047, -139.21395874023438, -133.89234924316406, -128.57073974609375, -123.2491455078125, -117.92753601074219, -112.6059341430664, -107.28433227539062, -101.96272277832031, -96.64112091064453, -91.31951904296875, -85.99790954589844, -80.67630767822266, -75.35470581054688, -70.03309631347656, -64.71149444580078, -59.38988494873047, -54.06828308105469, -48.74667739868164, -43.425071716308594, -38.10346984863281, -32.781864166259766, -27.46025848388672, -22.138652801513672, -16.817049026489258, -11.495444297790527, -6.173839569091797, -0.85223388671875, 4.469369888305664, 9.790973663330078, 15.112564086914062, 20.43416976928711, 25.755773544311523, 31.077377319335938, 36.398983001708984, 41.72058868408203, 47.04219055175781, 52.36379623413086, 57.685401916503906, 63.00700759887695, 68.32861328125, 73.65021514892578, 78.97181701660156, 84.29342651367188, 89.61502838134766, 94.93663024902344, 100.25823974609375, 105.57984161376953, 110.90145111083984, 116.22305297851562, 121.54466247558594, 126.86626434326172, 132.1878662109375, 137.5094757080078, 142.83108520507812, 148.15269470214844, 153.4742889404297, 158.7958984375, 164.1175079345703, 169.43911743164062, 174.76071166992188, 180.0823211669922, 185.40391540527344]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 9.0, 10.0, 13.0, 11.0, 19.0, 28.0, 43.0, 45.0, 79.0, 109.0, 132.0, 177.0, 315.0, 436.0, 661.0, 1042.0, 1773.0, 2896.0, 5403.0, 11295.0, 26660.0, 84689.0, 2448620.0, 1475847.0, 84464.0, 26111.0, 10902.0, 5448.0, 2827.0, 1657.0, 932.0, 539.0, 364.0, 236.0, 130.0, 117.0, 78.0, 44.0, 29.0, 20.0, 23.0, 10.0, 8.0, 7.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-52.96875, -51.36328125, -49.7578125, -48.15234375, -46.546875, -44.94140625, -43.3359375, -41.73046875, -40.125, -38.51953125, -36.9140625, -35.30859375, -33.703125, -32.09765625, -30.4921875, -28.88671875, -27.28125, -25.67578125, -24.0703125, -22.46484375, -20.859375, -19.25390625, -17.6484375, -16.04296875, -14.4375, -12.83203125, -11.2265625, -9.62109375, -8.015625, -6.41015625, -4.8046875, -3.19921875, -1.59375, 0.01171875, 1.6171875, 3.22265625, 4.828125, 6.43359375, 8.0390625, 9.64453125, 11.25, 12.85546875, 14.4609375, 16.06640625, 17.671875, 19.27734375, 20.8828125, 22.48828125, 24.09375, 25.69921875, 27.3046875, 28.91015625, 30.515625, 32.12109375, 33.7265625, 35.33203125, 36.9375, 38.54296875, 40.1484375, 41.75390625, 43.359375, 44.96484375, 46.5703125, 48.17578125, 49.78125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 10.0, 8.0, 9.0, 18.0, 20.0, 11.0, 15.0, 25.0, 25.0, 30.0, 55.0, 44.0, 40.0, 52.0, 40.0, 57.0, 60.0, 44.0, 59.0, 48.0, 36.0, 43.0, 39.0, 35.0, 29.0, 26.0, 22.0, 18.0, 12.0, 19.0, 9.0, 10.0, 9.0, 7.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.6875, -7.45819091796875, -7.2288818359375, -6.99957275390625, -6.770263671875, -6.54095458984375, -6.3116455078125, -6.08233642578125, -5.85302734375, -5.62371826171875, -5.3944091796875, -5.16510009765625, -4.935791015625, -4.70648193359375, -4.4771728515625, -4.24786376953125, -4.0185546875, -3.78924560546875, -3.5599365234375, -3.33062744140625, -3.101318359375, -2.87200927734375, -2.6427001953125, -2.41339111328125, -2.18408203125, -1.95477294921875, -1.7254638671875, -1.49615478515625, -1.266845703125, -1.03753662109375, -0.8082275390625, -0.57891845703125, -0.349609375, -0.12030029296875, 0.1090087890625, 0.33831787109375, 0.567626953125, 0.79693603515625, 1.0262451171875, 1.25555419921875, 1.48486328125, 1.71417236328125, 1.9434814453125, 2.17279052734375, 2.402099609375, 2.63140869140625, 2.8607177734375, 3.09002685546875, 3.3193359375, 3.54864501953125, 3.7779541015625, 4.00726318359375, 4.236572265625, 4.46588134765625, 4.6951904296875, 4.92449951171875, 5.15380859375, 5.38311767578125, 5.6124267578125, 5.84173583984375, 6.071044921875, 6.30035400390625, 6.5296630859375, 6.75897216796875, 6.98828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 11.0, 13.0, 23.0, 34.0, 72.0, 122.0, 188.0, 373.0, 634.0, 1372.0, 2958.0, 7501.0, 22356.0, 100530.0, 3363580.0, 607953.0, 60733.0, 15602.0, 5560.0, 2393.0, 1086.0, 535.0, 272.0, 146.0, 90.0, 71.0, 31.0, 17.0, 5.0, 11.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-72.125, -69.708984375, -67.29296875, -64.876953125, -62.4609375, -60.044921875, -57.62890625, -55.212890625, -52.796875, -50.380859375, -47.96484375, -45.548828125, -43.1328125, -40.716796875, -38.30078125, -35.884765625, -33.46875, -31.052734375, -28.63671875, -26.220703125, -23.8046875, -21.388671875, -18.97265625, -16.556640625, -14.140625, -11.724609375, -9.30859375, -6.892578125, -4.4765625, -2.060546875, 0.35546875, 2.771484375, 5.1875, 7.603515625, 10.01953125, 12.435546875, 14.8515625, 17.267578125, 19.68359375, 22.099609375, 24.515625, 26.931640625, 29.34765625, 31.763671875, 34.1796875, 36.595703125, 39.01171875, 41.427734375, 43.84375, 46.259765625, 48.67578125, 51.091796875, 53.5078125, 55.923828125, 58.33984375, 60.755859375, 63.171875, 65.587890625, 68.00390625, 70.419921875, 72.8359375, 75.251953125, 77.66796875, 80.083984375, 82.5]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 4.0, 5.0, 12.0, 11.0, 13.0, 14.0, 17.0, 26.0, 52.0, 58.0, 91.0, 122.0, 237.0, 716.0, 1842.0, 324.0, 168.0, 111.0, 66.0, 52.0, 21.0, 25.0, 13.0, 12.0, 14.0, 13.0, 7.0, 6.0, 4.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.671875, -19.9384765625, -19.205078125, -18.4716796875, -17.73828125, -17.0048828125, -16.271484375, -15.5380859375, -14.8046875, -14.0712890625, -13.337890625, -12.6044921875, -11.87109375, -11.1376953125, -10.404296875, -9.6708984375, -8.9375, -8.2041015625, -7.470703125, -6.7373046875, -6.00390625, -5.2705078125, -4.537109375, -3.8037109375, -3.0703125, -2.3369140625, -1.603515625, -0.8701171875, -0.13671875, 0.5966796875, 1.330078125, 2.0634765625, 2.796875, 3.5302734375, 4.263671875, 4.9970703125, 5.73046875, 6.4638671875, 7.197265625, 7.9306640625, 8.6640625, 9.3974609375, 10.130859375, 10.8642578125, 11.59765625, 12.3310546875, 13.064453125, 13.7978515625, 14.53125, 15.2646484375, 15.998046875, 16.7314453125, 17.46484375, 18.1982421875, 18.931640625, 19.6650390625, 20.3984375, 21.1318359375, 21.865234375, 22.5986328125, 23.33203125, 24.0654296875, 24.798828125, 25.5322265625, 26.265625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 7.0, 4.0, 5.0, 15.0, 33.0, 62.0, 107.0, 171.0, 176.0, 144.0, 115.0, 74.0, 41.0, 22.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.1884002685547, -245.286865234375, -238.38534545898438, -231.4838104248047, -224.582275390625, -217.68075561523438, -210.7792205810547, -203.877685546875, -196.9761505126953, -190.07461547851562, -183.173095703125, -176.2715606689453, -169.37002563476562, -162.468505859375, -155.5669708251953, -148.66543579101562, -141.763916015625, -134.8623809814453, -127.96085357666016, -121.059326171875, -114.15779113769531, -107.25626373291016, -100.354736328125, -93.45320129394531, -86.55166625976562, -79.65013885498047, -72.74860382080078, -65.84707641601562, -58.94554138183594, -52.04401397705078, -45.14248275756836, -38.24095153808594, -31.33941650390625, -24.437885284423828, -17.536354064941406, -10.634824752807617, -3.7332935333251953, 3.1682357788085938, 10.069766998291016, 16.971298217773438, 23.87282943725586, 30.77436065673828, 37.6758918762207, 44.577423095703125, 51.47895050048828, 58.3804817199707, 65.28201293945312, 72.18354797363281, 79.08507537841797, 85.98660278320312, 92.88813781738281, 99.78966522216797, 106.69120025634766, 113.59272766113281, 120.4942626953125, 127.39579010009766, 134.2973175048828, 141.1988525390625, 148.10037231445312, 155.0019073486328, 161.9034423828125, 168.80496215820312, 175.7064971923828, 182.6080322265625, 189.5095672607422]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 4.0, 6.0, 10.0, 7.0, 14.0, 20.0, 18.0, 19.0, 34.0, 25.0, 30.0, 30.0, 33.0, 37.0, 41.0, 39.0, 40.0, 38.0, 37.0, 45.0, 51.0, 39.0, 36.0, 32.0, 31.0, 37.0, 33.0, 29.0, 23.0, 23.0, 18.0, 14.0, 22.0, 11.0, 10.0, 15.0, 20.0, 4.0, 3.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-81.61823272705078, -79.24981689453125, -76.88140106201172, -74.51298522949219, -72.14456939697266, -69.77615356445312, -67.4077377319336, -65.03932189941406, -62.670902252197266, -60.302486419677734, -57.9340705871582, -55.56565475463867, -53.197235107421875, -50.828819274902344, -48.46040344238281, -46.09198760986328, -43.72357177734375, -41.35515594482422, -38.98674011230469, -36.618324279785156, -34.249908447265625, -31.88149070739746, -29.513072967529297, -27.144657135009766, -24.776241302490234, -22.407825469970703, -20.039409637451172, -17.670991897583008, -15.302576065063477, -12.934160232543945, -10.565743446350098, -8.19732666015625, -5.828910827636719, -3.4604945182800293, -1.0920782089233398, 1.2763381004333496, 3.644754409790039, 6.01317024230957, 8.381587028503418, 10.750003814697266, 13.118419647216797, 15.486835479736328, 17.85525131225586, 20.223669052124023, 22.592084884643555, 24.960500717163086, 27.32891845703125, 29.69733428955078, 32.06575012207031, 34.434165954589844, 36.802581787109375, 39.170997619628906, 41.53941345214844, 43.90782928466797, 46.276248931884766, 48.6446647644043, 51.01308059692383, 53.38149642944336, 55.74991226196289, 58.11832809448242, 60.48674774169922, 62.85516357421875, 65.22357940673828, 67.59199523925781, 69.96041107177734]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 11.0, 7.0, 7.0, 12.0, 17.0, 23.0, 25.0, 42.0, 59.0, 96.0, 158.0, 247.0, 390.0, 645.0, 1117.0, 2008.0, 3880.0, 7998.0, 18202.0, 47043.0, 135850.0, 436516.0, 259539.0, 80161.0, 30071.0, 12284.0, 5538.0, 2828.0, 1557.0, 821.0, 526.0, 303.0, 192.0, 109.0, 87.0, 67.0, 31.0, 30.0, 19.0, 14.0, 9.0, 7.0, 6.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.59375, -50.93798828125, -49.2822265625, -47.62646484375, -45.970703125, -44.31494140625, -42.6591796875, -41.00341796875, -39.34765625, -37.69189453125, -36.0361328125, -34.38037109375, -32.724609375, -31.06884765625, -29.4130859375, -27.75732421875, -26.1015625, -24.44580078125, -22.7900390625, -21.13427734375, -19.478515625, -17.82275390625, -16.1669921875, -14.51123046875, -12.85546875, -11.19970703125, -9.5439453125, -7.88818359375, -6.232421875, -4.57666015625, -2.9208984375, -1.26513671875, 0.390625, 2.04638671875, 3.7021484375, 5.35791015625, 7.013671875, 8.66943359375, 10.3251953125, 11.98095703125, 13.63671875, 15.29248046875, 16.9482421875, 18.60400390625, 20.259765625, 21.91552734375, 23.5712890625, 25.22705078125, 26.8828125, 28.53857421875, 30.1943359375, 31.85009765625, 33.505859375, 35.16162109375, 36.8173828125, 38.47314453125, 40.12890625, 41.78466796875, 43.4404296875, 45.09619140625, 46.751953125, 48.40771484375, 50.0634765625, 51.71923828125, 53.375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 3.0, 7.0, 8.0, 11.0, 12.0, 25.0, 21.0, 20.0, 28.0, 16.0, 34.0, 36.0, 33.0, 43.0, 55.0, 49.0, 55.0, 51.0, 51.0, 40.0, 57.0, 51.0, 31.0, 40.0, 33.0, 26.0, 25.0, 33.0, 21.0, 20.0, 19.0, 12.0, 5.0, 6.0, 5.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.56640625, -7.34234619140625, -7.1182861328125, -6.89422607421875, -6.670166015625, -6.44610595703125, -6.2220458984375, -5.99798583984375, -5.77392578125, -5.54986572265625, -5.3258056640625, -5.10174560546875, -4.877685546875, -4.65362548828125, -4.4295654296875, -4.20550537109375, -3.9814453125, -3.75738525390625, -3.5333251953125, -3.30926513671875, -3.085205078125, -2.86114501953125, -2.6370849609375, -2.41302490234375, -2.18896484375, -1.96490478515625, -1.7408447265625, -1.51678466796875, -1.292724609375, -1.06866455078125, -0.8446044921875, -0.62054443359375, -0.396484375, -0.17242431640625, 0.0516357421875, 0.27569580078125, 0.499755859375, 0.72381591796875, 0.9478759765625, 1.17193603515625, 1.39599609375, 1.62005615234375, 1.8441162109375, 2.06817626953125, 2.292236328125, 2.51629638671875, 2.7403564453125, 2.96441650390625, 3.1884765625, 3.41253662109375, 3.6365966796875, 3.86065673828125, 4.084716796875, 4.30877685546875, 4.5328369140625, 4.75689697265625, 4.98095703125, 5.20501708984375, 5.4290771484375, 5.65313720703125, 5.877197265625, 6.10125732421875, 6.3253173828125, 6.54937744140625, 6.7734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 7.0, 7.0, 11.0, 20.0, 19.0, 35.0, 44.0, 71.0, 108.0, 139.0, 238.0, 331.0, 560.0, 848.0, 1543.0, 2566.0, 4732.0, 9431.0, 22068.0, 58255.0, 184229.0, 462945.0, 194652.0, 61392.0, 22691.0, 9966.0, 4910.0, 2682.0, 1481.0, 912.0, 563.0, 364.0, 250.0, 157.0, 108.0, 59.0, 51.0, 30.0, 20.0, 15.0, 13.0, 6.0, 7.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.34375, -39.943359375, -38.54296875, -37.142578125, -35.7421875, -34.341796875, -32.94140625, -31.541015625, -30.140625, -28.740234375, -27.33984375, -25.939453125, -24.5390625, -23.138671875, -21.73828125, -20.337890625, -18.9375, -17.537109375, -16.13671875, -14.736328125, -13.3359375, -11.935546875, -10.53515625, -9.134765625, -7.734375, -6.333984375, -4.93359375, -3.533203125, -2.1328125, -0.732421875, 0.66796875, 2.068359375, 3.46875, 4.869140625, 6.26953125, 7.669921875, 9.0703125, 10.470703125, 11.87109375, 13.271484375, 14.671875, 16.072265625, 17.47265625, 18.873046875, 20.2734375, 21.673828125, 23.07421875, 24.474609375, 25.875, 27.275390625, 28.67578125, 30.076171875, 31.4765625, 32.876953125, 34.27734375, 35.677734375, 37.078125, 38.478515625, 39.87890625, 41.279296875, 42.6796875, 44.080078125, 45.48046875, 46.880859375, 48.28125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 12.0, 8.0, 12.0, 8.0, 18.0, 10.0, 20.0, 26.0, 17.0, 25.0, 27.0, 35.0, 39.0, 44.0, 59.0, 44.0, 55.0, 52.0, 49.0, 44.0, 45.0, 45.0, 48.0, 34.0, 36.0, 27.0, 26.0, 28.0, 26.0, 15.0, 15.0, 10.0, 10.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-35.25, -34.06298828125, -32.8759765625, -31.68896484375, -30.501953125, -29.31494140625, -28.1279296875, -26.94091796875, -25.75390625, -24.56689453125, -23.3798828125, -22.19287109375, -21.005859375, -19.81884765625, -18.6318359375, -17.44482421875, -16.2578125, -15.07080078125, -13.8837890625, -12.69677734375, -11.509765625, -10.32275390625, -9.1357421875, -7.94873046875, -6.76171875, -5.57470703125, -4.3876953125, -3.20068359375, -2.013671875, -0.82666015625, 0.3603515625, 1.54736328125, 2.734375, 3.92138671875, 5.1083984375, 6.29541015625, 7.482421875, 8.66943359375, 9.8564453125, 11.04345703125, 12.23046875, 13.41748046875, 14.6044921875, 15.79150390625, 16.978515625, 18.16552734375, 19.3525390625, 20.53955078125, 21.7265625, 22.91357421875, 24.1005859375, 25.28759765625, 26.474609375, 27.66162109375, 28.8486328125, 30.03564453125, 31.22265625, 32.40966796875, 33.5966796875, 34.78369140625, 35.970703125, 37.15771484375, 38.3447265625, 39.53173828125, 40.71875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 9.0, 14.0, 21.0, 48.0, 68.0, 111.0, 210.0, 346.0, 650.0, 1109.0, 2253.0, 4577.0, 10473.0, 31340.0, 263216.0, 651300.0, 55709.0, 14897.0, 6100.0, 2768.0, 1522.0, 786.0, 461.0, 219.0, 133.0, 90.0, 39.0, 41.0, 17.0, 9.0, 6.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.3125, -50.634765625, -48.95703125, -47.279296875, -45.6015625, -43.923828125, -42.24609375, -40.568359375, -38.890625, -37.212890625, -35.53515625, -33.857421875, -32.1796875, -30.501953125, -28.82421875, -27.146484375, -25.46875, -23.791015625, -22.11328125, -20.435546875, -18.7578125, -17.080078125, -15.40234375, -13.724609375, -12.046875, -10.369140625, -8.69140625, -7.013671875, -5.3359375, -3.658203125, -1.98046875, -0.302734375, 1.375, 3.052734375, 4.73046875, 6.408203125, 8.0859375, 9.763671875, 11.44140625, 13.119140625, 14.796875, 16.474609375, 18.15234375, 19.830078125, 21.5078125, 23.185546875, 24.86328125, 26.541015625, 28.21875, 29.896484375, 31.57421875, 33.251953125, 34.9296875, 36.607421875, 38.28515625, 39.962890625, 41.640625, 43.318359375, 44.99609375, 46.673828125, 48.3515625, 50.029296875, 51.70703125, 53.384765625, 55.0625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 2.0, 5.0, 11.0, 11.0, 25.0, 34.0, 80.0, 194.0, 326.0, 142.0, 60.0, 26.0, 21.0, 17.0, 8.0, 4.0, 6.0, 3.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.01534271240234375, -0.014820694923400879, -0.014298677444458008, -0.013776659965515137, -0.013254642486572266, -0.012732625007629395, -0.012210607528686523, -0.011688590049743652, -0.011166572570800781, -0.01064455509185791, -0.010122537612915039, -0.009600520133972168, -0.009078502655029297, -0.008556485176086426, -0.008034467697143555, -0.007512450218200684, -0.0069904327392578125, -0.006468415260314941, -0.00594639778137207, -0.005424380302429199, -0.004902362823486328, -0.004380345344543457, -0.003858327865600586, -0.003336310386657715, -0.0028142929077148438, -0.0022922754287719727, -0.0017702579498291016, -0.0012482404708862305, -0.0007262229919433594, -0.00020420551300048828, 0.0003178119659423828, 0.0008398294448852539, 0.001361846923828125, 0.001883864402770996, 0.002405881881713867, 0.0029278993606567383, 0.0034499168395996094, 0.0039719343185424805, 0.0044939517974853516, 0.005015969276428223, 0.005537986755371094, 0.006060004234313965, 0.006582021713256836, 0.007104039192199707, 0.007626056671142578, 0.00814807415008545, 0.00867009162902832, 0.009192109107971191, 0.009714126586914062, 0.010236144065856934, 0.010758161544799805, 0.011280179023742676, 0.011802196502685547, 0.012324213981628418, 0.012846231460571289, 0.01336824893951416, 0.013890266418457031, 0.014412283897399902, 0.014934301376342773, 0.015456318855285645, 0.015978336334228516, 0.016500353813171387, 0.017022371292114258, 0.01754438877105713, 0.01806640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 5.0, 14.0, 24.0, 21.0, 42.0, 50.0, 80.0, 119.0, 184.0, 301.0, 432.0, 809.0, 1331.0, 2286.0, 4218.0, 8859.0, 21641.0, 76130.0, 531628.0, 316489.0, 51570.0, 16608.0, 7057.0, 3613.0, 2005.0, 1133.0, 674.0, 421.0, 246.0, 175.0, 114.0, 86.0, 52.0, 36.0, 33.0, 14.0, 9.0, 12.0, 9.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-41.90625, -40.73779296875, -39.5693359375, -38.40087890625, -37.232421875, -36.06396484375, -34.8955078125, -33.72705078125, -32.55859375, -31.39013671875, -30.2216796875, -29.05322265625, -27.884765625, -26.71630859375, -25.5478515625, -24.37939453125, -23.2109375, -22.04248046875, -20.8740234375, -19.70556640625, -18.537109375, -17.36865234375, -16.2001953125, -15.03173828125, -13.86328125, -12.69482421875, -11.5263671875, -10.35791015625, -9.189453125, -8.02099609375, -6.8525390625, -5.68408203125, -4.515625, -3.34716796875, -2.1787109375, -1.01025390625, 0.158203125, 1.32666015625, 2.4951171875, 3.66357421875, 4.83203125, 6.00048828125, 7.1689453125, 8.33740234375, 9.505859375, 10.67431640625, 11.8427734375, 13.01123046875, 14.1796875, 15.34814453125, 16.5166015625, 17.68505859375, 18.853515625, 20.02197265625, 21.1904296875, 22.35888671875, 23.52734375, 24.69580078125, 25.8642578125, 27.03271484375, 28.201171875, 29.36962890625, 30.5380859375, 31.70654296875, 32.875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 8.0, 9.0, 19.0, 18.0, 21.0, 38.0, 43.0, 59.0, 84.0, 116.0, 125.0, 116.0, 95.0, 57.0, 39.0, 24.0, 32.0, 10.0, 13.0, 10.0, 13.0, 3.0, 7.0, 2.0, 3.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-32.71875, -31.846435546875, -30.97412109375, -30.101806640625, -29.2294921875, -28.357177734375, -27.48486328125, -26.612548828125, -25.740234375, -24.867919921875, -23.99560546875, -23.123291015625, -22.2509765625, -21.378662109375, -20.50634765625, -19.634033203125, -18.76171875, -17.889404296875, -17.01708984375, -16.144775390625, -15.2724609375, -14.400146484375, -13.52783203125, -12.655517578125, -11.783203125, -10.910888671875, -10.03857421875, -9.166259765625, -8.2939453125, -7.421630859375, -6.54931640625, -5.677001953125, -4.8046875, -3.932373046875, -3.06005859375, -2.187744140625, -1.3154296875, -0.443115234375, 0.42919921875, 1.301513671875, 2.173828125, 3.046142578125, 3.91845703125, 4.790771484375, 5.6630859375, 6.535400390625, 7.40771484375, 8.280029296875, 9.15234375, 10.024658203125, 10.89697265625, 11.769287109375, 12.6416015625, 13.513916015625, 14.38623046875, 15.258544921875, 16.130859375, 17.003173828125, 17.87548828125, 18.747802734375, 19.6201171875, 20.492431640625, 21.36474609375, 22.237060546875, 23.109375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 14.0, 30.0, 78.0, 168.0, 327.0, 228.0, 100.0, 47.0, 14.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1513.858642578125, -1484.44580078125, -1455.032958984375, -1425.6202392578125, -1396.2073974609375, -1366.7945556640625, -1337.3817138671875, -1307.968994140625, -1278.55615234375, -1249.143310546875, -1219.73046875, -1190.3177490234375, -1160.9049072265625, -1131.4920654296875, -1102.0792236328125, -1072.66650390625, -1043.253662109375, -1013.8408203125, -984.4280395507812, -955.0151977539062, -925.6024169921875, -896.1895751953125, -866.7767944335938, -837.3639526367188, -807.9511108398438, -778.5382690429688, -749.12548828125, -719.712646484375, -690.2998657226562, -660.8870239257812, -631.4742431640625, -602.0614013671875, -572.6485595703125, -543.2357177734375, -513.8229370117188, -484.4101257324219, -454.997314453125, -425.58447265625, -396.17169189453125, -366.75885009765625, -337.3460693359375, -307.9332580566406, -278.52044677734375, -249.10763549804688, -219.69482421875, -190.28199768066406, -160.8691864013672, -131.4563751220703, -102.0435791015625, -72.63076782226562, -43.217952728271484, -13.805137634277344, 15.607673645019531, 45.02049255371094, 74.43330383300781, 103.84611511230469, 133.25892639160156, 162.67173767089844, 192.0845489501953, 221.49737548828125, 250.91018676757812, 280.322998046875, 309.7358093261719, 339.14862060546875, 368.5614318847656]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 14.0, 7.0, 12.0, 15.0, 18.0, 29.0, 30.0, 36.0, 26.0, 42.0, 46.0, 38.0, 38.0, 56.0, 50.0, 54.0, 51.0, 46.0, 37.0, 52.0, 44.0, 36.0, 39.0, 29.0, 26.0, 25.0, 21.0, 24.0, 13.0, 12.0, 7.0, 6.0, 5.0, 1.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-302.77764892578125, -294.8313293457031, -286.8850402832031, -278.938720703125, -270.9924011230469, -263.0461120605469, -255.09979248046875, -247.1534881591797, -239.20718383789062, -231.26087951660156, -223.31455993652344, -215.36825561523438, -207.4219512939453, -199.47564697265625, -191.52932739257812, -183.58302307128906, -175.63671875, -167.69041442871094, -159.7440948486328, -151.79779052734375, -143.8514862060547, -135.90518188476562, -127.9588623046875, -120.01255798339844, -112.06623840332031, -104.11992645263672, -96.17362213134766, -88.22731018066406, -80.281005859375, -72.3346939086914, -64.38838195800781, -56.44207763671875, -48.49577331542969, -40.54946517944336, -32.60315704345703, -24.65684700012207, -16.710538864135742, -8.764228820800781, -0.8179206848144531, 7.128387451171875, 15.074695587158203, 23.02100372314453, 30.96731185913086, 38.91361999511719, 46.85993194580078, 54.80624008178711, 62.75254821777344, 70.6988525390625, 78.6451644897461, 86.59147644042969, 94.53778076171875, 102.48409271240234, 110.4303970336914, 118.376708984375, 126.32301330566406, 134.26931762695312, 142.21563720703125, 150.1619415283203, 158.10826110839844, 166.0545654296875, 174.00086975097656, 181.94717407226562, 189.89349365234375, 197.8397979736328, 205.78610229492188]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 21.0, 14.0, 16.0, 20.0, 43.0, 62.0, 85.0, 101.0, 199.0, 295.0, 482.0, 726.0, 1374.0, 2404.0, 5073.0, 12297.0, 41160.0, 669584.0, 3389823.0, 47142.0, 12729.0, 4977.0, 2478.0, 1304.0, 727.0, 409.0, 254.0, 155.0, 102.0, 76.0, 56.0, 26.0, 22.0, 19.0, 5.0, 5.0, 4.0, 9.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.125, -74.5576171875, -71.990234375, -69.4228515625, -66.85546875, -64.2880859375, -61.720703125, -59.1533203125, -56.5859375, -54.0185546875, -51.451171875, -48.8837890625, -46.31640625, -43.7490234375, -41.181640625, -38.6142578125, -36.046875, -33.4794921875, -30.912109375, -28.3447265625, -25.77734375, -23.2099609375, -20.642578125, -18.0751953125, -15.5078125, -12.9404296875, -10.373046875, -7.8056640625, -5.23828125, -2.6708984375, -0.103515625, 2.4638671875, 5.03125, 7.5986328125, 10.166015625, 12.7333984375, 15.30078125, 17.8681640625, 20.435546875, 23.0029296875, 25.5703125, 28.1376953125, 30.705078125, 33.2724609375, 35.83984375, 38.4072265625, 40.974609375, 43.5419921875, 46.109375, 48.6767578125, 51.244140625, 53.8115234375, 56.37890625, 58.9462890625, 61.513671875, 64.0810546875, 66.6484375, 69.2158203125, 71.783203125, 74.3505859375, 76.91796875, 79.4853515625, 82.052734375, 84.6201171875, 87.1875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 9.0, 9.0, 10.0, 10.0, 12.0, 16.0, 14.0, 22.0, 27.0, 22.0, 40.0, 33.0, 29.0, 35.0, 46.0, 45.0, 36.0, 37.0, 41.0, 46.0, 52.0, 48.0, 41.0, 35.0, 39.0, 23.0, 16.0, 20.0, 29.0, 19.0, 27.0, 20.0, 22.0, 10.0, 9.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.59765625, -7.376708984375, -7.15576171875, -6.934814453125, -6.7138671875, -6.492919921875, -6.27197265625, -6.051025390625, -5.830078125, -5.609130859375, -5.38818359375, -5.167236328125, -4.9462890625, -4.725341796875, -4.50439453125, -4.283447265625, -4.0625, -3.841552734375, -3.62060546875, -3.399658203125, -3.1787109375, -2.957763671875, -2.73681640625, -2.515869140625, -2.294921875, -2.073974609375, -1.85302734375, -1.632080078125, -1.4111328125, -1.190185546875, -0.96923828125, -0.748291015625, -0.52734375, -0.306396484375, -0.08544921875, 0.135498046875, 0.3564453125, 0.577392578125, 0.79833984375, 1.019287109375, 1.240234375, 1.461181640625, 1.68212890625, 1.903076171875, 2.1240234375, 2.344970703125, 2.56591796875, 2.786865234375, 3.0078125, 3.228759765625, 3.44970703125, 3.670654296875, 3.8916015625, 4.112548828125, 4.33349609375, 4.554443359375, 4.775390625, 4.996337890625, 5.21728515625, 5.438232421875, 5.6591796875, 5.880126953125, 6.10107421875, 6.322021484375, 6.54296875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 8.0, 2.0, 14.0, 15.0, 19.0, 32.0, 42.0, 54.0, 83.0, 130.0, 172.0, 257.0, 414.0, 664.0, 1109.0, 1867.0, 3218.0, 6208.0, 13354.0, 35289.0, 145323.0, 3687889.0, 222128.0, 43772.0, 15862.0, 7145.0, 3708.0, 2063.0, 1255.0, 785.0, 485.0, 299.0, 173.0, 141.0, 74.0, 69.0, 40.0, 28.0, 16.0, 24.0, 13.0, 6.0, 10.0, 5.0, 4.0, 3.0, 4.0, 0.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-73.125, -70.654296875, -68.18359375, -65.712890625, -63.2421875, -60.771484375, -58.30078125, -55.830078125, -53.359375, -50.888671875, -48.41796875, -45.947265625, -43.4765625, -41.005859375, -38.53515625, -36.064453125, -33.59375, -31.123046875, -28.65234375, -26.181640625, -23.7109375, -21.240234375, -18.76953125, -16.298828125, -13.828125, -11.357421875, -8.88671875, -6.416015625, -3.9453125, -1.474609375, 0.99609375, 3.466796875, 5.9375, 8.408203125, 10.87890625, 13.349609375, 15.8203125, 18.291015625, 20.76171875, 23.232421875, 25.703125, 28.173828125, 30.64453125, 33.115234375, 35.5859375, 38.056640625, 40.52734375, 42.998046875, 45.46875, 47.939453125, 50.41015625, 52.880859375, 55.3515625, 57.822265625, 60.29296875, 62.763671875, 65.234375, 67.705078125, 70.17578125, 72.646484375, 75.1171875, 77.587890625, 80.05859375, 82.529296875, 85.0]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 5.0, 6.0, 12.0, 22.0, 18.0, 50.0, 67.0, 141.0, 446.0, 2714.0, 274.0, 123.0, 51.0, 41.0, 26.0, 19.0, 16.0, 7.0, 4.0, 3.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.296875, -28.092041015625, -26.88720703125, -25.682373046875, -24.4775390625, -23.272705078125, -22.06787109375, -20.863037109375, -19.658203125, -18.453369140625, -17.24853515625, -16.043701171875, -14.8388671875, -13.634033203125, -12.42919921875, -11.224365234375, -10.01953125, -8.814697265625, -7.60986328125, -6.405029296875, -5.2001953125, -3.995361328125, -2.79052734375, -1.585693359375, -0.380859375, 0.823974609375, 2.02880859375, 3.233642578125, 4.4384765625, 5.643310546875, 6.84814453125, 8.052978515625, 9.2578125, 10.462646484375, 11.66748046875, 12.872314453125, 14.0771484375, 15.281982421875, 16.48681640625, 17.691650390625, 18.896484375, 20.101318359375, 21.30615234375, 22.510986328125, 23.7158203125, 24.920654296875, 26.12548828125, 27.330322265625, 28.53515625, 29.739990234375, 30.94482421875, 32.149658203125, 33.3544921875, 34.559326171875, 35.76416015625, 36.968994140625, 38.173828125, 39.378662109375, 40.58349609375, 41.788330078125, 42.9931640625, 44.197998046875, 45.40283203125, 46.607666015625, 47.8125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 8.0, 25.0, 47.0, 102.0, 209.0, 278.0, 186.0, 82.0, 32.0, 23.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.7943572998047, -192.905517578125, -181.0166778564453, -169.12783813476562, -157.23899841308594, -145.35015869140625, -133.46133422851562, -121.5724868774414, -109.68364715576172, -97.79480743408203, -85.90596771240234, -74.01713562011719, -62.128292083740234, -50.23945236206055, -38.350616455078125, -26.461776733398438, -14.57293701171875, -2.684098243713379, 9.204740524291992, 21.093578338623047, 32.982418060302734, 44.87125778198242, 56.760093688964844, 68.64893341064453, 80.53777313232422, 92.4266128540039, 104.3154525756836, 116.20428466796875, 128.09312438964844, 139.98196411132812, 151.8708038330078, 163.7596435546875, 175.64846801757812, 187.5373077392578, 199.4261474609375, 211.3149871826172, 223.20382690429688, 235.09266662597656, 246.98150634765625, 258.8703308105469, 270.7591857910156, 282.64801025390625, 294.536865234375, 306.4256896972656, 318.3145446777344, 330.203369140625, 342.09222412109375, 353.9810485839844, 365.869873046875, 377.7586975097656, 389.6475524902344, 401.536376953125, 413.42523193359375, 425.3140563964844, 437.2029113769531, 449.09173583984375, 460.9805908203125, 472.8694152832031, 484.7582702636719, 496.6470947265625, 508.53594970703125, 520.4248046875, 532.3135986328125, 544.2024536132812, 556.09130859375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 5.0, 3.0, 12.0, 3.0, 6.0, 10.0, 15.0, 20.0, 15.0, 11.0, 25.0, 24.0, 35.0, 34.0, 31.0, 33.0, 37.0, 47.0, 46.0, 43.0, 45.0, 50.0, 42.0, 35.0, 50.0, 35.0, 38.0, 24.0, 31.0, 36.0, 20.0, 33.0, 12.0, 20.0, 13.0, 10.0, 13.0, 6.0, 7.0, 5.0, 6.0, 2.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.41522216796875, -79.52839660644531, -76.64156341552734, -73.7547378540039, -70.86790466308594, -67.9810791015625, -65.09425354003906, -62.207420349121094, -59.32059097290039, -56.43376159667969, -53.546932220458984, -50.66010284423828, -47.773277282714844, -44.886444091796875, -41.99961853027344, -39.112789154052734, -36.22595977783203, -33.33913040161133, -30.452301025390625, -27.565473556518555, -24.67864418029785, -21.79181480407715, -18.904987335205078, -16.018157958984375, -13.131328582763672, -10.244499206542969, -7.357670783996582, -4.470842361450195, -1.5840129852294922, 1.302816390991211, 4.189643859863281, 7.076473236083984, 9.963294982910156, 12.85012435913086, 15.736952781677246, 18.623781204223633, 21.510610580444336, 24.39743995666504, 27.28426742553711, 30.171096801757812, 33.057926177978516, 35.94475555419922, 38.83158493041992, 41.718414306640625, 44.60523986816406, 47.49207305908203, 50.37889862060547, 53.26572799682617, 56.152557373046875, 59.03938674926758, 61.92621612548828, 64.81304168701172, 67.69987487792969, 70.58670043945312, 73.47352600097656, 76.36035919189453, 79.2471923828125, 82.13401794433594, 85.0208511352539, 87.90767669677734, 90.79450988769531, 93.68133544921875, 96.56816101074219, 99.45499420166016, 102.3418197631836]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 6.0, 4.0, 12.0, 27.0, 19.0, 33.0, 60.0, 71.0, 123.0, 155.0, 236.0, 341.0, 536.0, 793.0, 1213.0, 2009.0, 3267.0, 5289.0, 9001.0, 15877.0, 30032.0, 62521.0, 148231.0, 350947.0, 233010.0, 92307.0, 41932.0, 20894.0, 11551.0, 6700.0, 4075.0, 2484.0, 1638.0, 1054.0, 662.0, 447.0, 313.0, 230.0, 139.0, 94.0, 65.0, 29.0, 38.0, 16.0, 23.0, 14.0, 11.0, 8.0, 6.0, 1.0, 1.0, 2.0, 1.0, 5.0], "bins": [-47.96875, -46.546875, -45.125, -43.703125, -42.28125, -40.859375, -39.4375, -38.015625, -36.59375, -35.171875, -33.75, -32.328125, -30.90625, -29.484375, -28.0625, -26.640625, -25.21875, -23.796875, -22.375, -20.953125, -19.53125, -18.109375, -16.6875, -15.265625, -13.84375, -12.421875, -11.0, -9.578125, -8.15625, -6.734375, -5.3125, -3.890625, -2.46875, -1.046875, 0.375, 1.796875, 3.21875, 4.640625, 6.0625, 7.484375, 8.90625, 10.328125, 11.75, 13.171875, 14.59375, 16.015625, 17.4375, 18.859375, 20.28125, 21.703125, 23.125, 24.546875, 25.96875, 27.390625, 28.8125, 30.234375, 31.65625, 33.078125, 34.5, 35.921875, 37.34375, 38.765625, 40.1875, 41.609375, 43.03125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 10.0, 6.0, 5.0, 6.0, 11.0, 14.0, 15.0, 13.0, 10.0, 14.0, 26.0, 17.0, 19.0, 29.0, 37.0, 19.0, 40.0, 41.0, 46.0, 43.0, 40.0, 49.0, 47.0, 36.0, 40.0, 25.0, 56.0, 38.0, 39.0, 28.0, 22.0, 31.0, 24.0, 18.0, 18.0, 17.0, 9.0, 9.0, 11.0, 8.0, 6.0, 2.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.40625, -8.1561279296875, -7.906005859375, -7.6558837890625, -7.40576171875, -7.1556396484375, -6.905517578125, -6.6553955078125, -6.4052734375, -6.1551513671875, -5.905029296875, -5.6549072265625, -5.40478515625, -5.1546630859375, -4.904541015625, -4.6544189453125, -4.404296875, -4.1541748046875, -3.904052734375, -3.6539306640625, -3.40380859375, -3.1536865234375, -2.903564453125, -2.6534423828125, -2.4033203125, -2.1531982421875, -1.903076171875, -1.6529541015625, -1.40283203125, -1.1527099609375, -0.902587890625, -0.6524658203125, -0.40234375, -0.1522216796875, 0.097900390625, 0.3480224609375, 0.59814453125, 0.8482666015625, 1.098388671875, 1.3485107421875, 1.5986328125, 1.8487548828125, 2.098876953125, 2.3489990234375, 2.59912109375, 2.8492431640625, 3.099365234375, 3.3494873046875, 3.599609375, 3.8497314453125, 4.099853515625, 4.3499755859375, 4.60009765625, 4.8502197265625, 5.100341796875, 5.3504638671875, 5.6005859375, 5.8507080078125, 6.100830078125, 6.3509521484375, 6.60107421875, 6.8511962890625, 7.101318359375, 7.3514404296875, 7.6015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 15.0, 17.0, 8.0, 7.0, 12.0, 19.0, 35.0, 53.0, 71.0, 124.0, 210.0, 349.0, 593.0, 1046.0, 1867.0, 3754.0, 7898.0, 18215.0, 47131.0, 152896.0, 489353.0, 219346.0, 62822.0, 23228.0, 9805.0, 4536.0, 2270.0, 1175.0, 649.0, 365.0, 238.0, 125.0, 94.0, 65.0, 39.0, 22.0, 24.0, 10.0, 13.0, 10.0, 16.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-59.59375, -57.873046875, -56.15234375, -54.431640625, -52.7109375, -50.990234375, -49.26953125, -47.548828125, -45.828125, -44.107421875, -42.38671875, -40.666015625, -38.9453125, -37.224609375, -35.50390625, -33.783203125, -32.0625, -30.341796875, -28.62109375, -26.900390625, -25.1796875, -23.458984375, -21.73828125, -20.017578125, -18.296875, -16.576171875, -14.85546875, -13.134765625, -11.4140625, -9.693359375, -7.97265625, -6.251953125, -4.53125, -2.810546875, -1.08984375, 0.630859375, 2.3515625, 4.072265625, 5.79296875, 7.513671875, 9.234375, 10.955078125, 12.67578125, 14.396484375, 16.1171875, 17.837890625, 19.55859375, 21.279296875, 23.0, 24.720703125, 26.44140625, 28.162109375, 29.8828125, 31.603515625, 33.32421875, 35.044921875, 36.765625, 38.486328125, 40.20703125, 41.927734375, 43.6484375, 45.369140625, 47.08984375, 48.810546875, 50.53125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 8.0, 13.0, 8.0, 15.0, 14.0, 12.0, 13.0, 19.0, 34.0, 38.0, 34.0, 33.0, 28.0, 41.0, 44.0, 42.0, 45.0, 50.0, 47.0, 37.0, 48.0, 47.0, 40.0, 42.0, 38.0, 31.0, 25.0, 23.0, 19.0, 15.0, 17.0, 12.0, 10.0, 12.0, 9.0, 7.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 2.0], "bins": [-49.28125, -47.8896484375, -46.498046875, -45.1064453125, -43.71484375, -42.3232421875, -40.931640625, -39.5400390625, -38.1484375, -36.7568359375, -35.365234375, -33.9736328125, -32.58203125, -31.1904296875, -29.798828125, -28.4072265625, -27.015625, -25.6240234375, -24.232421875, -22.8408203125, -21.44921875, -20.0576171875, -18.666015625, -17.2744140625, -15.8828125, -14.4912109375, -13.099609375, -11.7080078125, -10.31640625, -8.9248046875, -7.533203125, -6.1416015625, -4.75, -3.3583984375, -1.966796875, -0.5751953125, 0.81640625, 2.2080078125, 3.599609375, 4.9912109375, 6.3828125, 7.7744140625, 9.166015625, 10.5576171875, 11.94921875, 13.3408203125, 14.732421875, 16.1240234375, 17.515625, 18.9072265625, 20.298828125, 21.6904296875, 23.08203125, 24.4736328125, 25.865234375, 27.2568359375, 28.6484375, 30.0400390625, 31.431640625, 32.8232421875, 34.21484375, 35.6064453125, 36.998046875, 38.3896484375, 39.78125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 5.0, 8.0, 10.0, 16.0, 25.0, 39.0, 47.0, 65.0, 97.0, 135.0, 187.0, 362.0, 587.0, 1115.0, 2112.0, 5004.0, 15196.0, 73578.0, 705039.0, 203583.0, 27125.0, 7722.0, 3077.0, 1431.0, 720.0, 411.0, 273.0, 203.0, 107.0, 73.0, 56.0, 29.0, 39.0, 23.0, 14.0, 10.0, 6.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.5, -58.5302734375, -56.560546875, -54.5908203125, -52.62109375, -50.6513671875, -48.681640625, -46.7119140625, -44.7421875, -42.7724609375, -40.802734375, -38.8330078125, -36.86328125, -34.8935546875, -32.923828125, -30.9541015625, -28.984375, -27.0146484375, -25.044921875, -23.0751953125, -21.10546875, -19.1357421875, -17.166015625, -15.1962890625, -13.2265625, -11.2568359375, -9.287109375, -7.3173828125, -5.34765625, -3.3779296875, -1.408203125, 0.5615234375, 2.53125, 4.5009765625, 6.470703125, 8.4404296875, 10.41015625, 12.3798828125, 14.349609375, 16.3193359375, 18.2890625, 20.2587890625, 22.228515625, 24.1982421875, 26.16796875, 28.1376953125, 30.107421875, 32.0771484375, 34.046875, 36.0166015625, 37.986328125, 39.9560546875, 41.92578125, 43.8955078125, 45.865234375, 47.8349609375, 49.8046875, 51.7744140625, 53.744140625, 55.7138671875, 57.68359375, 59.6533203125, 61.623046875, 63.5927734375, 65.5625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 4.0, 9.0, 15.0, 18.0, 30.0, 42.0, 73.0, 103.0, 220.0, 175.0, 96.0, 65.0, 33.0, 27.0, 21.0, 11.0, 7.0, 6.0, 8.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0171966552734375, -0.016753792762756348, -0.016310930252075195, -0.015868067741394043, -0.01542520523071289, -0.014982342720031738, -0.014539480209350586, -0.014096617698669434, -0.013653755187988281, -0.013210892677307129, -0.012768030166625977, -0.012325167655944824, -0.011882305145263672, -0.01143944263458252, -0.010996580123901367, -0.010553717613220215, -0.010110855102539062, -0.00966799259185791, -0.009225130081176758, -0.008782267570495605, -0.008339405059814453, -0.0078965425491333, -0.0074536800384521484, -0.007010817527770996, -0.006567955017089844, -0.006125092506408691, -0.005682229995727539, -0.005239367485046387, -0.004796504974365234, -0.004353642463684082, -0.00391077995300293, -0.0034679174423217773, -0.003025054931640625, -0.0025821924209594727, -0.0021393299102783203, -0.001696467399597168, -0.0012536048889160156, -0.0008107423782348633, -0.00036787986755371094, 7.49826431274414e-05, 0.0005178451538085938, 0.0009607076644897461, 0.0014035701751708984, 0.0018464326858520508, 0.002289295196533203, 0.0027321577072143555, 0.003175020217895508, 0.00361788272857666, 0.0040607452392578125, 0.004503607749938965, 0.004946470260620117, 0.0053893327713012695, 0.005832195281982422, 0.006275057792663574, 0.0067179203033447266, 0.007160782814025879, 0.007603645324707031, 0.008046507835388184, 0.008489370346069336, 0.008932232856750488, 0.00937509536743164, 0.009817957878112793, 0.010260820388793945, 0.010703682899475098, 0.01114654541015625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 4.0, 7.0, 10.0, 8.0, 17.0, 27.0, 25.0, 45.0, 60.0, 101.0, 126.0, 209.0, 365.0, 695.0, 1272.0, 3044.0, 9331.0, 47280.0, 604757.0, 337984.0, 31165.0, 6946.0, 2413.0, 1144.0, 591.0, 325.0, 194.0, 125.0, 83.0, 51.0, 40.0, 26.0, 17.0, 13.0, 7.0, 11.0, 7.0, 8.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-77.875, -75.705078125, -73.53515625, -71.365234375, -69.1953125, -67.025390625, -64.85546875, -62.685546875, -60.515625, -58.345703125, -56.17578125, -54.005859375, -51.8359375, -49.666015625, -47.49609375, -45.326171875, -43.15625, -40.986328125, -38.81640625, -36.646484375, -34.4765625, -32.306640625, -30.13671875, -27.966796875, -25.796875, -23.626953125, -21.45703125, -19.287109375, -17.1171875, -14.947265625, -12.77734375, -10.607421875, -8.4375, -6.267578125, -4.09765625, -1.927734375, 0.2421875, 2.412109375, 4.58203125, 6.751953125, 8.921875, 11.091796875, 13.26171875, 15.431640625, 17.6015625, 19.771484375, 21.94140625, 24.111328125, 26.28125, 28.451171875, 30.62109375, 32.791015625, 34.9609375, 37.130859375, 39.30078125, 41.470703125, 43.640625, 45.810546875, 47.98046875, 50.150390625, 52.3203125, 54.490234375, 56.66015625, 58.830078125, 61.0]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 9.0, 4.0, 10.0, 12.0, 15.0, 22.0, 39.0, 49.0, 66.0, 96.0, 137.0, 147.0, 116.0, 75.0, 56.0, 52.0, 19.0, 21.0, 15.0, 15.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.46875, -38.11572265625, -36.7626953125, -35.40966796875, -34.056640625, -32.70361328125, -31.3505859375, -29.99755859375, -28.64453125, -27.29150390625, -25.9384765625, -24.58544921875, -23.232421875, -21.87939453125, -20.5263671875, -19.17333984375, -17.8203125, -16.46728515625, -15.1142578125, -13.76123046875, -12.408203125, -11.05517578125, -9.7021484375, -8.34912109375, -6.99609375, -5.64306640625, -4.2900390625, -2.93701171875, -1.583984375, -0.23095703125, 1.1220703125, 2.47509765625, 3.828125, 5.18115234375, 6.5341796875, 7.88720703125, 9.240234375, 10.59326171875, 11.9462890625, 13.29931640625, 14.65234375, 16.00537109375, 17.3583984375, 18.71142578125, 20.064453125, 21.41748046875, 22.7705078125, 24.12353515625, 25.4765625, 26.82958984375, 28.1826171875, 29.53564453125, 30.888671875, 32.24169921875, 33.5947265625, 34.94775390625, 36.30078125, 37.65380859375, 39.0068359375, 40.35986328125, 41.712890625, 43.06591796875, 44.4189453125, 45.77197265625, 47.125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 15.0, 30.0, 42.0, 97.0, 125.0, 186.0, 166.0, 152.0, 83.0, 42.0, 33.0, 17.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-615.23486328125, -594.6429443359375, -574.051025390625, -553.4590454101562, -532.8671264648438, -512.2752075195312, -491.6832580566406, -471.09130859375, -450.4993896484375, -429.907470703125, -409.3155212402344, -388.72357177734375, -368.13165283203125, -347.53973388671875, -326.9477844238281, -306.3558349609375, -285.763916015625, -265.1719970703125, -244.58004760742188, -223.9881134033203, -203.39617919921875, -182.8042449951172, -162.21231079101562, -141.62037658691406, -121.0284423828125, -100.43650817871094, -79.84457397460938, -59.25263977050781, -38.66070556640625, -18.068771362304688, 2.523162841796875, 23.115097045898438, 43.70703125, 64.29896545410156, 84.89089965820312, 105.48283386230469, 126.07476806640625, 146.6667022705078, 167.25863647460938, 187.85057067871094, 208.4425048828125, 229.03443908691406, 249.62637329101562, 270.21832275390625, 290.81024169921875, 311.40216064453125, 331.9941101074219, 352.5860595703125, 373.177978515625, 393.7698974609375, 414.3618469238281, 434.95379638671875, 455.54571533203125, 476.13763427734375, 496.7295837402344, 517.321533203125, 537.9134521484375, 558.50537109375, 579.0972900390625, 599.6892700195312, 620.2811889648438, 640.8731079101562, 661.465087890625, 682.0570068359375, 702.64892578125]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 8.0, 7.0, 7.0, 14.0, 19.0, 14.0, 21.0, 26.0, 39.0, 39.0, 48.0, 42.0, 55.0, 46.0, 58.0, 47.0, 37.0, 53.0, 54.0, 49.0, 53.0, 37.0, 28.0, 36.0, 22.0, 22.0, 24.0, 17.0, 26.0, 19.0, 5.0, 8.0, 6.0, 4.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-262.41778564453125, -253.11940002441406, -243.82102966308594, -234.52264404296875, -225.22427368164062, -215.92588806152344, -206.62750244140625, -197.32913208007812, -188.03076171875, -178.7323760986328, -169.4340057373047, -160.1356201171875, -150.83724975585938, -141.5388641357422, -132.240478515625, -122.94210815429688, -113.64372253417969, -104.34534454345703, -95.04696655273438, -85.74858093261719, -76.45021057128906, -67.15182495117188, -57.85344696044922, -48.55506896972656, -39.256690979003906, -29.95831298828125, -20.65993309020996, -11.361553192138672, -2.0631752014160156, 7.235202789306641, 16.533584594726562, 25.83196258544922, 35.130340576171875, 44.42871856689453, 53.72709655761719, 63.02547836303711, 72.3238525390625, 81.62223815917969, 90.92061614990234, 100.218994140625, 109.51737213134766, 118.81575012207031, 128.1141357421875, 137.41250610351562, 146.7108917236328, 156.00926208496094, 165.30764770507812, 174.60601806640625, 183.90440368652344, 193.20278930664062, 202.50115966796875, 211.79954528808594, 221.09791564941406, 230.39630126953125, 239.69467163085938, 248.99305725097656, 258.29144287109375, 267.5898132324219, 276.8882141113281, 286.18658447265625, 295.4849548339844, 304.7833251953125, 314.08172607421875, 323.3800964355469, 332.678466796875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 6.0, 9.0, 11.0, 8.0, 15.0, 26.0, 25.0, 29.0, 38.0, 76.0, 109.0, 138.0, 208.0, 289.0, 383.0, 662.0, 1040.0, 1643.0, 2888.0, 5753.0, 12699.0, 35250.0, 168500.0, 3749113.0, 155736.0, 34505.0, 12215.0, 5537.0, 3012.0, 1606.0, 968.0, 589.0, 393.0, 243.0, 183.0, 102.0, 80.0, 56.0, 42.0, 29.0, 22.0, 15.0, 7.0, 13.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-84.0, -81.697265625, -79.39453125, -77.091796875, -74.7890625, -72.486328125, -70.18359375, -67.880859375, -65.578125, -63.275390625, -60.97265625, -58.669921875, -56.3671875, -54.064453125, -51.76171875, -49.458984375, -47.15625, -44.853515625, -42.55078125, -40.248046875, -37.9453125, -35.642578125, -33.33984375, -31.037109375, -28.734375, -26.431640625, -24.12890625, -21.826171875, -19.5234375, -17.220703125, -14.91796875, -12.615234375, -10.3125, -8.009765625, -5.70703125, -3.404296875, -1.1015625, 1.201171875, 3.50390625, 5.806640625, 8.109375, 10.412109375, 12.71484375, 15.017578125, 17.3203125, 19.623046875, 21.92578125, 24.228515625, 26.53125, 28.833984375, 31.13671875, 33.439453125, 35.7421875, 38.044921875, 40.34765625, 42.650390625, 44.953125, 47.255859375, 49.55859375, 51.861328125, 54.1640625, 56.466796875, 58.76953125, 61.072265625, 63.375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 11.0, 12.0, 9.0, 17.0, 17.0, 19.0, 27.0, 38.0, 45.0, 52.0, 40.0, 61.0, 67.0, 55.0, 56.0, 49.0, 73.0, 53.0, 49.0, 42.0, 52.0, 38.0, 26.0, 26.0, 22.0, 14.0, 5.0, 12.0, 6.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.3515625, -10.9781494140625, -10.604736328125, -10.2313232421875, -9.85791015625, -9.4844970703125, -9.111083984375, -8.7376708984375, -8.3642578125, -7.9908447265625, -7.617431640625, -7.2440185546875, -6.87060546875, -6.4971923828125, -6.123779296875, -5.7503662109375, -5.376953125, -5.0035400390625, -4.630126953125, -4.2567138671875, -3.88330078125, -3.5098876953125, -3.136474609375, -2.7630615234375, -2.3896484375, -2.0162353515625, -1.642822265625, -1.2694091796875, -0.89599609375, -0.5225830078125, -0.149169921875, 0.2242431640625, 0.59765625, 0.9710693359375, 1.344482421875, 1.7178955078125, 2.09130859375, 2.4647216796875, 2.838134765625, 3.2115478515625, 3.5849609375, 3.9583740234375, 4.331787109375, 4.7052001953125, 5.07861328125, 5.4520263671875, 5.825439453125, 6.1988525390625, 6.572265625, 6.9456787109375, 7.319091796875, 7.6925048828125, 8.06591796875, 8.4393310546875, 8.812744140625, 9.1861572265625, 9.5595703125, 9.9329833984375, 10.306396484375, 10.6798095703125, 11.05322265625, 11.4266357421875, 11.800048828125, 12.1734619140625, 12.546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 7.0, 12.0, 13.0, 21.0, 12.0, 41.0, 47.0, 69.0, 95.0, 151.0, 259.0, 436.0, 778.0, 1341.0, 2937.0, 7484.0, 25647.0, 138519.0, 3726715.0, 237815.0, 34971.0, 9546.0, 3561.0, 1601.0, 862.0, 483.0, 287.0, 173.0, 122.0, 91.0, 55.0, 42.0, 24.0, 20.0, 13.0, 5.0, 8.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.1875, -111.6552734375, -108.123046875, -104.5908203125, -101.05859375, -97.5263671875, -93.994140625, -90.4619140625, -86.9296875, -83.3974609375, -79.865234375, -76.3330078125, -72.80078125, -69.2685546875, -65.736328125, -62.2041015625, -58.671875, -55.1396484375, -51.607421875, -48.0751953125, -44.54296875, -41.0107421875, -37.478515625, -33.9462890625, -30.4140625, -26.8818359375, -23.349609375, -19.8173828125, -16.28515625, -12.7529296875, -9.220703125, -5.6884765625, -2.15625, 1.3759765625, 4.908203125, 8.4404296875, 11.97265625, 15.5048828125, 19.037109375, 22.5693359375, 26.1015625, 29.6337890625, 33.166015625, 36.6982421875, 40.23046875, 43.7626953125, 47.294921875, 50.8271484375, 54.359375, 57.8916015625, 61.423828125, 64.9560546875, 68.48828125, 72.0205078125, 75.552734375, 79.0849609375, 82.6171875, 86.1494140625, 89.681640625, 93.2138671875, 96.74609375, 100.2783203125, 103.810546875, 107.3427734375, 110.875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 6.0, 11.0, 18.0, 28.0, 36.0, 72.0, 137.0, 374.0, 2595.0, 454.0, 139.0, 84.0, 50.0, 24.0, 8.0, 11.0, 7.0, 10.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.46875, -36.59814453125, -34.7275390625, -32.85693359375, -30.986328125, -29.11572265625, -27.2451171875, -25.37451171875, -23.50390625, -21.63330078125, -19.7626953125, -17.89208984375, -16.021484375, -14.15087890625, -12.2802734375, -10.40966796875, -8.5390625, -6.66845703125, -4.7978515625, -2.92724609375, -1.056640625, 0.81396484375, 2.6845703125, 4.55517578125, 6.42578125, 8.29638671875, 10.1669921875, 12.03759765625, 13.908203125, 15.77880859375, 17.6494140625, 19.52001953125, 21.390625, 23.26123046875, 25.1318359375, 27.00244140625, 28.873046875, 30.74365234375, 32.6142578125, 34.48486328125, 36.35546875, 38.22607421875, 40.0966796875, 41.96728515625, 43.837890625, 45.70849609375, 47.5791015625, 49.44970703125, 51.3203125, 53.19091796875, 55.0615234375, 56.93212890625, 58.802734375, 60.67333984375, 62.5439453125, 64.41455078125, 66.28515625, 68.15576171875, 70.0263671875, 71.89697265625, 73.767578125, 75.63818359375, 77.5087890625, 79.37939453125, 81.25]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 27.0, 181.0, 367.0, 298.0, 99.0, 24.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-877.7890625, -853.2758178710938, -828.7625122070312, -804.249267578125, -779.7360229492188, -755.2227172851562, -730.70947265625, -706.1961669921875, -681.6829223632812, -657.169677734375, -632.6563720703125, -608.1431274414062, -583.6298828125, -559.1165771484375, -534.6033325195312, -510.0900573730469, -485.5768127441406, -461.06353759765625, -436.55029296875, -412.0370178222656, -387.52374267578125, -363.010498046875, -338.4972229003906, -313.98394775390625, -289.470703125, -264.9574279785156, -240.4441680908203, -215.930908203125, -191.41763305664062, -166.9043731689453, -142.39111328125, -117.87783813476562, -93.36456298828125, -68.8512954711914, -44.33803176879883, -19.82476806640625, 4.688499450683594, 29.201766967773438, 53.71502685546875, 78.22830200195312, 102.74156188964844, 127.25482940673828, 151.76809692382812, 176.28135681152344, 200.79461669921875, 225.30789184570312, 249.82115173339844, 274.33441162109375, 298.8476867675781, 323.3609619140625, 347.87420654296875, 372.3874816894531, 396.9007568359375, 421.41400146484375, 445.9272766113281, 470.4405517578125, 494.95379638671875, 519.467041015625, 543.9803466796875, 568.4935913085938, 593.0068359375, 617.5201416015625, 642.0333862304688, 666.546630859375, 691.0599365234375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 4.0, 6.0, 7.0, 11.0, 14.0, 10.0, 18.0, 25.0, 19.0, 26.0, 32.0, 38.0, 34.0, 44.0, 61.0, 40.0, 51.0, 37.0, 54.0, 61.0, 56.0, 41.0, 47.0, 32.0, 41.0, 28.0, 23.0, 27.0, 27.0, 22.0, 17.0, 9.0, 10.0, 5.0, 6.0, 12.0, 3.0, 5.0, 2.0, 1.0, 5.0, 1.0], "bins": [-179.501708984375, -175.03573608398438, -170.56976318359375, -166.1038055419922, -161.63783264160156, -157.17185974121094, -152.7058868408203, -148.2399139404297, -143.77395629882812, -139.3079833984375, -134.84201049804688, -130.3760528564453, -125.91007995605469, -121.44410705566406, -116.97813415527344, -112.51216125488281, -108.04618835449219, -103.58021545410156, -99.11425018310547, -94.64827728271484, -90.18231201171875, -85.71633911132812, -81.2503662109375, -76.78439331054688, -72.31842803955078, -67.85245513916016, -63.38648986816406, -58.92051696777344, -54.45454788208008, -49.98857879638672, -45.522605895996094, -41.056636810302734, -36.590660095214844, -32.124691009521484, -27.658720016479492, -23.1927490234375, -18.72677993774414, -14.260810852050781, -9.794839859008789, -5.328868865966797, -0.8628997802734375, 3.6030702590942383, 8.069040298461914, 12.53501033782959, 17.000980377197266, 21.466949462890625, 25.932920455932617, 30.39889144897461, 34.86486053466797, 39.33082962036133, 43.79679870605469, 48.26277160644531, 52.72874069213867, 57.19470977783203, 61.660682678222656, 66.12664794921875, 70.59262084960938, 75.05859375, 79.5245590209961, 83.99053192138672, 88.45649719238281, 92.92247009277344, 97.38844299316406, 101.85441589355469, 106.32038116455078]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 9.0, 5.0, 6.0, 18.0, 24.0, 19.0, 38.0, 43.0, 64.0, 99.0, 121.0, 191.0, 268.0, 429.0, 580.0, 833.0, 1305.0, 1930.0, 3130.0, 5075.0, 8766.0, 16071.0, 32696.0, 73764.0, 210944.0, 438712.0, 139970.0, 55173.0, 25586.0, 13107.0, 7473.0, 4335.0, 2622.0, 1697.0, 1111.0, 750.0, 514.0, 339.0, 210.0, 152.0, 119.0, 79.0, 59.0, 37.0, 26.0, 20.0, 12.0, 18.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-51.8125, -50.30322265625, -48.7939453125, -47.28466796875, -45.775390625, -44.26611328125, -42.7568359375, -41.24755859375, -39.73828125, -38.22900390625, -36.7197265625, -35.21044921875, -33.701171875, -32.19189453125, -30.6826171875, -29.17333984375, -27.6640625, -26.15478515625, -24.6455078125, -23.13623046875, -21.626953125, -20.11767578125, -18.6083984375, -17.09912109375, -15.58984375, -14.08056640625, -12.5712890625, -11.06201171875, -9.552734375, -8.04345703125, -6.5341796875, -5.02490234375, -3.515625, -2.00634765625, -0.4970703125, 1.01220703125, 2.521484375, 4.03076171875, 5.5400390625, 7.04931640625, 8.55859375, 10.06787109375, 11.5771484375, 13.08642578125, 14.595703125, 16.10498046875, 17.6142578125, 19.12353515625, 20.6328125, 22.14208984375, 23.6513671875, 25.16064453125, 26.669921875, 28.17919921875, 29.6884765625, 31.19775390625, 32.70703125, 34.21630859375, 35.7255859375, 37.23486328125, 38.744140625, 40.25341796875, 41.7626953125, 43.27197265625, 44.78125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 5.0, 5.0, 4.0, 8.0, 15.0, 7.0, 13.0, 13.0, 12.0, 19.0, 18.0, 23.0, 32.0, 34.0, 22.0, 24.0, 46.0, 46.0, 35.0, 39.0, 37.0, 51.0, 47.0, 43.0, 38.0, 42.0, 42.0, 37.0, 29.0, 24.0, 37.0, 22.0, 19.0, 18.0, 16.0, 9.0, 9.0, 11.0, 15.0, 5.0, 5.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.859375, -9.57177734375, -9.2841796875, -8.99658203125, -8.708984375, -8.42138671875, -8.1337890625, -7.84619140625, -7.55859375, -7.27099609375, -6.9833984375, -6.69580078125, -6.408203125, -6.12060546875, -5.8330078125, -5.54541015625, -5.2578125, -4.97021484375, -4.6826171875, -4.39501953125, -4.107421875, -3.81982421875, -3.5322265625, -3.24462890625, -2.95703125, -2.66943359375, -2.3818359375, -2.09423828125, -1.806640625, -1.51904296875, -1.2314453125, -0.94384765625, -0.65625, -0.36865234375, -0.0810546875, 0.20654296875, 0.494140625, 0.78173828125, 1.0693359375, 1.35693359375, 1.64453125, 1.93212890625, 2.2197265625, 2.50732421875, 2.794921875, 3.08251953125, 3.3701171875, 3.65771484375, 3.9453125, 4.23291015625, 4.5205078125, 4.80810546875, 5.095703125, 5.38330078125, 5.6708984375, 5.95849609375, 6.24609375, 6.53369140625, 6.8212890625, 7.10888671875, 7.396484375, 7.68408203125, 7.9716796875, 8.25927734375, 8.546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 3.0, 8.0, 6.0, 6.0, 9.0, 16.0, 18.0, 26.0, 27.0, 45.0, 73.0, 107.0, 146.0, 252.0, 330.0, 654.0, 1102.0, 2111.0, 4371.0, 10326.0, 30793.0, 137655.0, 655767.0, 151399.0, 32849.0, 10712.0, 4624.0, 2209.0, 1148.0, 643.0, 374.0, 246.0, 161.0, 97.0, 50.0, 43.0, 38.0, 32.0, 18.0, 21.0, 12.0, 5.0, 4.0, 10.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-76.875, -74.58203125, -72.2890625, -69.99609375, -67.703125, -65.41015625, -63.1171875, -60.82421875, -58.53125, -56.23828125, -53.9453125, -51.65234375, -49.359375, -47.06640625, -44.7734375, -42.48046875, -40.1875, -37.89453125, -35.6015625, -33.30859375, -31.015625, -28.72265625, -26.4296875, -24.13671875, -21.84375, -19.55078125, -17.2578125, -14.96484375, -12.671875, -10.37890625, -8.0859375, -5.79296875, -3.5, -1.20703125, 1.0859375, 3.37890625, 5.671875, 7.96484375, 10.2578125, 12.55078125, 14.84375, 17.13671875, 19.4296875, 21.72265625, 24.015625, 26.30859375, 28.6015625, 30.89453125, 33.1875, 35.48046875, 37.7734375, 40.06640625, 42.359375, 44.65234375, 46.9453125, 49.23828125, 51.53125, 53.82421875, 56.1171875, 58.41015625, 60.703125, 62.99609375, 65.2890625, 67.58203125, 69.875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 10.0, 9.0, 6.0, 9.0, 12.0, 14.0, 26.0, 34.0, 27.0, 35.0, 41.0, 60.0, 45.0, 71.0, 60.0, 71.0, 50.0, 69.0, 58.0, 57.0, 42.0, 45.0, 40.0, 22.0, 18.0, 18.0, 12.0, 6.0, 10.0, 7.0, 2.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-72.4375, -70.33984375, -68.2421875, -66.14453125, -64.046875, -61.94921875, -59.8515625, -57.75390625, -55.65625, -53.55859375, -51.4609375, -49.36328125, -47.265625, -45.16796875, -43.0703125, -40.97265625, -38.875, -36.77734375, -34.6796875, -32.58203125, -30.484375, -28.38671875, -26.2890625, -24.19140625, -22.09375, -19.99609375, -17.8984375, -15.80078125, -13.703125, -11.60546875, -9.5078125, -7.41015625, -5.3125, -3.21484375, -1.1171875, 0.98046875, 3.078125, 5.17578125, 7.2734375, 9.37109375, 11.46875, 13.56640625, 15.6640625, 17.76171875, 19.859375, 21.95703125, 24.0546875, 26.15234375, 28.25, 30.34765625, 32.4453125, 34.54296875, 36.640625, 38.73828125, 40.8359375, 42.93359375, 45.03125, 47.12890625, 49.2265625, 51.32421875, 53.421875, 55.51953125, 57.6171875, 59.71484375, 61.8125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 12.0, 24.0, 27.0, 35.0, 50.0, 63.0, 106.0, 162.0, 251.0, 449.0, 836.0, 1766.0, 4758.0, 17489.0, 175248.0, 797914.0, 36437.0, 7731.0, 2564.0, 1144.0, 572.0, 328.0, 194.0, 111.0, 73.0, 61.0, 46.0, 24.0, 14.0, 14.0, 14.0, 10.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.0625, -79.2529296875, -76.443359375, -73.6337890625, -70.82421875, -68.0146484375, -65.205078125, -62.3955078125, -59.5859375, -56.7763671875, -53.966796875, -51.1572265625, -48.34765625, -45.5380859375, -42.728515625, -39.9189453125, -37.109375, -34.2998046875, -31.490234375, -28.6806640625, -25.87109375, -23.0615234375, -20.251953125, -17.4423828125, -14.6328125, -11.8232421875, -9.013671875, -6.2041015625, -3.39453125, -0.5849609375, 2.224609375, 5.0341796875, 7.84375, 10.6533203125, 13.462890625, 16.2724609375, 19.08203125, 21.8916015625, 24.701171875, 27.5107421875, 30.3203125, 33.1298828125, 35.939453125, 38.7490234375, 41.55859375, 44.3681640625, 47.177734375, 49.9873046875, 52.796875, 55.6064453125, 58.416015625, 61.2255859375, 64.03515625, 66.8447265625, 69.654296875, 72.4638671875, 75.2734375, 78.0830078125, 80.892578125, 83.7021484375, 86.51171875, 89.3212890625, 92.130859375, 94.9404296875, 97.75]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 9.0, 38.0, 42.0, 120.0, 472.0, 175.0, 55.0, 27.0, 20.0, 12.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019866943359375, -0.018901824951171875, -0.01793670654296875, -0.016971588134765625, -0.0160064697265625, -0.015041351318359375, -0.01407623291015625, -0.013111114501953125, -0.01214599609375, -0.011180877685546875, -0.01021575927734375, -0.009250640869140625, -0.0082855224609375, -0.007320404052734375, -0.00635528564453125, -0.005390167236328125, -0.004425048828125, -0.003459930419921875, -0.00249481201171875, -0.001529693603515625, -0.0005645751953125, 0.000400543212890625, 0.00136566162109375, 0.002330780029296875, 0.0032958984375, 0.004261016845703125, 0.00522613525390625, 0.006191253662109375, 0.0071563720703125, 0.008121490478515625, 0.00908660888671875, 0.010051727294921875, 0.011016845703125, 0.011981964111328125, 0.01294708251953125, 0.013912200927734375, 0.0148773193359375, 0.015842437744140625, 0.01680755615234375, 0.017772674560546875, 0.01873779296875, 0.019702911376953125, 0.02066802978515625, 0.021633148193359375, 0.0225982666015625, 0.023563385009765625, 0.02452850341796875, 0.025493621826171875, 0.026458740234375, 0.027423858642578125, 0.02838897705078125, 0.029354095458984375, 0.0303192138671875, 0.031284332275390625, 0.03224945068359375, 0.033214569091796875, 0.0341796875, 0.035144805908203125, 0.03610992431640625, 0.037075042724609375, 0.0380401611328125, 0.039005279541015625, 0.03997039794921875, 0.040935516357421875, 0.041900634765625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 4.0, 2.0, 8.0, 6.0, 9.0, 9.0, 13.0, 13.0, 27.0, 41.0, 67.0, 120.0, 168.0, 331.0, 676.0, 1490.0, 3596.0, 13201.0, 117970.0, 852035.0, 46419.0, 7606.0, 2488.0, 1106.0, 515.0, 232.0, 159.0, 92.0, 62.0, 26.0, 21.0, 14.0, 6.0, 5.0, 4.0, 6.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.0625, -78.2978515625, -75.533203125, -72.7685546875, -70.00390625, -67.2392578125, -64.474609375, -61.7099609375, -58.9453125, -56.1806640625, -53.416015625, -50.6513671875, -47.88671875, -45.1220703125, -42.357421875, -39.5927734375, -36.828125, -34.0634765625, -31.298828125, -28.5341796875, -25.76953125, -23.0048828125, -20.240234375, -17.4755859375, -14.7109375, -11.9462890625, -9.181640625, -6.4169921875, -3.65234375, -0.8876953125, 1.876953125, 4.6416015625, 7.40625, 10.1708984375, 12.935546875, 15.7001953125, 18.46484375, 21.2294921875, 23.994140625, 26.7587890625, 29.5234375, 32.2880859375, 35.052734375, 37.8173828125, 40.58203125, 43.3466796875, 46.111328125, 48.8759765625, 51.640625, 54.4052734375, 57.169921875, 59.9345703125, 62.69921875, 65.4638671875, 68.228515625, 70.9931640625, 73.7578125, 76.5224609375, 79.287109375, 82.0517578125, 84.81640625, 87.5810546875, 90.345703125, 93.1103515625, 95.875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 5.0, 10.0, 16.0, 25.0, 33.0, 52.0, 67.0, 181.0, 288.0, 135.0, 59.0, 36.0, 28.0, 23.0, 11.0, 9.0, 4.0, 4.0, 0.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.96875, -49.99560546875, -48.0224609375, -46.04931640625, -44.076171875, -42.10302734375, -40.1298828125, -38.15673828125, -36.18359375, -34.21044921875, -32.2373046875, -30.26416015625, -28.291015625, -26.31787109375, -24.3447265625, -22.37158203125, -20.3984375, -18.42529296875, -16.4521484375, -14.47900390625, -12.505859375, -10.53271484375, -8.5595703125, -6.58642578125, -4.61328125, -2.64013671875, -0.6669921875, 1.30615234375, 3.279296875, 5.25244140625, 7.2255859375, 9.19873046875, 11.171875, 13.14501953125, 15.1181640625, 17.09130859375, 19.064453125, 21.03759765625, 23.0107421875, 24.98388671875, 26.95703125, 28.93017578125, 30.9033203125, 32.87646484375, 34.849609375, 36.82275390625, 38.7958984375, 40.76904296875, 42.7421875, 44.71533203125, 46.6884765625, 48.66162109375, 50.634765625, 52.60791015625, 54.5810546875, 56.55419921875, 58.52734375, 60.50048828125, 62.4736328125, 64.44677734375, 66.419921875, 68.39306640625, 70.3662109375, 72.33935546875, 74.3125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 12.0, 25.0, 64.0, 100.0, 156.0, 216.0, 180.0, 101.0, 71.0, 33.0, 20.0, 13.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-337.5392150878906, -312.78826904296875, -288.03729248046875, -263.2863464355469, -238.53538513183594, -213.784423828125, -189.03347778320312, -164.2825164794922, -139.53155517578125, -114.78059387207031, -90.0296401977539, -65.2786865234375, -40.52772521972656, -15.776763916015625, 8.97418212890625, 33.72514343261719, 58.476104736328125, 83.22706604003906, 107.97801971435547, 132.72897338867188, 157.4799346923828, 182.23089599609375, 206.98184204101562, 231.73280334472656, 256.4837646484375, 281.2347106933594, 305.9856872558594, 330.73663330078125, 355.48760986328125, 380.2385559082031, 404.989501953125, 429.740478515625, 454.491455078125, 479.2424011230469, 503.9933776855469, 528.7443237304688, 553.4953002929688, 578.2462158203125, 602.9971923828125, 627.7481689453125, 652.4991455078125, 677.2501220703125, 702.0010375976562, 726.7520141601562, 751.5029907226562, 776.25390625, 801.0048828125, 825.755859375, 850.5067749023438, 875.2577514648438, 900.0086669921875, 924.7596435546875, 949.5106201171875, 974.2615966796875, 999.0125122070312, 1023.7634887695312, 1048.514404296875, 1073.265380859375, 1098.016357421875, 1122.767333984375, 1147.5181884765625, 1172.2691650390625, 1197.0201416015625, 1221.7711181640625, 1246.5220947265625]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 5.0, 3.0, 6.0, 3.0, 4.0, 8.0, 20.0, 10.0, 12.0, 19.0, 24.0, 30.0, 21.0, 35.0, 39.0, 39.0, 36.0, 49.0, 41.0, 36.0, 38.0, 31.0, 48.0, 48.0, 41.0, 34.0, 29.0, 41.0, 21.0, 33.0, 26.0, 27.0, 23.0, 13.0, 21.0, 22.0, 13.0, 16.0, 9.0, 4.0, 9.0, 3.0, 7.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-248.39794921875, -240.1319122314453, -231.86585998535156, -223.59982299804688, -215.33377075195312, -207.06773376464844, -198.80169677734375, -190.53564453125, -182.2696075439453, -174.00357055664062, -165.73751831054688, -157.4714813232422, -149.2054443359375, -140.93939208984375, -132.67335510253906, -124.40731048583984, -116.14126586914062, -107.8752212524414, -99.60917663574219, -91.3431396484375, -83.07709503173828, -74.81105041503906, -66.54501342773438, -58.278968811035156, -50.01292419433594, -41.74687957763672, -33.480838775634766, -25.21479606628418, -16.948753356933594, -8.682708740234375, -0.4166679382324219, 7.849372863769531, 16.11541748046875, 24.381460189819336, 32.64750289916992, 40.913543701171875, 49.179588317871094, 57.44563293457031, 65.711669921875, 73.97771453857422, 82.24375915527344, 90.50980377197266, 98.77584838867188, 107.04188537597656, 115.30792999267578, 123.573974609375, 131.8400115966797, 140.10604858398438, 148.37210083007812, 156.6381378173828, 164.90419006347656, 173.17022705078125, 181.436279296875, 189.7023162841797, 197.96835327148438, 206.23440551757812, 214.5004425048828, 222.7664794921875, 231.03253173828125, 239.29856872558594, 247.56460571289062, 255.83065795898438, 264.0967102050781, 272.36273193359375, 280.6287841796875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 11.0, 12.0, 9.0, 25.0, 31.0, 32.0, 46.0, 66.0, 93.0, 145.0, 214.0, 310.0, 427.0, 722.0, 1266.0, 2296.0, 4295.0, 9354.0, 24143.0, 93548.0, 3796123.0, 198910.0, 36788.0, 12879.0, 5696.0, 2759.0, 1511.0, 880.0, 566.0, 363.0, 228.0, 152.0, 96.0, 80.0, 45.0, 40.0, 35.0, 27.0, 11.0, 15.0, 6.0, 8.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.5625, -76.08203125, -73.6015625, -71.12109375, -68.640625, -66.16015625, -63.6796875, -61.19921875, -58.71875, -56.23828125, -53.7578125, -51.27734375, -48.796875, -46.31640625, -43.8359375, -41.35546875, -38.875, -36.39453125, -33.9140625, -31.43359375, -28.953125, -26.47265625, -23.9921875, -21.51171875, -19.03125, -16.55078125, -14.0703125, -11.58984375, -9.109375, -6.62890625, -4.1484375, -1.66796875, 0.8125, 3.29296875, 5.7734375, 8.25390625, 10.734375, 13.21484375, 15.6953125, 18.17578125, 20.65625, 23.13671875, 25.6171875, 28.09765625, 30.578125, 33.05859375, 35.5390625, 38.01953125, 40.5, 42.98046875, 45.4609375, 47.94140625, 50.421875, 52.90234375, 55.3828125, 57.86328125, 60.34375, 62.82421875, 65.3046875, 67.78515625, 70.265625, 72.74609375, 75.2265625, 77.70703125, 80.1875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 8.0, 3.0, 11.0, 6.0, 11.0, 9.0, 19.0, 15.0, 17.0, 28.0, 30.0, 31.0, 41.0, 27.0, 32.0, 35.0, 50.0, 49.0, 53.0, 56.0, 53.0, 49.0, 48.0, 50.0, 38.0, 36.0, 28.0, 30.0, 37.0, 17.0, 21.0, 11.0, 13.0, 11.0, 8.0, 9.0, 6.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.875, -12.4864501953125, -12.097900390625, -11.7093505859375, -11.32080078125, -10.9322509765625, -10.543701171875, -10.1551513671875, -9.7666015625, -9.3780517578125, -8.989501953125, -8.6009521484375, -8.21240234375, -7.8238525390625, -7.435302734375, -7.0467529296875, -6.658203125, -6.2696533203125, -5.881103515625, -5.4925537109375, -5.10400390625, -4.7154541015625, -4.326904296875, -3.9383544921875, -3.5498046875, -3.1612548828125, -2.772705078125, -2.3841552734375, -1.99560546875, -1.6070556640625, -1.218505859375, -0.8299560546875, -0.44140625, -0.0528564453125, 0.335693359375, 0.7242431640625, 1.11279296875, 1.5013427734375, 1.889892578125, 2.2784423828125, 2.6669921875, 3.0555419921875, 3.444091796875, 3.8326416015625, 4.22119140625, 4.6097412109375, 4.998291015625, 5.3868408203125, 5.775390625, 6.1639404296875, 6.552490234375, 6.9410400390625, 7.32958984375, 7.7181396484375, 8.106689453125, 8.4952392578125, 8.8837890625, 9.2723388671875, 9.660888671875, 10.0494384765625, 10.43798828125, 10.8265380859375, 11.215087890625, 11.6036376953125, 11.9921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 8.0, 12.0, 8.0, 11.0, 8.0, 8.0, 16.0, 26.0, 23.0, 32.0, 50.0, 64.0, 98.0, 177.0, 289.0, 524.0, 1182.0, 2705.0, 7353.0, 25661.0, 168876.0, 3843375.0, 112526.0, 20486.0, 6191.0, 2341.0, 1077.0, 416.0, 292.0, 150.0, 94.0, 61.0, 34.0, 34.0, 18.0, 10.0, 8.0, 10.0, 7.0, 7.0, 3.0, 6.0, 4.0, 8.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-135.5, -131.4453125, -127.390625, -123.3359375, -119.28125, -115.2265625, -111.171875, -107.1171875, -103.0625, -99.0078125, -94.953125, -90.8984375, -86.84375, -82.7890625, -78.734375, -74.6796875, -70.625, -66.5703125, -62.515625, -58.4609375, -54.40625, -50.3515625, -46.296875, -42.2421875, -38.1875, -34.1328125, -30.078125, -26.0234375, -21.96875, -17.9140625, -13.859375, -9.8046875, -5.75, -1.6953125, 2.359375, 6.4140625, 10.46875, 14.5234375, 18.578125, 22.6328125, 26.6875, 30.7421875, 34.796875, 38.8515625, 42.90625, 46.9609375, 51.015625, 55.0703125, 59.125, 63.1796875, 67.234375, 71.2890625, 75.34375, 79.3984375, 83.453125, 87.5078125, 91.5625, 95.6171875, 99.671875, 103.7265625, 107.78125, 111.8359375, 115.890625, 119.9453125, 124.0]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 13.0, 10.0, 21.0, 25.0, 44.0, 102.0, 271.0, 2695.0, 558.0, 156.0, 64.0, 40.0, 21.0, 17.0, 12.0, 5.0, 7.0, 0.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-85.0, -83.1015625, -81.203125, -79.3046875, -77.40625, -75.5078125, -73.609375, -71.7109375, -69.8125, -67.9140625, -66.015625, -64.1171875, -62.21875, -60.3203125, -58.421875, -56.5234375, -54.625, -52.7265625, -50.828125, -48.9296875, -47.03125, -45.1328125, -43.234375, -41.3359375, -39.4375, -37.5390625, -35.640625, -33.7421875, -31.84375, -29.9453125, -28.046875, -26.1484375, -24.25, -22.3515625, -20.453125, -18.5546875, -16.65625, -14.7578125, -12.859375, -10.9609375, -9.0625, -7.1640625, -5.265625, -3.3671875, -1.46875, 0.4296875, 2.328125, 4.2265625, 6.125, 8.0234375, 9.921875, 11.8203125, 13.71875, 15.6171875, 17.515625, 19.4140625, 21.3125, 23.2109375, 25.109375, 27.0078125, 28.90625, 30.8046875, 32.703125, 34.6015625, 36.5]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 7.0, 7.0, 14.0, 15.0, 18.0, 39.0, 50.0, 93.0, 113.0, 135.0, 146.0, 125.0, 78.0, 67.0, 40.0, 21.0, 13.0, 10.0, 1.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-305.647216796875, -298.75439453125, -291.8615417480469, -284.9687194824219, -278.07586669921875, -271.18304443359375, -264.29022216796875, -257.3973693847656, -250.50453186035156, -243.6116943359375, -236.71885681152344, -229.82601928710938, -222.93319702148438, -216.0403594970703, -209.14752197265625, -202.2546844482422, -195.36184692382812, -188.46900939941406, -181.576171875, -174.683349609375, -167.79051208496094, -160.89767456054688, -154.0048370361328, -147.11199951171875, -140.21917724609375, -133.3263397216797, -126.43350982666016, -119.5406723022461, -112.64783477783203, -105.7550048828125, -98.86216735839844, -91.96932983398438, -85.07649230957031, -78.18365478515625, -71.29082489013672, -64.39798736572266, -57.505149841308594, -50.6123161315918, -43.719482421875, -36.82664489746094, -29.93381118774414, -23.04097557067871, -16.14813995361328, -9.255306243896484, -2.3624706268310547, 4.530364990234375, 11.423198699951172, 18.316036224365234, 25.20886993408203, 32.10170364379883, 38.99454116821289, 45.88737487792969, 52.78021240234375, 59.67304611206055, 66.56587982177734, 73.4587173461914, 80.35154724121094, 87.244384765625, 94.13721466064453, 101.0300521850586, 107.92288970947266, 114.81571960449219, 121.70855712890625, 128.6013946533203, 135.49423217773438]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 7.0, 5.0, 11.0, 11.0, 8.0, 7.0, 23.0, 27.0, 17.0, 35.0, 24.0, 34.0, 32.0, 42.0, 37.0, 51.0, 39.0, 46.0, 44.0, 43.0, 58.0, 38.0, 47.0, 31.0, 41.0, 34.0, 31.0, 33.0, 26.0, 20.0, 22.0, 19.0, 13.0, 12.0, 7.0, 7.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.66360473632812, -123.73861694335938, -119.81362915039062, -115.88864135742188, -111.96365356445312, -108.03866577148438, -104.11367797851562, -100.18869018554688, -96.26370239257812, -92.33871459960938, -88.41372680664062, -84.48873901367188, -80.56375122070312, -76.63876342773438, -72.71377563476562, -68.78878784179688, -64.86380767822266, -60.938819885253906, -57.013832092285156, -53.088844299316406, -49.163856506347656, -45.238868713378906, -41.31388473510742, -37.38889694213867, -33.46390914916992, -29.538921356201172, -25.613933563232422, -21.688947677612305, -17.763959884643555, -13.838972091674805, -9.913986206054688, -5.9889984130859375, -2.0640106201171875, 1.8609766960144043, 5.785964012145996, 9.71095085144043, 13.63593864440918, 17.56092643737793, 21.485912322998047, 25.410900115966797, 29.335887908935547, 33.2608757019043, 37.18586349487305, 41.11084747314453, 45.03583526611328, 48.96082305908203, 52.88581085205078, 56.81079864501953, 60.73578643798828, 64.66077423095703, 68.58576202392578, 72.51074981689453, 76.43573760986328, 80.36072540283203, 84.28570556640625, 88.210693359375, 92.13568115234375, 96.0606689453125, 99.98565673828125, 103.91064453125, 107.83563232421875, 111.7606201171875, 115.68560791015625, 119.610595703125, 123.53558349609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 5.0, 8.0, 11.0, 14.0, 17.0, 24.0, 40.0, 55.0, 73.0, 92.0, 181.0, 281.0, 466.0, 743.0, 1386.0, 2496.0, 4436.0, 8255.0, 16363.0, 34279.0, 78570.0, 248041.0, 430775.0, 125094.0, 49333.0, 22821.0, 11211.0, 5899.0, 3245.0, 1731.0, 1022.0, 604.0, 348.0, 201.0, 119.0, 83.0, 63.0, 45.0, 36.0, 24.0, 13.0, 16.0, 15.0, 11.0, 3.0, 4.0, 6.0, 0.0, 1.0, 3.0], "bins": [-50.1875, -48.80224609375, -47.4169921875, -46.03173828125, -44.646484375, -43.26123046875, -41.8759765625, -40.49072265625, -39.10546875, -37.72021484375, -36.3349609375, -34.94970703125, -33.564453125, -32.17919921875, -30.7939453125, -29.40869140625, -28.0234375, -26.63818359375, -25.2529296875, -23.86767578125, -22.482421875, -21.09716796875, -19.7119140625, -18.32666015625, -16.94140625, -15.55615234375, -14.1708984375, -12.78564453125, -11.400390625, -10.01513671875, -8.6298828125, -7.24462890625, -5.859375, -4.47412109375, -3.0888671875, -1.70361328125, -0.318359375, 1.06689453125, 2.4521484375, 3.83740234375, 5.22265625, 6.60791015625, 7.9931640625, 9.37841796875, 10.763671875, 12.14892578125, 13.5341796875, 14.91943359375, 16.3046875, 17.68994140625, 19.0751953125, 20.46044921875, 21.845703125, 23.23095703125, 24.6162109375, 26.00146484375, 27.38671875, 28.77197265625, 30.1572265625, 31.54248046875, 32.927734375, 34.31298828125, 35.6982421875, 37.08349609375, 38.46875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 5.0, 4.0, 12.0, 12.0, 12.0, 12.0, 10.0, 15.0, 16.0, 19.0, 17.0, 22.0, 29.0, 30.0, 29.0, 41.0, 33.0, 37.0, 40.0, 52.0, 40.0, 34.0, 28.0, 40.0, 40.0, 38.0, 35.0, 41.0, 20.0, 29.0, 23.0, 26.0, 20.0, 26.0, 16.0, 17.0, 13.0, 13.0, 7.0, 8.0, 7.0, 8.0, 4.0, 3.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2421875, -10.894287109375, -10.54638671875, -10.198486328125, -9.8505859375, -9.502685546875, -9.15478515625, -8.806884765625, -8.458984375, -8.111083984375, -7.76318359375, -7.415283203125, -7.0673828125, -6.719482421875, -6.37158203125, -6.023681640625, -5.67578125, -5.327880859375, -4.97998046875, -4.632080078125, -4.2841796875, -3.936279296875, -3.58837890625, -3.240478515625, -2.892578125, -2.544677734375, -2.19677734375, -1.848876953125, -1.5009765625, -1.153076171875, -0.80517578125, -0.457275390625, -0.109375, 0.238525390625, 0.58642578125, 0.934326171875, 1.2822265625, 1.630126953125, 1.97802734375, 2.325927734375, 2.673828125, 3.021728515625, 3.36962890625, 3.717529296875, 4.0654296875, 4.413330078125, 4.76123046875, 5.109130859375, 5.45703125, 5.804931640625, 6.15283203125, 6.500732421875, 6.8486328125, 7.196533203125, 7.54443359375, 7.892333984375, 8.240234375, 8.588134765625, 8.93603515625, 9.283935546875, 9.6318359375, 9.979736328125, 10.32763671875, 10.675537109375, 11.0234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 9.0, 7.0, 11.0, 25.0, 24.0, 32.0, 43.0, 62.0, 68.0, 119.0, 171.0, 249.0, 472.0, 744.0, 1391.0, 2567.0, 5490.0, 14168.0, 52247.0, 541378.0, 363523.0, 42848.0, 12414.0, 4881.0, 2323.0, 1256.0, 708.0, 434.0, 292.0, 170.0, 115.0, 78.0, 56.0, 39.0, 26.0, 21.0, 14.0, 20.0, 16.0, 9.0, 7.0, 9.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.1875, -78.3818359375, -75.576171875, -72.7705078125, -69.96484375, -67.1591796875, -64.353515625, -61.5478515625, -58.7421875, -55.9365234375, -53.130859375, -50.3251953125, -47.51953125, -44.7138671875, -41.908203125, -39.1025390625, -36.296875, -33.4912109375, -30.685546875, -27.8798828125, -25.07421875, -22.2685546875, -19.462890625, -16.6572265625, -13.8515625, -11.0458984375, -8.240234375, -5.4345703125, -2.62890625, 0.1767578125, 2.982421875, 5.7880859375, 8.59375, 11.3994140625, 14.205078125, 17.0107421875, 19.81640625, 22.6220703125, 25.427734375, 28.2333984375, 31.0390625, 33.8447265625, 36.650390625, 39.4560546875, 42.26171875, 45.0673828125, 47.873046875, 50.6787109375, 53.484375, 56.2900390625, 59.095703125, 61.9013671875, 64.70703125, 67.5126953125, 70.318359375, 73.1240234375, 75.9296875, 78.7353515625, 81.541015625, 84.3466796875, 87.15234375, 89.9580078125, 92.763671875, 95.5693359375, 98.375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 6.0, 6.0, 6.0, 8.0, 14.0, 13.0, 16.0, 24.0, 36.0, 38.0, 51.0, 67.0, 78.0, 75.0, 92.0, 57.0, 79.0, 73.0, 58.0, 49.0, 34.0, 26.0, 23.0, 16.0, 6.0, 11.0, 7.0, 2.0, 4.0, 2.0, 5.0, 0.0, 6.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.6875, -88.693359375, -85.69921875, -82.705078125, -79.7109375, -76.716796875, -73.72265625, -70.728515625, -67.734375, -64.740234375, -61.74609375, -58.751953125, -55.7578125, -52.763671875, -49.76953125, -46.775390625, -43.78125, -40.787109375, -37.79296875, -34.798828125, -31.8046875, -28.810546875, -25.81640625, -22.822265625, -19.828125, -16.833984375, -13.83984375, -10.845703125, -7.8515625, -4.857421875, -1.86328125, 1.130859375, 4.125, 7.119140625, 10.11328125, 13.107421875, 16.1015625, 19.095703125, 22.08984375, 25.083984375, 28.078125, 31.072265625, 34.06640625, 37.060546875, 40.0546875, 43.048828125, 46.04296875, 49.037109375, 52.03125, 55.025390625, 58.01953125, 61.013671875, 64.0078125, 67.001953125, 69.99609375, 72.990234375, 75.984375, 78.978515625, 81.97265625, 84.966796875, 87.9609375, 90.955078125, 93.94921875, 96.943359375, 99.9375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 3.0, 7.0, 10.0, 14.0, 18.0, 18.0, 32.0, 43.0, 65.0, 87.0, 126.0, 151.0, 253.0, 379.0, 516.0, 755.0, 1186.0, 2105.0, 4223.0, 11101.0, 54593.0, 860864.0, 86535.0, 14253.0, 4869.0, 2285.0, 1333.0, 882.0, 608.0, 370.0, 240.0, 156.0, 141.0, 93.0, 64.0, 49.0, 40.0, 21.0, 19.0, 12.0, 10.0, 11.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.25, -64.9775390625, -62.705078125, -60.4326171875, -58.16015625, -55.8876953125, -53.615234375, -51.3427734375, -49.0703125, -46.7978515625, -44.525390625, -42.2529296875, -39.98046875, -37.7080078125, -35.435546875, -33.1630859375, -30.890625, -28.6181640625, -26.345703125, -24.0732421875, -21.80078125, -19.5283203125, -17.255859375, -14.9833984375, -12.7109375, -10.4384765625, -8.166015625, -5.8935546875, -3.62109375, -1.3486328125, 0.923828125, 3.1962890625, 5.46875, 7.7412109375, 10.013671875, 12.2861328125, 14.55859375, 16.8310546875, 19.103515625, 21.3759765625, 23.6484375, 25.9208984375, 28.193359375, 30.4658203125, 32.73828125, 35.0107421875, 37.283203125, 39.5556640625, 41.828125, 44.1005859375, 46.373046875, 48.6455078125, 50.91796875, 53.1904296875, 55.462890625, 57.7353515625, 60.0078125, 62.2802734375, 64.552734375, 66.8251953125, 69.09765625, 71.3701171875, 73.642578125, 75.9150390625, 78.1875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 5.0, 8.0, 11.0, 16.0, 23.0, 37.0, 90.0, 365.0, 283.0, 71.0, 26.0, 20.0, 14.0, 11.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0207672119140625, -0.020022153854370117, -0.019277095794677734, -0.01853203773498535, -0.01778697967529297, -0.017041921615600586, -0.016296863555908203, -0.01555180549621582, -0.014806747436523438, -0.014061689376831055, -0.013316631317138672, -0.012571573257446289, -0.011826515197753906, -0.011081457138061523, -0.01033639907836914, -0.009591341018676758, -0.008846282958984375, -0.008101224899291992, -0.007356166839599609, -0.0066111087799072266, -0.005866050720214844, -0.005120992660522461, -0.004375934600830078, -0.0036308765411376953, -0.0028858184814453125, -0.0021407604217529297, -0.0013957023620605469, -0.0006506443023681641, 9.441375732421875e-05, 0.0008394718170166016, 0.0015845298767089844, 0.002329587936401367, 0.00307464599609375, 0.003819704055786133, 0.004564762115478516, 0.0053098201751708984, 0.006054878234863281, 0.006799936294555664, 0.007544994354248047, 0.00829005241394043, 0.009035110473632812, 0.009780168533325195, 0.010525226593017578, 0.011270284652709961, 0.012015342712402344, 0.012760400772094727, 0.01350545883178711, 0.014250516891479492, 0.014995574951171875, 0.015740633010864258, 0.01648569107055664, 0.017230749130249023, 0.017975807189941406, 0.01872086524963379, 0.019465923309326172, 0.020210981369018555, 0.020956039428710938, 0.02170109748840332, 0.022446155548095703, 0.023191213607788086, 0.02393627166748047, 0.02468132972717285, 0.025426387786865234, 0.026171445846557617, 0.02691650390625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 10.0, 14.0, 14.0, 21.0, 36.0, 48.0, 88.0, 110.0, 179.0, 301.0, 593.0, 1039.0, 2298.0, 6538.0, 26083.0, 586647.0, 391077.0, 22932.0, 5878.0, 2262.0, 1022.0, 544.0, 307.0, 174.0, 115.0, 66.0, 42.0, 33.0, 25.0, 16.0, 5.0, 8.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.3125, -73.84765625, -71.3828125, -68.91796875, -66.453125, -63.98828125, -61.5234375, -59.05859375, -56.59375, -54.12890625, -51.6640625, -49.19921875, -46.734375, -44.26953125, -41.8046875, -39.33984375, -36.875, -34.41015625, -31.9453125, -29.48046875, -27.015625, -24.55078125, -22.0859375, -19.62109375, -17.15625, -14.69140625, -12.2265625, -9.76171875, -7.296875, -4.83203125, -2.3671875, 0.09765625, 2.5625, 5.02734375, 7.4921875, 9.95703125, 12.421875, 14.88671875, 17.3515625, 19.81640625, 22.28125, 24.74609375, 27.2109375, 29.67578125, 32.140625, 34.60546875, 37.0703125, 39.53515625, 42.0, 44.46484375, 46.9296875, 49.39453125, 51.859375, 54.32421875, 56.7890625, 59.25390625, 61.71875, 64.18359375, 66.6484375, 69.11328125, 71.578125, 74.04296875, 76.5078125, 78.97265625, 81.4375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 12.0, 7.0, 14.0, 19.0, 43.0, 98.0, 325.0, 257.0, 107.0, 31.0, 20.0, 17.0, 9.0, 7.0, 6.0, 7.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.125, -69.7880859375, -67.451171875, -65.1142578125, -62.77734375, -60.4404296875, -58.103515625, -55.7666015625, -53.4296875, -51.0927734375, -48.755859375, -46.4189453125, -44.08203125, -41.7451171875, -39.408203125, -37.0712890625, -34.734375, -32.3974609375, -30.060546875, -27.7236328125, -25.38671875, -23.0498046875, -20.712890625, -18.3759765625, -16.0390625, -13.7021484375, -11.365234375, -9.0283203125, -6.69140625, -4.3544921875, -2.017578125, 0.3193359375, 2.65625, 4.9931640625, 7.330078125, 9.6669921875, 12.00390625, 14.3408203125, 16.677734375, 19.0146484375, 21.3515625, 23.6884765625, 26.025390625, 28.3623046875, 30.69921875, 33.0361328125, 35.373046875, 37.7099609375, 40.046875, 42.3837890625, 44.720703125, 47.0576171875, 49.39453125, 51.7314453125, 54.068359375, 56.4052734375, 58.7421875, 61.0791015625, 63.416015625, 65.7529296875, 68.08984375, 70.4267578125, 72.763671875, 75.1005859375, 77.4375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 10.0, 10.0, 28.0, 60.0, 105.0, 190.0, 198.0, 182.0, 102.0, 47.0, 36.0, 21.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-445.5379943847656, -416.69622802734375, -387.8544921875, -359.0127258300781, -330.1709899902344, -301.3292236328125, -272.48748779296875, -243.64572143554688, -214.80397033691406, -185.96221923828125, -157.12046813964844, -128.27871704101562, -99.43695831298828, -70.59519958496094, -41.753448486328125, -12.911697387695312, 15.9300537109375, 44.77180480957031, 73.61355590820312, 102.45531463623047, 131.29705810546875, 160.13882446289062, 188.98057556152344, 217.82232666015625, 246.66407775878906, 275.5058288574219, 304.34759521484375, 333.1893310546875, 362.0310974121094, 390.87286376953125, 419.714599609375, 448.55633544921875, 477.39813232421875, 506.2398986816406, 535.0816650390625, 563.9234008789062, 592.76513671875, 621.60693359375, 650.4486694335938, 679.2904052734375, 708.1321411132812, 736.973876953125, 765.815673828125, 794.6574096679688, 823.4991455078125, 852.3409423828125, 881.1826782226562, 910.0244140625, 938.8662109375, 967.7079467773438, 996.5497436523438, 1025.3914794921875, 1054.2332763671875, 1083.074951171875, 1111.916748046875, 1140.758544921875, 1169.6002197265625, 1198.4420166015625, 1227.28369140625, 1256.12548828125, 1284.96728515625, 1313.8089599609375, 1342.6507568359375, 1371.492431640625, 1400.334228515625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 2.0, 4.0, 10.0, 3.0, 11.0, 9.0, 9.0, 15.0, 14.0, 10.0, 23.0, 21.0, 22.0, 25.0, 15.0, 35.0, 37.0, 27.0, 30.0, 30.0, 39.0, 44.0, 41.0, 39.0, 43.0, 45.0, 47.0, 41.0, 37.0, 26.0, 31.0, 33.0, 17.0, 21.0, 21.0, 19.0, 24.0, 17.0, 10.0, 7.0, 10.0, 5.0, 10.0, 4.0, 3.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-278.5648193359375, -269.580322265625, -260.5958251953125, -251.611328125, -242.62681579589844, -233.64231872558594, -224.65782165527344, -215.67332458496094, -206.68881225585938, -197.70431518554688, -188.71981811523438, -179.73532104492188, -170.7508087158203, -161.7663116455078, -152.7818145751953, -143.7973175048828, -134.8128204345703, -125.82832336425781, -116.84381866455078, -107.85932159423828, -98.87481689453125, -89.89031982421875, -80.90582275390625, -71.92132568359375, -62.93682098388672, -53.95232009887695, -44.96781921386719, -35.98332214355469, -26.998821258544922, -18.014320373535156, -9.029823303222656, -0.045322418212890625, 8.939178466796875, 17.92367935180664, 26.908178329467773, 35.892677307128906, 44.87717819213867, 53.86167907714844, 62.84617614746094, 71.83067321777344, 80.81517791748047, 89.79967498779297, 98.7841796875, 107.7686767578125, 116.753173828125, 125.73767852783203, 134.72216796875, 143.70668029785156, 152.69117736816406, 161.67567443847656, 170.66017150878906, 179.64468383789062, 188.62918090820312, 197.61367797851562, 206.59817504882812, 215.58267211914062, 224.56716918945312, 233.55166625976562, 242.53616333007812, 251.52066040039062, 260.5051574707031, 269.48968505859375, 278.47418212890625, 287.45867919921875, 296.44317626953125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 4.0, 5.0, 10.0, 12.0, 16.0, 13.0, 23.0, 28.0, 41.0, 75.0, 98.0, 153.0, 235.0, 346.0, 561.0, 951.0, 1585.0, 2881.0, 5353.0, 10922.0, 27774.0, 124063.0, 3846040.0, 120945.0, 28392.0, 11319.0, 5446.0, 2889.0, 1616.0, 958.0, 551.0, 338.0, 204.0, 134.0, 94.0, 63.0, 39.0, 19.0, 17.0, 13.0, 14.0, 12.0, 6.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-125.0, -121.267578125, -117.53515625, -113.802734375, -110.0703125, -106.337890625, -102.60546875, -98.873046875, -95.140625, -91.408203125, -87.67578125, -83.943359375, -80.2109375, -76.478515625, -72.74609375, -69.013671875, -65.28125, -61.548828125, -57.81640625, -54.083984375, -50.3515625, -46.619140625, -42.88671875, -39.154296875, -35.421875, -31.689453125, -27.95703125, -24.224609375, -20.4921875, -16.759765625, -13.02734375, -9.294921875, -5.5625, -1.830078125, 1.90234375, 5.634765625, 9.3671875, 13.099609375, 16.83203125, 20.564453125, 24.296875, 28.029296875, 31.76171875, 35.494140625, 39.2265625, 42.958984375, 46.69140625, 50.423828125, 54.15625, 57.888671875, 61.62109375, 65.353515625, 69.0859375, 72.818359375, 76.55078125, 80.283203125, 84.015625, 87.748046875, 91.48046875, 95.212890625, 98.9453125, 102.677734375, 106.41015625, 110.142578125, 113.875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 8.0, 4.0, 4.0, 7.0, 17.0, 8.0, 19.0, 21.0, 29.0, 27.0, 37.0, 49.0, 28.0, 41.0, 52.0, 35.0, 50.0, 57.0, 54.0, 58.0, 46.0, 55.0, 34.0, 37.0, 38.0, 26.0, 26.0, 29.0, 30.0, 18.0, 16.0, 8.0, 9.0, 9.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3984375, -13.8973388671875, -13.396240234375, -12.8951416015625, -12.39404296875, -11.8929443359375, -11.391845703125, -10.8907470703125, -10.3896484375, -9.8885498046875, -9.387451171875, -8.8863525390625, -8.38525390625, -7.8841552734375, -7.383056640625, -6.8819580078125, -6.380859375, -5.8797607421875, -5.378662109375, -4.8775634765625, -4.37646484375, -3.8753662109375, -3.374267578125, -2.8731689453125, -2.3720703125, -1.8709716796875, -1.369873046875, -0.8687744140625, -0.36767578125, 0.1334228515625, 0.634521484375, 1.1356201171875, 1.63671875, 2.1378173828125, 2.638916015625, 3.1400146484375, 3.64111328125, 4.1422119140625, 4.643310546875, 5.1444091796875, 5.6455078125, 6.1466064453125, 6.647705078125, 7.1488037109375, 7.64990234375, 8.1510009765625, 8.652099609375, 9.1531982421875, 9.654296875, 10.1553955078125, 10.656494140625, 11.1575927734375, 11.65869140625, 12.1597900390625, 12.660888671875, 13.1619873046875, 13.6630859375, 14.1641845703125, 14.665283203125, 15.1663818359375, 15.66748046875, 16.1685791015625, 16.669677734375, 17.1707763671875, 17.671875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 4.0, 7.0, 7.0, 5.0, 6.0, 19.0, 11.0, 13.0, 30.0, 42.0, 57.0, 50.0, 95.0, 144.0, 252.0, 469.0, 1164.0, 3313.0, 11148.0, 56985.0, 3969535.0, 126579.0, 16778.0, 4539.0, 1569.0, 615.0, 311.0, 173.0, 104.0, 68.0, 46.0, 30.0, 18.0, 18.0, 18.0, 16.0, 2.0, 11.0, 11.0, 9.0, 6.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-309.0, -300.08203125, -291.1640625, -282.24609375, -273.328125, -264.41015625, -255.4921875, -246.57421875, -237.65625, -228.73828125, -219.8203125, -210.90234375, -201.984375, -193.06640625, -184.1484375, -175.23046875, -166.3125, -157.39453125, -148.4765625, -139.55859375, -130.640625, -121.72265625, -112.8046875, -103.88671875, -94.96875, -86.05078125, -77.1328125, -68.21484375, -59.296875, -50.37890625, -41.4609375, -32.54296875, -23.625, -14.70703125, -5.7890625, 3.12890625, 12.046875, 20.96484375, 29.8828125, 38.80078125, 47.71875, 56.63671875, 65.5546875, 74.47265625, 83.390625, 92.30859375, 101.2265625, 110.14453125, 119.0625, 127.98046875, 136.8984375, 145.81640625, 154.734375, 163.65234375, 172.5703125, 181.48828125, 190.40625, 199.32421875, 208.2421875, 217.16015625, 226.078125, 234.99609375, 243.9140625, 252.83203125, 261.75]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 6.0, 9.0, 14.0, 31.0, 66.0, 222.0, 3269.0, 296.0, 63.0, 35.0, 18.0, 21.0, 10.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-178.875, -174.669921875, -170.46484375, -166.259765625, -162.0546875, -157.849609375, -153.64453125, -149.439453125, -145.234375, -141.029296875, -136.82421875, -132.619140625, -128.4140625, -124.208984375, -120.00390625, -115.798828125, -111.59375, -107.388671875, -103.18359375, -98.978515625, -94.7734375, -90.568359375, -86.36328125, -82.158203125, -77.953125, -73.748046875, -69.54296875, -65.337890625, -61.1328125, -56.927734375, -52.72265625, -48.517578125, -44.3125, -40.107421875, -35.90234375, -31.697265625, -27.4921875, -23.287109375, -19.08203125, -14.876953125, -10.671875, -6.466796875, -2.26171875, 1.943359375, 6.1484375, 10.353515625, 14.55859375, 18.763671875, 22.96875, 27.173828125, 31.37890625, 35.583984375, 39.7890625, 43.994140625, 48.19921875, 52.404296875, 56.609375, 60.814453125, 65.01953125, 69.224609375, 73.4296875, 77.634765625, 81.83984375, 86.044921875, 90.25]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 15.0, 19.0, 32.0, 66.0, 149.0, 245.0, 243.0, 116.0, 72.0, 27.0, 12.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-434.6964111328125, -414.8282470703125, -394.9600830078125, -375.0919189453125, -355.2237548828125, -335.3555908203125, -315.4874267578125, -295.6192626953125, -275.7510986328125, -255.8829345703125, -236.0147705078125, -216.1466064453125, -196.2784423828125, -176.4102783203125, -156.5421142578125, -136.6739501953125, -116.8057861328125, -96.9376220703125, -77.0694580078125, -57.2012939453125, -37.3331298828125, -17.4649658203125, 2.4031982421875, 22.2713623046875, 42.1395263671875, 62.0076904296875, 81.8758544921875, 101.7440185546875, 121.6121826171875, 141.4803466796875, 161.3485107421875, 181.2166748046875, 201.08489990234375, 220.95306396484375, 240.82122802734375, 260.68939208984375, 280.55755615234375, 300.42572021484375, 320.29388427734375, 340.16204833984375, 360.03021240234375, 379.89837646484375, 399.76654052734375, 419.63470458984375, 439.50286865234375, 459.37103271484375, 479.23919677734375, 499.10736083984375, 518.9755249023438, 538.8436889648438, 558.7118530273438, 578.5800170898438, 598.4481811523438, 618.3163452148438, 638.1845092773438, 658.0526733398438, 677.9208374023438, 697.7890014648438, 717.6571655273438, 737.5253295898438, 757.3934936523438, 777.2616577148438, 797.1298217773438, 816.9979858398438, 836.8661499023438]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 6.0, 5.0, 7.0, 5.0, 10.0, 15.0, 19.0, 31.0, 23.0, 17.0, 25.0, 38.0, 33.0, 28.0, 34.0, 40.0, 40.0, 39.0, 36.0, 47.0, 48.0, 41.0, 49.0, 33.0, 45.0, 24.0, 31.0, 36.0, 27.0, 21.0, 13.0, 24.0, 16.0, 7.0, 13.0, 9.0, 16.0, 13.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-171.8367919921875, -166.40737915039062, -160.9779510498047, -155.5485382080078, -150.11912536621094, -144.689697265625, -139.26028442382812, -133.83087158203125, -128.40145874023438, -122.97203826904297, -117.5426254272461, -112.11320495605469, -106.68379211425781, -101.2543716430664, -95.824951171875, -90.39553833007812, -84.96611022949219, -79.53668975830078, -74.1072769165039, -68.6778564453125, -63.24843978881836, -57.81902313232422, -52.38960266113281, -46.96018600463867, -41.53076934814453, -36.10135269165039, -30.671934127807617, -25.242515563964844, -19.813098907470703, -14.383682250976562, -8.954261779785156, -3.5248451232910156, 1.904571533203125, 7.333989143371582, 12.763406753540039, 18.192825317382812, 23.622241973876953, 29.051658630371094, 34.4810791015625, 39.91049575805664, 45.33991241455078, 50.76932907104492, 56.19874572753906, 61.62816619873047, 67.05758666992188, 72.48699951171875, 77.91641998291016, 83.34584045410156, 88.77525329589844, 94.20467376708984, 99.63408660888672, 105.06350708007812, 110.492919921875, 115.9223403930664, 121.35176086425781, 126.78117370605469, 132.21060180664062, 137.6400146484375, 143.06944274902344, 148.4988555908203, 153.9282684326172, 159.35769653320312, 164.787109375, 170.21652221679688, 175.64593505859375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 3.0, 9.0, 8.0, 15.0, 18.0, 37.0, 46.0, 66.0, 98.0, 127.0, 210.0, 275.0, 465.0, 730.0, 1109.0, 1716.0, 2797.0, 4905.0, 8768.0, 16878.0, 34589.0, 77865.0, 204060.0, 402828.0, 162832.0, 64729.0, 29602.0, 14679.0, 7768.0, 4411.0, 2613.0, 1569.0, 976.0, 560.0, 409.0, 254.0, 159.0, 126.0, 74.0, 52.0, 35.0, 24.0, 16.0, 15.0, 9.0, 5.0, 9.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.34375, -52.35986328125, -50.3759765625, -48.39208984375, -46.408203125, -44.42431640625, -42.4404296875, -40.45654296875, -38.47265625, -36.48876953125, -34.5048828125, -32.52099609375, -30.537109375, -28.55322265625, -26.5693359375, -24.58544921875, -22.6015625, -20.61767578125, -18.6337890625, -16.64990234375, -14.666015625, -12.68212890625, -10.6982421875, -8.71435546875, -6.73046875, -4.74658203125, -2.7626953125, -0.77880859375, 1.205078125, 3.18896484375, 5.1728515625, 7.15673828125, 9.140625, 11.12451171875, 13.1083984375, 15.09228515625, 17.076171875, 19.06005859375, 21.0439453125, 23.02783203125, 25.01171875, 26.99560546875, 28.9794921875, 30.96337890625, 32.947265625, 34.93115234375, 36.9150390625, 38.89892578125, 40.8828125, 42.86669921875, 44.8505859375, 46.83447265625, 48.818359375, 50.80224609375, 52.7861328125, 54.77001953125, 56.75390625, 58.73779296875, 60.7216796875, 62.70556640625, 64.689453125, 66.67333984375, 68.6572265625, 70.64111328125, 72.625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 3.0, 5.0, 5.0, 11.0, 7.0, 9.0, 20.0, 20.0, 23.0, 20.0, 25.0, 22.0, 38.0, 29.0, 27.0, 43.0, 46.0, 49.0, 44.0, 44.0, 36.0, 40.0, 46.0, 41.0, 29.0, 27.0, 27.0, 38.0, 24.0, 26.0, 29.0, 20.0, 20.0, 20.0, 18.0, 15.0, 9.0, 10.0, 6.0, 7.0, 2.0, 3.0, 0.0, 5.0, 1.0, 2.0, 3.0], "bins": [-19.515625, -18.988037109375, -18.46044921875, -17.932861328125, -17.4052734375, -16.877685546875, -16.35009765625, -15.822509765625, -15.294921875, -14.767333984375, -14.23974609375, -13.712158203125, -13.1845703125, -12.656982421875, -12.12939453125, -11.601806640625, -11.07421875, -10.546630859375, -10.01904296875, -9.491455078125, -8.9638671875, -8.436279296875, -7.90869140625, -7.381103515625, -6.853515625, -6.325927734375, -5.79833984375, -5.270751953125, -4.7431640625, -4.215576171875, -3.68798828125, -3.160400390625, -2.6328125, -2.105224609375, -1.57763671875, -1.050048828125, -0.5224609375, 0.005126953125, 0.53271484375, 1.060302734375, 1.587890625, 2.115478515625, 2.64306640625, 3.170654296875, 3.6982421875, 4.225830078125, 4.75341796875, 5.281005859375, 5.80859375, 6.336181640625, 6.86376953125, 7.391357421875, 7.9189453125, 8.446533203125, 8.97412109375, 9.501708984375, 10.029296875, 10.556884765625, 11.08447265625, 11.612060546875, 12.1396484375, 12.667236328125, 13.19482421875, 13.722412109375, 14.25]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 4.0, 6.0, 2.0, 13.0, 9.0, 11.0, 8.0, 18.0, 26.0, 33.0, 43.0, 57.0, 86.0, 116.0, 194.0, 294.0, 421.0, 805.0, 1466.0, 2733.0, 5793.0, 14011.0, 40264.0, 163782.0, 613386.0, 143840.0, 36502.0, 13107.0, 5488.0, 2628.0, 1303.0, 781.0, 456.0, 259.0, 187.0, 114.0, 92.0, 49.0, 43.0, 22.0, 22.0, 24.0, 17.0, 12.0, 11.0, 8.0, 4.0, 3.0, 1.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-83.9375, -80.880859375, -77.82421875, -74.767578125, -71.7109375, -68.654296875, -65.59765625, -62.541015625, -59.484375, -56.427734375, -53.37109375, -50.314453125, -47.2578125, -44.201171875, -41.14453125, -38.087890625, -35.03125, -31.974609375, -28.91796875, -25.861328125, -22.8046875, -19.748046875, -16.69140625, -13.634765625, -10.578125, -7.521484375, -4.46484375, -1.408203125, 1.6484375, 4.705078125, 7.76171875, 10.818359375, 13.875, 16.931640625, 19.98828125, 23.044921875, 26.1015625, 29.158203125, 32.21484375, 35.271484375, 38.328125, 41.384765625, 44.44140625, 47.498046875, 50.5546875, 53.611328125, 56.66796875, 59.724609375, 62.78125, 65.837890625, 68.89453125, 71.951171875, 75.0078125, 78.064453125, 81.12109375, 84.177734375, 87.234375, 90.291015625, 93.34765625, 96.404296875, 99.4609375, 102.517578125, 105.57421875, 108.630859375, 111.6875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 7.0, 2.0, 5.0, 11.0, 9.0, 12.0, 19.0, 13.0, 20.0, 15.0, 20.0, 28.0, 28.0, 38.0, 36.0, 33.0, 33.0, 32.0, 39.0, 43.0, 59.0, 55.0, 44.0, 56.0, 41.0, 38.0, 34.0, 37.0, 38.0, 26.0, 12.0, 14.0, 16.0, 15.0, 16.0, 6.0, 9.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-73.3125, -70.6162109375, -67.919921875, -65.2236328125, -62.52734375, -59.8310546875, -57.134765625, -54.4384765625, -51.7421875, -49.0458984375, -46.349609375, -43.6533203125, -40.95703125, -38.2607421875, -35.564453125, -32.8681640625, -30.171875, -27.4755859375, -24.779296875, -22.0830078125, -19.38671875, -16.6904296875, -13.994140625, -11.2978515625, -8.6015625, -5.9052734375, -3.208984375, -0.5126953125, 2.18359375, 4.8798828125, 7.576171875, 10.2724609375, 12.96875, 15.6650390625, 18.361328125, 21.0576171875, 23.75390625, 26.4501953125, 29.146484375, 31.8427734375, 34.5390625, 37.2353515625, 39.931640625, 42.6279296875, 45.32421875, 48.0205078125, 50.716796875, 53.4130859375, 56.109375, 58.8056640625, 61.501953125, 64.1982421875, 66.89453125, 69.5908203125, 72.287109375, 74.9833984375, 77.6796875, 80.3759765625, 83.072265625, 85.7685546875, 88.46484375, 91.1611328125, 93.857421875, 96.5537109375, 99.25]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 11.0, 7.0, 25.0, 19.0, 24.0, 45.0, 69.0, 118.0, 201.0, 313.0, 609.0, 1175.0, 2437.0, 5216.0, 14411.0, 51789.0, 415748.0, 474016.0, 56296.0, 15223.0, 5737.0, 2416.0, 1180.0, 588.0, 336.0, 228.0, 110.0, 56.0, 39.0, 30.0, 28.0, 17.0, 13.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.0625, -46.2841796875, -44.505859375, -42.7275390625, -40.94921875, -39.1708984375, -37.392578125, -35.6142578125, -33.8359375, -32.0576171875, -30.279296875, -28.5009765625, -26.72265625, -24.9443359375, -23.166015625, -21.3876953125, -19.609375, -17.8310546875, -16.052734375, -14.2744140625, -12.49609375, -10.7177734375, -8.939453125, -7.1611328125, -5.3828125, -3.6044921875, -1.826171875, -0.0478515625, 1.73046875, 3.5087890625, 5.287109375, 7.0654296875, 8.84375, 10.6220703125, 12.400390625, 14.1787109375, 15.95703125, 17.7353515625, 19.513671875, 21.2919921875, 23.0703125, 24.8486328125, 26.626953125, 28.4052734375, 30.18359375, 31.9619140625, 33.740234375, 35.5185546875, 37.296875, 39.0751953125, 40.853515625, 42.6318359375, 44.41015625, 46.1884765625, 47.966796875, 49.7451171875, 51.5234375, 53.3017578125, 55.080078125, 56.8583984375, 58.63671875, 60.4150390625, 62.193359375, 63.9716796875, 65.75]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 7.0, 7.0, 9.0, 10.0, 9.0, 20.0, 20.0, 36.0, 48.0, 86.0, 141.0, 201.0, 141.0, 77.0, 55.0, 29.0, 27.0, 21.0, 9.0, 10.0, 13.0, 7.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0164337158203125, -0.01594412326812744, -0.015454530715942383, -0.014964938163757324, -0.014475345611572266, -0.013985753059387207, -0.013496160507202148, -0.01300656795501709, -0.012516975402832031, -0.012027382850646973, -0.011537790298461914, -0.011048197746276855, -0.010558605194091797, -0.010069012641906738, -0.00957942008972168, -0.009089827537536621, -0.008600234985351562, -0.008110642433166504, -0.007621049880981445, -0.007131457328796387, -0.006641864776611328, -0.0061522722244262695, -0.005662679672241211, -0.005173087120056152, -0.004683494567871094, -0.004193902015686035, -0.0037043094635009766, -0.003214716911315918, -0.0027251243591308594, -0.0022355318069458008, -0.0017459392547607422, -0.0012563467025756836, -0.000766754150390625, -0.0002771615982055664, 0.0002124309539794922, 0.0007020235061645508, 0.0011916160583496094, 0.001681208610534668, 0.0021708011627197266, 0.002660393714904785, 0.0031499862670898438, 0.0036395788192749023, 0.004129171371459961, 0.0046187639236450195, 0.005108356475830078, 0.005597949028015137, 0.006087541580200195, 0.006577134132385254, 0.0070667266845703125, 0.007556319236755371, 0.00804591178894043, 0.008535504341125488, 0.009025096893310547, 0.009514689445495605, 0.010004281997680664, 0.010493874549865723, 0.010983467102050781, 0.01147305965423584, 0.011962652206420898, 0.012452244758605957, 0.012941837310791016, 0.013431429862976074, 0.013921022415161133, 0.014410614967346191, 0.01490020751953125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 1.0, 5.0, 8.0, 11.0, 20.0, 25.0, 33.0, 47.0, 74.0, 101.0, 196.0, 315.0, 607.0, 1253.0, 2730.0, 7874.0, 28155.0, 176411.0, 680226.0, 117810.0, 21686.0, 6143.0, 2440.0, 1091.0, 542.0, 263.0, 176.0, 100.0, 67.0, 32.0, 32.0, 23.0, 8.0, 15.0, 7.0, 2.0, 10.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.3125, -51.3671875, -49.421875, -47.4765625, -45.53125, -43.5859375, -41.640625, -39.6953125, -37.75, -35.8046875, -33.859375, -31.9140625, -29.96875, -28.0234375, -26.078125, -24.1328125, -22.1875, -20.2421875, -18.296875, -16.3515625, -14.40625, -12.4609375, -10.515625, -8.5703125, -6.625, -4.6796875, -2.734375, -0.7890625, 1.15625, 3.1015625, 5.046875, 6.9921875, 8.9375, 10.8828125, 12.828125, 14.7734375, 16.71875, 18.6640625, 20.609375, 22.5546875, 24.5, 26.4453125, 28.390625, 30.3359375, 32.28125, 34.2265625, 36.171875, 38.1171875, 40.0625, 42.0078125, 43.953125, 45.8984375, 47.84375, 49.7890625, 51.734375, 53.6796875, 55.625, 57.5703125, 59.515625, 61.4609375, 63.40625, 65.3515625, 67.296875, 69.2421875, 71.1875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 14.0, 8.0, 12.0, 11.0, 12.0, 29.0, 33.0, 46.0, 52.0, 76.0, 127.0, 130.0, 133.0, 93.0, 59.0, 34.0, 36.0, 22.0, 20.0, 12.0, 7.0, 5.0, 9.0, 5.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.375, -39.61328125, -37.8515625, -36.08984375, -34.328125, -32.56640625, -30.8046875, -29.04296875, -27.28125, -25.51953125, -23.7578125, -21.99609375, -20.234375, -18.47265625, -16.7109375, -14.94921875, -13.1875, -11.42578125, -9.6640625, -7.90234375, -6.140625, -4.37890625, -2.6171875, -0.85546875, 0.90625, 2.66796875, 4.4296875, 6.19140625, 7.953125, 9.71484375, 11.4765625, 13.23828125, 15.0, 16.76171875, 18.5234375, 20.28515625, 22.046875, 23.80859375, 25.5703125, 27.33203125, 29.09375, 30.85546875, 32.6171875, 34.37890625, 36.140625, 37.90234375, 39.6640625, 41.42578125, 43.1875, 44.94921875, 46.7109375, 48.47265625, 50.234375, 51.99609375, 53.7578125, 55.51953125, 57.28125, 59.04296875, 60.8046875, 62.56640625, 64.328125, 66.08984375, 67.8515625, 69.61328125, 71.375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 10.0, 23.0, 49.0, 78.0, 149.0, 193.0, 220.0, 136.0, 74.0, 35.0, 24.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1474.6683349609375, -1435.7587890625, -1396.84912109375, -1357.9395751953125, -1319.030029296875, -1280.120361328125, -1241.2108154296875, -1202.30126953125, -1163.3916015625, -1124.4820556640625, -1085.5723876953125, -1046.662841796875, -1007.7532348632812, -968.8436279296875, -929.93408203125, -891.0244750976562, -852.1148681640625, -813.2052612304688, -774.295654296875, -735.3861083984375, -696.4765014648438, -657.56689453125, -618.6573486328125, -579.7477416992188, -540.838134765625, -501.92852783203125, -463.0189514160156, -424.109375, -385.19976806640625, -346.2901611328125, -307.3805847167969, -268.47100830078125, -229.56134033203125, -190.65174865722656, -151.74215698242188, -112.83256530761719, -73.9229736328125, -35.01338195800781, 3.896209716796875, 42.8057861328125, 81.71539306640625, 120.62498474121094, 159.53457641601562, 198.4441680908203, 237.353759765625, 276.26336669921875, 315.1729431152344, 354.08251953125, 392.99212646484375, 431.9017333984375, 470.8113098144531, 509.72088623046875, 548.6304931640625, 587.5401000976562, 626.44970703125, 665.3592529296875, 704.2688598632812, 743.178466796875, 782.0880126953125, 820.9976196289062, 859.9072265625, 898.8168334960938, 937.7264404296875, 976.635986328125, 1015.5455932617188]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 9.0, 10.0, 9.0, 6.0, 9.0, 6.0, 15.0, 18.0, 21.0, 32.0, 26.0, 19.0, 25.0, 29.0, 32.0, 40.0, 44.0, 39.0, 35.0, 39.0, 34.0, 31.0, 39.0, 33.0, 43.0, 35.0, 24.0, 39.0, 35.0, 34.0, 19.0, 19.0, 23.0, 16.0, 15.0, 9.0, 11.0, 13.0, 6.0, 5.0, 11.0, 8.0, 10.0, 2.0, 1.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-383.0623474121094, -371.3676452636719, -359.6729431152344, -347.9782409667969, -336.28350830078125, -324.58880615234375, -312.89410400390625, -301.19940185546875, -289.50469970703125, -277.80999755859375, -266.11529541015625, -254.4205780029297, -242.7258758544922, -231.0311737060547, -219.33645629882812, -207.64175415039062, -195.94705200195312, -184.25234985351562, -172.55764770507812, -160.86293029785156, -149.16822814941406, -137.47352600097656, -125.77881622314453, -114.0841064453125, -102.389404296875, -90.6947021484375, -78.99999237060547, -67.30528259277344, -55.61058044433594, -43.91587448120117, -32.221168518066406, -20.526458740234375, -8.831787109375, 2.8629188537597656, 14.557624816894531, 26.252330780029297, 37.94703674316406, 49.64174270629883, 61.336448669433594, 73.03115844726562, 84.72586059570312, 96.42056274414062, 108.11527252197266, 119.80998229980469, 131.5046844482422, 143.1993865966797, 154.89410400390625, 166.58880615234375, 178.28350830078125, 189.97821044921875, 201.67291259765625, 213.3676300048828, 225.0623321533203, 236.7570343017578, 248.45175170898438, 260.1464538574219, 271.8411560058594, 283.5358581542969, 295.2305603027344, 306.9252624511719, 318.6199951171875, 330.314697265625, 342.0093994140625, 353.7041015625, 365.3988037109375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 7.0, 5.0, 11.0, 10.0, 16.0, 12.0, 22.0, 32.0, 37.0, 72.0, 91.0, 98.0, 174.0, 218.0, 345.0, 484.0, 718.0, 1109.0, 1585.0, 2468.0, 4165.0, 7472.0, 15608.0, 37174.0, 127705.0, 3694992.0, 209546.0, 48352.0, 18838.0, 9207.0, 5053.0, 2972.0, 1926.0, 1229.0, 808.0, 543.0, 382.0, 260.0, 180.0, 123.0, 70.0, 56.0, 37.0, 26.0, 22.0, 10.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-96.0625, -93.3662109375, -90.669921875, -87.9736328125, -85.27734375, -82.5810546875, -79.884765625, -77.1884765625, -74.4921875, -71.7958984375, -69.099609375, -66.4033203125, -63.70703125, -61.0107421875, -58.314453125, -55.6181640625, -52.921875, -50.2255859375, -47.529296875, -44.8330078125, -42.13671875, -39.4404296875, -36.744140625, -34.0478515625, -31.3515625, -28.6552734375, -25.958984375, -23.2626953125, -20.56640625, -17.8701171875, -15.173828125, -12.4775390625, -9.78125, -7.0849609375, -4.388671875, -1.6923828125, 1.00390625, 3.7001953125, 6.396484375, 9.0927734375, 11.7890625, 14.4853515625, 17.181640625, 19.8779296875, 22.57421875, 25.2705078125, 27.966796875, 30.6630859375, 33.359375, 36.0556640625, 38.751953125, 41.4482421875, 44.14453125, 46.8408203125, 49.537109375, 52.2333984375, 54.9296875, 57.6259765625, 60.322265625, 63.0185546875, 65.71484375, 68.4111328125, 71.107421875, 73.8037109375, 76.5]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 4.0, 8.0, 7.0, 6.0, 11.0, 16.0, 17.0, 22.0, 26.0, 19.0, 27.0, 28.0, 34.0, 36.0, 41.0, 42.0, 52.0, 49.0, 46.0, 37.0, 59.0, 37.0, 46.0, 38.0, 37.0, 33.0, 33.0, 33.0, 26.0, 20.0, 18.0, 16.0, 16.0, 17.0, 11.0, 10.0, 5.0, 3.0, 7.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.171875, -19.6126708984375, -19.053466796875, -18.4942626953125, -17.93505859375, -17.3758544921875, -16.816650390625, -16.2574462890625, -15.6982421875, -15.1390380859375, -14.579833984375, -14.0206298828125, -13.46142578125, -12.9022216796875, -12.343017578125, -11.7838134765625, -11.224609375, -10.6654052734375, -10.106201171875, -9.5469970703125, -8.98779296875, -8.4285888671875, -7.869384765625, -7.3101806640625, -6.7509765625, -6.1917724609375, -5.632568359375, -5.0733642578125, -4.51416015625, -3.9549560546875, -3.395751953125, -2.8365478515625, -2.27734375, -1.7181396484375, -1.158935546875, -0.5997314453125, -0.04052734375, 0.5186767578125, 1.077880859375, 1.6370849609375, 2.1962890625, 2.7554931640625, 3.314697265625, 3.8739013671875, 4.43310546875, 4.9923095703125, 5.551513671875, 6.1107177734375, 6.669921875, 7.2291259765625, 7.788330078125, 8.3475341796875, 8.90673828125, 9.4659423828125, 10.025146484375, 10.5843505859375, 11.1435546875, 11.7027587890625, 12.261962890625, 12.8211669921875, 13.38037109375, 13.9395751953125, 14.498779296875, 15.0579833984375, 15.6171875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 8.0, 13.0, 13.0, 14.0, 26.0, 30.0, 30.0, 50.0, 55.0, 100.0, 157.0, 218.0, 441.0, 840.0, 1720.0, 3879.0, 10436.0, 35914.0, 285796.0, 3744019.0, 80746.0, 18296.0, 6266.0, 2525.0, 1163.0, 557.0, 310.0, 183.0, 134.0, 75.0, 57.0, 46.0, 33.0, 16.0, 22.0, 24.0, 11.0, 7.0, 11.0, 5.0, 4.0, 8.0, 3.0, 5.0, 2.0, 2.0], "bins": [-253.0, -246.20703125, -239.4140625, -232.62109375, -225.828125, -219.03515625, -212.2421875, -205.44921875, -198.65625, -191.86328125, -185.0703125, -178.27734375, -171.484375, -164.69140625, -157.8984375, -151.10546875, -144.3125, -137.51953125, -130.7265625, -123.93359375, -117.140625, -110.34765625, -103.5546875, -96.76171875, -89.96875, -83.17578125, -76.3828125, -69.58984375, -62.796875, -56.00390625, -49.2109375, -42.41796875, -35.625, -28.83203125, -22.0390625, -15.24609375, -8.453125, -1.66015625, 5.1328125, 11.92578125, 18.71875, 25.51171875, 32.3046875, 39.09765625, 45.890625, 52.68359375, 59.4765625, 66.26953125, 73.0625, 79.85546875, 86.6484375, 93.44140625, 100.234375, 107.02734375, 113.8203125, 120.61328125, 127.40625, 134.19921875, 140.9921875, 147.78515625, 154.578125, 161.37109375, 168.1640625, 174.95703125, 181.75]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 11.0, 9.0, 9.0, 21.0, 28.0, 28.0, 56.0, 131.0, 518.0, 2784.0, 233.0, 104.0, 46.0, 32.0, 20.0, 17.0, 7.0, 7.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-166.25, -162.576171875, -158.90234375, -155.228515625, -151.5546875, -147.880859375, -144.20703125, -140.533203125, -136.859375, -133.185546875, -129.51171875, -125.837890625, -122.1640625, -118.490234375, -114.81640625, -111.142578125, -107.46875, -103.794921875, -100.12109375, -96.447265625, -92.7734375, -89.099609375, -85.42578125, -81.751953125, -78.078125, -74.404296875, -70.73046875, -67.056640625, -63.3828125, -59.708984375, -56.03515625, -52.361328125, -48.6875, -45.013671875, -41.33984375, -37.666015625, -33.9921875, -30.318359375, -26.64453125, -22.970703125, -19.296875, -15.623046875, -11.94921875, -8.275390625, -4.6015625, -0.927734375, 2.74609375, 6.419921875, 10.09375, 13.767578125, 17.44140625, 21.115234375, 24.7890625, 28.462890625, 32.13671875, 35.810546875, 39.484375, 43.158203125, 46.83203125, 50.505859375, 54.1796875, 57.853515625, 61.52734375, 65.201171875, 68.875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 16.0, 41.0, 82.0, 202.0, 246.0, 243.0, 99.0, 41.0, 12.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-880.707275390625, -847.4222412109375, -814.13720703125, -780.8521118164062, -747.5670776367188, -714.2820434570312, -680.9969482421875, -647.7119140625, -614.4268798828125, -581.141845703125, -547.8568115234375, -514.5717163085938, -481.28668212890625, -448.00164794921875, -414.7165832519531, -381.4315185546875, -348.146484375, -314.8614501953125, -281.5763854980469, -248.2913360595703, -215.00628662109375, -181.7212371826172, -148.43618774414062, -115.15113830566406, -81.8660888671875, -48.58103942871094, -15.295989990234375, 17.989059448242188, 51.27410888671875, 84.55915832519531, 117.84420776367188, 151.12925720214844, 184.414306640625, 217.69935607910156, 250.98440551757812, 284.26947021484375, 317.55450439453125, 350.83953857421875, 384.1246032714844, 417.40966796875, 450.6947021484375, 483.979736328125, 517.2647705078125, 550.5498657226562, 583.8348999023438, 617.1199340820312, 650.405029296875, 683.6900634765625, 716.97509765625, 750.2601318359375, 783.545166015625, 816.8302612304688, 850.1152954101562, 883.4003295898438, 916.6854248046875, 949.970458984375, 983.2554931640625, 1016.54052734375, 1049.8255615234375, 1083.110595703125, 1116.395751953125, 1149.6807861328125, 1182.9658203125, 1216.2508544921875, 1249.535888671875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 8.0, 6.0, 12.0, 5.0, 12.0, 16.0, 15.0, 21.0, 15.0, 19.0, 29.0, 24.0, 22.0, 38.0, 42.0, 43.0, 39.0, 37.0, 44.0, 43.0, 41.0, 40.0, 49.0, 40.0, 50.0, 42.0, 35.0, 37.0, 20.0, 30.0, 25.0, 18.0, 14.0, 18.0, 8.0, 13.0, 6.0, 5.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-230.9420623779297, -223.25466918945312, -215.56727600097656, -207.8798828125, -200.19248962402344, -192.50509643554688, -184.81771850585938, -177.13031005859375, -169.44293212890625, -161.7555389404297, -154.06814575195312, -146.38075256347656, -138.693359375, -131.00596618652344, -123.3185806274414, -115.63118743896484, -107.94378662109375, -100.25639343261719, -92.56900024414062, -84.88160705566406, -77.1942138671875, -69.50682067871094, -61.819435119628906, -54.132041931152344, -46.44464874267578, -38.75725555419922, -31.06986427307129, -23.38247299194336, -15.695079803466797, -8.007686614990234, -0.3202972412109375, 7.367095947265625, 15.05450439453125, 22.741897583007812, 30.429288864135742, 38.11668014526367, 45.804073333740234, 53.4914665222168, 61.178855895996094, 68.86624908447266, 76.55364227294922, 84.24103546142578, 91.92842864990234, 99.61581420898438, 107.30320739746094, 114.9906005859375, 122.67799377441406, 130.36538696289062, 138.0527801513672, 145.74017333984375, 153.4275665283203, 161.11495971679688, 168.80235290527344, 176.48974609375, 184.1771240234375, 191.86453247070312, 199.55191040039062, 207.2393035888672, 214.92669677734375, 222.6140899658203, 230.30148315429688, 237.98887634277344, 245.67626953125, 253.3636474609375, 261.0510559082031]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 5.0, 1.0, 5.0, 11.0, 15.0, 21.0, 17.0, 31.0, 51.0, 62.0, 105.0, 127.0, 185.0, 280.0, 430.0, 670.0, 1106.0, 2085.0, 4254.0, 9491.0, 24525.0, 78861.0, 345640.0, 431039.0, 98292.0, 29675.0, 10991.0, 4834.0, 2421.0, 1212.0, 700.0, 429.0, 301.0, 224.0, 115.0, 81.0, 73.0, 52.0, 32.0, 28.0, 22.0, 24.0, 12.0, 7.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0], "bins": [-115.4375, -112.23828125, -109.0390625, -105.83984375, -102.640625, -99.44140625, -96.2421875, -93.04296875, -89.84375, -86.64453125, -83.4453125, -80.24609375, -77.046875, -73.84765625, -70.6484375, -67.44921875, -64.25, -61.05078125, -57.8515625, -54.65234375, -51.453125, -48.25390625, -45.0546875, -41.85546875, -38.65625, -35.45703125, -32.2578125, -29.05859375, -25.859375, -22.66015625, -19.4609375, -16.26171875, -13.0625, -9.86328125, -6.6640625, -3.46484375, -0.265625, 2.93359375, 6.1328125, 9.33203125, 12.53125, 15.73046875, 18.9296875, 22.12890625, 25.328125, 28.52734375, 31.7265625, 34.92578125, 38.125, 41.32421875, 44.5234375, 47.72265625, 50.921875, 54.12109375, 57.3203125, 60.51953125, 63.71875, 66.91796875, 70.1171875, 73.31640625, 76.515625, 79.71484375, 82.9140625, 86.11328125, 89.3125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 11.0, 6.0, 8.0, 15.0, 13.0, 9.0, 14.0, 22.0, 28.0, 24.0, 33.0, 38.0, 46.0, 40.0, 50.0, 49.0, 50.0, 38.0, 57.0, 54.0, 46.0, 39.0, 40.0, 50.0, 32.0, 25.0, 31.0, 28.0, 22.0, 9.0, 20.0, 14.0, 8.0, 7.0, 5.0, 9.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.140625, -24.349853515625, -23.55908203125, -22.768310546875, -21.9775390625, -21.186767578125, -20.39599609375, -19.605224609375, -18.814453125, -18.023681640625, -17.23291015625, -16.442138671875, -15.6513671875, -14.860595703125, -14.06982421875, -13.279052734375, -12.48828125, -11.697509765625, -10.90673828125, -10.115966796875, -9.3251953125, -8.534423828125, -7.74365234375, -6.952880859375, -6.162109375, -5.371337890625, -4.58056640625, -3.789794921875, -2.9990234375, -2.208251953125, -1.41748046875, -0.626708984375, 0.1640625, 0.954833984375, 1.74560546875, 2.536376953125, 3.3271484375, 4.117919921875, 4.90869140625, 5.699462890625, 6.490234375, 7.281005859375, 8.07177734375, 8.862548828125, 9.6533203125, 10.444091796875, 11.23486328125, 12.025634765625, 12.81640625, 13.607177734375, 14.39794921875, 15.188720703125, 15.9794921875, 16.770263671875, 17.56103515625, 18.351806640625, 19.142578125, 19.933349609375, 20.72412109375, 21.514892578125, 22.3056640625, 23.096435546875, 23.88720703125, 24.677978515625, 25.46875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 7.0, 5.0, 3.0, 12.0, 27.0, 32.0, 45.0, 86.0, 124.0, 199.0, 329.0, 594.0, 1040.0, 1925.0, 4242.0, 12956.0, 72892.0, 746505.0, 174035.0, 21908.0, 6038.0, 2467.0, 1304.0, 706.0, 418.0, 247.0, 170.0, 88.0, 60.0, 30.0, 23.0, 12.0, 9.0, 11.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.125, -172.87890625, -166.6328125, -160.38671875, -154.140625, -147.89453125, -141.6484375, -135.40234375, -129.15625, -122.91015625, -116.6640625, -110.41796875, -104.171875, -97.92578125, -91.6796875, -85.43359375, -79.1875, -72.94140625, -66.6953125, -60.44921875, -54.203125, -47.95703125, -41.7109375, -35.46484375, -29.21875, -22.97265625, -16.7265625, -10.48046875, -4.234375, 2.01171875, 8.2578125, 14.50390625, 20.75, 26.99609375, 33.2421875, 39.48828125, 45.734375, 51.98046875, 58.2265625, 64.47265625, 70.71875, 76.96484375, 83.2109375, 89.45703125, 95.703125, 101.94921875, 108.1953125, 114.44140625, 120.6875, 126.93359375, 133.1796875, 139.42578125, 145.671875, 151.91796875, 158.1640625, 164.41015625, 170.65625, 176.90234375, 183.1484375, 189.39453125, 195.640625, 201.88671875, 208.1328125, 214.37890625, 220.625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 5.0, 6.0, 12.0, 12.0, 14.0, 15.0, 15.0, 25.0, 17.0, 33.0, 43.0, 59.0, 46.0, 59.0, 55.0, 56.0, 41.0, 48.0, 49.0, 47.0, 61.0, 45.0, 28.0, 28.0, 27.0, 23.0, 26.0, 21.0, 19.0, 8.0, 14.0, 10.0, 8.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-124.9375, -120.4228515625, -115.908203125, -111.3935546875, -106.87890625, -102.3642578125, -97.849609375, -93.3349609375, -88.8203125, -84.3056640625, -79.791015625, -75.2763671875, -70.76171875, -66.2470703125, -61.732421875, -57.2177734375, -52.703125, -48.1884765625, -43.673828125, -39.1591796875, -34.64453125, -30.1298828125, -25.615234375, -21.1005859375, -16.5859375, -12.0712890625, -7.556640625, -3.0419921875, 1.47265625, 5.9873046875, 10.501953125, 15.0166015625, 19.53125, 24.0458984375, 28.560546875, 33.0751953125, 37.58984375, 42.1044921875, 46.619140625, 51.1337890625, 55.6484375, 60.1630859375, 64.677734375, 69.1923828125, 73.70703125, 78.2216796875, 82.736328125, 87.2509765625, 91.765625, 96.2802734375, 100.794921875, 105.3095703125, 109.82421875, 114.3388671875, 118.853515625, 123.3681640625, 127.8828125, 132.3974609375, 136.912109375, 141.4267578125, 145.94140625, 150.4560546875, 154.970703125, 159.4853515625, 164.0]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 0.0, 11.0, 10.0, 9.0, 19.0, 15.0, 28.0, 24.0, 47.0, 56.0, 73.0, 108.0, 162.0, 245.0, 274.0, 400.0, 515.0, 751.0, 1032.0, 1562.0, 2398.0, 4408.0, 15316.0, 661375.0, 335975.0, 12283.0, 4126.0, 2248.0, 1456.0, 1012.0, 672.0, 535.0, 373.0, 274.0, 184.0, 159.0, 98.0, 95.0, 53.0, 51.0, 33.0, 24.0, 13.0, 16.0, 10.0, 9.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-213.0, -206.115234375, -199.23046875, -192.345703125, -185.4609375, -178.576171875, -171.69140625, -164.806640625, -157.921875, -151.037109375, -144.15234375, -137.267578125, -130.3828125, -123.498046875, -116.61328125, -109.728515625, -102.84375, -95.958984375, -89.07421875, -82.189453125, -75.3046875, -68.419921875, -61.53515625, -54.650390625, -47.765625, -40.880859375, -33.99609375, -27.111328125, -20.2265625, -13.341796875, -6.45703125, 0.427734375, 7.3125, 14.197265625, 21.08203125, 27.966796875, 34.8515625, 41.736328125, 48.62109375, 55.505859375, 62.390625, 69.275390625, 76.16015625, 83.044921875, 89.9296875, 96.814453125, 103.69921875, 110.583984375, 117.46875, 124.353515625, 131.23828125, 138.123046875, 145.0078125, 151.892578125, 158.77734375, 165.662109375, 172.546875, 179.431640625, 186.31640625, 193.201171875, 200.0859375, 206.970703125, 213.85546875, 220.740234375, 227.625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 12.0, 26.0, 113.0, 594.0, 165.0, 43.0, 20.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097412109375, -0.09401321411132812, -0.09061431884765625, -0.08721542358398438, -0.0838165283203125, -0.08041763305664062, -0.07701873779296875, -0.07361984252929688, -0.070220947265625, -0.06682205200195312, -0.06342315673828125, -0.060024261474609375, -0.0566253662109375, -0.053226470947265625, -0.04982757568359375, -0.046428680419921875, -0.04302978515625, -0.039630889892578125, -0.03623199462890625, -0.032833099365234375, -0.0294342041015625, -0.026035308837890625, -0.02263641357421875, -0.019237518310546875, -0.015838623046875, -0.012439727783203125, -0.00904083251953125, -0.005641937255859375, -0.0022430419921875, 0.001155853271484375, 0.00455474853515625, 0.007953643798828125, 0.0113525390625, 0.014751434326171875, 0.01815032958984375, 0.021549224853515625, 0.0249481201171875, 0.028347015380859375, 0.03174591064453125, 0.035144805908203125, 0.038543701171875, 0.041942596435546875, 0.04534149169921875, 0.048740386962890625, 0.0521392822265625, 0.055538177490234375, 0.05893707275390625, 0.062335968017578125, 0.06573486328125, 0.06913375854492188, 0.07253265380859375, 0.07593154907226562, 0.0793304443359375, 0.08272933959960938, 0.08612823486328125, 0.08952713012695312, 0.092926025390625, 0.09632492065429688, 0.09972381591796875, 0.10312271118164062, 0.1065216064453125, 0.10992050170898438, 0.11331939697265625, 0.11671829223632812, 0.1201171875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 0.0, 0.0, 9.0, 11.0, 10.0, 17.0, 28.0, 49.0, 52.0, 96.0, 148.0, 264.0, 464.0, 916.0, 2024.0, 5040.0, 24008.0, 988400.0, 18538.0, 4589.0, 1902.0, 910.0, 428.0, 256.0, 149.0, 80.0, 44.0, 36.0, 22.0, 14.0, 12.0, 11.0, 9.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-346.5, -333.87890625, -321.2578125, -308.63671875, -296.015625, -283.39453125, -270.7734375, -258.15234375, -245.53125, -232.91015625, -220.2890625, -207.66796875, -195.046875, -182.42578125, -169.8046875, -157.18359375, -144.5625, -131.94140625, -119.3203125, -106.69921875, -94.078125, -81.45703125, -68.8359375, -56.21484375, -43.59375, -30.97265625, -18.3515625, -5.73046875, 6.890625, 19.51171875, 32.1328125, 44.75390625, 57.375, 69.99609375, 82.6171875, 95.23828125, 107.859375, 120.48046875, 133.1015625, 145.72265625, 158.34375, 170.96484375, 183.5859375, 196.20703125, 208.828125, 221.44921875, 234.0703125, 246.69140625, 259.3125, 271.93359375, 284.5546875, 297.17578125, 309.796875, 322.41796875, 335.0390625, 347.66015625, 360.28125, 372.90234375, 385.5234375, 398.14453125, 410.765625, 423.38671875, 436.0078125, 448.62890625, 461.25]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 14.0, 45.0, 295.0, 474.0, 101.0, 21.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-298.5, -287.93359375, -277.3671875, -266.80078125, -256.234375, -245.66796875, -235.1015625, -224.53515625, -213.96875, -203.40234375, -192.8359375, -182.26953125, -171.703125, -161.13671875, -150.5703125, -140.00390625, -129.4375, -118.87109375, -108.3046875, -97.73828125, -87.171875, -76.60546875, -66.0390625, -55.47265625, -44.90625, -34.33984375, -23.7734375, -13.20703125, -2.640625, 7.92578125, 18.4921875, 29.05859375, 39.625, 50.19140625, 60.7578125, 71.32421875, 81.890625, 92.45703125, 103.0234375, 113.58984375, 124.15625, 134.72265625, 145.2890625, 155.85546875, 166.421875, 176.98828125, 187.5546875, 198.12109375, 208.6875, 219.25390625, 229.8203125, 240.38671875, 250.953125, 261.51953125, 272.0859375, 282.65234375, 293.21875, 303.78515625, 314.3515625, 324.91796875, 335.484375, 346.05078125, 356.6171875, 367.18359375, 377.75]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 13.0, 18.0, 16.0, 31.0, 25.0, 51.0, 54.0, 77.0, 86.0, 120.0, 106.0, 104.0, 82.0, 57.0, 48.0, 40.0, 19.0, 9.0, 9.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1795.10498046875, -1750.699462890625, -1706.2939453125, -1661.888427734375, -1617.48291015625, -1573.077392578125, -1528.671875, -1484.2662353515625, -1439.8607177734375, -1395.4552001953125, -1351.0496826171875, -1306.6441650390625, -1262.2386474609375, -1217.8330078125, -1173.427490234375, -1129.02197265625, -1084.616455078125, -1040.2109375, -995.805419921875, -951.39990234375, -906.9943237304688, -862.5888061523438, -818.1832885742188, -773.7777099609375, -729.372314453125, -684.966796875, -640.561279296875, -596.15576171875, -551.7501831054688, -507.34466552734375, -462.93914794921875, -418.5335998535156, -374.1280517578125, -329.7225341796875, -285.3169860839844, -240.91146850585938, -196.5059356689453, -152.10040283203125, -107.69488525390625, -63.289337158203125, -18.883819580078125, 25.521709442138672, 69.92723846435547, 114.332763671875, 158.73829650878906, 203.14382934570312, 247.54934692382812, 291.95489501953125, 336.36041259765625, 380.76593017578125, 425.1714782714844, 469.5769958496094, 513.9825439453125, 558.3880615234375, 602.7935791015625, 647.1990966796875, 691.6046142578125, 736.0101318359375, 780.4156494140625, 824.8211669921875, 869.2267456054688, 913.6322631835938, 958.0377807617188, 1002.443359375, 1046.848876953125]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 11.0, 11.0, 9.0, 7.0, 13.0, 14.0, 27.0, 23.0, 33.0, 25.0, 23.0, 29.0, 31.0, 46.0, 35.0, 45.0, 54.0, 43.0, 39.0, 38.0, 49.0, 38.0, 44.0, 44.0, 34.0, 26.0, 32.0, 28.0, 33.0, 18.0, 20.0, 19.0, 9.0, 13.0, 11.0, 5.0, 9.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-966.2689208984375, -938.384521484375, -910.5001831054688, -882.6157836914062, -854.7314453125, -826.8470458984375, -798.9627075195312, -771.0783081054688, -743.1939697265625, -715.3095703125, -687.4252319335938, -659.5408325195312, -631.656494140625, -603.7720947265625, -575.8877563476562, -548.0033569335938, -520.1190185546875, -492.2346496582031, -464.35028076171875, -436.4659118652344, -408.58154296875, -380.6971435546875, -352.81280517578125, -324.92840576171875, -297.04400634765625, -269.1596374511719, -241.2752685546875, -213.39089965820312, -185.50653076171875, -157.6221466064453, -129.73777770996094, -101.85340881347656, -73.96905517578125, -46.084686279296875, -18.200313568115234, 9.684059143066406, 37.56842803955078, 65.45280456542969, 93.33717346191406, 121.22154235839844, 149.1059112548828, 176.9902801513672, 204.87464904785156, 232.759033203125, 260.6434020996094, 288.52777099609375, 316.4121398925781, 344.2965087890625, 372.1808776855469, 400.06524658203125, 427.9496154785156, 455.833984375, 483.7183532714844, 511.60272216796875, 539.4871215820312, 567.3714599609375, 595.255859375, 623.1402587890625, 651.0245971679688, 678.9089965820312, 706.7933349609375, 734.677734375, 762.5620727539062, 790.4464721679688, 818.330810546875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 10.0, 2.0, 4.0, 7.0, 8.0, 7.0, 20.0, 19.0, 33.0, 49.0, 42.0, 77.0, 115.0, 160.0, 261.0, 450.0, 707.0, 1330.0, 3114.0, 11585.0, 4154649.0, 14592.0, 3471.0, 1425.0, 743.0, 455.0, 319.0, 186.0, 130.0, 85.0, 51.0, 42.0, 36.0, 23.0, 20.0, 14.0, 13.0, 7.0, 10.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-318.0, -307.59375, -297.1875, -286.78125, -276.375, -265.96875, -255.5625, -245.15625, -234.75, -224.34375, -213.9375, -203.53125, -193.125, -182.71875, -172.3125, -161.90625, -151.5, -141.09375, -130.6875, -120.28125, -109.875, -99.46875, -89.0625, -78.65625, -68.25, -57.84375, -47.4375, -37.03125, -26.625, -16.21875, -5.8125, 4.59375, 15.0, 25.40625, 35.8125, 46.21875, 56.625, 67.03125, 77.4375, 87.84375, 98.25, 108.65625, 119.0625, 129.46875, 139.875, 150.28125, 160.6875, 171.09375, 181.5, 191.90625, 202.3125, 212.71875, 223.125, 233.53125, 243.9375, 254.34375, 264.75, 275.15625, 285.5625, 295.96875, 306.375, 316.78125, 327.1875, 337.59375, 348.0]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 7.0, 6.0, 19.0, 14.0, 18.0, 24.0, 20.0, 31.0, 21.0, 37.0, 42.0, 43.0, 44.0, 54.0, 64.0, 52.0, 54.0, 46.0, 48.0, 35.0, 48.0, 33.0, 40.0, 29.0, 24.0, 23.0, 14.0, 12.0, 18.0, 17.0, 11.0, 10.0, 9.0, 4.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.015625, -29.906982421875, -28.79833984375, -27.689697265625, -26.5810546875, -25.472412109375, -24.36376953125, -23.255126953125, -22.146484375, -21.037841796875, -19.92919921875, -18.820556640625, -17.7119140625, -16.603271484375, -15.49462890625, -14.385986328125, -13.27734375, -12.168701171875, -11.06005859375, -9.951416015625, -8.8427734375, -7.734130859375, -6.62548828125, -5.516845703125, -4.408203125, -3.299560546875, -2.19091796875, -1.082275390625, 0.0263671875, 1.135009765625, 2.24365234375, 3.352294921875, 4.4609375, 5.569580078125, 6.67822265625, 7.786865234375, 8.8955078125, 10.004150390625, 11.11279296875, 12.221435546875, 13.330078125, 14.438720703125, 15.54736328125, 16.656005859375, 17.7646484375, 18.873291015625, 19.98193359375, 21.090576171875, 22.19921875, 23.307861328125, 24.41650390625, 25.525146484375, 26.6337890625, 27.742431640625, 28.85107421875, 29.959716796875, 31.068359375, 32.177001953125, 33.28564453125, 34.394287109375, 35.5029296875, 36.611572265625, 37.72021484375, 38.828857421875, 39.9375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 8.0, 4.0, 15.0, 19.0, 25.0, 39.0, 49.0, 79.0, 151.0, 205.0, 297.0, 481.0, 712.0, 1169.0, 1825.0, 3136.0, 6654.0, 38889.0, 4116437.0, 12889.0, 4443.0, 2423.0, 1473.0, 957.0, 645.0, 438.0, 271.0, 185.0, 115.0, 85.0, 54.0, 49.0, 15.0, 21.0, 9.0, 10.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.375, -216.681640625, -205.98828125, -195.294921875, -184.6015625, -173.908203125, -163.21484375, -152.521484375, -141.828125, -131.134765625, -120.44140625, -109.748046875, -99.0546875, -88.361328125, -77.66796875, -66.974609375, -56.28125, -45.587890625, -34.89453125, -24.201171875, -13.5078125, -2.814453125, 7.87890625, 18.572265625, 29.265625, 39.958984375, 50.65234375, 61.345703125, 72.0390625, 82.732421875, 93.42578125, 104.119140625, 114.8125, 125.505859375, 136.19921875, 146.892578125, 157.5859375, 168.279296875, 178.97265625, 189.666015625, 200.359375, 211.052734375, 221.74609375, 232.439453125, 243.1328125, 253.826171875, 264.51953125, 275.212890625, 285.90625, 296.599609375, 307.29296875, 317.986328125, 328.6796875, 339.373046875, 350.06640625, 360.759765625, 371.453125, 382.146484375, 392.83984375, 403.533203125, 414.2265625, 424.919921875, 435.61328125, 446.306640625, 457.0]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 9.0, 29.0, 69.0, 3852.0, 41.0, 20.0, 11.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.34375, -43.62939453125, -41.9150390625, -40.20068359375, -38.486328125, -36.77197265625, -35.0576171875, -33.34326171875, -31.62890625, -29.91455078125, -28.2001953125, -26.48583984375, -24.771484375, -23.05712890625, -21.3427734375, -19.62841796875, -17.9140625, -16.19970703125, -14.4853515625, -12.77099609375, -11.056640625, -9.34228515625, -7.6279296875, -5.91357421875, -4.19921875, -2.48486328125, -0.7705078125, 0.94384765625, 2.658203125, 4.37255859375, 6.0869140625, 7.80126953125, 9.515625, 11.22998046875, 12.9443359375, 14.65869140625, 16.373046875, 18.08740234375, 19.8017578125, 21.51611328125, 23.23046875, 24.94482421875, 26.6591796875, 28.37353515625, 30.087890625, 31.80224609375, 33.5166015625, 35.23095703125, 36.9453125, 38.65966796875, 40.3740234375, 42.08837890625, 43.802734375, 45.51708984375, 47.2314453125, 48.94580078125, 50.66015625, 52.37451171875, 54.0888671875, 55.80322265625, 57.517578125, 59.23193359375, 60.9462890625, 62.66064453125, 64.375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 10.0, 15.0, 26.0, 44.0, 65.0, 67.0, 116.0, 117.0, 108.0, 108.0, 87.0, 52.0, 45.0, 23.0, 31.0, 24.0, 12.0, 10.0, 9.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.50454711914062, -144.19775390625, -137.89096069335938, -131.5841827392578, -125.27738952636719, -118.97059631347656, -112.66381072998047, -106.35702514648438, -100.05023193359375, -93.74343872070312, -87.43665313720703, -81.12986755371094, -74.82307434082031, -68.51628112792969, -62.209495544433594, -55.902706146240234, -49.595916748046875, -43.289127349853516, -36.982337951660156, -30.675548553466797, -24.368759155273438, -18.061969757080078, -11.755180358886719, -5.448390960693359, 0.8583984375, 7.165187835693359, 13.471977233886719, 19.778766632080078, 26.085556030273438, 32.3923454284668, 38.699134826660156, 45.005924224853516, 51.31272888183594, 57.6195182800293, 63.926307678222656, 70.23309326171875, 76.53988647460938, 82.8466796875, 89.1534652709961, 95.46025085449219, 101.76704406738281, 108.07383728027344, 114.38062286376953, 120.68740844726562, 126.99420166015625, 133.30099487304688, 139.6077880859375, 145.91456604003906, 152.2213592529297, 158.5281524658203, 164.83493041992188, 171.1417236328125, 177.44851684570312, 183.75531005859375, 190.06210327148438, 196.36888122558594, 202.67567443847656, 208.9824676513672, 215.28924560546875, 221.59603881835938, 227.90283203125, 234.20962524414062, 240.51641845703125, 246.8231964111328, 253.12998962402344]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 2.0, 8.0, 7.0, 11.0, 11.0, 16.0, 24.0, 20.0, 26.0, 27.0, 20.0, 25.0, 28.0, 28.0, 40.0, 38.0, 40.0, 51.0, 34.0, 40.0, 49.0, 42.0, 38.0, 27.0, 33.0, 34.0, 41.0, 40.0, 26.0, 20.0, 25.0, 20.0, 23.0, 13.0, 11.0, 14.0, 9.0, 9.0, 11.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-100.87227630615234, -97.64218139648438, -94.41209411621094, -91.18199920654297, -87.951904296875, -84.72180938720703, -81.49171447753906, -78.26162719726562, -75.03153228759766, -71.80143737792969, -68.57135009765625, -65.34125518798828, -62.11116027832031, -58.881065368652344, -55.65097427368164, -52.42088317871094, -49.19078826904297, -45.960693359375, -42.7306022644043, -39.500511169433594, -36.270416259765625, -33.040321350097656, -29.810230255126953, -26.580137252807617, -23.35004425048828, -20.119951248168945, -16.88985824584961, -13.659765243530273, -10.429672241210938, -7.199579238891602, -3.9694862365722656, -0.7393932342529297, 2.490692138671875, 5.720785140991211, 8.950878143310547, 12.180971145629883, 15.411064147949219, 18.641157150268555, 21.87125015258789, 25.101343154907227, 28.331436157226562, 31.5615291595459, 34.791622161865234, 38.02171325683594, 41.251808166503906, 44.481903076171875, 47.71199417114258, 50.94208526611328, 54.17218017578125, 57.40227508544922, 60.63236618041992, 63.862457275390625, 67.0925521850586, 70.32264709472656, 73.552734375, 76.78282928466797, 80.01292419433594, 83.2430191040039, 86.47311401367188, 89.70320129394531, 92.93329620361328, 96.16339111328125, 99.39347839355469, 102.62357330322266, 105.85366821289062]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 9.0, 10.0, 11.0, 23.0, 37.0, 53.0, 78.0, 116.0, 186.0, 275.0, 435.0, 647.0, 1011.0, 1502.0, 2555.0, 4066.0, 7461.0, 12906.0, 24162.0, 49217.0, 111254.0, 278614.0, 309605.0, 128408.0, 55104.0, 26688.0, 13985.0, 7844.0, 4664.0, 2861.0, 1760.0, 1121.0, 652.0, 399.0, 284.0, 172.0, 147.0, 71.0, 50.0, 35.0, 26.0, 16.0, 12.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.125, -77.4609375, -74.796875, -72.1328125, -69.46875, -66.8046875, -64.140625, -61.4765625, -58.8125, -56.1484375, -53.484375, -50.8203125, -48.15625, -45.4921875, -42.828125, -40.1640625, -37.5, -34.8359375, -32.171875, -29.5078125, -26.84375, -24.1796875, -21.515625, -18.8515625, -16.1875, -13.5234375, -10.859375, -8.1953125, -5.53125, -2.8671875, -0.203125, 2.4609375, 5.125, 7.7890625, 10.453125, 13.1171875, 15.78125, 18.4453125, 21.109375, 23.7734375, 26.4375, 29.1015625, 31.765625, 34.4296875, 37.09375, 39.7578125, 42.421875, 45.0859375, 47.75, 50.4140625, 53.078125, 55.7421875, 58.40625, 61.0703125, 63.734375, 66.3984375, 69.0625, 71.7265625, 74.390625, 77.0546875, 79.71875, 82.3828125, 85.046875, 87.7109375, 90.375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 4.0, 4.0, 6.0, 6.0, 9.0, 8.0, 12.0, 12.0, 25.0, 15.0, 22.0, 23.0, 20.0, 29.0, 30.0, 35.0, 24.0, 39.0, 47.0, 54.0, 53.0, 39.0, 37.0, 41.0, 26.0, 40.0, 39.0, 54.0, 36.0, 22.0, 26.0, 17.0, 28.0, 17.0, 13.0, 17.0, 17.0, 8.0, 13.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-31.25, -30.19287109375, -29.1357421875, -28.07861328125, -27.021484375, -25.96435546875, -24.9072265625, -23.85009765625, -22.79296875, -21.73583984375, -20.6787109375, -19.62158203125, -18.564453125, -17.50732421875, -16.4501953125, -15.39306640625, -14.3359375, -13.27880859375, -12.2216796875, -11.16455078125, -10.107421875, -9.05029296875, -7.9931640625, -6.93603515625, -5.87890625, -4.82177734375, -3.7646484375, -2.70751953125, -1.650390625, -0.59326171875, 0.4638671875, 1.52099609375, 2.578125, 3.63525390625, 4.6923828125, 5.74951171875, 6.806640625, 7.86376953125, 8.9208984375, 9.97802734375, 11.03515625, 12.09228515625, 13.1494140625, 14.20654296875, 15.263671875, 16.32080078125, 17.3779296875, 18.43505859375, 19.4921875, 20.54931640625, 21.6064453125, 22.66357421875, 23.720703125, 24.77783203125, 25.8349609375, 26.89208984375, 27.94921875, 29.00634765625, 30.0634765625, 31.12060546875, 32.177734375, 33.23486328125, 34.2919921875, 35.34912109375, 36.40625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 21.0, 20.0, 23.0, 30.0, 40.0, 59.0, 104.0, 140.0, 239.0, 429.0, 780.0, 1531.0, 3426.0, 8090.0, 22827.0, 79323.0, 453133.0, 374092.0, 69664.0, 20596.0, 7511.0, 3178.0, 1457.0, 775.0, 407.0, 228.0, 139.0, 85.0, 58.0, 38.0, 26.0, 18.0, 12.0, 15.0, 4.0, 9.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-168.625, -163.34765625, -158.0703125, -152.79296875, -147.515625, -142.23828125, -136.9609375, -131.68359375, -126.40625, -121.12890625, -115.8515625, -110.57421875, -105.296875, -100.01953125, -94.7421875, -89.46484375, -84.1875, -78.91015625, -73.6328125, -68.35546875, -63.078125, -57.80078125, -52.5234375, -47.24609375, -41.96875, -36.69140625, -31.4140625, -26.13671875, -20.859375, -15.58203125, -10.3046875, -5.02734375, 0.25, 5.52734375, 10.8046875, 16.08203125, 21.359375, 26.63671875, 31.9140625, 37.19140625, 42.46875, 47.74609375, 53.0234375, 58.30078125, 63.578125, 68.85546875, 74.1328125, 79.41015625, 84.6875, 89.96484375, 95.2421875, 100.51953125, 105.796875, 111.07421875, 116.3515625, 121.62890625, 126.90625, 132.18359375, 137.4609375, 142.73828125, 148.015625, 153.29296875, 158.5703125, 163.84765625, 169.125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 9.0, 14.0, 13.0, 22.0, 15.0, 19.0, 19.0, 27.0, 36.0, 32.0, 50.0, 33.0, 39.0, 50.0, 41.0, 48.0, 50.0, 50.0, 61.0, 53.0, 31.0, 51.0, 31.0, 33.0, 23.0, 27.0, 30.0, 14.0, 11.0, 9.0, 12.0, 11.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-213.375, -206.7890625, -200.203125, -193.6171875, -187.03125, -180.4453125, -173.859375, -167.2734375, -160.6875, -154.1015625, -147.515625, -140.9296875, -134.34375, -127.7578125, -121.171875, -114.5859375, -108.0, -101.4140625, -94.828125, -88.2421875, -81.65625, -75.0703125, -68.484375, -61.8984375, -55.3125, -48.7265625, -42.140625, -35.5546875, -28.96875, -22.3828125, -15.796875, -9.2109375, -2.625, 3.9609375, 10.546875, 17.1328125, 23.71875, 30.3046875, 36.890625, 43.4765625, 50.0625, 56.6484375, 63.234375, 69.8203125, 76.40625, 82.9921875, 89.578125, 96.1640625, 102.75, 109.3359375, 115.921875, 122.5078125, 129.09375, 135.6796875, 142.265625, 148.8515625, 155.4375, 162.0234375, 168.609375, 175.1953125, 181.78125, 188.3671875, 194.953125, 201.5390625, 208.125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 1.0, 7.0, 10.0, 10.0, 15.0, 25.0, 25.0, 37.0, 55.0, 78.0, 99.0, 173.0, 223.0, 310.0, 531.0, 836.0, 1504.0, 2930.0, 6198.0, 16139.0, 54503.0, 285710.0, 538866.0, 97652.0, 24944.0, 8820.0, 3886.0, 1900.0, 1141.0, 631.0, 396.0, 258.0, 195.0, 136.0, 75.0, 65.0, 50.0, 30.0, 26.0, 18.0, 10.0, 4.0, 3.0, 9.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-68.9375, -66.86083984375, -64.7841796875, -62.70751953125, -60.630859375, -58.55419921875, -56.4775390625, -54.40087890625, -52.32421875, -50.24755859375, -48.1708984375, -46.09423828125, -44.017578125, -41.94091796875, -39.8642578125, -37.78759765625, -35.7109375, -33.63427734375, -31.5576171875, -29.48095703125, -27.404296875, -25.32763671875, -23.2509765625, -21.17431640625, -19.09765625, -17.02099609375, -14.9443359375, -12.86767578125, -10.791015625, -8.71435546875, -6.6376953125, -4.56103515625, -2.484375, -0.40771484375, 1.6689453125, 3.74560546875, 5.822265625, 7.89892578125, 9.9755859375, 12.05224609375, 14.12890625, 16.20556640625, 18.2822265625, 20.35888671875, 22.435546875, 24.51220703125, 26.5888671875, 28.66552734375, 30.7421875, 32.81884765625, 34.8955078125, 36.97216796875, 39.048828125, 41.12548828125, 43.2021484375, 45.27880859375, 47.35546875, 49.43212890625, 51.5087890625, 53.58544921875, 55.662109375, 57.73876953125, 59.8154296875, 61.89208984375, 63.96875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 5.0, 6.0, 4.0, 11.0, 15.0, 16.0, 21.0, 37.0, 64.0, 106.0, 148.0, 155.0, 133.0, 84.0, 61.0, 43.0, 29.0, 21.0, 12.0, 9.0, 5.0, 8.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0347900390625, -0.0339512825012207, -0.033112525939941406, -0.03227376937866211, -0.03143501281738281, -0.030596256256103516, -0.02975749969482422, -0.028918743133544922, -0.028079986572265625, -0.027241230010986328, -0.02640247344970703, -0.025563716888427734, -0.024724960327148438, -0.02388620376586914, -0.023047447204589844, -0.022208690643310547, -0.02136993408203125, -0.020531177520751953, -0.019692420959472656, -0.01885366439819336, -0.018014907836914062, -0.017176151275634766, -0.01633739471435547, -0.015498638153076172, -0.014659881591796875, -0.013821125030517578, -0.012982368469238281, -0.012143611907958984, -0.011304855346679688, -0.01046609878540039, -0.009627342224121094, -0.008788585662841797, -0.0079498291015625, -0.007111072540283203, -0.006272315979003906, -0.005433559417724609, -0.0045948028564453125, -0.0037560462951660156, -0.0029172897338867188, -0.002078533172607422, -0.001239776611328125, -0.0004010200500488281, 0.00043773651123046875, 0.0012764930725097656, 0.0021152496337890625, 0.0029540061950683594, 0.0037927627563476562, 0.004631519317626953, 0.00547027587890625, 0.006309032440185547, 0.007147789001464844, 0.00798654556274414, 0.008825302124023438, 0.009664058685302734, 0.010502815246582031, 0.011341571807861328, 0.012180328369140625, 0.013019084930419922, 0.013857841491699219, 0.014696598052978516, 0.015535354614257812, 0.01637411117553711, 0.017212867736816406, 0.018051624298095703, 0.018890380859375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 5.0, 4.0, 8.0, 22.0, 15.0, 18.0, 39.0, 72.0, 87.0, 138.0, 234.0, 365.0, 758.0, 1400.0, 3233.0, 8347.0, 27587.0, 129008.0, 588806.0, 225319.0, 43034.0, 11940.0, 4170.0, 1848.0, 875.0, 486.0, 260.0, 157.0, 115.0, 65.0, 37.0, 22.0, 28.0, 13.0, 8.0, 8.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.5, -65.14453125, -62.7890625, -60.43359375, -58.078125, -55.72265625, -53.3671875, -51.01171875, -48.65625, -46.30078125, -43.9453125, -41.58984375, -39.234375, -36.87890625, -34.5234375, -32.16796875, -29.8125, -27.45703125, -25.1015625, -22.74609375, -20.390625, -18.03515625, -15.6796875, -13.32421875, -10.96875, -8.61328125, -6.2578125, -3.90234375, -1.546875, 0.80859375, 3.1640625, 5.51953125, 7.875, 10.23046875, 12.5859375, 14.94140625, 17.296875, 19.65234375, 22.0078125, 24.36328125, 26.71875, 29.07421875, 31.4296875, 33.78515625, 36.140625, 38.49609375, 40.8515625, 43.20703125, 45.5625, 47.91796875, 50.2734375, 52.62890625, 54.984375, 57.33984375, 59.6953125, 62.05078125, 64.40625, 66.76171875, 69.1171875, 71.47265625, 73.828125, 76.18359375, 78.5390625, 80.89453125, 83.25]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 3.0, 4.0, 5.0, 11.0, 12.0, 25.0, 40.0, 46.0, 49.0, 66.0, 77.0, 89.0, 114.0, 111.0, 78.0, 61.0, 48.0, 49.0, 24.0, 20.0, 18.0, 13.0, 10.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.96875, -60.56494140625, -58.1611328125, -55.75732421875, -53.353515625, -50.94970703125, -48.5458984375, -46.14208984375, -43.73828125, -41.33447265625, -38.9306640625, -36.52685546875, -34.123046875, -31.71923828125, -29.3154296875, -26.91162109375, -24.5078125, -22.10400390625, -19.7001953125, -17.29638671875, -14.892578125, -12.48876953125, -10.0849609375, -7.68115234375, -5.27734375, -2.87353515625, -0.4697265625, 1.93408203125, 4.337890625, 6.74169921875, 9.1455078125, 11.54931640625, 13.953125, 16.35693359375, 18.7607421875, 21.16455078125, 23.568359375, 25.97216796875, 28.3759765625, 30.77978515625, 33.18359375, 35.58740234375, 37.9912109375, 40.39501953125, 42.798828125, 45.20263671875, 47.6064453125, 50.01025390625, 52.4140625, 54.81787109375, 57.2216796875, 59.62548828125, 62.029296875, 64.43310546875, 66.8369140625, 69.24072265625, 71.64453125, 74.04833984375, 76.4521484375, 78.85595703125, 81.259765625, 83.66357421875, 86.0673828125, 88.47119140625, 90.875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 11.0, 12.0, 18.0, 56.0, 53.0, 90.0, 149.0, 169.0, 139.0, 112.0, 79.0, 42.0, 17.0, 18.0, 11.0, 12.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-801.0159912109375, -749.6306762695312, -698.245361328125, -646.8599853515625, -595.4747314453125, -544.08935546875, -492.70404052734375, -441.3187255859375, -389.93341064453125, -338.548095703125, -287.16278076171875, -235.77743530273438, -184.39212036132812, -133.00680541992188, -81.6214599609375, -30.23614501953125, 21.149169921875, 72.53449249267578, 123.91981506347656, 175.30514526367188, 226.69046020507812, 278.0757751464844, 329.46112060546875, 380.846435546875, 432.23175048828125, 483.6170654296875, 535.0023803710938, 586.3876953125, 637.7730712890625, 689.1583251953125, 740.543701171875, 791.9290161132812, 843.314453125, 894.6997680664062, 946.0850830078125, 997.470458984375, 1048.855712890625, 1100.2410888671875, 1151.62646484375, 1203.01171875, 1254.39697265625, 1305.7823486328125, 1357.1676025390625, 1408.552978515625, 1459.938232421875, 1511.3236083984375, 1562.708984375, 1614.09423828125, 1665.4796142578125, 1716.864990234375, 1768.250244140625, 1819.6356201171875, 1871.0208740234375, 1922.40625, 1973.79150390625, 2025.1768798828125, 2076.562255859375, 2127.947509765625, 2179.3330078125, 2230.71826171875, 2282.103515625, 2333.48876953125, 2384.874267578125, 2436.259521484375, 2487.644775390625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 4.0, 6.0, 7.0, 4.0, 8.0, 12.0, 9.0, 6.0, 16.0, 26.0, 27.0, 23.0, 24.0, 31.0, 39.0, 52.0, 50.0, 50.0, 50.0, 59.0, 55.0, 63.0, 57.0, 58.0, 38.0, 33.0, 29.0, 30.0, 25.0, 23.0, 16.0, 12.0, 13.0, 13.0, 11.0, 4.0, 3.0, 3.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1346.954345703125, -1311.202880859375, -1275.451416015625, -1239.699951171875, -1203.948486328125, -1168.197021484375, -1132.445556640625, -1096.694091796875, -1060.942626953125, -1025.191162109375, -989.439697265625, -953.688232421875, -917.936767578125, -882.185302734375, -846.433837890625, -810.682373046875, -774.930908203125, -739.179443359375, -703.427978515625, -667.676513671875, -631.925048828125, -596.173583984375, -560.422119140625, -524.670654296875, -488.919189453125, -453.167724609375, -417.416259765625, -381.664794921875, -345.913330078125, -310.161865234375, -274.410400390625, -238.658935546875, -202.9073486328125, -167.1558837890625, -131.4044189453125, -95.6529541015625, -59.9014892578125, -24.1500244140625, 11.6014404296875, 47.3529052734375, 83.1043701171875, 118.8558349609375, 154.6072998046875, 190.3587646484375, 226.1102294921875, 261.8616943359375, 297.6131591796875, 333.3646240234375, 369.1160888671875, 404.8675537109375, 440.6190185546875, 476.3704833984375, 512.1219482421875, 547.8734130859375, 583.6248779296875, 619.3763427734375, 655.1278076171875, 690.8792724609375, 726.6307373046875, 762.3822021484375, 798.1336669921875, 833.8851318359375, 869.6365966796875, 905.3880615234375, 941.1395263671875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 1.0, 6.0, 3.0, 6.0, 4.0, 10.0, 8.0, 19.0, 22.0, 29.0, 45.0, 70.0, 98.0, 118.0, 191.0, 231.0, 328.0, 516.0, 757.0, 1114.0, 2186.0, 5519.0, 4043915.0, 128159.0, 5259.0, 2094.0, 1212.0, 698.0, 473.0, 317.0, 239.0, 192.0, 108.0, 96.0, 57.0, 49.0, 42.0, 26.0, 16.0, 14.0, 10.0, 7.0, 11.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-348.75, -338.17578125, -327.6015625, -317.02734375, -306.453125, -295.87890625, -285.3046875, -274.73046875, -264.15625, -253.58203125, -243.0078125, -232.43359375, -221.859375, -211.28515625, -200.7109375, -190.13671875, -179.5625, -168.98828125, -158.4140625, -147.83984375, -137.265625, -126.69140625, -116.1171875, -105.54296875, -94.96875, -84.39453125, -73.8203125, -63.24609375, -52.671875, -42.09765625, -31.5234375, -20.94921875, -10.375, 0.19921875, 10.7734375, 21.34765625, 31.921875, 42.49609375, 53.0703125, 63.64453125, 74.21875, 84.79296875, 95.3671875, 105.94140625, 116.515625, 127.08984375, 137.6640625, 148.23828125, 158.8125, 169.38671875, 179.9609375, 190.53515625, 201.109375, 211.68359375, 222.2578125, 232.83203125, 243.40625, 253.98046875, 264.5546875, 275.12890625, 285.703125, 296.27734375, 306.8515625, 317.42578125, 328.0]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 6.0, 6.0, 2.0, 3.0, 9.0, 4.0, 7.0, 12.0, 9.0, 12.0, 9.0, 15.0, 22.0, 21.0, 22.0, 30.0, 33.0, 22.0, 38.0, 28.0, 45.0, 41.0, 51.0, 47.0, 51.0, 54.0, 42.0, 36.0, 32.0, 39.0, 28.0, 25.0, 29.0, 28.0, 20.0, 26.0, 14.0, 15.0, 12.0, 7.0, 9.0, 9.0, 10.0, 5.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-31.421875, -30.412841796875, -29.40380859375, -28.394775390625, -27.3857421875, -26.376708984375, -25.36767578125, -24.358642578125, -23.349609375, -22.340576171875, -21.33154296875, -20.322509765625, -19.3134765625, -18.304443359375, -17.29541015625, -16.286376953125, -15.27734375, -14.268310546875, -13.25927734375, -12.250244140625, -11.2412109375, -10.232177734375, -9.22314453125, -8.214111328125, -7.205078125, -6.196044921875, -5.18701171875, -4.177978515625, -3.1689453125, -2.159912109375, -1.15087890625, -0.141845703125, 0.8671875, 1.876220703125, 2.88525390625, 3.894287109375, 4.9033203125, 5.912353515625, 6.92138671875, 7.930419921875, 8.939453125, 9.948486328125, 10.95751953125, 11.966552734375, 12.9755859375, 13.984619140625, 14.99365234375, 16.002685546875, 17.01171875, 18.020751953125, 19.02978515625, 20.038818359375, 21.0478515625, 22.056884765625, 23.06591796875, 24.074951171875, 25.083984375, 26.093017578125, 27.10205078125, 28.111083984375, 29.1201171875, 30.129150390625, 31.13818359375, 32.147216796875, 33.15625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 1.0, 4.0, 9.0, 2.0, 3.0, 7.0, 9.0, 6.0, 17.0, 13.0, 29.0, 31.0, 55.0, 86.0, 97.0, 165.0, 234.0, 398.0, 669.0, 1087.0, 2170.0, 8104.0, 4139805.0, 33759.0, 3664.0, 1510.0, 891.0, 527.0, 308.0, 172.0, 135.0, 87.0, 47.0, 50.0, 24.0, 23.0, 21.0, 24.0, 11.0, 9.0, 9.0, 4.0, 6.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-519.0, -502.125, -485.25, -468.375, -451.5, -434.625, -417.75, -400.875, -384.0, -367.125, -350.25, -333.375, -316.5, -299.625, -282.75, -265.875, -249.0, -232.125, -215.25, -198.375, -181.5, -164.625, -147.75, -130.875, -114.0, -97.125, -80.25, -63.375, -46.5, -29.625, -12.75, 4.125, 21.0, 37.875, 54.75, 71.625, 88.5, 105.375, 122.25, 139.125, 156.0, 172.875, 189.75, 206.625, 223.5, 240.375, 257.25, 274.125, 291.0, 307.875, 324.75, 341.625, 358.5, 375.375, 392.25, 409.125, 426.0, 442.875, 459.75, 476.625, 493.5, 510.375, 527.25, 544.125, 561.0]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 7.0, 21.0, 49.0, 3905.0, 70.0, 18.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.75, -167.5263671875, -163.302734375, -159.0791015625, -154.85546875, -150.6318359375, -146.408203125, -142.1845703125, -137.9609375, -133.7373046875, -129.513671875, -125.2900390625, -121.06640625, -116.8427734375, -112.619140625, -108.3955078125, -104.171875, -99.9482421875, -95.724609375, -91.5009765625, -87.27734375, -83.0537109375, -78.830078125, -74.6064453125, -70.3828125, -66.1591796875, -61.935546875, -57.7119140625, -53.48828125, -49.2646484375, -45.041015625, -40.8173828125, -36.59375, -32.3701171875, -28.146484375, -23.9228515625, -19.69921875, -15.4755859375, -11.251953125, -7.0283203125, -2.8046875, 1.4189453125, 5.642578125, 9.8662109375, 14.08984375, 18.3134765625, 22.537109375, 26.7607421875, 30.984375, 35.2080078125, 39.431640625, 43.6552734375, 47.87890625, 52.1025390625, 56.326171875, 60.5498046875, 64.7734375, 68.9970703125, 73.220703125, 77.4443359375, 81.66796875, 85.8916015625, 90.115234375, 94.3388671875, 98.5625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 7.0, 10.0, 11.0, 14.0, 11.0, 20.0, 18.0, 27.0, 35.0, 41.0, 45.0, 73.0, 87.0, 84.0, 80.0, 92.0, 73.0, 67.0, 44.0, 40.0, 30.0, 15.0, 10.0, 14.0, 9.0, 10.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-243.32638549804688, -237.09654235839844, -230.86669921875, -224.63685607910156, -218.40701293945312, -212.1771697998047, -205.94732666015625, -199.71746826171875, -193.48764038085938, -187.25779724121094, -181.0279541015625, -174.79811096191406, -168.56826782226562, -162.3384246826172, -156.10858154296875, -149.87872314453125, -143.6488800048828, -137.41903686523438, -131.18919372558594, -124.9593505859375, -118.72950744628906, -112.49966430664062, -106.26981353759766, -100.03997039794922, -93.81012725830078, -87.58028411865234, -81.3504409790039, -75.12059020996094, -68.8907470703125, -62.66090774536133, -56.431060791015625, -50.20121765136719, -43.97135925292969, -37.74151611328125, -31.51167106628418, -25.28182601928711, -19.051982879638672, -12.822139739990234, -6.592292785644531, -0.36244964599609375, 5.867393493652344, 12.097237586975098, 18.32708168029785, 24.556926727294922, 30.78676986694336, 37.0166130065918, 43.2464599609375, 49.47630310058594, 55.706146240234375, 61.93598937988281, 68.16583251953125, 74.39567565917969, 80.62551879882812, 86.85536193847656, 93.08521270751953, 99.31505584716797, 105.5448989868164, 111.77474212646484, 118.00458526611328, 124.23443603515625, 130.4642791748047, 136.69412231445312, 142.92396545410156, 149.15380859375, 155.38365173339844]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 7.0, 7.0, 8.0, 7.0, 13.0, 17.0, 17.0, 12.0, 25.0, 31.0, 31.0, 31.0, 30.0, 40.0, 30.0, 33.0, 52.0, 44.0, 50.0, 55.0, 34.0, 44.0, 48.0, 41.0, 35.0, 35.0, 31.0, 30.0, 25.0, 18.0, 19.0, 16.0, 14.0, 15.0, 4.0, 8.0, 6.0, 11.0, 7.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.7794952392578, -164.78338623046875, -159.78729248046875, -154.7911834716797, -149.79507446289062, -144.79896545410156, -139.8028564453125, -134.8067626953125, -129.81065368652344, -124.81454467773438, -119.81844329833984, -114.82234191894531, -109.82623291015625, -104.83012390136719, -99.83402252197266, -94.83792114257812, -89.84181213378906, -84.845703125, -79.84960174560547, -74.85350036621094, -69.85739135742188, -64.86128234863281, -59.86518096923828, -54.869075775146484, -49.87297058105469, -44.87686538696289, -39.880760192871094, -34.8846549987793, -29.8885498046875, -24.892444610595703, -19.896339416503906, -14.90023422241211, -9.904144287109375, -4.908039093017578, 0.08806610107421875, 5.084171295166016, 10.080276489257812, 15.07638168334961, 20.072486877441406, 25.068592071533203, 30.064697265625, 35.0608024597168, 40.056907653808594, 45.05301284790039, 50.04911804199219, 55.045223236083984, 60.04132843017578, 65.03742980957031, 70.03353881835938, 75.02964782714844, 80.02574920654297, 85.0218505859375, 90.01795959472656, 95.01406860351562, 100.01016998291016, 105.00627136230469, 110.00238037109375, 114.99848937988281, 119.99459075927734, 124.99069213867188, 129.98680114746094, 134.98291015625, 139.97900390625, 144.97511291503906, 149.97122192382812]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 0.0, 5.0, 9.0, 19.0, 17.0, 36.0, 58.0, 64.0, 86.0, 152.0, 272.0, 437.0, 699.0, 1219.0, 2161.0, 3951.0, 7097.0, 14550.0, 30791.0, 70494.0, 181620.0, 378698.0, 207841.0, 79922.0, 34469.0, 15934.0, 8056.0, 4348.0, 2294.0, 1323.0, 763.0, 451.0, 267.0, 172.0, 80.0, 54.0, 44.0, 39.0, 24.0, 18.0, 12.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-106.0, -102.93359375, -99.8671875, -96.80078125, -93.734375, -90.66796875, -87.6015625, -84.53515625, -81.46875, -78.40234375, -75.3359375, -72.26953125, -69.203125, -66.13671875, -63.0703125, -60.00390625, -56.9375, -53.87109375, -50.8046875, -47.73828125, -44.671875, -41.60546875, -38.5390625, -35.47265625, -32.40625, -29.33984375, -26.2734375, -23.20703125, -20.140625, -17.07421875, -14.0078125, -10.94140625, -7.875, -4.80859375, -1.7421875, 1.32421875, 4.390625, 7.45703125, 10.5234375, 13.58984375, 16.65625, 19.72265625, 22.7890625, 25.85546875, 28.921875, 31.98828125, 35.0546875, 38.12109375, 41.1875, 44.25390625, 47.3203125, 50.38671875, 53.453125, 56.51953125, 59.5859375, 62.65234375, 65.71875, 68.78515625, 71.8515625, 74.91796875, 77.984375, 81.05078125, 84.1171875, 87.18359375, 90.25]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 4.0, 4.0, 5.0, 5.0, 8.0, 10.0, 13.0, 14.0, 16.0, 17.0, 18.0, 28.0, 22.0, 24.0, 31.0, 34.0, 28.0, 29.0, 37.0, 43.0, 44.0, 40.0, 47.0, 48.0, 36.0, 47.0, 35.0, 33.0, 25.0, 30.0, 28.0, 25.0, 28.0, 21.0, 17.0, 16.0, 16.0, 14.0, 11.0, 5.0, 14.0, 9.0, 5.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0], "bins": [-41.9375, -40.8017578125, -39.666015625, -38.5302734375, -37.39453125, -36.2587890625, -35.123046875, -33.9873046875, -32.8515625, -31.7158203125, -30.580078125, -29.4443359375, -28.30859375, -27.1728515625, -26.037109375, -24.9013671875, -23.765625, -22.6298828125, -21.494140625, -20.3583984375, -19.22265625, -18.0869140625, -16.951171875, -15.8154296875, -14.6796875, -13.5439453125, -12.408203125, -11.2724609375, -10.13671875, -9.0009765625, -7.865234375, -6.7294921875, -5.59375, -4.4580078125, -3.322265625, -2.1865234375, -1.05078125, 0.0849609375, 1.220703125, 2.3564453125, 3.4921875, 4.6279296875, 5.763671875, 6.8994140625, 8.03515625, 9.1708984375, 10.306640625, 11.4423828125, 12.578125, 13.7138671875, 14.849609375, 15.9853515625, 17.12109375, 18.2568359375, 19.392578125, 20.5283203125, 21.6640625, 22.7998046875, 23.935546875, 25.0712890625, 26.20703125, 27.3427734375, 28.478515625, 29.6142578125, 30.75]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 5.0, 7.0, 7.0, 10.0, 18.0, 20.0, 45.0, 74.0, 86.0, 166.0, 278.0, 526.0, 1009.0, 2288.0, 6385.0, 21885.0, 124794.0, 718002.0, 137959.0, 23607.0, 6683.0, 2404.0, 1086.0, 496.0, 274.0, 151.0, 102.0, 55.0, 40.0, 23.0, 15.0, 13.0, 9.0, 12.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-181.75, -175.146484375, -168.54296875, -161.939453125, -155.3359375, -148.732421875, -142.12890625, -135.525390625, -128.921875, -122.318359375, -115.71484375, -109.111328125, -102.5078125, -95.904296875, -89.30078125, -82.697265625, -76.09375, -69.490234375, -62.88671875, -56.283203125, -49.6796875, -43.076171875, -36.47265625, -29.869140625, -23.265625, -16.662109375, -10.05859375, -3.455078125, 3.1484375, 9.751953125, 16.35546875, 22.958984375, 29.5625, 36.166015625, 42.76953125, 49.373046875, 55.9765625, 62.580078125, 69.18359375, 75.787109375, 82.390625, 88.994140625, 95.59765625, 102.201171875, 108.8046875, 115.408203125, 122.01171875, 128.615234375, 135.21875, 141.822265625, 148.42578125, 155.029296875, 161.6328125, 168.236328125, 174.83984375, 181.443359375, 188.046875, 194.650390625, 201.25390625, 207.857421875, 214.4609375, 221.064453125, 227.66796875, 234.271484375, 240.875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 11.0, 8.0, 12.0, 18.0, 27.0, 17.0, 24.0, 26.0, 32.0, 40.0, 36.0, 34.0, 52.0, 43.0, 46.0, 41.0, 50.0, 54.0, 45.0, 38.0, 50.0, 33.0, 29.0, 36.0, 28.0, 27.0, 19.0, 18.0, 13.0, 6.0, 15.0, 13.0, 3.0, 5.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-195.875, -190.046875, -184.21875, -178.390625, -172.5625, -166.734375, -160.90625, -155.078125, -149.25, -143.421875, -137.59375, -131.765625, -125.9375, -120.109375, -114.28125, -108.453125, -102.625, -96.796875, -90.96875, -85.140625, -79.3125, -73.484375, -67.65625, -61.828125, -56.0, -50.171875, -44.34375, -38.515625, -32.6875, -26.859375, -21.03125, -15.203125, -9.375, -3.546875, 2.28125, 8.109375, 13.9375, 19.765625, 25.59375, 31.421875, 37.25, 43.078125, 48.90625, 54.734375, 60.5625, 66.390625, 72.21875, 78.046875, 83.875, 89.703125, 95.53125, 101.359375, 107.1875, 113.015625, 118.84375, 124.671875, 130.5, 136.328125, 142.15625, 147.984375, 153.8125, 159.640625, 165.46875, 171.296875, 177.125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 7.0, 9.0, 11.0, 24.0, 28.0, 39.0, 72.0, 89.0, 189.0, 335.0, 675.0, 1368.0, 3252.0, 8967.0, 36706.0, 463821.0, 480612.0, 37553.0, 8658.0, 3123.0, 1340.0, 702.0, 389.0, 246.0, 126.0, 71.0, 56.0, 23.0, 18.0, 16.0, 8.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-103.625, -100.4853515625, -97.345703125, -94.2060546875, -91.06640625, -87.9267578125, -84.787109375, -81.6474609375, -78.5078125, -75.3681640625, -72.228515625, -69.0888671875, -65.94921875, -62.8095703125, -59.669921875, -56.5302734375, -53.390625, -50.2509765625, -47.111328125, -43.9716796875, -40.83203125, -37.6923828125, -34.552734375, -31.4130859375, -28.2734375, -25.1337890625, -21.994140625, -18.8544921875, -15.71484375, -12.5751953125, -9.435546875, -6.2958984375, -3.15625, -0.0166015625, 3.123046875, 6.2626953125, 9.40234375, 12.5419921875, 15.681640625, 18.8212890625, 21.9609375, 25.1005859375, 28.240234375, 31.3798828125, 34.51953125, 37.6591796875, 40.798828125, 43.9384765625, 47.078125, 50.2177734375, 53.357421875, 56.4970703125, 59.63671875, 62.7763671875, 65.916015625, 69.0556640625, 72.1953125, 75.3349609375, 78.474609375, 81.6142578125, 84.75390625, 87.8935546875, 91.033203125, 94.1728515625, 97.3125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 13.0, 21.0, 28.0, 48.0, 82.0, 156.0, 228.0, 182.0, 114.0, 60.0, 30.0, 9.0, 7.0, 9.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022216796875, -0.020956993103027344, -0.019697189331054688, -0.01843738555908203, -0.017177581787109375, -0.01591777801513672, -0.014657974243164062, -0.013398170471191406, -0.01213836669921875, -0.010878562927246094, -0.009618759155273438, -0.008358955383300781, -0.007099151611328125, -0.005839347839355469, -0.0045795440673828125, -0.0033197402954101562, -0.0020599365234375, -0.0008001327514648438, 0.0004596710205078125, 0.0017194747924804688, 0.002979278564453125, 0.004239082336425781, 0.0054988861083984375, 0.006758689880371094, 0.00801849365234375, 0.009278297424316406, 0.010538101196289062, 0.011797904968261719, 0.013057708740234375, 0.014317512512207031, 0.015577316284179688, 0.016837120056152344, 0.018096923828125, 0.019356727600097656, 0.020616531372070312, 0.02187633514404297, 0.023136138916015625, 0.02439594268798828, 0.025655746459960938, 0.026915550231933594, 0.02817535400390625, 0.029435157775878906, 0.030694961547851562, 0.03195476531982422, 0.033214569091796875, 0.03447437286376953, 0.03573417663574219, 0.036993980407714844, 0.0382537841796875, 0.039513587951660156, 0.04077339172363281, 0.04203319549560547, 0.043292999267578125, 0.04455280303955078, 0.04581260681152344, 0.047072410583496094, 0.04833221435546875, 0.049592018127441406, 0.05085182189941406, 0.05211162567138672, 0.053371429443359375, 0.05463123321533203, 0.05589103698730469, 0.057150840759277344, 0.05841064453125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 6.0, 13.0, 17.0, 27.0, 34.0, 70.0, 109.0, 154.0, 361.0, 752.0, 1953.0, 6387.0, 41782.0, 778075.0, 198024.0, 15166.0, 3355.0, 1092.0, 503.0, 295.0, 127.0, 87.0, 47.0, 24.0, 20.0, 14.0, 19.0, 6.0, 10.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-134.5, -129.98046875, -125.4609375, -120.94140625, -116.421875, -111.90234375, -107.3828125, -102.86328125, -98.34375, -93.82421875, -89.3046875, -84.78515625, -80.265625, -75.74609375, -71.2265625, -66.70703125, -62.1875, -57.66796875, -53.1484375, -48.62890625, -44.109375, -39.58984375, -35.0703125, -30.55078125, -26.03125, -21.51171875, -16.9921875, -12.47265625, -7.953125, -3.43359375, 1.0859375, 5.60546875, 10.125, 14.64453125, 19.1640625, 23.68359375, 28.203125, 32.72265625, 37.2421875, 41.76171875, 46.28125, 50.80078125, 55.3203125, 59.83984375, 64.359375, 68.87890625, 73.3984375, 77.91796875, 82.4375, 86.95703125, 91.4765625, 95.99609375, 100.515625, 105.03515625, 109.5546875, 114.07421875, 118.59375, 123.11328125, 127.6328125, 132.15234375, 136.671875, 141.19140625, 145.7109375, 150.23046875, 154.75]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 5.0, 8.0, 15.0, 8.0, 23.0, 34.0, 60.0, 63.0, 120.0, 118.0, 128.0, 135.0, 92.0, 63.0, 33.0, 33.0, 16.0, 11.0, 8.0, 9.0, 7.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.28125, -52.42529296875, -49.5693359375, -46.71337890625, -43.857421875, -41.00146484375, -38.1455078125, -35.28955078125, -32.43359375, -29.57763671875, -26.7216796875, -23.86572265625, -21.009765625, -18.15380859375, -15.2978515625, -12.44189453125, -9.5859375, -6.72998046875, -3.8740234375, -1.01806640625, 1.837890625, 4.69384765625, 7.5498046875, 10.40576171875, 13.26171875, 16.11767578125, 18.9736328125, 21.82958984375, 24.685546875, 27.54150390625, 30.3974609375, 33.25341796875, 36.109375, 38.96533203125, 41.8212890625, 44.67724609375, 47.533203125, 50.38916015625, 53.2451171875, 56.10107421875, 58.95703125, 61.81298828125, 64.6689453125, 67.52490234375, 70.380859375, 73.23681640625, 76.0927734375, 78.94873046875, 81.8046875, 84.66064453125, 87.5166015625, 90.37255859375, 93.228515625, 96.08447265625, 98.9404296875, 101.79638671875, 104.65234375, 107.50830078125, 110.3642578125, 113.22021484375, 116.076171875, 118.93212890625, 121.7880859375, 124.64404296875, 127.5]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 5.0, 12.0, 22.0, 59.0, 108.0, 207.0, 242.0, 176.0, 78.0, 47.0, 23.0, 17.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3731.10546875, -3645.3759765625, -3559.646484375, -3473.9169921875, -3388.1875, -3302.458251953125, -3216.728759765625, -3130.999267578125, -3045.269775390625, -2959.540283203125, -2873.810791015625, -2788.081298828125, -2702.35205078125, -2616.62255859375, -2530.89306640625, -2445.16357421875, -2359.43408203125, -2273.70458984375, -2187.97509765625, -2102.24560546875, -2016.5162353515625, -1930.7867431640625, -1845.057373046875, -1759.327880859375, -1673.598388671875, -1587.868896484375, -1502.139404296875, -1416.4100341796875, -1330.6805419921875, -1244.9510498046875, -1159.2216796875, -1073.4921875, -987.7628173828125, -902.0333251953125, -816.3038940429688, -730.574462890625, -644.844970703125, -559.115478515625, -473.38604736328125, -387.6566162109375, -301.9271240234375, -216.19766235351562, -130.46820068359375, -44.738739013671875, 40.99072265625, 126.72018432617188, 212.44964599609375, 298.1790771484375, 383.9085693359375, 469.6380310058594, 555.3674926757812, 641.096923828125, 726.826416015625, 812.555908203125, 898.2853393554688, 984.0147705078125, 1069.7442626953125, 1155.4737548828125, 1241.203125, 1326.9326171875, 1412.662109375, 1498.3916015625, 1584.12109375, 1669.8504638671875, 1755.5799560546875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 7.0, 10.0, 8.0, 13.0, 19.0, 17.0, 21.0, 15.0, 19.0, 31.0, 37.0, 38.0, 46.0, 54.0, 69.0, 54.0, 58.0, 59.0, 47.0, 50.0, 59.0, 37.0, 42.0, 35.0, 34.0, 34.0, 18.0, 20.0, 13.0, 13.0, 4.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1028.7578125, -993.9733276367188, -959.1888427734375, -924.4044189453125, -889.6199340820312, -854.83544921875, -820.051025390625, -785.2665405273438, -750.4820556640625, -715.6975708007812, -680.9130859375, -646.128662109375, -611.3441772460938, -576.5596923828125, -541.7752685546875, -506.99078369140625, -472.206298828125, -437.42181396484375, -402.6373596191406, -367.8529052734375, -333.06842041015625, -298.283935546875, -263.4994812011719, -228.7150115966797, -193.9305419921875, -159.1460723876953, -124.36160278320312, -89.57713317871094, -54.79266357421875, -20.008193969726562, 14.776275634765625, 49.56074523925781, 84.3453369140625, 119.12980651855469, 153.91427612304688, 188.69874572753906, 223.48321533203125, 258.2677001953125, 293.0521545410156, 327.83660888671875, 362.62109375, 397.40557861328125, 432.1900329589844, 466.9744873046875, 501.75897216796875, 536.54345703125, 571.327880859375, 606.1123657226562, 640.8968505859375, 675.6813354492188, 710.4658203125, 745.250244140625, 780.0347290039062, 814.8192138671875, 849.6036376953125, 884.3881225585938, 919.172607421875, 953.9570922851562, 988.7415771484375, 1023.5260009765625, 1058.310546875, 1093.094970703125, 1127.87939453125, 1162.6639404296875, 1197.4483642578125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 6.0, 5.0, 9.0, 5.0, 12.0, 19.0, 16.0, 27.0, 24.0, 35.0, 42.0, 76.0, 64.0, 112.0, 128.0, 181.0, 209.0, 283.0, 393.0, 600.0, 915.0, 1767.0, 5137.0, 4165384.0, 12410.0, 2703.0, 1206.0, 662.0, 416.0, 348.0, 249.0, 173.0, 161.0, 112.0, 91.0, 65.0, 64.0, 41.0, 26.0, 27.0, 18.0, 18.0, 15.0, 7.0, 3.0, 7.0, 5.0, 3.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-291.5, -282.58984375, -273.6796875, -264.76953125, -255.859375, -246.94921875, -238.0390625, -229.12890625, -220.21875, -211.30859375, -202.3984375, -193.48828125, -184.578125, -175.66796875, -166.7578125, -157.84765625, -148.9375, -140.02734375, -131.1171875, -122.20703125, -113.296875, -104.38671875, -95.4765625, -86.56640625, -77.65625, -68.74609375, -59.8359375, -50.92578125, -42.015625, -33.10546875, -24.1953125, -15.28515625, -6.375, 2.53515625, 11.4453125, 20.35546875, 29.265625, 38.17578125, 47.0859375, 55.99609375, 64.90625, 73.81640625, 82.7265625, 91.63671875, 100.546875, 109.45703125, 118.3671875, 127.27734375, 136.1875, 145.09765625, 154.0078125, 162.91796875, 171.828125, 180.73828125, 189.6484375, 198.55859375, 207.46875, 216.37890625, 225.2890625, 234.19921875, 243.109375, 252.01953125, 260.9296875, 269.83984375, 278.75]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 12.0, 9.0, 17.0, 12.0, 13.0, 27.0, 19.0, 28.0, 35.0, 38.0, 39.0, 46.0, 36.0, 52.0, 54.0, 57.0, 53.0, 46.0, 51.0, 54.0, 42.0, 48.0, 37.0, 32.0, 18.0, 15.0, 14.0, 18.0, 18.0, 11.0, 11.0, 6.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.75, -44.26318359375, -42.7763671875, -41.28955078125, -39.802734375, -38.31591796875, -36.8291015625, -35.34228515625, -33.85546875, -32.36865234375, -30.8818359375, -29.39501953125, -27.908203125, -26.42138671875, -24.9345703125, -23.44775390625, -21.9609375, -20.47412109375, -18.9873046875, -17.50048828125, -16.013671875, -14.52685546875, -13.0400390625, -11.55322265625, -10.06640625, -8.57958984375, -7.0927734375, -5.60595703125, -4.119140625, -2.63232421875, -1.1455078125, 0.34130859375, 1.828125, 3.31494140625, 4.8017578125, 6.28857421875, 7.775390625, 9.26220703125, 10.7490234375, 12.23583984375, 13.72265625, 15.20947265625, 16.6962890625, 18.18310546875, 19.669921875, 21.15673828125, 22.6435546875, 24.13037109375, 25.6171875, 27.10400390625, 28.5908203125, 30.07763671875, 31.564453125, 33.05126953125, 34.5380859375, 36.02490234375, 37.51171875, 38.99853515625, 40.4853515625, 41.97216796875, 43.458984375, 44.94580078125, 46.4326171875, 47.91943359375, 49.40625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 6.0, 4.0, 14.0, 20.0, 17.0, 26.0, 38.0, 40.0, 51.0, 72.0, 103.0, 120.0, 204.0, 260.0, 427.0, 655.0, 1186.0, 2632.0, 10167.0, 4155381.0, 15990.0, 3249.0, 1374.0, 731.0, 435.0, 306.0, 217.0, 144.0, 107.0, 92.0, 50.0, 39.0, 20.0, 24.0, 18.0, 22.0, 9.0, 12.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-380.75, -368.69921875, -356.6484375, -344.59765625, -332.546875, -320.49609375, -308.4453125, -296.39453125, -284.34375, -272.29296875, -260.2421875, -248.19140625, -236.140625, -224.08984375, -212.0390625, -199.98828125, -187.9375, -175.88671875, -163.8359375, -151.78515625, -139.734375, -127.68359375, -115.6328125, -103.58203125, -91.53125, -79.48046875, -67.4296875, -55.37890625, -43.328125, -31.27734375, -19.2265625, -7.17578125, 4.875, 16.92578125, 28.9765625, 41.02734375, 53.078125, 65.12890625, 77.1796875, 89.23046875, 101.28125, 113.33203125, 125.3828125, 137.43359375, 149.484375, 161.53515625, 173.5859375, 185.63671875, 197.6875, 209.73828125, 221.7890625, 233.83984375, 245.890625, 257.94140625, 269.9921875, 282.04296875, 294.09375, 306.14453125, 318.1953125, 330.24609375, 342.296875, 354.34765625, 366.3984375, 378.44921875, 390.5]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 16.0, 3904.0, 102.0, 19.0, 9.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.3125, -79.7314453125, -77.150390625, -74.5693359375, -71.98828125, -69.4072265625, -66.826171875, -64.2451171875, -61.6640625, -59.0830078125, -56.501953125, -53.9208984375, -51.33984375, -48.7587890625, -46.177734375, -43.5966796875, -41.015625, -38.4345703125, -35.853515625, -33.2724609375, -30.69140625, -28.1103515625, -25.529296875, -22.9482421875, -20.3671875, -17.7861328125, -15.205078125, -12.6240234375, -10.04296875, -7.4619140625, -4.880859375, -2.2998046875, 0.28125, 2.8623046875, 5.443359375, 8.0244140625, 10.60546875, 13.1865234375, 15.767578125, 18.3486328125, 20.9296875, 23.5107421875, 26.091796875, 28.6728515625, 31.25390625, 33.8349609375, 36.416015625, 38.9970703125, 41.578125, 44.1591796875, 46.740234375, 49.3212890625, 51.90234375, 54.4833984375, 57.064453125, 59.6455078125, 62.2265625, 64.8076171875, 67.388671875, 69.9697265625, 72.55078125, 75.1318359375, 77.712890625, 80.2939453125, 82.875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 5.0, 5.0, 8.0, 10.0, 19.0, 11.0, 22.0, 41.0, 63.0, 76.0, 78.0, 85.0, 115.0, 94.0, 100.0, 76.0, 47.0, 43.0, 26.0, 21.0, 15.0, 8.0, 8.0, 8.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.56581115722656, -161.5968017578125, -156.6278076171875, -151.6588134765625, -146.68980407714844, -141.72079467773438, -136.75180053710938, -131.78280639648438, -126.81379699707031, -121.84479522705078, -116.87579345703125, -111.90679168701172, -106.93778991699219, -101.96878814697266, -96.99978637695312, -92.0307846069336, -87.06178283691406, -82.09278106689453, -77.123779296875, -72.15477752685547, -67.18577575683594, -62.216773986816406, -57.247772216796875, -52.278770446777344, -47.30976867675781, -42.34076690673828, -37.37176513671875, -32.40276336669922, -27.433761596679688, -22.464759826660156, -17.495758056640625, -12.526756286621094, -7.5577392578125, -2.5887374877929688, 2.3802642822265625, 7.349266052246094, 12.318267822265625, 17.287269592285156, 22.256271362304688, 27.22527313232422, 32.19427490234375, 37.16327667236328, 42.13227844238281, 47.101280212402344, 52.070281982421875, 57.039283752441406, 62.00828552246094, 66.97728729248047, 71.9462890625, 76.91529083251953, 81.88429260253906, 86.8532943725586, 91.82229614257812, 96.79129791259766, 101.76029968261719, 106.72930145263672, 111.69830322265625, 116.66730499267578, 121.63630676269531, 126.60530853271484, 131.57431030273438, 136.54330444335938, 141.51231384277344, 146.4813232421875, 151.4503173828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 11.0, 17.0, 9.0, 16.0, 13.0, 22.0, 16.0, 22.0, 28.0, 37.0, 25.0, 40.0, 29.0, 35.0, 49.0, 44.0, 47.0, 40.0, 47.0, 31.0, 34.0, 42.0, 37.0, 29.0, 37.0, 20.0, 33.0, 25.0, 26.0, 23.0, 13.0, 14.0, 19.0, 7.0, 9.0, 7.0, 8.0, 4.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-76.51296997070312, -74.08256530761719, -71.65216064453125, -69.22174835205078, -66.79134368896484, -64.3609390258789, -61.93053436279297, -59.500125885009766, -57.06971740722656, -54.639312744140625, -52.20890426635742, -49.778499603271484, -47.34809112548828, -44.917686462402344, -42.487281799316406, -40.0568733215332, -37.626468658447266, -35.19606399536133, -32.765655517578125, -30.335250854492188, -27.904842376708984, -25.474437713623047, -23.044031143188477, -20.613624572753906, -18.183218002319336, -15.752811431884766, -13.322404861450195, -10.891999244689941, -8.461592674255371, -6.031186103820801, -3.600780487060547, -1.1703739166259766, 1.2600326538085938, 3.690438985824585, 6.120845317840576, 8.551251411437988, 10.981657981872559, 13.412064552307129, 15.842470169067383, 18.272876739501953, 20.703283309936523, 23.133689880371094, 25.564096450805664, 27.994503021240234, 30.424907684326172, 32.855316162109375, 35.28572082519531, 37.71612548828125, 40.14653396606445, 42.57693862915039, 45.007347106933594, 47.43775177001953, 49.868160247802734, 52.29856491088867, 54.728973388671875, 57.15937805175781, 59.58978271484375, 62.02018737792969, 64.45059204101562, 66.8810043334961, 69.31140899658203, 71.74181365966797, 74.1722183227539, 76.60263061523438, 79.03303527832031]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 9.0, 13.0, 17.0, 18.0, 28.0, 50.0, 63.0, 93.0, 145.0, 226.0, 292.0, 510.0, 727.0, 1228.0, 2205.0, 4259.0, 9036.0, 22181.0, 63455.0, 233213.0, 496910.0, 140574.0, 42745.0, 15744.0, 6734.0, 3303.0, 1810.0, 1061.0, 655.0, 411.0, 250.0, 203.0, 113.0, 83.0, 50.0, 46.0, 22.0, 19.0, 18.0, 13.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-132.5, -128.400390625, -124.30078125, -120.201171875, -116.1015625, -112.001953125, -107.90234375, -103.802734375, -99.703125, -95.603515625, -91.50390625, -87.404296875, -83.3046875, -79.205078125, -75.10546875, -71.005859375, -66.90625, -62.806640625, -58.70703125, -54.607421875, -50.5078125, -46.408203125, -42.30859375, -38.208984375, -34.109375, -30.009765625, -25.91015625, -21.810546875, -17.7109375, -13.611328125, -9.51171875, -5.412109375, -1.3125, 2.787109375, 6.88671875, 10.986328125, 15.0859375, 19.185546875, 23.28515625, 27.384765625, 31.484375, 35.583984375, 39.68359375, 43.783203125, 47.8828125, 51.982421875, 56.08203125, 60.181640625, 64.28125, 68.380859375, 72.48046875, 76.580078125, 80.6796875, 84.779296875, 88.87890625, 92.978515625, 97.078125, 101.177734375, 105.27734375, 109.376953125, 113.4765625, 117.576171875, 121.67578125, 125.775390625, 129.875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 10.0, 7.0, 6.0, 19.0, 8.0, 15.0, 22.0, 16.0, 32.0, 36.0, 38.0, 43.0, 36.0, 49.0, 53.0, 53.0, 51.0, 39.0, 54.0, 42.0, 47.0, 31.0, 48.0, 51.0, 34.0, 25.0, 23.0, 18.0, 17.0, 14.0, 10.0, 11.0, 6.0, 7.0, 1.0, 9.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.78125, -48.2314453125, -46.681640625, -45.1318359375, -43.58203125, -42.0322265625, -40.482421875, -38.9326171875, -37.3828125, -35.8330078125, -34.283203125, -32.7333984375, -31.18359375, -29.6337890625, -28.083984375, -26.5341796875, -24.984375, -23.4345703125, -21.884765625, -20.3349609375, -18.78515625, -17.2353515625, -15.685546875, -14.1357421875, -12.5859375, -11.0361328125, -9.486328125, -7.9365234375, -6.38671875, -4.8369140625, -3.287109375, -1.7373046875, -0.1875, 1.3623046875, 2.912109375, 4.4619140625, 6.01171875, 7.5615234375, 9.111328125, 10.6611328125, 12.2109375, 13.7607421875, 15.310546875, 16.8603515625, 18.41015625, 19.9599609375, 21.509765625, 23.0595703125, 24.609375, 26.1591796875, 27.708984375, 29.2587890625, 30.80859375, 32.3583984375, 33.908203125, 35.4580078125, 37.0078125, 38.5576171875, 40.107421875, 41.6572265625, 43.20703125, 44.7568359375, 46.306640625, 47.8564453125, 49.40625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 9.0, 7.0, 15.0, 22.0, 23.0, 43.0, 61.0, 77.0, 145.0, 219.0, 350.0, 622.0, 1250.0, 2873.0, 7816.0, 27196.0, 148564.0, 689299.0, 132217.0, 25100.0, 7295.0, 2611.0, 1165.0, 610.0, 336.0, 199.0, 125.0, 90.0, 41.0, 41.0, 26.0, 22.0, 19.0, 19.0, 7.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-176.125, -171.015625, -165.90625, -160.796875, -155.6875, -150.578125, -145.46875, -140.359375, -135.25, -130.140625, -125.03125, -119.921875, -114.8125, -109.703125, -104.59375, -99.484375, -94.375, -89.265625, -84.15625, -79.046875, -73.9375, -68.828125, -63.71875, -58.609375, -53.5, -48.390625, -43.28125, -38.171875, -33.0625, -27.953125, -22.84375, -17.734375, -12.625, -7.515625, -2.40625, 2.703125, 7.8125, 12.921875, 18.03125, 23.140625, 28.25, 33.359375, 38.46875, 43.578125, 48.6875, 53.796875, 58.90625, 64.015625, 69.125, 74.234375, 79.34375, 84.453125, 89.5625, 94.671875, 99.78125, 104.890625, 110.0, 115.109375, 120.21875, 125.328125, 130.4375, 135.546875, 140.65625, 145.765625, 150.875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 10.0, 5.0, 17.0, 13.0, 21.0, 17.0, 34.0, 29.0, 29.0, 33.0, 43.0, 39.0, 35.0, 50.0, 62.0, 52.0, 56.0, 57.0, 55.0, 54.0, 46.0, 30.0, 32.0, 34.0, 28.0, 27.0, 16.0, 15.0, 12.0, 10.0, 13.0, 7.0, 4.0, 6.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-190.375, -183.169921875, -175.96484375, -168.759765625, -161.5546875, -154.349609375, -147.14453125, -139.939453125, -132.734375, -125.529296875, -118.32421875, -111.119140625, -103.9140625, -96.708984375, -89.50390625, -82.298828125, -75.09375, -67.888671875, -60.68359375, -53.478515625, -46.2734375, -39.068359375, -31.86328125, -24.658203125, -17.453125, -10.248046875, -3.04296875, 4.162109375, 11.3671875, 18.572265625, 25.77734375, 32.982421875, 40.1875, 47.392578125, 54.59765625, 61.802734375, 69.0078125, 76.212890625, 83.41796875, 90.623046875, 97.828125, 105.033203125, 112.23828125, 119.443359375, 126.6484375, 133.853515625, 141.05859375, 148.263671875, 155.46875, 162.673828125, 169.87890625, 177.083984375, 184.2890625, 191.494140625, 198.69921875, 205.904296875, 213.109375, 220.314453125, 227.51953125, 234.724609375, 241.9296875, 249.134765625, 256.33984375, 263.544921875, 270.75]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 11.0, 14.0, 16.0, 36.0, 64.0, 163.0, 449.0, 1240.0, 4621.0, 36494.0, 915505.0, 80618.0, 6809.0, 1616.0, 525.0, 184.0, 84.0, 41.0, 24.0, 15.0, 4.0, 9.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-209.25, -203.83203125, -198.4140625, -192.99609375, -187.578125, -182.16015625, -176.7421875, -171.32421875, -165.90625, -160.48828125, -155.0703125, -149.65234375, -144.234375, -138.81640625, -133.3984375, -127.98046875, -122.5625, -117.14453125, -111.7265625, -106.30859375, -100.890625, -95.47265625, -90.0546875, -84.63671875, -79.21875, -73.80078125, -68.3828125, -62.96484375, -57.546875, -52.12890625, -46.7109375, -41.29296875, -35.875, -30.45703125, -25.0390625, -19.62109375, -14.203125, -8.78515625, -3.3671875, 2.05078125, 7.46875, 12.88671875, 18.3046875, 23.72265625, 29.140625, 34.55859375, 39.9765625, 45.39453125, 50.8125, 56.23046875, 61.6484375, 67.06640625, 72.484375, 77.90234375, 83.3203125, 88.73828125, 94.15625, 99.57421875, 104.9921875, 110.41015625, 115.828125, 121.24609375, 126.6640625, 132.08203125, 137.5]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 3.0, 11.0, 8.0, 9.0, 18.0, 26.0, 24.0, 36.0, 52.0, 81.0, 153.0, 151.0, 126.0, 83.0, 60.0, 39.0, 28.0, 21.0, 18.0, 10.0, 10.0, 9.0, 8.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01995849609375, -0.019141197204589844, -0.018323898315429688, -0.01750659942626953, -0.016689300537109375, -0.01587200164794922, -0.015054702758789062, -0.014237403869628906, -0.01342010498046875, -0.012602806091308594, -0.011785507202148438, -0.010968208312988281, -0.010150909423828125, -0.009333610534667969, -0.008516311645507812, -0.007699012756347656, -0.0068817138671875, -0.006064414978027344, -0.0052471160888671875, -0.004429817199707031, -0.003612518310546875, -0.0027952194213867188, -0.0019779205322265625, -0.0011606216430664062, -0.00034332275390625, 0.00047397613525390625, 0.0012912750244140625, 0.0021085739135742188, 0.002925872802734375, 0.0037431716918945312, 0.0045604705810546875, 0.005377769470214844, 0.006195068359375, 0.007012367248535156, 0.007829666137695312, 0.008646965026855469, 0.009464263916015625, 0.010281562805175781, 0.011098861694335938, 0.011916160583496094, 0.01273345947265625, 0.013550758361816406, 0.014368057250976562, 0.015185356140136719, 0.016002655029296875, 0.01681995391845703, 0.017637252807617188, 0.018454551696777344, 0.0192718505859375, 0.020089149475097656, 0.020906448364257812, 0.02172374725341797, 0.022541046142578125, 0.02335834503173828, 0.024175643920898438, 0.024992942810058594, 0.02581024169921875, 0.026627540588378906, 0.027444839477539062, 0.02826213836669922, 0.029079437255859375, 0.02989673614501953, 0.030714035034179688, 0.031531333923339844, 0.0323486328125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 7.0, 15.0, 7.0, 10.0, 23.0, 40.0, 87.0, 106.0, 255.0, 658.0, 3243.0, 46045.0, 951014.0, 42775.0, 3096.0, 648.0, 248.0, 111.0, 62.0, 38.0, 26.0, 15.0, 12.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-178.375, -171.376953125, -164.37890625, -157.380859375, -150.3828125, -143.384765625, -136.38671875, -129.388671875, -122.390625, -115.392578125, -108.39453125, -101.396484375, -94.3984375, -87.400390625, -80.40234375, -73.404296875, -66.40625, -59.408203125, -52.41015625, -45.412109375, -38.4140625, -31.416015625, -24.41796875, -17.419921875, -10.421875, -3.423828125, 3.57421875, 10.572265625, 17.5703125, 24.568359375, 31.56640625, 38.564453125, 45.5625, 52.560546875, 59.55859375, 66.556640625, 73.5546875, 80.552734375, 87.55078125, 94.548828125, 101.546875, 108.544921875, 115.54296875, 122.541015625, 129.5390625, 136.537109375, 143.53515625, 150.533203125, 157.53125, 164.529296875, 171.52734375, 178.525390625, 185.5234375, 192.521484375, 199.51953125, 206.517578125, 213.515625, 220.513671875, 227.51171875, 234.509765625, 241.5078125, 248.505859375, 255.50390625, 262.501953125, 269.5]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 9.0, 9.0, 25.0, 43.0, 110.0, 216.0, 314.0, 154.0, 59.0, 33.0, 21.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.25, -102.11328125, -94.9765625, -87.83984375, -80.703125, -73.56640625, -66.4296875, -59.29296875, -52.15625, -45.01953125, -37.8828125, -30.74609375, -23.609375, -16.47265625, -9.3359375, -2.19921875, 4.9375, 12.07421875, 19.2109375, 26.34765625, 33.484375, 40.62109375, 47.7578125, 54.89453125, 62.03125, 69.16796875, 76.3046875, 83.44140625, 90.578125, 97.71484375, 104.8515625, 111.98828125, 119.125, 126.26171875, 133.3984375, 140.53515625, 147.671875, 154.80859375, 161.9453125, 169.08203125, 176.21875, 183.35546875, 190.4921875, 197.62890625, 204.765625, 211.90234375, 219.0390625, 226.17578125, 233.3125, 240.44921875, 247.5859375, 254.72265625, 261.859375, 268.99609375, 276.1328125, 283.26953125, 290.40625, 297.54296875, 304.6796875, 311.81640625, 318.953125, 326.08984375, 333.2265625, 340.36328125, 347.5]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 26.0, 77.0, 188.0, 304.0, 244.0, 104.0, 35.0, 10.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2995.394287109375, -2897.577392578125, -2799.760498046875, -2701.943359375, -2604.12646484375, -2506.3095703125, -2408.49267578125, -2310.67578125, -2212.85888671875, -2115.0419921875, -2017.2249755859375, -1919.4080810546875, -1821.591064453125, -1723.774169921875, -1625.957275390625, -1528.140380859375, -1430.3232421875, -1332.50634765625, -1234.6893310546875, -1136.8724365234375, -1039.055419921875, -941.238525390625, -843.421630859375, -745.6046752929688, -647.7877197265625, -549.9707641601562, -452.1538391113281, -354.3369140625, -256.51995849609375, -158.7030029296875, -60.8861083984375, 36.93084716796875, 134.747802734375, 232.5647430419922, 330.3816833496094, 428.1986083984375, 526.0155639648438, 623.83251953125, 721.6494140625, 819.4663696289062, 917.2833251953125, 1015.1002807617188, 1112.917236328125, 1210.734130859375, 1308.551025390625, 1406.3680419921875, 1504.1849365234375, 1602.001953125, 1699.81884765625, 1797.6357421875, 1895.4527587890625, 1993.2696533203125, 2091.086669921875, 2188.903564453125, 2286.720458984375, 2384.537353515625, 2482.3544921875, 2580.17138671875, 2677.98828125, 2775.80517578125, 2873.622314453125, 2971.439208984375, 3069.256103515625, 3167.072998046875, 3264.889892578125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 4.0, 8.0, 7.0, 7.0, 12.0, 9.0, 12.0, 14.0, 14.0, 15.0, 17.0, 19.0, 23.0, 26.0, 29.0, 33.0, 30.0, 39.0, 45.0, 50.0, 50.0, 39.0, 47.0, 56.0, 50.0, 47.0, 37.0, 25.0, 32.0, 25.0, 23.0, 23.0, 21.0, 14.0, 19.0, 10.0, 16.0, 9.0, 7.0, 4.0, 3.0, 1.0, 8.0, 5.0, 4.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-890.6057739257812, -863.0966796875, -835.587646484375, -808.0785522460938, -780.5695190429688, -753.0604248046875, -725.5513916015625, -698.0422973632812, -670.533203125, -643.0241088867188, -615.5150756835938, -588.0059814453125, -560.4969482421875, -532.9878540039062, -505.4787902832031, -477.9697265625, -450.460693359375, -422.9516296386719, -395.44256591796875, -367.9334716796875, -340.4244384765625, -312.91534423828125, -285.4062805175781, -257.897216796875, -230.38815307617188, -202.87908935546875, -175.37002563476562, -147.86094665527344, -120.35188293457031, -92.84281921386719, -65.333740234375, -37.824676513671875, -10.3155517578125, 17.19351577758789, 44.70258331298828, 72.21165466308594, 99.72071838378906, 127.22978210449219, 154.73886108398438, 182.2479248046875, 209.75698852539062, 237.26605224609375, 264.7751159667969, 292.2841796875, 319.79327392578125, 347.30230712890625, 374.8114013671875, 402.3204650878906, 429.82952880859375, 457.3385925292969, 484.84765625, 512.3567504882812, 539.8657836914062, 567.3748779296875, 594.8839111328125, 622.3930053710938, 649.902099609375, 677.4111938476562, 704.9202270507812, 732.4293212890625, 759.9383544921875, 787.4474487304688, 814.95654296875, 842.465576171875, 869.974609375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 8.0, 17.0, 15.0, 15.0, 36.0, 36.0, 46.0, 55.0, 74.0, 95.0, 116.0, 218.0, 281.0, 435.0, 709.0, 1223.0, 2188.0, 4830.0, 15213.0, 4094330.0, 58181.0, 8412.0, 3318.0, 1690.0, 883.0, 569.0, 378.0, 229.0, 170.0, 115.0, 89.0, 52.0, 61.0, 43.0, 32.0, 25.0, 17.0, 15.0, 13.0, 14.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-258.5, -250.3671875, -242.234375, -234.1015625, -225.96875, -217.8359375, -209.703125, -201.5703125, -193.4375, -185.3046875, -177.171875, -169.0390625, -160.90625, -152.7734375, -144.640625, -136.5078125, -128.375, -120.2421875, -112.109375, -103.9765625, -95.84375, -87.7109375, -79.578125, -71.4453125, -63.3125, -55.1796875, -47.046875, -38.9140625, -30.78125, -22.6484375, -14.515625, -6.3828125, 1.75, 9.8828125, 18.015625, 26.1484375, 34.28125, 42.4140625, 50.546875, 58.6796875, 66.8125, 74.9453125, 83.078125, 91.2109375, 99.34375, 107.4765625, 115.609375, 123.7421875, 131.875, 140.0078125, 148.140625, 156.2734375, 164.40625, 172.5390625, 180.671875, 188.8046875, 196.9375, 205.0703125, 213.203125, 221.3359375, 229.46875, 237.6015625, 245.734375, 253.8671875, 262.0]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 11.0, 5.0, 11.0, 6.0, 12.0, 14.0, 18.0, 24.0, 23.0, 37.0, 33.0, 33.0, 36.0, 44.0, 56.0, 43.0, 46.0, 50.0, 57.0, 49.0, 43.0, 32.0, 51.0, 39.0, 33.0, 43.0, 17.0, 19.0, 15.0, 18.0, 12.0, 7.0, 13.0, 9.0, 8.0, 8.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.0, -45.47607421875, -43.9521484375, -42.42822265625, -40.904296875, -39.38037109375, -37.8564453125, -36.33251953125, -34.80859375, -33.28466796875, -31.7607421875, -30.23681640625, -28.712890625, -27.18896484375, -25.6650390625, -24.14111328125, -22.6171875, -21.09326171875, -19.5693359375, -18.04541015625, -16.521484375, -14.99755859375, -13.4736328125, -11.94970703125, -10.42578125, -8.90185546875, -7.3779296875, -5.85400390625, -4.330078125, -2.80615234375, -1.2822265625, 0.24169921875, 1.765625, 3.28955078125, 4.8134765625, 6.33740234375, 7.861328125, 9.38525390625, 10.9091796875, 12.43310546875, 13.95703125, 15.48095703125, 17.0048828125, 18.52880859375, 20.052734375, 21.57666015625, 23.1005859375, 24.62451171875, 26.1484375, 27.67236328125, 29.1962890625, 30.72021484375, 32.244140625, 33.76806640625, 35.2919921875, 36.81591796875, 38.33984375, 39.86376953125, 41.3876953125, 42.91162109375, 44.435546875, 45.95947265625, 47.4833984375, 49.00732421875, 50.53125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 8.0, 11.0, 20.0, 22.0, 48.0, 49.0, 85.0, 159.0, 222.0, 423.0, 696.0, 1305.0, 2630.0, 5881.0, 19027.0, 3952864.0, 185909.0, 14756.0, 5080.0, 2264.0, 1215.0, 626.0, 370.0, 202.0, 151.0, 86.0, 62.0, 29.0, 21.0, 17.0, 10.0, 15.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-318.75, -308.76171875, -298.7734375, -288.78515625, -278.796875, -268.80859375, -258.8203125, -248.83203125, -238.84375, -228.85546875, -218.8671875, -208.87890625, -198.890625, -188.90234375, -178.9140625, -168.92578125, -158.9375, -148.94921875, -138.9609375, -128.97265625, -118.984375, -108.99609375, -99.0078125, -89.01953125, -79.03125, -69.04296875, -59.0546875, -49.06640625, -39.078125, -29.08984375, -19.1015625, -9.11328125, 0.875, 10.86328125, 20.8515625, 30.83984375, 40.828125, 50.81640625, 60.8046875, 70.79296875, 80.78125, 90.76953125, 100.7578125, 110.74609375, 120.734375, 130.72265625, 140.7109375, 150.69921875, 160.6875, 170.67578125, 180.6640625, 190.65234375, 200.640625, 210.62890625, 220.6171875, 230.60546875, 240.59375, 250.58203125, 260.5703125, 270.55859375, 280.546875, 290.53515625, 300.5234375, 310.51171875, 320.5]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 7.0, 7.0, 13.0, 23.0, 43.0, 125.0, 3644.0, 98.0, 46.0, 12.0, 12.0, 12.0, 6.0, 7.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.25, -106.37890625, -102.5078125, -98.63671875, -94.765625, -90.89453125, -87.0234375, -83.15234375, -79.28125, -75.41015625, -71.5390625, -67.66796875, -63.796875, -59.92578125, -56.0546875, -52.18359375, -48.3125, -44.44140625, -40.5703125, -36.69921875, -32.828125, -28.95703125, -25.0859375, -21.21484375, -17.34375, -13.47265625, -9.6015625, -5.73046875, -1.859375, 2.01171875, 5.8828125, 9.75390625, 13.625, 17.49609375, 21.3671875, 25.23828125, 29.109375, 32.98046875, 36.8515625, 40.72265625, 44.59375, 48.46484375, 52.3359375, 56.20703125, 60.078125, 63.94921875, 67.8203125, 71.69140625, 75.5625, 79.43359375, 83.3046875, 87.17578125, 91.046875, 94.91796875, 98.7890625, 102.66015625, 106.53125, 110.40234375, 114.2734375, 118.14453125, 122.015625, 125.88671875, 129.7578125, 133.62890625, 137.5]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 2.0, 2.0, 8.0, 4.0, 10.0, 15.0, 30.0, 42.0, 58.0, 86.0, 117.0, 136.0, 144.0, 104.0, 76.0, 46.0, 43.0, 28.0, 18.0, 5.0, 6.0, 4.0, 12.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-458.49542236328125, -444.99444580078125, -431.4934387207031, -417.9924621582031, -404.491455078125, -390.990478515625, -377.489501953125, -363.988525390625, -350.4875183105469, -336.9865417480469, -323.48553466796875, -309.98455810546875, -296.48358154296875, -282.9825744628906, -269.4815979003906, -255.98060607910156, -242.4796142578125, -228.97862243652344, -215.47763061523438, -201.97665405273438, -188.4756622314453, -174.97467041015625, -161.47369384765625, -147.9727020263672, -134.47171020507812, -120.97071838378906, -107.46973419189453, -93.96875, -80.46775817871094, -66.96676635742188, -53.465782165527344, -39.96479797363281, -26.463775634765625, -12.962787628173828, 0.5382003784179688, 14.039188385009766, 27.540176391601562, 41.041168212890625, 54.542152404785156, 68.04313659667969, 81.54412841796875, 95.04512023925781, 108.54610443115234, 122.04708862304688, 135.54808044433594, 149.049072265625, 162.550048828125, 176.05104064941406, 189.55203247070312, 203.0530242919922, 216.55401611328125, 230.05499267578125, 243.5559844970703, 257.0569763183594, 270.5579528808594, 284.0589599609375, 297.5599365234375, 311.0609130859375, 324.5619201660156, 338.0628967285156, 351.56390380859375, 365.06488037109375, 378.56585693359375, 392.06683349609375, 405.5678405761719]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 9.0, 9.0, 22.0, 10.0, 17.0, 20.0, 20.0, 30.0, 32.0, 28.0, 41.0, 42.0, 43.0, 47.0, 51.0, 45.0, 60.0, 55.0, 38.0, 44.0, 39.0, 33.0, 29.0, 36.0, 20.0, 22.0, 19.0, 23.0, 16.0, 16.0, 16.0, 10.0, 6.0, 6.0, 4.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-227.385498046875, -220.46206665039062, -213.5386505126953, -206.61521911621094, -199.69180297851562, -192.76837158203125, -185.84494018554688, -178.9215087890625, -171.9980926513672, -165.0746612548828, -158.1512451171875, -151.22781372070312, -144.30438232421875, -137.38096618652344, -130.45753479003906, -123.53411102294922, -116.61068725585938, -109.68726348876953, -102.76383972167969, -95.84040832519531, -88.91698455810547, -81.99356079101562, -75.07012939453125, -68.1467056274414, -61.22328186035156, -54.29985809326172, -47.37643051147461, -40.4530029296875, -33.529579162597656, -26.606155395507812, -19.682727813720703, -12.759300231933594, -5.8358917236328125, 1.087533950805664, 8.01095962524414, 14.934385299682617, 21.857810974121094, 28.781234741210938, 35.70466232299805, 42.628089904785156, 49.551513671875, 56.474937438964844, 63.39836502075195, 70.32179260253906, 77.2452163696289, 84.16864013671875, 91.09207153320312, 98.01549530029297, 104.93891906738281, 111.86234283447266, 118.7857666015625, 125.70919799804688, 132.63262939453125, 139.55604553222656, 146.47947692871094, 153.40289306640625, 160.32632446289062, 167.249755859375, 174.1731719970703, 181.0966033935547, 188.02001953125, 194.94345092773438, 201.86688232421875, 208.79031372070312, 215.71372985839844]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 10.0, 11.0, 21.0, 43.0, 41.0, 73.0, 112.0, 165.0, 319.0, 468.0, 897.0, 1678.0, 3198.0, 6688.0, 14824.0, 36220.0, 98647.0, 334594.0, 372618.0, 108152.0, 39625.0, 15820.0, 7106.0, 3462.0, 1634.0, 810.0, 512.0, 275.0, 177.0, 104.0, 59.0, 52.0, 43.0, 35.0, 16.0, 13.0, 5.0, 2.0, 4.0, 8.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.125, -128.541015625, -123.95703125, -119.373046875, -114.7890625, -110.205078125, -105.62109375, -101.037109375, -96.453125, -91.869140625, -87.28515625, -82.701171875, -78.1171875, -73.533203125, -68.94921875, -64.365234375, -59.78125, -55.197265625, -50.61328125, -46.029296875, -41.4453125, -36.861328125, -32.27734375, -27.693359375, -23.109375, -18.525390625, -13.94140625, -9.357421875, -4.7734375, -0.189453125, 4.39453125, 8.978515625, 13.5625, 18.146484375, 22.73046875, 27.314453125, 31.8984375, 36.482421875, 41.06640625, 45.650390625, 50.234375, 54.818359375, 59.40234375, 63.986328125, 68.5703125, 73.154296875, 77.73828125, 82.322265625, 86.90625, 91.490234375, 96.07421875, 100.658203125, 105.2421875, 109.826171875, 114.41015625, 118.994140625, 123.578125, 128.162109375, 132.74609375, 137.330078125, 141.9140625, 146.498046875, 151.08203125, 155.666015625, 160.25]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 4.0, 4.0, 10.0, 12.0, 10.0, 14.0, 22.0, 21.0, 36.0, 31.0, 44.0, 45.0, 48.0, 47.0, 67.0, 75.0, 65.0, 55.0, 48.0, 47.0, 55.0, 38.0, 41.0, 32.0, 28.0, 14.0, 11.0, 20.0, 11.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.25, -63.27880859375, -61.3076171875, -59.33642578125, -57.365234375, -55.39404296875, -53.4228515625, -51.45166015625, -49.48046875, -47.50927734375, -45.5380859375, -43.56689453125, -41.595703125, -39.62451171875, -37.6533203125, -35.68212890625, -33.7109375, -31.73974609375, -29.7685546875, -27.79736328125, -25.826171875, -23.85498046875, -21.8837890625, -19.91259765625, -17.94140625, -15.97021484375, -13.9990234375, -12.02783203125, -10.056640625, -8.08544921875, -6.1142578125, -4.14306640625, -2.171875, -0.20068359375, 1.7705078125, 3.74169921875, 5.712890625, 7.68408203125, 9.6552734375, 11.62646484375, 13.59765625, 15.56884765625, 17.5400390625, 19.51123046875, 21.482421875, 23.45361328125, 25.4248046875, 27.39599609375, 29.3671875, 31.33837890625, 33.3095703125, 35.28076171875, 37.251953125, 39.22314453125, 41.1943359375, 43.16552734375, 45.13671875, 47.10791015625, 49.0791015625, 51.05029296875, 53.021484375, 54.99267578125, 56.9638671875, 58.93505859375, 60.90625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 7.0, 4.0, 3.0, 11.0, 20.0, 21.0, 40.0, 41.0, 59.0, 99.0, 110.0, 173.0, 264.0, 390.0, 590.0, 1028.0, 1847.0, 3608.0, 8797.0, 25701.0, 101468.0, 577890.0, 249482.0, 50221.0, 14922.0, 5637.0, 2519.0, 1347.0, 813.0, 460.0, 270.0, 200.0, 152.0, 92.0, 71.0, 55.0, 35.0, 30.0, 14.0, 12.0, 15.0, 11.0, 6.0, 5.0, 0.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-160.875, -155.46875, -150.0625, -144.65625, -139.25, -133.84375, -128.4375, -123.03125, -117.625, -112.21875, -106.8125, -101.40625, -96.0, -90.59375, -85.1875, -79.78125, -74.375, -68.96875, -63.5625, -58.15625, -52.75, -47.34375, -41.9375, -36.53125, -31.125, -25.71875, -20.3125, -14.90625, -9.5, -4.09375, 1.3125, 6.71875, 12.125, 17.53125, 22.9375, 28.34375, 33.75, 39.15625, 44.5625, 49.96875, 55.375, 60.78125, 66.1875, 71.59375, 77.0, 82.40625, 87.8125, 93.21875, 98.625, 104.03125, 109.4375, 114.84375, 120.25, 125.65625, 131.0625, 136.46875, 141.875, 147.28125, 152.6875, 158.09375, 163.5, 168.90625, 174.3125, 179.71875, 185.125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 2.0, 3.0, 7.0, 10.0, 13.0, 13.0, 22.0, 27.0, 28.0, 29.0, 39.0, 40.0, 48.0, 50.0, 52.0, 40.0, 45.0, 58.0, 64.0, 45.0, 52.0, 39.0, 41.0, 40.0, 38.0, 29.0, 22.0, 25.0, 16.0, 13.0, 11.0, 7.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-198.625, -191.095703125, -183.56640625, -176.037109375, -168.5078125, -160.978515625, -153.44921875, -145.919921875, -138.390625, -130.861328125, -123.33203125, -115.802734375, -108.2734375, -100.744140625, -93.21484375, -85.685546875, -78.15625, -70.626953125, -63.09765625, -55.568359375, -48.0390625, -40.509765625, -32.98046875, -25.451171875, -17.921875, -10.392578125, -2.86328125, 4.666015625, 12.1953125, 19.724609375, 27.25390625, 34.783203125, 42.3125, 49.841796875, 57.37109375, 64.900390625, 72.4296875, 79.958984375, 87.48828125, 95.017578125, 102.546875, 110.076171875, 117.60546875, 125.134765625, 132.6640625, 140.193359375, 147.72265625, 155.251953125, 162.78125, 170.310546875, 177.83984375, 185.369140625, 192.8984375, 200.427734375, 207.95703125, 215.486328125, 223.015625, 230.544921875, 238.07421875, 245.603515625, 253.1328125, 260.662109375, 268.19140625, 275.720703125, 283.25]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 8.0, 17.0, 14.0, 23.0, 39.0, 79.0, 150.0, 380.0, 953.0, 2970.0, 11800.0, 88416.0, 769582.0, 151107.0, 17012.0, 3863.0, 1206.0, 468.0, 230.0, 91.0, 52.0, 30.0, 21.0, 11.0, 9.0, 10.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.125, -95.369140625, -92.61328125, -89.857421875, -87.1015625, -84.345703125, -81.58984375, -78.833984375, -76.078125, -73.322265625, -70.56640625, -67.810546875, -65.0546875, -62.298828125, -59.54296875, -56.787109375, -54.03125, -51.275390625, -48.51953125, -45.763671875, -43.0078125, -40.251953125, -37.49609375, -34.740234375, -31.984375, -29.228515625, -26.47265625, -23.716796875, -20.9609375, -18.205078125, -15.44921875, -12.693359375, -9.9375, -7.181640625, -4.42578125, -1.669921875, 1.0859375, 3.841796875, 6.59765625, 9.353515625, 12.109375, 14.865234375, 17.62109375, 20.376953125, 23.1328125, 25.888671875, 28.64453125, 31.400390625, 34.15625, 36.912109375, 39.66796875, 42.423828125, 45.1796875, 47.935546875, 50.69140625, 53.447265625, 56.203125, 58.958984375, 61.71484375, 64.470703125, 67.2265625, 69.982421875, 72.73828125, 75.494140625, 78.25]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 4.0, 3.0, 8.0, 13.0, 12.0, 18.0, 19.0, 34.0, 34.0, 36.0, 29.0, 45.0, 54.0, 73.0, 115.0, 81.0, 86.0, 72.0, 44.0, 40.0, 26.0, 27.0, 20.0, 14.0, 14.0, 8.0, 11.0, 14.0, 4.0, 9.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01447296142578125, -0.01399219036102295, -0.013511419296264648, -0.013030648231506348, -0.012549877166748047, -0.012069106101989746, -0.011588335037231445, -0.011107563972473145, -0.010626792907714844, -0.010146021842956543, -0.009665250778198242, -0.009184479713439941, -0.00870370864868164, -0.00822293758392334, -0.007742166519165039, -0.007261395454406738, -0.0067806243896484375, -0.006299853324890137, -0.005819082260131836, -0.005338311195373535, -0.004857540130615234, -0.004376769065856934, -0.003895998001098633, -0.003415226936340332, -0.0029344558715820312, -0.0024536848068237305, -0.0019729137420654297, -0.001492142677307129, -0.0010113716125488281, -0.0005306005477905273, -4.982948303222656e-05, 0.0004309415817260742, 0.000911712646484375, 0.0013924837112426758, 0.0018732547760009766, 0.0023540258407592773, 0.002834796905517578, 0.003315567970275879, 0.0037963390350341797, 0.0042771100997924805, 0.004757881164550781, 0.005238652229309082, 0.005719423294067383, 0.006200194358825684, 0.006680965423583984, 0.007161736488342285, 0.007642507553100586, 0.008123278617858887, 0.008604049682617188, 0.009084820747375488, 0.009565591812133789, 0.01004636287689209, 0.01052713394165039, 0.011007905006408691, 0.011488676071166992, 0.011969447135925293, 0.012450218200683594, 0.012930989265441895, 0.013411760330200195, 0.013892531394958496, 0.014373302459716797, 0.014854073524475098, 0.015334844589233398, 0.0158156156539917, 0.01629638671875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 1.0, 9.0, 9.0, 13.0, 19.0, 24.0, 32.0, 50.0, 77.0, 131.0, 160.0, 314.0, 511.0, 932.0, 1806.0, 4027.0, 10690.0, 39369.0, 221504.0, 606561.0, 122940.0, 25362.0, 7612.0, 2988.0, 1479.0, 755.0, 410.0, 252.0, 159.0, 92.0, 71.0, 57.0, 33.0, 25.0, 20.0, 13.0, 15.0, 5.0, 4.0, 8.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-69.875, -67.84033203125, -65.8056640625, -63.77099609375, -61.736328125, -59.70166015625, -57.6669921875, -55.63232421875, -53.59765625, -51.56298828125, -49.5283203125, -47.49365234375, -45.458984375, -43.42431640625, -41.3896484375, -39.35498046875, -37.3203125, -35.28564453125, -33.2509765625, -31.21630859375, -29.181640625, -27.14697265625, -25.1123046875, -23.07763671875, -21.04296875, -19.00830078125, -16.9736328125, -14.93896484375, -12.904296875, -10.86962890625, -8.8349609375, -6.80029296875, -4.765625, -2.73095703125, -0.6962890625, 1.33837890625, 3.373046875, 5.40771484375, 7.4423828125, 9.47705078125, 11.51171875, 13.54638671875, 15.5810546875, 17.61572265625, 19.650390625, 21.68505859375, 23.7197265625, 25.75439453125, 27.7890625, 29.82373046875, 31.8583984375, 33.89306640625, 35.927734375, 37.96240234375, 39.9970703125, 42.03173828125, 44.06640625, 46.10107421875, 48.1357421875, 50.17041015625, 52.205078125, 54.23974609375, 56.2744140625, 58.30908203125, 60.34375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 8.0, 9.0, 20.0, 31.0, 42.0, 86.0, 93.0, 129.0, 178.0, 113.0, 103.0, 79.0, 34.0, 24.0, 15.0, 8.0, 3.0, 11.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.75, -114.3232421875, -110.896484375, -107.4697265625, -104.04296875, -100.6162109375, -97.189453125, -93.7626953125, -90.3359375, -86.9091796875, -83.482421875, -80.0556640625, -76.62890625, -73.2021484375, -69.775390625, -66.3486328125, -62.921875, -59.4951171875, -56.068359375, -52.6416015625, -49.21484375, -45.7880859375, -42.361328125, -38.9345703125, -35.5078125, -32.0810546875, -28.654296875, -25.2275390625, -21.80078125, -18.3740234375, -14.947265625, -11.5205078125, -8.09375, -4.6669921875, -1.240234375, 2.1865234375, 5.61328125, 9.0400390625, 12.466796875, 15.8935546875, 19.3203125, 22.7470703125, 26.173828125, 29.6005859375, 33.02734375, 36.4541015625, 39.880859375, 43.3076171875, 46.734375, 50.1611328125, 53.587890625, 57.0146484375, 60.44140625, 63.8681640625, 67.294921875, 70.7216796875, 74.1484375, 77.5751953125, 81.001953125, 84.4287109375, 87.85546875, 91.2822265625, 94.708984375, 98.1357421875, 101.5625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 13.0, 13.0, 29.0, 49.0, 66.0, 113.0, 124.0, 161.0, 136.0, 105.0, 62.0, 37.0, 25.0, 16.0, 14.0, 8.0, 5.0, 3.0, 0.0, 4.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1657.6605224609375, -1606.6939697265625, -1555.727294921875, -1504.7607421875, -1453.794189453125, -1402.8275146484375, -1351.8609619140625, -1300.894287109375, -1249.927734375, -1198.961181640625, -1147.9945068359375, -1097.0279541015625, -1046.061279296875, -995.0947265625, -944.128173828125, -893.1615600585938, -842.1949462890625, -791.2283325195312, -740.26171875, -689.295166015625, -638.3285522460938, -587.3619384765625, -536.3953857421875, -485.42877197265625, -434.462158203125, -383.49554443359375, -332.5289611816406, -281.5623779296875, -230.59576416015625, -179.62916564941406, -128.66256713867188, -77.69598388671875, -26.7294921875, 24.237106323242188, 75.20370483398438, 126.17030334472656, 177.13690185546875, 228.10350036621094, 279.0700988769531, 330.03668212890625, 381.0032958984375, 431.96990966796875, 482.9364929199219, 533.903076171875, 584.8696899414062, 635.8363037109375, 686.8028564453125, 737.7694702148438, 788.736083984375, 839.7026977539062, 890.6693115234375, 941.6358642578125, 992.6024780273438, 1043.569091796875, 1094.53564453125, 1145.502197265625, 1196.4688720703125, 1247.4354248046875, 1298.402099609375, 1349.36865234375, 1400.335205078125, 1451.3018798828125, 1502.2684326171875, 1553.235107421875, 1604.20166015625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 6.0, 9.0, 12.0, 10.0, 16.0, 20.0, 25.0, 28.0, 20.0, 33.0, 34.0, 39.0, 53.0, 41.0, 47.0, 49.0, 41.0, 49.0, 39.0, 38.0, 48.0, 47.0, 28.0, 44.0, 27.0, 37.0, 20.0, 28.0, 20.0, 15.0, 13.0, 13.0, 9.0, 13.0, 9.0, 3.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1066.38671875, -1032.3743896484375, -998.3619995117188, -964.349609375, -930.3372802734375, -896.3248901367188, -862.3125, -828.3001708984375, -794.2877807617188, -760.275390625, -726.2630615234375, -692.2506713867188, -658.23828125, -624.2259521484375, -590.2135620117188, -556.201171875, -522.1888427734375, -488.1764831542969, -454.16412353515625, -420.1517333984375, -386.1393737792969, -352.12701416015625, -318.1146240234375, -284.1022644042969, -250.08990478515625, -216.07754516601562, -182.06517028808594, -148.05279541015625, -114.04043579101562, -80.028076171875, -46.01570129394531, -12.003326416015625, 22.0089111328125, 56.021278381347656, 90.03364562988281, 124.04601287841797, 158.05838012695312, 192.07073974609375, 226.08311462402344, 260.0954895019531, 294.10784912109375, 328.1202087402344, 362.132568359375, 396.14495849609375, 430.1573181152344, 464.169677734375, 498.18206787109375, 532.1944580078125, 566.206787109375, 600.2191772460938, 634.2315063476562, 668.243896484375, 702.2562255859375, 736.2686157226562, 770.281005859375, 804.2933349609375, 838.3057250976562, 872.318115234375, 906.3304443359375, 940.3428344726562, 974.355224609375, 1008.3675537109375, 1042.3798828125, 1076.392333984375, 1110.4046630859375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 7.0, 6.0, 18.0, 14.0, 36.0, 20.0, 38.0, 56.0, 81.0, 112.0, 190.0, 344.0, 505.0, 802.0, 1448.0, 2357.0, 4321.0, 8306.0, 18402.0, 53158.0, 451295.0, 3372747.0, 210470.0, 39314.0, 14818.0, 6843.0, 3548.0, 1950.0, 1148.0, 707.0, 408.0, 256.0, 162.0, 129.0, 72.0, 46.0, 39.0, 25.0, 22.0, 15.0, 11.0, 12.0, 10.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.0, -120.744140625, -116.48828125, -112.232421875, -107.9765625, -103.720703125, -99.46484375, -95.208984375, -90.953125, -86.697265625, -82.44140625, -78.185546875, -73.9296875, -69.673828125, -65.41796875, -61.162109375, -56.90625, -52.650390625, -48.39453125, -44.138671875, -39.8828125, -35.626953125, -31.37109375, -27.115234375, -22.859375, -18.603515625, -14.34765625, -10.091796875, -5.8359375, -1.580078125, 2.67578125, 6.931640625, 11.1875, 15.443359375, 19.69921875, 23.955078125, 28.2109375, 32.466796875, 36.72265625, 40.978515625, 45.234375, 49.490234375, 53.74609375, 58.001953125, 62.2578125, 66.513671875, 70.76953125, 75.025390625, 79.28125, 83.537109375, 87.79296875, 92.048828125, 96.3046875, 100.560546875, 104.81640625, 109.072265625, 113.328125, 117.583984375, 121.83984375, 126.095703125, 130.3515625, 134.607421875, 138.86328125, 143.119140625, 147.375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 10.0, 9.0, 15.0, 14.0, 16.0, 22.0, 33.0, 24.0, 36.0, 24.0, 27.0, 42.0, 44.0, 54.0, 55.0, 52.0, 50.0, 44.0, 50.0, 32.0, 33.0, 41.0, 50.0, 31.0, 32.0, 24.0, 17.0, 20.0, 13.0, 19.0, 16.0, 4.0, 7.0, 9.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.21875, -47.68359375, -46.1484375, -44.61328125, -43.078125, -41.54296875, -40.0078125, -38.47265625, -36.9375, -35.40234375, -33.8671875, -32.33203125, -30.796875, -29.26171875, -27.7265625, -26.19140625, -24.65625, -23.12109375, -21.5859375, -20.05078125, -18.515625, -16.98046875, -15.4453125, -13.91015625, -12.375, -10.83984375, -9.3046875, -7.76953125, -6.234375, -4.69921875, -3.1640625, -1.62890625, -0.09375, 1.44140625, 2.9765625, 4.51171875, 6.046875, 7.58203125, 9.1171875, 10.65234375, 12.1875, 13.72265625, 15.2578125, 16.79296875, 18.328125, 19.86328125, 21.3984375, 22.93359375, 24.46875, 26.00390625, 27.5390625, 29.07421875, 30.609375, 32.14453125, 33.6796875, 35.21484375, 36.75, 38.28515625, 39.8203125, 41.35546875, 42.890625, 44.42578125, 45.9609375, 47.49609375, 49.03125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 16.0, 11.0, 21.0, 28.0, 38.0, 55.0, 73.0, 118.0, 206.0, 356.0, 710.0, 1394.0, 3027.0, 6668.0, 16900.0, 52043.0, 277419.0, 3492503.0, 263150.0, 50845.0, 16558.0, 6534.0, 2712.0, 1365.0, 625.0, 348.0, 216.0, 111.0, 65.0, 50.0, 34.0, 21.0, 17.0, 14.0, 9.0, 8.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-174.375, -169.0078125, -163.640625, -158.2734375, -152.90625, -147.5390625, -142.171875, -136.8046875, -131.4375, -126.0703125, -120.703125, -115.3359375, -109.96875, -104.6015625, -99.234375, -93.8671875, -88.5, -83.1328125, -77.765625, -72.3984375, -67.03125, -61.6640625, -56.296875, -50.9296875, -45.5625, -40.1953125, -34.828125, -29.4609375, -24.09375, -18.7265625, -13.359375, -7.9921875, -2.625, 2.7421875, 8.109375, 13.4765625, 18.84375, 24.2109375, 29.578125, 34.9453125, 40.3125, 45.6796875, 51.046875, 56.4140625, 61.78125, 67.1484375, 72.515625, 77.8828125, 83.25, 88.6171875, 93.984375, 99.3515625, 104.71875, 110.0859375, 115.453125, 120.8203125, 126.1875, 131.5546875, 136.921875, 142.2890625, 147.65625, 153.0234375, 158.390625, 163.7578125, 169.125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 4.0, 4.0, 9.0, 11.0, 9.0, 16.0, 18.0, 18.0, 19.0, 30.0, 58.0, 67.0, 83.0, 171.0, 370.0, 953.0, 1060.0, 478.0, 236.0, 134.0, 74.0, 54.0, 48.0, 25.0, 25.0, 25.0, 14.0, 7.0, 5.0, 5.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-194.5, -189.1328125, -183.765625, -178.3984375, -173.03125, -167.6640625, -162.296875, -156.9296875, -151.5625, -146.1953125, -140.828125, -135.4609375, -130.09375, -124.7265625, -119.359375, -113.9921875, -108.625, -103.2578125, -97.890625, -92.5234375, -87.15625, -81.7890625, -76.421875, -71.0546875, -65.6875, -60.3203125, -54.953125, -49.5859375, -44.21875, -38.8515625, -33.484375, -28.1171875, -22.75, -17.3828125, -12.015625, -6.6484375, -1.28125, 4.0859375, 9.453125, 14.8203125, 20.1875, 25.5546875, 30.921875, 36.2890625, 41.65625, 47.0234375, 52.390625, 57.7578125, 63.125, 68.4921875, 73.859375, 79.2265625, 84.59375, 89.9609375, 95.328125, 100.6953125, 106.0625, 111.4296875, 116.796875, 122.1640625, 127.53125, 132.8984375, 138.265625, 143.6328125, 149.0]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 9.0, 14.0, 30.0, 78.0, 190.0, 284.0, 237.0, 84.0, 37.0, 21.0, 4.0, 3.0, 3.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2384.1220703125, -2290.970458984375, -2197.818603515625, -2104.6669921875, -2011.51513671875, -1918.363525390625, -1825.2117919921875, -1732.06005859375, -1638.9083251953125, -1545.756591796875, -1452.6048583984375, -1359.453125, -1266.301513671875, -1173.149658203125, -1079.998046875, -986.8463134765625, -893.694580078125, -800.5428466796875, -707.39111328125, -614.2394409179688, -521.0877075195312, -427.93597412109375, -334.7843017578125, -241.632568359375, -148.4808349609375, -55.32911682128906, 37.822601318359375, 130.97430419921875, 224.12603759765625, 317.27777099609375, 410.429443359375, 503.5811767578125, 596.73291015625, 689.8846435546875, 783.036376953125, 876.1880493164062, 969.3397827148438, 1062.491455078125, 1155.6431884765625, 1248.794921875, 1341.9466552734375, 1435.098388671875, 1528.2501220703125, 1621.40185546875, 1714.553466796875, 1807.705322265625, 1900.85693359375, 1994.0086669921875, 2087.160400390625, 2180.31201171875, 2273.4638671875, 2366.615478515625, 2459.767333984375, 2552.9189453125, 2646.07080078125, 2739.222412109375, 2832.3740234375, 2925.525634765625, 3018.677490234375, 3111.8291015625, 3204.98095703125, 3298.132568359375, 3391.2841796875, 3484.43603515625, 3577.587890625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 6.0, 10.0, 9.0, 8.0, 12.0, 13.0, 15.0, 12.0, 16.0, 26.0, 23.0, 28.0, 28.0, 38.0, 30.0, 27.0, 37.0, 43.0, 44.0, 49.0, 31.0, 42.0, 30.0, 36.0, 36.0, 46.0, 35.0, 39.0, 29.0, 23.0, 12.0, 21.0, 17.0, 17.0, 16.0, 17.0, 7.0, 7.0, 11.0, 4.0, 7.0, 5.0, 9.0, 9.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-557.974853515625, -538.8375854492188, -519.7003784179688, -500.5631103515625, -481.4258728027344, -462.28863525390625, -443.1513671875, -424.0141296386719, -404.87689208984375, -385.7396545410156, -366.6024169921875, -347.46514892578125, -328.3279113769531, -309.190673828125, -290.05340576171875, -270.9161682128906, -251.7789306640625, -232.64169311523438, -213.5044403076172, -194.3671875, -175.22994995117188, -156.09271240234375, -136.95545959472656, -117.81820678710938, -98.68096923828125, -79.5437240600586, -60.40647888183594, -41.26923370361328, -22.131988525390625, -2.9947433471679688, 16.142501831054688, 35.279754638671875, 54.4169921875, 73.55423736572266, 92.69148254394531, 111.82872772216797, 130.96597290039062, 150.10321044921875, 169.24046325683594, 188.37771606445312, 207.51495361328125, 226.65219116210938, 245.78944396972656, 264.92669677734375, 284.0639343261719, 303.201171875, 322.33843994140625, 341.4756774902344, 360.6129150390625, 379.7501525878906, 398.88739013671875, 418.024658203125, 437.1618957519531, 456.29913330078125, 475.4364013671875, 494.5736389160156, 513.7108764648438, 532.84814453125, 551.9853515625, 571.1226196289062, 590.2598876953125, 609.3970947265625, 628.5343627929688, 647.671630859375, 666.808837890625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 17.0, 18.0, 30.0, 28.0, 59.0, 84.0, 110.0, 159.0, 221.0, 360.0, 564.0, 839.0, 1230.0, 1988.0, 3156.0, 5460.0, 9110.0, 16596.0, 32566.0, 68115.0, 161287.0, 357832.0, 214596.0, 86745.0, 39651.0, 20294.0, 10987.0, 6175.0, 3746.0, 2263.0, 1456.0, 944.0, 613.0, 405.0, 301.0, 183.0, 132.0, 74.0, 44.0, 39.0, 23.0, 16.0, 11.0, 7.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.3125, -101.0166015625, -97.720703125, -94.4248046875, -91.12890625, -87.8330078125, -84.537109375, -81.2412109375, -77.9453125, -74.6494140625, -71.353515625, -68.0576171875, -64.76171875, -61.4658203125, -58.169921875, -54.8740234375, -51.578125, -48.2822265625, -44.986328125, -41.6904296875, -38.39453125, -35.0986328125, -31.802734375, -28.5068359375, -25.2109375, -21.9150390625, -18.619140625, -15.3232421875, -12.02734375, -8.7314453125, -5.435546875, -2.1396484375, 1.15625, 4.4521484375, 7.748046875, 11.0439453125, 14.33984375, 17.6357421875, 20.931640625, 24.2275390625, 27.5234375, 30.8193359375, 34.115234375, 37.4111328125, 40.70703125, 44.0029296875, 47.298828125, 50.5947265625, 53.890625, 57.1865234375, 60.482421875, 63.7783203125, 67.07421875, 70.3701171875, 73.666015625, 76.9619140625, 80.2578125, 83.5537109375, 86.849609375, 90.1455078125, 93.44140625, 96.7373046875, 100.033203125, 103.3291015625, 106.625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 4.0, 6.0, 6.0, 6.0, 9.0, 9.0, 11.0, 14.0, 16.0, 12.0, 18.0, 24.0, 25.0, 28.0, 33.0, 27.0, 36.0, 40.0, 45.0, 34.0, 34.0, 53.0, 62.0, 37.0, 43.0, 36.0, 36.0, 44.0, 27.0, 32.0, 28.0, 26.0, 17.0, 20.0, 16.0, 19.0, 10.0, 16.0, 6.0, 7.0, 3.0, 6.0, 1.0, 4.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-42.03125, -40.61279296875, -39.1943359375, -37.77587890625, -36.357421875, -34.93896484375, -33.5205078125, -32.10205078125, -30.68359375, -29.26513671875, -27.8466796875, -26.42822265625, -25.009765625, -23.59130859375, -22.1728515625, -20.75439453125, -19.3359375, -17.91748046875, -16.4990234375, -15.08056640625, -13.662109375, -12.24365234375, -10.8251953125, -9.40673828125, -7.98828125, -6.56982421875, -5.1513671875, -3.73291015625, -2.314453125, -0.89599609375, 0.5224609375, 1.94091796875, 3.359375, 4.77783203125, 6.1962890625, 7.61474609375, 9.033203125, 10.45166015625, 11.8701171875, 13.28857421875, 14.70703125, 16.12548828125, 17.5439453125, 18.96240234375, 20.380859375, 21.79931640625, 23.2177734375, 24.63623046875, 26.0546875, 27.47314453125, 28.8916015625, 30.31005859375, 31.728515625, 33.14697265625, 34.5654296875, 35.98388671875, 37.40234375, 38.82080078125, 40.2392578125, 41.65771484375, 43.076171875, 44.49462890625, 45.9130859375, 47.33154296875, 48.75]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 11.0, 17.0, 24.0, 20.0, 44.0, 56.0, 90.0, 110.0, 219.0, 320.0, 569.0, 1005.0, 2190.0, 5506.0, 19753.0, 132081.0, 765317.0, 96064.0, 16237.0, 4687.0, 1963.0, 915.0, 495.0, 299.0, 171.0, 124.0, 83.0, 56.0, 35.0, 26.0, 19.0, 12.0, 8.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-270.25, -262.166015625, -254.08203125, -245.998046875, -237.9140625, -229.830078125, -221.74609375, -213.662109375, -205.578125, -197.494140625, -189.41015625, -181.326171875, -173.2421875, -165.158203125, -157.07421875, -148.990234375, -140.90625, -132.822265625, -124.73828125, -116.654296875, -108.5703125, -100.486328125, -92.40234375, -84.318359375, -76.234375, -68.150390625, -60.06640625, -51.982421875, -43.8984375, -35.814453125, -27.73046875, -19.646484375, -11.5625, -3.478515625, 4.60546875, 12.689453125, 20.7734375, 28.857421875, 36.94140625, 45.025390625, 53.109375, 61.193359375, 69.27734375, 77.361328125, 85.4453125, 93.529296875, 101.61328125, 109.697265625, 117.78125, 125.865234375, 133.94921875, 142.033203125, 150.1171875, 158.201171875, 166.28515625, 174.369140625, 182.453125, 190.537109375, 198.62109375, 206.705078125, 214.7890625, 222.873046875, 230.95703125, 239.041015625, 247.125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 13.0, 6.0, 13.0, 14.0, 25.0, 25.0, 34.0, 39.0, 30.0, 46.0, 62.0, 44.0, 46.0, 49.0, 64.0, 69.0, 59.0, 58.0, 49.0, 40.0, 40.0, 23.0, 31.0, 28.0, 20.0, 17.0, 20.0, 5.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.5, -227.9921875, -219.484375, -210.9765625, -202.46875, -193.9609375, -185.453125, -176.9453125, -168.4375, -159.9296875, -151.421875, -142.9140625, -134.40625, -125.8984375, -117.390625, -108.8828125, -100.375, -91.8671875, -83.359375, -74.8515625, -66.34375, -57.8359375, -49.328125, -40.8203125, -32.3125, -23.8046875, -15.296875, -6.7890625, 1.71875, 10.2265625, 18.734375, 27.2421875, 35.75, 44.2578125, 52.765625, 61.2734375, 69.78125, 78.2890625, 86.796875, 95.3046875, 103.8125, 112.3203125, 120.828125, 129.3359375, 137.84375, 146.3515625, 154.859375, 163.3671875, 171.875, 180.3828125, 188.890625, 197.3984375, 205.90625, 214.4140625, 222.921875, 231.4296875, 239.9375, 248.4453125, 256.953125, 265.4609375, 273.96875, 282.4765625, 290.984375, 299.4921875, 308.0]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 8.0, 7.0, 10.0, 19.0, 18.0, 31.0, 40.0, 87.0, 141.0, 284.0, 609.0, 1572.0, 4842.0, 23406.0, 442921.0, 541631.0, 24884.0, 5148.0, 1632.0, 605.0, 295.0, 157.0, 76.0, 37.0, 32.0, 23.0, 12.0, 8.0, 9.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.125, -132.556640625, -127.98828125, -123.419921875, -118.8515625, -114.283203125, -109.71484375, -105.146484375, -100.578125, -96.009765625, -91.44140625, -86.873046875, -82.3046875, -77.736328125, -73.16796875, -68.599609375, -64.03125, -59.462890625, -54.89453125, -50.326171875, -45.7578125, -41.189453125, -36.62109375, -32.052734375, -27.484375, -22.916015625, -18.34765625, -13.779296875, -9.2109375, -4.642578125, -0.07421875, 4.494140625, 9.0625, 13.630859375, 18.19921875, 22.767578125, 27.3359375, 31.904296875, 36.47265625, 41.041015625, 45.609375, 50.177734375, 54.74609375, 59.314453125, 63.8828125, 68.451171875, 73.01953125, 77.587890625, 82.15625, 86.724609375, 91.29296875, 95.861328125, 100.4296875, 104.998046875, 109.56640625, 114.134765625, 118.703125, 123.271484375, 127.83984375, 132.408203125, 136.9765625, 141.544921875, 146.11328125, 150.681640625, 155.25]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 6.0, 5.0, 21.0, 25.0, 46.0, 68.0, 105.0, 182.0, 191.0, 132.0, 85.0, 39.0, 30.0, 20.0, 10.0, 7.0, 4.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0301513671875, -0.028729915618896484, -0.02730846405029297, -0.025887012481689453, -0.024465560913085938, -0.023044109344482422, -0.021622657775878906, -0.02020120620727539, -0.018779754638671875, -0.01735830307006836, -0.015936851501464844, -0.014515399932861328, -0.013093948364257812, -0.011672496795654297, -0.010251045227050781, -0.008829593658447266, -0.00740814208984375, -0.005986690521240234, -0.004565238952636719, -0.003143787384033203, -0.0017223358154296875, -0.0003008842468261719, 0.0011205673217773438, 0.0025420188903808594, 0.003963470458984375, 0.005384922027587891, 0.006806373596191406, 0.008227825164794922, 0.009649276733398438, 0.011070728302001953, 0.012492179870605469, 0.013913631439208984, 0.0153350830078125, 0.016756534576416016, 0.01817798614501953, 0.019599437713623047, 0.021020889282226562, 0.022442340850830078, 0.023863792419433594, 0.02528524398803711, 0.026706695556640625, 0.02812814712524414, 0.029549598693847656, 0.030971050262451172, 0.03239250183105469, 0.0338139533996582, 0.03523540496826172, 0.036656856536865234, 0.03807830810546875, 0.039499759674072266, 0.04092121124267578, 0.0423426628112793, 0.04376411437988281, 0.04518556594848633, 0.046607017517089844, 0.04802846908569336, 0.049449920654296875, 0.05087137222290039, 0.052292823791503906, 0.05371427536010742, 0.05513572692871094, 0.05655717849731445, 0.05797863006591797, 0.059400081634521484, 0.060821533203125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 10.0, 21.0, 19.0, 29.0, 50.0, 70.0, 109.0, 179.0, 323.0, 643.0, 1464.0, 3709.0, 13035.0, 79852.0, 758144.0, 161857.0, 20291.0, 5145.0, 1840.0, 824.0, 383.0, 208.0, 123.0, 77.0, 47.0, 23.0, 13.0, 16.0, 14.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.8125, -100.4248046875, -97.037109375, -93.6494140625, -90.26171875, -86.8740234375, -83.486328125, -80.0986328125, -76.7109375, -73.3232421875, -69.935546875, -66.5478515625, -63.16015625, -59.7724609375, -56.384765625, -52.9970703125, -49.609375, -46.2216796875, -42.833984375, -39.4462890625, -36.05859375, -32.6708984375, -29.283203125, -25.8955078125, -22.5078125, -19.1201171875, -15.732421875, -12.3447265625, -8.95703125, -5.5693359375, -2.181640625, 1.2060546875, 4.59375, 7.9814453125, 11.369140625, 14.7568359375, 18.14453125, 21.5322265625, 24.919921875, 28.3076171875, 31.6953125, 35.0830078125, 38.470703125, 41.8583984375, 45.24609375, 48.6337890625, 52.021484375, 55.4091796875, 58.796875, 62.1845703125, 65.572265625, 68.9599609375, 72.34765625, 75.7353515625, 79.123046875, 82.5107421875, 85.8984375, 89.2861328125, 92.673828125, 96.0615234375, 99.44921875, 102.8369140625, 106.224609375, 109.6123046875, 113.0]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 6.0, 11.0, 10.0, 15.0, 18.0, 21.0, 53.0, 54.0, 80.0, 71.0, 128.0, 99.0, 101.0, 82.0, 62.0, 38.0, 35.0, 24.0, 17.0, 10.0, 17.0, 7.0, 7.0, 10.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-105.3125, -102.490234375, -99.66796875, -96.845703125, -94.0234375, -91.201171875, -88.37890625, -85.556640625, -82.734375, -79.912109375, -77.08984375, -74.267578125, -71.4453125, -68.623046875, -65.80078125, -62.978515625, -60.15625, -57.333984375, -54.51171875, -51.689453125, -48.8671875, -46.044921875, -43.22265625, -40.400390625, -37.578125, -34.755859375, -31.93359375, -29.111328125, -26.2890625, -23.466796875, -20.64453125, -17.822265625, -15.0, -12.177734375, -9.35546875, -6.533203125, -3.7109375, -0.888671875, 1.93359375, 4.755859375, 7.578125, 10.400390625, 13.22265625, 16.044921875, 18.8671875, 21.689453125, 24.51171875, 27.333984375, 30.15625, 32.978515625, 35.80078125, 38.623046875, 41.4453125, 44.267578125, 47.08984375, 49.912109375, 52.734375, 55.556640625, 58.37890625, 61.201171875, 64.0234375, 66.845703125, 69.66796875, 72.490234375, 75.3125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 7.0, 11.0, 19.0, 32.0, 52.0, 98.0, 144.0, 179.0, 137.0, 102.0, 73.0, 62.0, 28.0, 15.0, 6.0, 10.0, 3.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-938.35693359375, -884.2062377929688, -830.0555419921875, -775.9049072265625, -721.754150390625, -667.603515625, -613.4528198242188, -559.3021240234375, -505.15142822265625, -451.000732421875, -396.85003662109375, -342.6993713378906, -288.5486755371094, -234.39797973632812, -180.247314453125, -126.09661865234375, -71.9459228515625, -17.79523468017578, 36.35545349121094, 90.50613403320312, 144.65682983398438, 198.80752563476562, 252.95819091796875, 307.10888671875, 361.25958251953125, 415.4102783203125, 469.56097412109375, 523.711669921875, 577.8623046875, 632.0130615234375, 686.1636962890625, 740.3143920898438, 794.465087890625, 848.6157836914062, 902.7664794921875, 956.9171142578125, 1011.06787109375, 1065.218505859375, 1119.369140625, 1173.5198974609375, 1227.670654296875, 1281.8212890625, 1335.9720458984375, 1390.1226806640625, 1444.2734375, 1498.424072265625, 1552.57470703125, 1606.7254638671875, 1660.8760986328125, 1715.0267333984375, 1769.177490234375, 1823.328125, 1877.4788818359375, 1931.6295166015625, 1985.7802734375, 2039.930908203125, 2094.08154296875, 2148.232177734375, 2202.3828125, 2256.53369140625, 2310.684326171875, 2364.8349609375, 2418.985595703125, 2473.13623046875, 2527.287109375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 11.0, 7.0, 14.0, 11.0, 24.0, 27.0, 31.0, 29.0, 32.0, 28.0, 34.0, 44.0, 39.0, 49.0, 55.0, 35.0, 52.0, 41.0, 51.0, 45.0, 56.0, 36.0, 31.0, 20.0, 28.0, 29.0, 21.0, 16.0, 11.0, 9.0, 9.0, 13.0, 1.0, 8.0, 5.0, 7.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-763.8731689453125, -736.0970458984375, -708.3209228515625, -680.5447998046875, -652.7686767578125, -624.9925537109375, -597.2164306640625, -569.4403076171875, -541.6641845703125, -513.8880615234375, -486.1119384765625, -458.3358154296875, -430.5596923828125, -402.7835693359375, -375.0074768066406, -347.2313537597656, -319.45526123046875, -291.67913818359375, -263.90301513671875, -236.1269073486328, -208.3507843017578, -180.5746612548828, -152.79855346679688, -125.02243041992188, -97.24630737304688, -69.47018432617188, -41.694068908691406, -13.917953491210938, 13.858169555664062, 41.63429260253906, 69.410400390625, 97.1865234375, 124.96258544921875, 152.73870849609375, 180.51483154296875, 208.2909393310547, 236.0670623779297, 263.84320068359375, 291.6192932128906, 319.3954162597656, 347.1715393066406, 374.9476623535156, 402.7237854003906, 430.4998779296875, 458.2760009765625, 486.0521240234375, 513.8282470703125, 541.6043701171875, 569.3804931640625, 597.1566162109375, 624.9327392578125, 652.7088623046875, 680.4849853515625, 708.2611083984375, 736.0372314453125, 763.8133544921875, 791.5894775390625, 819.3656005859375, 847.1417236328125, 874.9178466796875, 902.6939697265625, 930.4700927734375, 958.2462158203125, 986.0223388671875, 1013.7984008789062]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 6.0, 7.0, 9.0, 18.0, 21.0, 36.0, 52.0, 88.0, 174.0, 524.0, 3412.0, 61314.0, 4090829.0, 34984.0, 2101.0, 380.0, 133.0, 58.0, 40.0, 22.0, 27.0, 10.0, 13.0, 5.0, 5.0, 11.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-277.25, -263.67578125, -250.1015625, -236.52734375, -222.953125, -209.37890625, -195.8046875, -182.23046875, -168.65625, -155.08203125, -141.5078125, -127.93359375, -114.359375, -100.78515625, -87.2109375, -73.63671875, -60.0625, -46.48828125, -32.9140625, -19.33984375, -5.765625, 7.80859375, 21.3828125, 34.95703125, 48.53125, 62.10546875, 75.6796875, 89.25390625, 102.828125, 116.40234375, 129.9765625, 143.55078125, 157.125, 170.69921875, 184.2734375, 197.84765625, 211.421875, 224.99609375, 238.5703125, 252.14453125, 265.71875, 279.29296875, 292.8671875, 306.44140625, 320.015625, 333.58984375, 347.1640625, 360.73828125, 374.3125, 387.88671875, 401.4609375, 415.03515625, 428.609375, 442.18359375, 455.7578125, 469.33203125, 482.90625, 496.48046875, 510.0546875, 523.62890625, 537.203125, 550.77734375, 564.3515625, 577.92578125, 591.5]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 4.0, 10.0, 6.0, 9.0, 7.0, 6.0, 13.0, 16.0, 9.0, 16.0, 20.0, 26.0, 21.0, 23.0, 32.0, 39.0, 31.0, 25.0, 37.0, 36.0, 39.0, 54.0, 43.0, 40.0, 36.0, 37.0, 53.0, 42.0, 35.0, 33.0, 22.0, 27.0, 26.0, 28.0, 11.0, 21.0, 11.0, 5.0, 10.0, 5.0, 7.0, 4.0, 5.0, 3.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-42.71875, -41.41943359375, -40.1201171875, -38.82080078125, -37.521484375, -36.22216796875, -34.9228515625, -33.62353515625, -32.32421875, -31.02490234375, -29.7255859375, -28.42626953125, -27.126953125, -25.82763671875, -24.5283203125, -23.22900390625, -21.9296875, -20.63037109375, -19.3310546875, -18.03173828125, -16.732421875, -15.43310546875, -14.1337890625, -12.83447265625, -11.53515625, -10.23583984375, -8.9365234375, -7.63720703125, -6.337890625, -5.03857421875, -3.7392578125, -2.43994140625, -1.140625, 0.15869140625, 1.4580078125, 2.75732421875, 4.056640625, 5.35595703125, 6.6552734375, 7.95458984375, 9.25390625, 10.55322265625, 11.8525390625, 13.15185546875, 14.451171875, 15.75048828125, 17.0498046875, 18.34912109375, 19.6484375, 20.94775390625, 22.2470703125, 23.54638671875, 24.845703125, 26.14501953125, 27.4443359375, 28.74365234375, 30.04296875, 31.34228515625, 32.6416015625, 33.94091796875, 35.240234375, 36.53955078125, 37.8388671875, 39.13818359375, 40.4375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 0.0, 6.0, 8.0, 10.0, 27.0, 20.0, 33.0, 39.0, 63.0, 102.0, 147.0, 245.0, 376.0, 665.0, 1166.0, 2217.0, 4285.0, 9233.0, 21702.0, 60860.0, 299699.0, 3234669.0, 438710.0, 74071.0, 25149.0, 10453.0, 4735.0, 2472.0, 1295.0, 699.0, 420.0, 236.0, 160.0, 101.0, 57.0, 52.0, 22.0, 22.0, 19.0, 9.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-149.375, -144.7890625, -140.203125, -135.6171875, -131.03125, -126.4453125, -121.859375, -117.2734375, -112.6875, -108.1015625, -103.515625, -98.9296875, -94.34375, -89.7578125, -85.171875, -80.5859375, -76.0, -71.4140625, -66.828125, -62.2421875, -57.65625, -53.0703125, -48.484375, -43.8984375, -39.3125, -34.7265625, -30.140625, -25.5546875, -20.96875, -16.3828125, -11.796875, -7.2109375, -2.625, 1.9609375, 6.546875, 11.1328125, 15.71875, 20.3046875, 24.890625, 29.4765625, 34.0625, 38.6484375, 43.234375, 47.8203125, 52.40625, 56.9921875, 61.578125, 66.1640625, 70.75, 75.3359375, 79.921875, 84.5078125, 89.09375, 93.6796875, 98.265625, 102.8515625, 107.4375, 112.0234375, 116.609375, 121.1953125, 125.78125, 130.3671875, 134.953125, 139.5390625, 144.125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 6.0, 5.0, 11.0, 18.0, 22.0, 22.0, 41.0, 32.0, 54.0, 83.0, 167.0, 363.0, 768.0, 1135.0, 614.0, 249.0, 154.0, 80.0, 53.0, 44.0, 32.0, 21.0, 24.0, 11.0, 9.0, 12.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-208.0, -202.26953125, -196.5390625, -190.80859375, -185.078125, -179.34765625, -173.6171875, -167.88671875, -162.15625, -156.42578125, -150.6953125, -144.96484375, -139.234375, -133.50390625, -127.7734375, -122.04296875, -116.3125, -110.58203125, -104.8515625, -99.12109375, -93.390625, -87.66015625, -81.9296875, -76.19921875, -70.46875, -64.73828125, -59.0078125, -53.27734375, -47.546875, -41.81640625, -36.0859375, -30.35546875, -24.625, -18.89453125, -13.1640625, -7.43359375, -1.703125, 4.02734375, 9.7578125, 15.48828125, 21.21875, 26.94921875, 32.6796875, 38.41015625, 44.140625, 49.87109375, 55.6015625, 61.33203125, 67.0625, 72.79296875, 78.5234375, 84.25390625, 89.984375, 95.71484375, 101.4453125, 107.17578125, 112.90625, 118.63671875, 124.3671875, 130.09765625, 135.828125, 141.55859375, 147.2890625, 153.01953125, 158.75]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 9.0, 19.0, 46.0, 82.0, 167.0, 199.0, 205.0, 106.0, 66.0, 28.0, 20.0, 13.0, 7.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1288.7979736328125, -1225.997802734375, -1163.1976318359375, -1100.3974609375, -1037.597412109375, -974.7972412109375, -911.9970703125, -849.1968994140625, -786.3967895507812, -723.5966186523438, -660.7965087890625, -597.996337890625, -535.1961669921875, -472.39605712890625, -409.59588623046875, -346.7957458496094, -283.99560546875, -221.19546508789062, -158.3953094482422, -95.59515380859375, -32.795013427734375, 30.005126953125, 92.8052978515625, 155.60543823242188, 218.40557861328125, 281.2057189941406, 344.005859375, 406.8060302734375, 469.6061706542969, 532.4063110351562, 595.2064819335938, 658.006591796875, 720.806640625, 783.6068115234375, 846.4069213867188, 909.2070922851562, 972.0072021484375, 1034.807373046875, 1097.6075439453125, 1160.40771484375, 1223.207763671875, 1286.0079345703125, 1348.80810546875, 1411.608154296875, 1474.4083251953125, 1537.20849609375, 1600.0086669921875, 1662.808837890625, 1725.6090087890625, 1788.4091796875, 1851.2093505859375, 1914.009521484375, 1976.8095703125, 2039.6097412109375, 2102.409912109375, 2165.2099609375, 2228.01025390625, 2290.810302734375, 2353.610595703125, 2416.41064453125, 2479.2109375, 2542.010986328125, 2604.81103515625, 2667.611328125, 2730.411376953125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 3.0, 4.0, 4.0, 7.0, 4.0, 8.0, 15.0, 12.0, 21.0, 17.0, 25.0, 33.0, 25.0, 39.0, 38.0, 41.0, 32.0, 44.0, 51.0, 44.0, 55.0, 60.0, 55.0, 40.0, 46.0, 23.0, 34.0, 34.0, 29.0, 24.0, 34.0, 15.0, 21.0, 18.0, 9.0, 8.0, 7.0, 7.0, 9.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-759.8634033203125, -734.7206420898438, -709.577880859375, -684.4351196289062, -659.2923583984375, -634.1495971679688, -609.0068359375, -583.8640747070312, -558.7213134765625, -533.5785522460938, -508.435791015625, -483.29302978515625, -458.1502685546875, -433.00750732421875, -407.86474609375, -382.72198486328125, -357.5792236328125, -332.43646240234375, -307.293701171875, -282.15093994140625, -257.0081787109375, -231.86541748046875, -206.72265625, -181.57989501953125, -156.4371337890625, -131.29437255859375, -106.151611328125, -81.00885009765625, -55.8660888671875, -30.72332763671875, -5.58056640625, 19.56219482421875, 44.7049560546875, 69.84771728515625, 94.990478515625, 120.13323974609375, 145.2760009765625, 170.41876220703125, 195.5615234375, 220.70428466796875, 245.8470458984375, 270.98980712890625, 296.132568359375, 321.27532958984375, 346.4180908203125, 371.56085205078125, 396.70361328125, 421.84637451171875, 446.9891357421875, 472.13189697265625, 497.274658203125, 522.4174194335938, 547.5601806640625, 572.7029418945312, 597.845703125, 622.9884643554688, 648.1312255859375, 673.2739868164062, 698.416748046875, 723.5595092773438, 748.7022705078125, 773.8450317382812, 798.98779296875, 824.1305541992188, 849.2733154296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 5.0, 7.0, 14.0, 19.0, 30.0, 32.0, 44.0, 62.0, 114.0, 158.0, 221.0, 314.0, 475.0, 790.0, 1214.0, 1994.0, 3372.0, 5948.0, 11091.0, 21933.0, 46881.0, 111505.0, 296807.0, 320822.0, 122825.0, 50899.0, 23572.0, 11875.0, 6234.0, 3548.0, 2083.0, 1289.0, 756.0, 532.0, 367.0, 204.0, 142.0, 98.0, 84.0, 62.0, 37.0, 32.0, 22.0, 17.0, 6.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-102.0625, -98.775390625, -95.48828125, -92.201171875, -88.9140625, -85.626953125, -82.33984375, -79.052734375, -75.765625, -72.478515625, -69.19140625, -65.904296875, -62.6171875, -59.330078125, -56.04296875, -52.755859375, -49.46875, -46.181640625, -42.89453125, -39.607421875, -36.3203125, -33.033203125, -29.74609375, -26.458984375, -23.171875, -19.884765625, -16.59765625, -13.310546875, -10.0234375, -6.736328125, -3.44921875, -0.162109375, 3.125, 6.412109375, 9.69921875, 12.986328125, 16.2734375, 19.560546875, 22.84765625, 26.134765625, 29.421875, 32.708984375, 35.99609375, 39.283203125, 42.5703125, 45.857421875, 49.14453125, 52.431640625, 55.71875, 59.005859375, 62.29296875, 65.580078125, 68.8671875, 72.154296875, 75.44140625, 78.728515625, 82.015625, 85.302734375, 88.58984375, 91.876953125, 95.1640625, 98.451171875, 101.73828125, 105.025390625, 108.3125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 3.0, 8.0, 6.0, 9.0, 16.0, 15.0, 24.0, 18.0, 28.0, 21.0, 36.0, 38.0, 49.0, 43.0, 54.0, 61.0, 63.0, 59.0, 64.0, 53.0, 39.0, 52.0, 31.0, 32.0, 25.0, 27.0, 22.0, 27.0, 16.0, 19.0, 12.0, 9.0, 8.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.6875, -57.646484375, -55.60546875, -53.564453125, -51.5234375, -49.482421875, -47.44140625, -45.400390625, -43.359375, -41.318359375, -39.27734375, -37.236328125, -35.1953125, -33.154296875, -31.11328125, -29.072265625, -27.03125, -24.990234375, -22.94921875, -20.908203125, -18.8671875, -16.826171875, -14.78515625, -12.744140625, -10.703125, -8.662109375, -6.62109375, -4.580078125, -2.5390625, -0.498046875, 1.54296875, 3.583984375, 5.625, 7.666015625, 9.70703125, 11.748046875, 13.7890625, 15.830078125, 17.87109375, 19.912109375, 21.953125, 23.994140625, 26.03515625, 28.076171875, 30.1171875, 32.158203125, 34.19921875, 36.240234375, 38.28125, 40.322265625, 42.36328125, 44.404296875, 46.4453125, 48.486328125, 50.52734375, 52.568359375, 54.609375, 56.650390625, 58.69140625, 60.732421875, 62.7734375, 64.814453125, 66.85546875, 68.896484375, 70.9375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 10.0, 10.0, 9.0, 9.0, 19.0, 26.0, 53.0, 76.0, 116.0, 227.0, 459.0, 925.0, 2273.0, 7239.0, 36011.0, 421492.0, 528496.0, 38892.0, 7834.0, 2331.0, 983.0, 455.0, 236.0, 141.0, 73.0, 45.0, 31.0, 30.0, 16.0, 9.0, 5.0, 9.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-352.0, -341.94921875, -331.8984375, -321.84765625, -311.796875, -301.74609375, -291.6953125, -281.64453125, -271.59375, -261.54296875, -251.4921875, -241.44140625, -231.390625, -221.33984375, -211.2890625, -201.23828125, -191.1875, -181.13671875, -171.0859375, -161.03515625, -150.984375, -140.93359375, -130.8828125, -120.83203125, -110.78125, -100.73046875, -90.6796875, -80.62890625, -70.578125, -60.52734375, -50.4765625, -40.42578125, -30.375, -20.32421875, -10.2734375, -0.22265625, 9.828125, 19.87890625, 29.9296875, 39.98046875, 50.03125, 60.08203125, 70.1328125, 80.18359375, 90.234375, 100.28515625, 110.3359375, 120.38671875, 130.4375, 140.48828125, 150.5390625, 160.58984375, 170.640625, 180.69140625, 190.7421875, 200.79296875, 210.84375, 220.89453125, 230.9453125, 240.99609375, 251.046875, 261.09765625, 271.1484375, 281.19921875, 291.25]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 13.0, 6.0, 9.0, 26.0, 26.0, 31.0, 40.0, 46.0, 55.0, 67.0, 63.0, 84.0, 65.0, 69.0, 61.0, 64.0, 44.0, 48.0, 35.0, 33.0, 25.0, 23.0, 19.0, 14.0, 9.0, 9.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-371.25, -359.87109375, -348.4921875, -337.11328125, -325.734375, -314.35546875, -302.9765625, -291.59765625, -280.21875, -268.83984375, -257.4609375, -246.08203125, -234.703125, -223.32421875, -211.9453125, -200.56640625, -189.1875, -177.80859375, -166.4296875, -155.05078125, -143.671875, -132.29296875, -120.9140625, -109.53515625, -98.15625, -86.77734375, -75.3984375, -64.01953125, -52.640625, -41.26171875, -29.8828125, -18.50390625, -7.125, 4.25390625, 15.6328125, 27.01171875, 38.390625, 49.76953125, 61.1484375, 72.52734375, 83.90625, 95.28515625, 106.6640625, 118.04296875, 129.421875, 140.80078125, 152.1796875, 163.55859375, 174.9375, 186.31640625, 197.6953125, 209.07421875, 220.453125, 231.83203125, 243.2109375, 254.58984375, 265.96875, 277.34765625, 288.7265625, 300.10546875, 311.484375, 322.86328125, 334.2421875, 345.62109375, 357.0]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 10.0, 17.0, 22.0, 43.0, 86.0, 217.0, 572.0, 1817.0, 9337.0, 98324.0, 860616.0, 67617.0, 7392.0, 1578.0, 503.0, 186.0, 85.0, 41.0, 21.0, 10.0, 14.0, 10.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-208.375, -202.80859375, -197.2421875, -191.67578125, -186.109375, -180.54296875, -174.9765625, -169.41015625, -163.84375, -158.27734375, -152.7109375, -147.14453125, -141.578125, -136.01171875, -130.4453125, -124.87890625, -119.3125, -113.74609375, -108.1796875, -102.61328125, -97.046875, -91.48046875, -85.9140625, -80.34765625, -74.78125, -69.21484375, -63.6484375, -58.08203125, -52.515625, -46.94921875, -41.3828125, -35.81640625, -30.25, -24.68359375, -19.1171875, -13.55078125, -7.984375, -2.41796875, 3.1484375, 8.71484375, 14.28125, 19.84765625, 25.4140625, 30.98046875, 36.546875, 42.11328125, 47.6796875, 53.24609375, 58.8125, 64.37890625, 69.9453125, 75.51171875, 81.078125, 86.64453125, 92.2109375, 97.77734375, 103.34375, 108.91015625, 114.4765625, 120.04296875, 125.609375, 131.17578125, 136.7421875, 142.30859375, 147.875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 7.0, 5.0, 14.0, 8.0, 20.0, 30.0, 47.0, 75.0, 94.0, 171.0, 184.0, 127.0, 66.0, 48.0, 29.0, 29.0, 16.0, 10.0, 9.0, 4.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032684326171875, -0.03133201599121094, -0.029979705810546875, -0.028627395629882812, -0.02727508544921875, -0.025922775268554688, -0.024570465087890625, -0.023218154907226562, -0.0218658447265625, -0.020513534545898438, -0.019161224365234375, -0.017808914184570312, -0.01645660400390625, -0.015104293823242188, -0.013751983642578125, -0.012399673461914062, -0.01104736328125, -0.009695053100585938, -0.008342742919921875, -0.0069904327392578125, -0.00563812255859375, -0.0042858123779296875, -0.002933502197265625, -0.0015811920166015625, -0.0002288818359375, 0.0011234283447265625, 0.002475738525390625, 0.0038280487060546875, 0.00518035888671875, 0.0065326690673828125, 0.007884979248046875, 0.009237289428710938, 0.010589599609375, 0.011941909790039062, 0.013294219970703125, 0.014646530151367188, 0.01599884033203125, 0.017351150512695312, 0.018703460693359375, 0.020055770874023438, 0.0214080810546875, 0.022760391235351562, 0.024112701416015625, 0.025465011596679688, 0.02681732177734375, 0.028169631958007812, 0.029521942138671875, 0.030874252319335938, 0.0322265625, 0.03357887268066406, 0.034931182861328125, 0.03628349304199219, 0.03763580322265625, 0.03898811340332031, 0.040340423583984375, 0.04169273376464844, 0.0430450439453125, 0.04439735412597656, 0.045749664306640625, 0.04710197448730469, 0.04845428466796875, 0.04980659484863281, 0.051158905029296875, 0.05251121520996094, 0.053863525390625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 11.0, 14.0, 28.0, 18.0, 46.0, 88.0, 142.0, 279.0, 700.0, 2174.0, 8455.0, 53260.0, 747428.0, 209796.0, 19820.0, 4053.0, 1282.0, 473.0, 213.0, 101.0, 62.0, 42.0, 16.0, 13.0, 8.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-142.0, -137.529296875, -133.05859375, -128.587890625, -124.1171875, -119.646484375, -115.17578125, -110.705078125, -106.234375, -101.763671875, -97.29296875, -92.822265625, -88.3515625, -83.880859375, -79.41015625, -74.939453125, -70.46875, -65.998046875, -61.52734375, -57.056640625, -52.5859375, -48.115234375, -43.64453125, -39.173828125, -34.703125, -30.232421875, -25.76171875, -21.291015625, -16.8203125, -12.349609375, -7.87890625, -3.408203125, 1.0625, 5.533203125, 10.00390625, 14.474609375, 18.9453125, 23.416015625, 27.88671875, 32.357421875, 36.828125, 41.298828125, 45.76953125, 50.240234375, 54.7109375, 59.181640625, 63.65234375, 68.123046875, 72.59375, 77.064453125, 81.53515625, 86.005859375, 90.4765625, 94.947265625, 99.41796875, 103.888671875, 108.359375, 112.830078125, 117.30078125, 121.771484375, 126.2421875, 130.712890625, 135.18359375, 139.654296875, 144.125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 6.0, 7.0, 9.0, 17.0, 16.0, 17.0, 22.0, 46.0, 37.0, 59.0, 56.0, 100.0, 105.0, 88.0, 94.0, 61.0, 57.0, 47.0, 25.0, 23.0, 22.0, 23.0, 12.0, 9.0, 7.0, 11.0, 5.0, 5.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.9375, -84.0390625, -81.140625, -78.2421875, -75.34375, -72.4453125, -69.546875, -66.6484375, -63.75, -60.8515625, -57.953125, -55.0546875, -52.15625, -49.2578125, -46.359375, -43.4609375, -40.5625, -37.6640625, -34.765625, -31.8671875, -28.96875, -26.0703125, -23.171875, -20.2734375, -17.375, -14.4765625, -11.578125, -8.6796875, -5.78125, -2.8828125, 0.015625, 2.9140625, 5.8125, 8.7109375, 11.609375, 14.5078125, 17.40625, 20.3046875, 23.203125, 26.1015625, 29.0, 31.8984375, 34.796875, 37.6953125, 40.59375, 43.4921875, 46.390625, 49.2890625, 52.1875, 55.0859375, 57.984375, 60.8828125, 63.78125, 66.6796875, 69.578125, 72.4765625, 75.375, 78.2734375, 81.171875, 84.0703125, 86.96875, 89.8671875, 92.765625, 95.6640625, 98.5625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 11.0, 10.0, 26.0, 67.0, 134.0, 229.0, 255.0, 145.0, 69.0, 23.0, 16.0, 6.0, 8.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1734.6851806640625, -1652.6103515625, -1570.53564453125, -1488.4609375, -1406.3861083984375, -1324.311279296875, -1242.236572265625, -1160.161865234375, -1078.0870361328125, -996.0122680664062, -913.9375, -831.8627319335938, -749.7879638671875, -667.7131958007812, -585.638427734375, -503.56365966796875, -421.4888916015625, -339.41412353515625, -257.33935546875, -175.26458740234375, -93.1898193359375, -11.11505126953125, 70.959716796875, 153.03448486328125, 235.1092529296875, 317.18402099609375, 399.2587890625, 481.33355712890625, 563.4083251953125, 645.4830932617188, 727.557861328125, 809.6326293945312, 891.70751953125, 973.7822875976562, 1055.8570556640625, 1137.931884765625, 1220.006591796875, 1302.081298828125, 1384.1561279296875, 1466.23095703125, 1548.3056640625, 1630.38037109375, 1712.4552001953125, 1794.530029296875, 1876.604736328125, 1958.679443359375, 2040.7542724609375, 2122.8291015625, 2204.90380859375, 2286.978515625, 2369.05322265625, 2451.128173828125, 2533.202880859375, 2615.277587890625, 2697.3525390625, 2779.42724609375, 2861.501953125, 2943.57666015625, 3025.6513671875, 3107.726318359375, 3189.801025390625, 3271.875732421875, 3353.95068359375, 3436.025390625, 3518.10009765625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 8.0, 8.0, 8.0, 11.0, 14.0, 11.0, 15.0, 11.0, 14.0, 16.0, 28.0, 26.0, 34.0, 45.0, 49.0, 50.0, 56.0, 64.0, 66.0, 60.0, 55.0, 43.0, 43.0, 40.0, 35.0, 32.0, 35.0, 18.0, 11.0, 17.0, 16.0, 12.0, 11.0, 11.0, 4.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1078.020751953125, -1043.714599609375, -1009.4083251953125, -975.1021118164062, -940.7958984375, -906.4896850585938, -872.1834716796875, -837.8772583007812, -803.571044921875, -769.2648315429688, -734.9586181640625, -700.6524047851562, -666.34619140625, -632.0399780273438, -597.7337646484375, -563.4275512695312, -529.121337890625, -494.81512451171875, -460.5089111328125, -426.20269775390625, -391.896484375, -357.59027099609375, -323.2840576171875, -288.97784423828125, -254.671630859375, -220.36541748046875, -186.0592041015625, -151.75299072265625, -117.44677734375, -83.14056396484375, -48.8343505859375, -14.52813720703125, 19.778076171875, 54.08428955078125, 88.3905029296875, 122.69671630859375, 157.0029296875, 191.30914306640625, 225.6153564453125, 259.92156982421875, 294.227783203125, 328.53399658203125, 362.8402099609375, 397.14642333984375, 431.45263671875, 465.75885009765625, 500.0650634765625, 534.3712768554688, 568.677490234375, 602.9837036132812, 637.2899169921875, 671.5961303710938, 705.90234375, 740.2085571289062, 774.5147705078125, 808.8209838867188, 843.127197265625, 877.4334106445312, 911.7396240234375, 946.0458374023438, 980.35205078125, 1014.6582641601562, 1048.9644775390625, 1083.270751953125, 1117.576904296875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 9.0, 9.0, 12.0, 19.0, 21.0, 35.0, 51.0, 65.0, 115.0, 179.0, 219.0, 394.0, 615.0, 951.0, 1672.0, 2748.0, 4701.0, 8298.0, 15384.0, 32885.0, 85752.0, 320626.0, 1339522.0, 1729423.0, 455544.0, 113433.0, 40213.0, 18555.0, 9664.0, 5367.0, 3000.0, 1786.0, 1106.0, 650.0, 420.0, 274.0, 174.0, 118.0, 100.0, 46.0, 33.0, 25.0, 22.0, 13.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-70.9375, -68.7958984375, -66.654296875, -64.5126953125, -62.37109375, -60.2294921875, -58.087890625, -55.9462890625, -53.8046875, -51.6630859375, -49.521484375, -47.3798828125, -45.23828125, -43.0966796875, -40.955078125, -38.8134765625, -36.671875, -34.5302734375, -32.388671875, -30.2470703125, -28.10546875, -25.9638671875, -23.822265625, -21.6806640625, -19.5390625, -17.3974609375, -15.255859375, -13.1142578125, -10.97265625, -8.8310546875, -6.689453125, -4.5478515625, -2.40625, -0.2646484375, 1.876953125, 4.0185546875, 6.16015625, 8.3017578125, 10.443359375, 12.5849609375, 14.7265625, 16.8681640625, 19.009765625, 21.1513671875, 23.29296875, 25.4345703125, 27.576171875, 29.7177734375, 31.859375, 34.0009765625, 36.142578125, 38.2841796875, 40.42578125, 42.5673828125, 44.708984375, 46.8505859375, 48.9921875, 51.1337890625, 53.275390625, 55.4169921875, 57.55859375, 59.7001953125, 61.841796875, 63.9833984375, 66.125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 5.0, 9.0, 1.0, 6.0, 11.0, 15.0, 10.0, 21.0, 23.0, 32.0, 34.0, 30.0, 33.0, 32.0, 42.0, 47.0, 41.0, 48.0, 45.0, 66.0, 52.0, 43.0, 51.0, 26.0, 36.0, 44.0, 31.0, 29.0, 24.0, 19.0, 18.0, 8.0, 11.0, 8.0, 6.0, 12.0, 9.0, 7.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.25, -48.56640625, -46.8828125, -45.19921875, -43.515625, -41.83203125, -40.1484375, -38.46484375, -36.78125, -35.09765625, -33.4140625, -31.73046875, -30.046875, -28.36328125, -26.6796875, -24.99609375, -23.3125, -21.62890625, -19.9453125, -18.26171875, -16.578125, -14.89453125, -13.2109375, -11.52734375, -9.84375, -8.16015625, -6.4765625, -4.79296875, -3.109375, -1.42578125, 0.2578125, 1.94140625, 3.625, 5.30859375, 6.9921875, 8.67578125, 10.359375, 12.04296875, 13.7265625, 15.41015625, 17.09375, 18.77734375, 20.4609375, 22.14453125, 23.828125, 25.51171875, 27.1953125, 28.87890625, 30.5625, 32.24609375, 33.9296875, 35.61328125, 37.296875, 38.98046875, 40.6640625, 42.34765625, 44.03125, 45.71484375, 47.3984375, 49.08203125, 50.765625, 52.44921875, 54.1328125, 55.81640625, 57.5]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 5.0, 11.0, 17.0, 25.0, 32.0, 73.0, 100.0, 204.0, 477.0, 1070.0, 3308.0, 12926.0, 75528.0, 1882966.0, 2122861.0, 76770.0, 12793.0, 3282.0, 1038.0, 459.0, 164.0, 78.0, 40.0, 20.0, 17.0, 7.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.25, -258.6328125, -250.015625, -241.3984375, -232.78125, -224.1640625, -215.546875, -206.9296875, -198.3125, -189.6953125, -181.078125, -172.4609375, -163.84375, -155.2265625, -146.609375, -137.9921875, -129.375, -120.7578125, -112.140625, -103.5234375, -94.90625, -86.2890625, -77.671875, -69.0546875, -60.4375, -51.8203125, -43.203125, -34.5859375, -25.96875, -17.3515625, -8.734375, -0.1171875, 8.5, 17.1171875, 25.734375, 34.3515625, 42.96875, 51.5859375, 60.203125, 68.8203125, 77.4375, 86.0546875, 94.671875, 103.2890625, 111.90625, 120.5234375, 129.140625, 137.7578125, 146.375, 154.9921875, 163.609375, 172.2265625, 180.84375, 189.4609375, 198.078125, 206.6953125, 215.3125, 223.9296875, 232.546875, 241.1640625, 249.78125, 258.3984375, 267.015625, 275.6328125, 284.25]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 9.0, 9.0, 9.0, 16.0, 24.0, 27.0, 42.0, 77.0, 88.0, 142.0, 218.0, 436.0, 781.0, 920.0, 522.0, 279.0, 143.0, 108.0, 65.0, 50.0, 36.0, 20.0, 9.0, 15.0, 12.0, 10.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-338.0, -329.99609375, -321.9921875, -313.98828125, -305.984375, -297.98046875, -289.9765625, -281.97265625, -273.96875, -265.96484375, -257.9609375, -249.95703125, -241.953125, -233.94921875, -225.9453125, -217.94140625, -209.9375, -201.93359375, -193.9296875, -185.92578125, -177.921875, -169.91796875, -161.9140625, -153.91015625, -145.90625, -137.90234375, -129.8984375, -121.89453125, -113.890625, -105.88671875, -97.8828125, -89.87890625, -81.875, -73.87109375, -65.8671875, -57.86328125, -49.859375, -41.85546875, -33.8515625, -25.84765625, -17.84375, -9.83984375, -1.8359375, 6.16796875, 14.171875, 22.17578125, 30.1796875, 38.18359375, 46.1875, 54.19140625, 62.1953125, 70.19921875, 78.203125, 86.20703125, 94.2109375, 102.21484375, 110.21875, 118.22265625, 126.2265625, 134.23046875, 142.234375, 150.23828125, 158.2421875, 166.24609375, 174.25]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 8.0, 17.0, 51.0, 276.0, 473.0, 137.0, 29.0, 8.0, 3.0, 2.0, 3.0], "bins": [-11731.53515625, -11526.765625, -11321.99609375, -11117.2265625, -10912.45703125, -10707.6875, -10502.91796875, -10298.1494140625, -10093.3798828125, -9888.6103515625, -9683.8408203125, -9479.0712890625, -9274.3017578125, -9069.533203125, -8864.763671875, -8659.994140625, -8455.224609375, -8250.455078125, -8045.685546875, -7840.916015625, -7636.14697265625, -7431.37744140625, -7226.60791015625, -7021.83837890625, -6817.068359375, -6612.298828125, -6407.529296875, -6202.759765625, -5997.99072265625, -5793.22119140625, -5588.45166015625, -5383.68212890625, -5178.91259765625, -4974.14306640625, -4769.37353515625, -4564.6044921875, -4359.8349609375, -4155.0654296875, -3950.2958984375, -3745.5263671875, -3540.75732421875, -3335.98779296875, -3131.218505859375, -2926.448974609375, -2721.6796875, -2516.91015625, -2312.140625, -2107.37109375, -1902.6016845703125, -1697.832275390625, -1493.062744140625, -1288.2933349609375, -1083.52392578125, -878.7545166015625, -673.9849853515625, -469.215576171875, -264.4461669921875, -59.676727294921875, 145.09271240234375, 349.8621826171875, 554.631591796875, 759.4010009765625, 964.1705322265625, 1168.93994140625, 1373.7093505859375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 5.0, 7.0, 11.0, 16.0, 21.0, 21.0, 26.0, 22.0, 30.0, 32.0, 43.0, 35.0, 36.0, 33.0, 40.0, 48.0, 53.0, 51.0, 52.0, 58.0, 42.0, 38.0, 38.0, 33.0, 29.0, 32.0, 24.0, 20.0, 21.0, 17.0, 7.0, 12.0, 8.0, 7.0, 7.0, 7.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-930.379638671875, -898.8958740234375, -867.4120483398438, -835.9282836914062, -804.4445190429688, -772.960693359375, -741.4769287109375, -709.9931640625, -678.5093383789062, -647.0255737304688, -615.541748046875, -584.0579833984375, -552.57421875, -521.0903930664062, -489.60662841796875, -458.1228332519531, -426.6390686035156, -395.1552734375, -363.6715087890625, -332.1877136230469, -300.70391845703125, -269.22015380859375, -237.73635864257812, -206.2525634765625, -174.76878356933594, -143.28500366210938, -111.80120849609375, -80.31742858886719, -48.833641052246094, -17.349853515625, 14.133926391601562, 45.61772155761719, 77.10150146484375, 108.58528900146484, 140.06907653808594, 171.5528564453125, 203.03665161132812, 234.5204315185547, 266.00421142578125, 297.4880065917969, 328.9718017578125, 360.4555969238281, 391.9393615722656, 423.42315673828125, 454.9069519042969, 486.3907470703125, 517.87451171875, 549.3582763671875, 580.842041015625, 612.3258056640625, 643.8096313476562, 675.2933959960938, 706.7771606445312, 738.260986328125, 769.7447509765625, 801.228515625, 832.7123413085938, 864.1961059570312, 895.679931640625, 927.1636962890625, 958.6474609375, 990.1312866210938, 1021.6150512695312, 1053.098876953125, 1084.5826416015625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 13.0, 9.0, 25.0, 26.0, 49.0, 57.0, 117.0, 156.0, 227.0, 403.0, 634.0, 1181.0, 2114.0, 3798.0, 7205.0, 14470.0, 29633.0, 63901.0, 144496.0, 337707.0, 246964.0, 103539.0, 46764.0, 21883.0, 10621.0, 5540.0, 3043.0, 1624.0, 889.0, 536.0, 330.0, 207.0, 124.0, 92.0, 55.0, 30.0, 32.0, 13.0, 9.0, 10.0, 4.0, 10.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-131.125, -127.4619140625, -123.798828125, -120.1357421875, -116.47265625, -112.8095703125, -109.146484375, -105.4833984375, -101.8203125, -98.1572265625, -94.494140625, -90.8310546875, -87.16796875, -83.5048828125, -79.841796875, -76.1787109375, -72.515625, -68.8525390625, -65.189453125, -61.5263671875, -57.86328125, -54.2001953125, -50.537109375, -46.8740234375, -43.2109375, -39.5478515625, -35.884765625, -32.2216796875, -28.55859375, -24.8955078125, -21.232421875, -17.5693359375, -13.90625, -10.2431640625, -6.580078125, -2.9169921875, 0.74609375, 4.4091796875, 8.072265625, 11.7353515625, 15.3984375, 19.0615234375, 22.724609375, 26.3876953125, 30.05078125, 33.7138671875, 37.376953125, 41.0400390625, 44.703125, 48.3662109375, 52.029296875, 55.6923828125, 59.35546875, 63.0185546875, 66.681640625, 70.3447265625, 74.0078125, 77.6708984375, 81.333984375, 84.9970703125, 88.66015625, 92.3232421875, 95.986328125, 99.6494140625, 103.3125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 9.0, 3.0, 5.0, 9.0, 5.0, 8.0, 10.0, 16.0, 20.0, 21.0, 17.0, 29.0, 31.0, 33.0, 28.0, 30.0, 50.0, 42.0, 35.0, 43.0, 43.0, 31.0, 51.0, 44.0, 33.0, 36.0, 27.0, 30.0, 33.0, 26.0, 25.0, 21.0, 21.0, 16.0, 17.0, 16.0, 12.0, 10.0, 9.0, 8.0, 9.0, 9.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-48.96875, -47.32470703125, -45.6806640625, -44.03662109375, -42.392578125, -40.74853515625, -39.1044921875, -37.46044921875, -35.81640625, -34.17236328125, -32.5283203125, -30.88427734375, -29.240234375, -27.59619140625, -25.9521484375, -24.30810546875, -22.6640625, -21.02001953125, -19.3759765625, -17.73193359375, -16.087890625, -14.44384765625, -12.7998046875, -11.15576171875, -9.51171875, -7.86767578125, -6.2236328125, -4.57958984375, -2.935546875, -1.29150390625, 0.3525390625, 1.99658203125, 3.640625, 5.28466796875, 6.9287109375, 8.57275390625, 10.216796875, 11.86083984375, 13.5048828125, 15.14892578125, 16.79296875, 18.43701171875, 20.0810546875, 21.72509765625, 23.369140625, 25.01318359375, 26.6572265625, 28.30126953125, 29.9453125, 31.58935546875, 33.2333984375, 34.87744140625, 36.521484375, 38.16552734375, 39.8095703125, 41.45361328125, 43.09765625, 44.74169921875, 46.3857421875, 48.02978515625, 49.673828125, 51.31787109375, 52.9619140625, 54.60595703125, 56.25]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 10.0, 10.0, 13.0, 9.0, 17.0, 28.0, 38.0, 50.0, 63.0, 103.0, 135.0, 191.0, 245.0, 453.0, 674.0, 1134.0, 2150.0, 4855.0, 14821.0, 71937.0, 674960.0, 227161.0, 33499.0, 8629.0, 3092.0, 1638.0, 897.0, 536.0, 379.0, 241.0, 142.0, 119.0, 86.0, 53.0, 51.0, 31.0, 23.0, 19.0, 19.0, 11.0, 5.0, 7.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0], "bins": [-322.5, -313.486328125, -304.47265625, -295.458984375, -286.4453125, -277.431640625, -268.41796875, -259.404296875, -250.390625, -241.376953125, -232.36328125, -223.349609375, -214.3359375, -205.322265625, -196.30859375, -187.294921875, -178.28125, -169.267578125, -160.25390625, -151.240234375, -142.2265625, -133.212890625, -124.19921875, -115.185546875, -106.171875, -97.158203125, -88.14453125, -79.130859375, -70.1171875, -61.103515625, -52.08984375, -43.076171875, -34.0625, -25.048828125, -16.03515625, -7.021484375, 1.9921875, 11.005859375, 20.01953125, 29.033203125, 38.046875, 47.060546875, 56.07421875, 65.087890625, 74.1015625, 83.115234375, 92.12890625, 101.142578125, 110.15625, 119.169921875, 128.18359375, 137.197265625, 146.2109375, 155.224609375, 164.23828125, 173.251953125, 182.265625, 191.279296875, 200.29296875, 209.306640625, 218.3203125, 227.333984375, 236.34765625, 245.361328125, 254.375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 10.0, 11.0, 13.0, 15.0, 18.0, 19.0, 19.0, 33.0, 33.0, 43.0, 48.0, 54.0, 56.0, 59.0, 72.0, 54.0, 55.0, 81.0, 60.0, 41.0, 31.0, 45.0, 23.0, 29.0, 13.0, 11.0, 17.0, 14.0, 7.0, 5.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-451.0, -438.36328125, -425.7265625, -413.08984375, -400.453125, -387.81640625, -375.1796875, -362.54296875, -349.90625, -337.26953125, -324.6328125, -311.99609375, -299.359375, -286.72265625, -274.0859375, -261.44921875, -248.8125, -236.17578125, -223.5390625, -210.90234375, -198.265625, -185.62890625, -172.9921875, -160.35546875, -147.71875, -135.08203125, -122.4453125, -109.80859375, -97.171875, -84.53515625, -71.8984375, -59.26171875, -46.625, -33.98828125, -21.3515625, -8.71484375, 3.921875, 16.55859375, 29.1953125, 41.83203125, 54.46875, 67.10546875, 79.7421875, 92.37890625, 105.015625, 117.65234375, 130.2890625, 142.92578125, 155.5625, 168.19921875, 180.8359375, 193.47265625, 206.109375, 218.74609375, 231.3828125, 244.01953125, 256.65625, 269.29296875, 281.9296875, 294.56640625, 307.203125, 319.83984375, 332.4765625, 345.11328125, 357.75]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 15.0, 12.0, 18.0, 27.0, 53.0, 98.0, 202.0, 358.0, 854.0, 2220.0, 8217.0, 50764.0, 676035.0, 274764.0, 26792.0, 5227.0, 1638.0, 633.0, 280.0, 159.0, 74.0, 39.0, 21.0, 20.0, 13.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.4375, -101.0517578125, -97.666015625, -94.2802734375, -90.89453125, -87.5087890625, -84.123046875, -80.7373046875, -77.3515625, -73.9658203125, -70.580078125, -67.1943359375, -63.80859375, -60.4228515625, -57.037109375, -53.6513671875, -50.265625, -46.8798828125, -43.494140625, -40.1083984375, -36.72265625, -33.3369140625, -29.951171875, -26.5654296875, -23.1796875, -19.7939453125, -16.408203125, -13.0224609375, -9.63671875, -6.2509765625, -2.865234375, 0.5205078125, 3.90625, 7.2919921875, 10.677734375, 14.0634765625, 17.44921875, 20.8349609375, 24.220703125, 27.6064453125, 30.9921875, 34.3779296875, 37.763671875, 41.1494140625, 44.53515625, 47.9208984375, 51.306640625, 54.6923828125, 58.078125, 61.4638671875, 64.849609375, 68.2353515625, 71.62109375, 75.0068359375, 78.392578125, 81.7783203125, 85.1640625, 88.5498046875, 91.935546875, 95.3212890625, 98.70703125, 102.0927734375, 105.478515625, 108.8642578125, 112.25]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 5.0, 8.0, 14.0, 7.0, 16.0, 17.0, 23.0, 22.0, 29.0, 35.0, 19.0, 39.0, 48.0, 58.0, 80.0, 87.0, 82.0, 65.0, 55.0, 33.0, 34.0, 43.0, 35.0, 22.0, 24.0, 16.0, 14.0, 18.0, 11.0, 5.0, 6.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0222320556640625, -0.021589994430541992, -0.020947933197021484, -0.020305871963500977, -0.01966381072998047, -0.01902174949645996, -0.018379688262939453, -0.017737627029418945, -0.017095565795898438, -0.01645350456237793, -0.015811443328857422, -0.015169382095336914, -0.014527320861816406, -0.013885259628295898, -0.01324319839477539, -0.012601137161254883, -0.011959075927734375, -0.011317014694213867, -0.01067495346069336, -0.010032892227172852, -0.009390830993652344, -0.008748769760131836, -0.008106708526611328, -0.00746464729309082, -0.0068225860595703125, -0.006180524826049805, -0.005538463592529297, -0.004896402359008789, -0.004254341125488281, -0.0036122798919677734, -0.0029702186584472656, -0.002328157424926758, -0.00168609619140625, -0.0010440349578857422, -0.0004019737243652344, 0.00024008750915527344, 0.0008821487426757812, 0.001524209976196289, 0.002166271209716797, 0.0028083324432373047, 0.0034503936767578125, 0.00409245491027832, 0.004734516143798828, 0.005376577377319336, 0.006018638610839844, 0.0066606998443603516, 0.007302761077880859, 0.007944822311401367, 0.008586883544921875, 0.009228944778442383, 0.00987100601196289, 0.010513067245483398, 0.011155128479003906, 0.011797189712524414, 0.012439250946044922, 0.01308131217956543, 0.013723373413085938, 0.014365434646606445, 0.015007495880126953, 0.01564955711364746, 0.01629161834716797, 0.016933679580688477, 0.017575740814208984, 0.018217802047729492, 0.01885986328125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 9.0, 8.0, 6.0, 23.0, 26.0, 59.0, 72.0, 164.0, 322.0, 683.0, 1599.0, 5201.0, 28431.0, 427687.0, 545665.0, 30232.0, 5266.0, 1653.0, 681.0, 347.0, 192.0, 90.0, 59.0, 42.0, 20.0, 12.0, 11.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-161.75, -158.0751953125, -154.400390625, -150.7255859375, -147.05078125, -143.3759765625, -139.701171875, -136.0263671875, -132.3515625, -128.6767578125, -125.001953125, -121.3271484375, -117.65234375, -113.9775390625, -110.302734375, -106.6279296875, -102.953125, -99.2783203125, -95.603515625, -91.9287109375, -88.25390625, -84.5791015625, -80.904296875, -77.2294921875, -73.5546875, -69.8798828125, -66.205078125, -62.5302734375, -58.85546875, -55.1806640625, -51.505859375, -47.8310546875, -44.15625, -40.4814453125, -36.806640625, -33.1318359375, -29.45703125, -25.7822265625, -22.107421875, -18.4326171875, -14.7578125, -11.0830078125, -7.408203125, -3.7333984375, -0.05859375, 3.6162109375, 7.291015625, 10.9658203125, 14.640625, 18.3154296875, 21.990234375, 25.6650390625, 29.33984375, 33.0146484375, 36.689453125, 40.3642578125, 44.0390625, 47.7138671875, 51.388671875, 55.0634765625, 58.73828125, 62.4130859375, 66.087890625, 69.7626953125, 73.4375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 5.0, 6.0, 3.0, 3.0, 11.0, 7.0, 18.0, 12.0, 11.0, 18.0, 20.0, 25.0, 32.0, 34.0, 36.0, 39.0, 44.0, 43.0, 45.0, 45.0, 50.0, 50.0, 55.0, 56.0, 38.0, 51.0, 33.0, 34.0, 21.0, 24.0, 24.0, 14.0, 20.0, 10.0, 12.0, 9.0, 9.0, 6.0, 6.0, 4.0, 5.0, 3.0, 6.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-53.875, -52.10791015625, -50.3408203125, -48.57373046875, -46.806640625, -45.03955078125, -43.2724609375, -41.50537109375, -39.73828125, -37.97119140625, -36.2041015625, -34.43701171875, -32.669921875, -30.90283203125, -29.1357421875, -27.36865234375, -25.6015625, -23.83447265625, -22.0673828125, -20.30029296875, -18.533203125, -16.76611328125, -14.9990234375, -13.23193359375, -11.46484375, -9.69775390625, -7.9306640625, -6.16357421875, -4.396484375, -2.62939453125, -0.8623046875, 0.90478515625, 2.671875, 4.43896484375, 6.2060546875, 7.97314453125, 9.740234375, 11.50732421875, 13.2744140625, 15.04150390625, 16.80859375, 18.57568359375, 20.3427734375, 22.10986328125, 23.876953125, 25.64404296875, 27.4111328125, 29.17822265625, 30.9453125, 32.71240234375, 34.4794921875, 36.24658203125, 38.013671875, 39.78076171875, 41.5478515625, 43.31494140625, 45.08203125, 46.84912109375, 48.6162109375, 50.38330078125, 52.150390625, 53.91748046875, 55.6845703125, 57.45166015625, 59.21875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 7.0, 8.0, 18.0, 21.0, 77.0, 160.0, 278.0, 203.0, 114.0, 62.0, 26.0, 13.0, 9.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2113.28076171875, -2031.3466796875, -1949.4127197265625, -1867.478759765625, -1785.544677734375, -1703.610595703125, -1621.6766357421875, -1539.74267578125, -1457.80859375, -1375.87451171875, -1293.9405517578125, -1212.006591796875, -1130.072509765625, -1048.138427734375, -966.2044677734375, -884.2704467773438, -802.33642578125, -720.4024047851562, -638.4683837890625, -556.5343627929688, -474.600341796875, -392.66632080078125, -310.7322998046875, -228.79827880859375, -146.8642578125, -64.93023681640625, 17.0037841796875, 98.93780517578125, 180.871826171875, 262.80584716796875, 344.7398681640625, 426.67388916015625, 508.60791015625, 590.5419311523438, 672.4759521484375, 754.4099731445312, 836.343994140625, 918.2780151367188, 1000.2120361328125, 1082.14599609375, 1164.080078125, 1246.01416015625, 1327.9481201171875, 1409.882080078125, 1491.816162109375, 1573.750244140625, 1655.6842041015625, 1737.6181640625, 1819.55224609375, 1901.486328125, 1983.4202880859375, 2065.354248046875, 2147.288330078125, 2229.222412109375, 2311.15625, 2393.09033203125, 2475.0244140625, 2556.95849609375, 2638.892578125, 2720.826416015625, 2802.760498046875, 2884.694580078125, 2966.62841796875, 3048.5625, 3130.49658203125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 4.0, 9.0, 8.0, 11.0, 14.0, 11.0, 22.0, 18.0, 22.0, 24.0, 22.0, 36.0, 30.0, 43.0, 37.0, 55.0, 76.0, 68.0, 76.0, 61.0, 52.0, 36.0, 38.0, 43.0, 33.0, 25.0, 25.0, 13.0, 16.0, 15.0, 11.0, 9.0, 5.0, 8.0, 5.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1455.0361328125, -1411.7655029296875, -1368.4949951171875, -1325.224365234375, -1281.953857421875, -1238.6832275390625, -1195.41259765625, -1152.14208984375, -1108.8714599609375, -1065.600830078125, -1022.330322265625, -979.0596923828125, -935.7891235351562, -892.5185546875, -849.2479248046875, -805.9773559570312, -762.706787109375, -719.4362182617188, -676.1656494140625, -632.89501953125, -589.6244506835938, -546.3538818359375, -503.0832824707031, -459.81268310546875, -416.5421142578125, -373.27154541015625, -330.0009460449219, -286.7303466796875, -243.45977783203125, -200.18919372558594, -156.91860961914062, -113.64801025390625, -70.3773193359375, -27.106735229492188, 16.163848876953125, 59.43443298339844, 102.70501708984375, 145.97560119628906, 189.24618530273438, 232.51678466796875, 275.787353515625, 319.05792236328125, 362.3285217285156, 405.59912109375, 448.86968994140625, 492.1402587890625, 535.410888671875, 578.6814575195312, 621.9520263671875, 665.2225952148438, 708.4931640625, 751.7637939453125, 795.0343627929688, 838.304931640625, 881.5755615234375, 924.8461303710938, 968.11669921875, 1011.3872680664062, 1054.6578369140625, 1097.928466796875, 1141.198974609375, 1184.4696044921875, 1227.740234375, 1271.0107421875, 1314.2813720703125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 10.0, 15.0, 34.0, 40.0, 57.0, 86.0, 150.0, 240.0, 436.0, 701.0, 1196.0, 2104.0, 3890.0, 7216.0, 14909.0, 36036.0, 116678.0, 493805.0, 1742292.0, 1326649.0, 319126.0, 77136.0, 26521.0, 11622.0, 5715.0, 3136.0, 1821.0, 991.0, 614.0, 362.0, 243.0, 139.0, 99.0, 57.0, 48.0, 35.0, 21.0, 19.0, 13.0, 2.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.40625, -52.21728515625, -50.0283203125, -47.83935546875, -45.650390625, -43.46142578125, -41.2724609375, -39.08349609375, -36.89453125, -34.70556640625, -32.5166015625, -30.32763671875, -28.138671875, -25.94970703125, -23.7607421875, -21.57177734375, -19.3828125, -17.19384765625, -15.0048828125, -12.81591796875, -10.626953125, -8.43798828125, -6.2490234375, -4.06005859375, -1.87109375, 0.31787109375, 2.5068359375, 4.69580078125, 6.884765625, 9.07373046875, 11.2626953125, 13.45166015625, 15.640625, 17.82958984375, 20.0185546875, 22.20751953125, 24.396484375, 26.58544921875, 28.7744140625, 30.96337890625, 33.15234375, 35.34130859375, 37.5302734375, 39.71923828125, 41.908203125, 44.09716796875, 46.2861328125, 48.47509765625, 50.6640625, 52.85302734375, 55.0419921875, 57.23095703125, 59.419921875, 61.60888671875, 63.7978515625, 65.98681640625, 68.17578125, 70.36474609375, 72.5537109375, 74.74267578125, 76.931640625, 79.12060546875, 81.3095703125, 83.49853515625, 85.6875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 10.0, 7.0, 5.0, 14.0, 12.0, 19.0, 26.0, 22.0, 48.0, 42.0, 44.0, 67.0, 51.0, 70.0, 66.0, 60.0, 60.0, 57.0, 51.0, 51.0, 46.0, 34.0, 41.0, 26.0, 17.0, 18.0, 12.0, 14.0, 1.0, 8.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.8125, -74.1767578125, -71.541015625, -68.9052734375, -66.26953125, -63.6337890625, -60.998046875, -58.3623046875, -55.7265625, -53.0908203125, -50.455078125, -47.8193359375, -45.18359375, -42.5478515625, -39.912109375, -37.2763671875, -34.640625, -32.0048828125, -29.369140625, -26.7333984375, -24.09765625, -21.4619140625, -18.826171875, -16.1904296875, -13.5546875, -10.9189453125, -8.283203125, -5.6474609375, -3.01171875, -0.3759765625, 2.259765625, 4.8955078125, 7.53125, 10.1669921875, 12.802734375, 15.4384765625, 18.07421875, 20.7099609375, 23.345703125, 25.9814453125, 28.6171875, 31.2529296875, 33.888671875, 36.5244140625, 39.16015625, 41.7958984375, 44.431640625, 47.0673828125, 49.703125, 52.3388671875, 54.974609375, 57.6103515625, 60.24609375, 62.8818359375, 65.517578125, 68.1533203125, 70.7890625, 73.4248046875, 76.060546875, 78.6962890625, 81.33203125, 83.9677734375, 86.603515625, 89.2392578125, 91.875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 5.0, 8.0, 12.0, 12.0, 14.0, 27.0, 27.0, 62.0, 107.0, 144.0, 262.0, 524.0, 1083.0, 2562.0, 6578.0, 19987.0, 73282.0, 457305.0, 3117858.0, 413408.0, 69165.0, 19935.0, 6817.0, 2677.0, 1129.0, 559.0, 269.0, 146.0, 103.0, 59.0, 46.0, 34.0, 16.0, 26.0, 10.0, 4.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-136.875, -132.232421875, -127.58984375, -122.947265625, -118.3046875, -113.662109375, -109.01953125, -104.376953125, -99.734375, -95.091796875, -90.44921875, -85.806640625, -81.1640625, -76.521484375, -71.87890625, -67.236328125, -62.59375, -57.951171875, -53.30859375, -48.666015625, -44.0234375, -39.380859375, -34.73828125, -30.095703125, -25.453125, -20.810546875, -16.16796875, -11.525390625, -6.8828125, -2.240234375, 2.40234375, 7.044921875, 11.6875, 16.330078125, 20.97265625, 25.615234375, 30.2578125, 34.900390625, 39.54296875, 44.185546875, 48.828125, 53.470703125, 58.11328125, 62.755859375, 67.3984375, 72.041015625, 76.68359375, 81.326171875, 85.96875, 90.611328125, 95.25390625, 99.896484375, 104.5390625, 109.181640625, 113.82421875, 118.466796875, 123.109375, 127.751953125, 132.39453125, 137.037109375, 141.6796875, 146.322265625, 150.96484375, 155.607421875, 160.25]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 5.0, 8.0, 10.0, 5.0, 8.0, 15.0, 12.0, 15.0, 33.0, 35.0, 35.0, 57.0, 70.0, 87.0, 118.0, 151.0, 226.0, 359.0, 443.0, 531.0, 515.0, 357.0, 261.0, 175.0, 127.0, 83.0, 67.0, 45.0, 42.0, 29.0, 27.0, 19.0, 20.0, 16.0, 10.0, 9.0, 7.0, 10.0, 4.0, 3.0, 9.0, 1.0, 7.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-131.875, -127.5703125, -123.265625, -118.9609375, -114.65625, -110.3515625, -106.046875, -101.7421875, -97.4375, -93.1328125, -88.828125, -84.5234375, -80.21875, -75.9140625, -71.609375, -67.3046875, -63.0, -58.6953125, -54.390625, -50.0859375, -45.78125, -41.4765625, -37.171875, -32.8671875, -28.5625, -24.2578125, -19.953125, -15.6484375, -11.34375, -7.0390625, -2.734375, 1.5703125, 5.875, 10.1796875, 14.484375, 18.7890625, 23.09375, 27.3984375, 31.703125, 36.0078125, 40.3125, 44.6171875, 48.921875, 53.2265625, 57.53125, 61.8359375, 66.140625, 70.4453125, 74.75, 79.0546875, 83.359375, 87.6640625, 91.96875, 96.2734375, 100.578125, 104.8828125, 109.1875, 113.4921875, 117.796875, 122.1015625, 126.40625, 130.7109375, 135.015625, 139.3203125, 143.625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 10.0, 56.0, 349.0, 439.0, 113.0, 20.0, 10.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1325.0260009765625, -1164.0267333984375, -1003.027587890625, -842.0283203125, -681.0291137695312, -520.0299072265625, -359.0306396484375, -198.031494140625, -37.0322265625, 123.96699523925781, 284.9662170410156, 445.9654541015625, 606.9646606445312, 767.9638671875, 928.963134765625, 1089.9622802734375, 1250.9615478515625, 1411.9608154296875, 1572.9599609375, 1733.959228515625, 1894.95849609375, 2055.95751953125, 2216.95703125, 2377.9560546875, 2538.955322265625, 2699.95458984375, 2860.953857421875, 3021.953125, 3182.9521484375, 3343.951416015625, 3504.95068359375, 3665.94970703125, 3826.94873046875, 3987.947998046875, 4148.947265625, 4309.9462890625, 4470.94580078125, 4631.94482421875, 4792.9443359375, 4953.943359375, 5114.9423828125, 5275.94140625, 5436.94091796875, 5597.93994140625, 5758.939453125, 5919.9384765625, 6080.9375, 6241.93701171875, 6402.9365234375, 6563.935546875, 6724.93505859375, 6885.93408203125, 7046.93359375, 7207.9326171875, 7368.931640625, 7529.93115234375, 7690.93017578125, 7851.92919921875, 8012.9287109375, 8173.927734375, 8334.9267578125, 8495.92578125, 8656.92578125, 8817.9248046875, 8978.923828125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 11.0, 4.0, 5.0, 4.0, 7.0, 9.0, 17.0, 8.0, 18.0, 19.0, 19.0, 25.0, 25.0, 32.0, 24.0, 27.0, 34.0, 39.0, 50.0, 34.0, 57.0, 52.0, 50.0, 51.0, 41.0, 44.0, 40.0, 24.0, 38.0, 25.0, 35.0, 23.0, 13.0, 24.0, 16.0, 8.0, 9.0, 7.0, 7.0, 9.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-795.8304443359375, -770.4745483398438, -745.1187133789062, -719.7628173828125, -694.406982421875, -669.0510864257812, -643.6952514648438, -618.33935546875, -592.9835205078125, -567.6276245117188, -542.2717895507812, -516.9158935546875, -491.56005859375, -466.2041931152344, -440.84832763671875, -415.492431640625, -390.1365661621094, -364.78070068359375, -339.4248352050781, -314.0689697265625, -288.7131042480469, -263.35723876953125, -238.00135803222656, -212.64549255371094, -187.2896270751953, -161.9337615966797, -136.57789611816406, -111.2220230102539, -85.86615753173828, -60.510292053222656, -35.1544189453125, -9.798553466796875, 15.55731201171875, 40.913177490234375, 66.26904296875, 91.62491607666016, 116.98078155517578, 142.33663940429688, 167.69252014160156, 193.0483856201172, 218.4042510986328, 243.76011657714844, 269.1159973144531, 294.47186279296875, 319.8277282714844, 345.18359375, 370.5394592285156, 395.89532470703125, 421.2511901855469, 446.6070556640625, 471.9629211425781, 497.31878662109375, 522.6746826171875, 548.030517578125, 573.3864135742188, 598.7422485351562, 624.09814453125, 649.4540405273438, 674.8098754882812, 700.165771484375, 725.5216064453125, 750.8775024414062, 776.2333374023438, 801.5892333984375, 826.945068359375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 9.0, 18.0, 19.0, 33.0, 37.0, 61.0, 109.0, 145.0, 217.0, 345.0, 543.0, 887.0, 1516.0, 2699.0, 5034.0, 9780.0, 19612.0, 41800.0, 93534.0, 237262.0, 357681.0, 152782.0, 64383.0, 29486.0, 14233.0, 7151.0, 3899.0, 2121.0, 1202.0, 706.0, 441.0, 258.0, 182.0, 124.0, 77.0, 69.0, 31.0, 19.0, 19.0, 9.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-104.8125, -101.4609375, -98.109375, -94.7578125, -91.40625, -88.0546875, -84.703125, -81.3515625, -78.0, -74.6484375, -71.296875, -67.9453125, -64.59375, -61.2421875, -57.890625, -54.5390625, -51.1875, -47.8359375, -44.484375, -41.1328125, -37.78125, -34.4296875, -31.078125, -27.7265625, -24.375, -21.0234375, -17.671875, -14.3203125, -10.96875, -7.6171875, -4.265625, -0.9140625, 2.4375, 5.7890625, 9.140625, 12.4921875, 15.84375, 19.1953125, 22.546875, 25.8984375, 29.25, 32.6015625, 35.953125, 39.3046875, 42.65625, 46.0078125, 49.359375, 52.7109375, 56.0625, 59.4140625, 62.765625, 66.1171875, 69.46875, 72.8203125, 76.171875, 79.5234375, 82.875, 86.2265625, 89.578125, 92.9296875, 96.28125, 99.6328125, 102.984375, 106.3359375, 109.6875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 9.0, 3.0, 15.0, 13.0, 21.0, 20.0, 23.0, 28.0, 46.0, 31.0, 48.0, 50.0, 54.0, 52.0, 57.0, 53.0, 54.0, 49.0, 49.0, 46.0, 47.0, 44.0, 39.0, 24.0, 23.0, 24.0, 17.0, 9.0, 13.0, 10.0, 10.0, 5.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.25, -65.7763671875, -63.302734375, -60.8291015625, -58.35546875, -55.8818359375, -53.408203125, -50.9345703125, -48.4609375, -45.9873046875, -43.513671875, -41.0400390625, -38.56640625, -36.0927734375, -33.619140625, -31.1455078125, -28.671875, -26.1982421875, -23.724609375, -21.2509765625, -18.77734375, -16.3037109375, -13.830078125, -11.3564453125, -8.8828125, -6.4091796875, -3.935546875, -1.4619140625, 1.01171875, 3.4853515625, 5.958984375, 8.4326171875, 10.90625, 13.3798828125, 15.853515625, 18.3271484375, 20.80078125, 23.2744140625, 25.748046875, 28.2216796875, 30.6953125, 33.1689453125, 35.642578125, 38.1162109375, 40.58984375, 43.0634765625, 45.537109375, 48.0107421875, 50.484375, 52.9580078125, 55.431640625, 57.9052734375, 60.37890625, 62.8525390625, 65.326171875, 67.7998046875, 70.2734375, 72.7470703125, 75.220703125, 77.6943359375, 80.16796875, 82.6416015625, 85.115234375, 87.5888671875, 90.0625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 13.0, 11.0, 28.0, 32.0, 40.0, 70.0, 109.0, 185.0, 284.0, 445.0, 871.0, 1825.0, 5308.0, 24887.0, 236698.0, 708712.0, 54884.0, 8888.0, 2598.0, 1095.0, 601.0, 344.0, 208.0, 134.0, 97.0, 64.0, 38.0, 20.0, 18.0, 11.0, 8.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-331.0, -321.3203125, -311.640625, -301.9609375, -292.28125, -282.6015625, -272.921875, -263.2421875, -253.5625, -243.8828125, -234.203125, -224.5234375, -214.84375, -205.1640625, -195.484375, -185.8046875, -176.125, -166.4453125, -156.765625, -147.0859375, -137.40625, -127.7265625, -118.046875, -108.3671875, -98.6875, -89.0078125, -79.328125, -69.6484375, -59.96875, -50.2890625, -40.609375, -30.9296875, -21.25, -11.5703125, -1.890625, 7.7890625, 17.46875, 27.1484375, 36.828125, 46.5078125, 56.1875, 65.8671875, 75.546875, 85.2265625, 94.90625, 104.5859375, 114.265625, 123.9453125, 133.625, 143.3046875, 152.984375, 162.6640625, 172.34375, 182.0234375, 191.703125, 201.3828125, 211.0625, 220.7421875, 230.421875, 240.1015625, 249.78125, 259.4609375, 269.140625, 278.8203125, 288.5]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 9.0, 19.0, 25.0, 21.0, 37.0, 46.0, 45.0, 47.0, 68.0, 48.0, 68.0, 64.0, 60.0, 60.0, 69.0, 55.0, 41.0, 44.0, 39.0, 21.0, 24.0, 28.0, 17.0, 16.0, 10.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-299.75, -287.78125, -275.8125, -263.84375, -251.875, -239.90625, -227.9375, -215.96875, -204.0, -192.03125, -180.0625, -168.09375, -156.125, -144.15625, -132.1875, -120.21875, -108.25, -96.28125, -84.3125, -72.34375, -60.375, -48.40625, -36.4375, -24.46875, -12.5, -0.53125, 11.4375, 23.40625, 35.375, 47.34375, 59.3125, 71.28125, 83.25, 95.21875, 107.1875, 119.15625, 131.125, 143.09375, 155.0625, 167.03125, 179.0, 190.96875, 202.9375, 214.90625, 226.875, 238.84375, 250.8125, 262.78125, 274.75, 286.71875, 298.6875, 310.65625, 322.625, 334.59375, 346.5625, 358.53125, 370.5, 382.46875, 394.4375, 406.40625, 418.375, 430.34375, 442.3125, 454.28125, 466.25]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 6.0, 4.0, 8.0, 12.0, 21.0, 19.0, 29.0, 42.0, 73.0, 117.0, 181.0, 307.0, 489.0, 1037.0, 2349.0, 5822.0, 18135.0, 82304.0, 583264.0, 283092.0, 50661.0, 12485.0, 4330.0, 1777.0, 820.0, 444.0, 257.0, 148.0, 96.0, 59.0, 38.0, 23.0, 24.0, 21.0, 10.0, 8.0, 5.0, 10.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-63.3125, -61.38525390625, -59.4580078125, -57.53076171875, -55.603515625, -53.67626953125, -51.7490234375, -49.82177734375, -47.89453125, -45.96728515625, -44.0400390625, -42.11279296875, -40.185546875, -38.25830078125, -36.3310546875, -34.40380859375, -32.4765625, -30.54931640625, -28.6220703125, -26.69482421875, -24.767578125, -22.84033203125, -20.9130859375, -18.98583984375, -17.05859375, -15.13134765625, -13.2041015625, -11.27685546875, -9.349609375, -7.42236328125, -5.4951171875, -3.56787109375, -1.640625, 0.28662109375, 2.2138671875, 4.14111328125, 6.068359375, 7.99560546875, 9.9228515625, 11.85009765625, 13.77734375, 15.70458984375, 17.6318359375, 19.55908203125, 21.486328125, 23.41357421875, 25.3408203125, 27.26806640625, 29.1953125, 31.12255859375, 33.0498046875, 34.97705078125, 36.904296875, 38.83154296875, 40.7587890625, 42.68603515625, 44.61328125, 46.54052734375, 48.4677734375, 50.39501953125, 52.322265625, 54.24951171875, 56.1767578125, 58.10400390625, 60.03125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 3.0, 6.0, 8.0, 8.0, 9.0, 17.0, 34.0, 37.0, 52.0, 74.0, 96.0, 116.0, 142.0, 109.0, 72.0, 66.0, 54.0, 24.0, 19.0, 12.0, 9.0, 5.0, 9.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0390625, -0.038178443908691406, -0.03729438781738281, -0.03641033172607422, -0.035526275634765625, -0.03464221954345703, -0.03375816345214844, -0.032874107360839844, -0.03199005126953125, -0.031105995178222656, -0.030221939086914062, -0.02933788299560547, -0.028453826904296875, -0.02756977081298828, -0.026685714721679688, -0.025801658630371094, -0.0249176025390625, -0.024033546447753906, -0.023149490356445312, -0.02226543426513672, -0.021381378173828125, -0.02049732208251953, -0.019613265991210938, -0.018729209899902344, -0.01784515380859375, -0.016961097717285156, -0.016077041625976562, -0.015192985534667969, -0.014308929443359375, -0.013424873352050781, -0.012540817260742188, -0.011656761169433594, -0.010772705078125, -0.009888648986816406, -0.009004592895507812, -0.008120536804199219, -0.007236480712890625, -0.006352424621582031, -0.0054683685302734375, -0.004584312438964844, -0.00370025634765625, -0.0028162002563476562, -0.0019321441650390625, -0.0010480880737304688, -0.000164031982421875, 0.0007200241088867188, 0.0016040802001953125, 0.0024881362915039062, 0.0033721923828125, 0.004256248474121094, 0.0051403045654296875, 0.006024360656738281, 0.006908416748046875, 0.007792472839355469, 0.008676528930664062, 0.009560585021972656, 0.01044464111328125, 0.011328697204589844, 0.012212753295898438, 0.013096809387207031, 0.013980865478515625, 0.014864921569824219, 0.015748977661132812, 0.016633033752441406, 0.01751708984375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 12.0, 16.0, 16.0, 41.0, 76.0, 188.0, 471.0, 1364.0, 6576.0, 119533.0, 881243.0, 34024.0, 3517.0, 890.0, 294.0, 148.0, 59.0, 26.0, 20.0, 14.0, 14.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.625, -96.48828125, -92.3515625, -88.21484375, -84.078125, -79.94140625, -75.8046875, -71.66796875, -67.53125, -63.39453125, -59.2578125, -55.12109375, -50.984375, -46.84765625, -42.7109375, -38.57421875, -34.4375, -30.30078125, -26.1640625, -22.02734375, -17.890625, -13.75390625, -9.6171875, -5.48046875, -1.34375, 2.79296875, 6.9296875, 11.06640625, 15.203125, 19.33984375, 23.4765625, 27.61328125, 31.75, 35.88671875, 40.0234375, 44.16015625, 48.296875, 52.43359375, 56.5703125, 60.70703125, 64.84375, 68.98046875, 73.1171875, 77.25390625, 81.390625, 85.52734375, 89.6640625, 93.80078125, 97.9375, 102.07421875, 106.2109375, 110.34765625, 114.484375, 118.62109375, 122.7578125, 126.89453125, 131.03125, 135.16796875, 139.3046875, 143.44140625, 147.578125, 151.71484375, 155.8515625, 159.98828125, 164.125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 8.0, 14.0, 17.0, 22.0, 31.0, 27.0, 46.0, 45.0, 52.0, 48.0, 66.0, 77.0, 75.0, 74.0, 64.0, 57.0, 57.0, 40.0, 42.0, 41.0, 28.0, 15.0, 15.0, 9.0, 7.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.1875, -58.33935546875, -56.4912109375, -54.64306640625, -52.794921875, -50.94677734375, -49.0986328125, -47.25048828125, -45.40234375, -43.55419921875, -41.7060546875, -39.85791015625, -38.009765625, -36.16162109375, -34.3134765625, -32.46533203125, -30.6171875, -28.76904296875, -26.9208984375, -25.07275390625, -23.224609375, -21.37646484375, -19.5283203125, -17.68017578125, -15.83203125, -13.98388671875, -12.1357421875, -10.28759765625, -8.439453125, -6.59130859375, -4.7431640625, -2.89501953125, -1.046875, 0.80126953125, 2.6494140625, 4.49755859375, 6.345703125, 8.19384765625, 10.0419921875, 11.89013671875, 13.73828125, 15.58642578125, 17.4345703125, 19.28271484375, 21.130859375, 22.97900390625, 24.8271484375, 26.67529296875, 28.5234375, 30.37158203125, 32.2197265625, 34.06787109375, 35.916015625, 37.76416015625, 39.6123046875, 41.46044921875, 43.30859375, 45.15673828125, 47.0048828125, 48.85302734375, 50.701171875, 52.54931640625, 54.3974609375, 56.24560546875, 58.09375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 8.0, 29.0, 58.0, 157.0, 324.0, 244.0, 95.0, 50.0, 14.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2960.052978515625, -2874.81982421875, -2789.586669921875, -2704.353515625, -2619.120361328125, -2533.88720703125, -2448.654052734375, -2363.4208984375, -2278.187744140625, -2192.95458984375, -2107.721435546875, -2022.48828125, -1937.255126953125, -1852.02197265625, -1766.788818359375, -1681.5556640625, -1596.322509765625, -1511.08935546875, -1425.856201171875, -1340.623046875, -1255.389892578125, -1170.15673828125, -1084.923583984375, -999.6904296875, -914.457275390625, -829.22412109375, -743.990966796875, -658.7578125, -573.524658203125, -488.29150390625, -403.058349609375, -317.8251953125, -232.592041015625, -147.35888671875, -62.125732421875, 23.107421875, 108.340576171875, 193.57373046875, 278.806884765625, 364.0400390625, 449.273193359375, 534.50634765625, 619.739501953125, 704.97265625, 790.205810546875, 875.43896484375, 960.672119140625, 1045.9052734375, 1131.138427734375, 1216.37158203125, 1301.604736328125, 1386.837890625, 1472.071044921875, 1557.30419921875, 1642.537353515625, 1727.7705078125, 1813.003662109375, 1898.23681640625, 1983.469970703125, 2068.703125, 2153.936279296875, 2239.16943359375, 2324.402587890625, 2409.6357421875, 2494.868896484375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 5.0, 6.0, 12.0, 9.0, 13.0, 12.0, 14.0, 12.0, 14.0, 14.0, 26.0, 32.0, 32.0, 38.0, 30.0, 33.0, 47.0, 51.0, 57.0, 82.0, 61.0, 47.0, 39.0, 29.0, 30.0, 23.0, 33.0, 22.0, 35.0, 21.0, 21.0, 15.0, 9.0, 13.0, 14.0, 9.0, 7.0, 5.0, 5.0, 7.0, 1.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1181.378662109375, -1148.8143310546875, -1116.25, -1083.685791015625, -1051.1214599609375, -1018.55712890625, -985.9927978515625, -953.428466796875, -920.8641967773438, -888.2998657226562, -855.735595703125, -823.1712646484375, -790.60693359375, -758.0426635742188, -725.4783325195312, -692.9140625, -660.3497314453125, -627.785400390625, -595.2211303710938, -562.6567993164062, -530.092529296875, -497.5281982421875, -464.9638671875, -432.3995666503906, -399.83526611328125, -367.2709655761719, -334.7066650390625, -302.142333984375, -269.5780334472656, -237.01373291015625, -204.4494171142578, -171.88510131835938, -139.32086181640625, -106.75655364990234, -74.19224548339844, -41.62793731689453, -9.063629150390625, 23.50067138671875, 56.06498718261719, 88.62930297851562, 121.193603515625, 153.75790405273438, 186.3222198486328, 218.88653564453125, 251.45083618164062, 284.01513671875, 316.5794677734375, 349.1437683105469, 381.70806884765625, 414.2723693847656, 446.836669921875, 479.4010009765625, 511.9653015136719, 544.5296020507812, 577.0939331054688, 609.658203125, 642.2225341796875, 674.786865234375, 707.3511352539062, 739.9154663085938, 772.479736328125, 805.0440673828125, 837.6083984375, 870.1727294921875, 902.7369995117188]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 11.0, 9.0, 22.0, 33.0, 46.0, 60.0, 78.0, 146.0, 228.0, 406.0, 697.0, 1339.0, 2702.0, 6160.0, 16755.0, 69253.0, 536323.0, 2578308.0, 847198.0, 98720.0, 21584.0, 7502.0, 3215.0, 1529.0, 789.0, 438.0, 244.0, 149.0, 83.0, 77.0, 44.0, 32.0, 25.0, 18.0, 15.0, 7.0, 5.0, 6.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.5625, -97.380859375, -94.19921875, -91.017578125, -87.8359375, -84.654296875, -81.47265625, -78.291015625, -75.109375, -71.927734375, -68.74609375, -65.564453125, -62.3828125, -59.201171875, -56.01953125, -52.837890625, -49.65625, -46.474609375, -43.29296875, -40.111328125, -36.9296875, -33.748046875, -30.56640625, -27.384765625, -24.203125, -21.021484375, -17.83984375, -14.658203125, -11.4765625, -8.294921875, -5.11328125, -1.931640625, 1.25, 4.431640625, 7.61328125, 10.794921875, 13.9765625, 17.158203125, 20.33984375, 23.521484375, 26.703125, 29.884765625, 33.06640625, 36.248046875, 39.4296875, 42.611328125, 45.79296875, 48.974609375, 52.15625, 55.337890625, 58.51953125, 61.701171875, 64.8828125, 68.064453125, 71.24609375, 74.427734375, 77.609375, 80.791015625, 83.97265625, 87.154296875, 90.3359375, 93.517578125, 96.69921875, 99.880859375, 103.0625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 7.0, 6.0, 8.0, 14.0, 16.0, 18.0, 26.0, 29.0, 35.0, 28.0, 30.0, 40.0, 30.0, 35.0, 44.0, 50.0, 42.0, 57.0, 52.0, 36.0, 46.0, 41.0, 35.0, 35.0, 29.0, 32.0, 34.0, 23.0, 21.0, 21.0, 12.0, 16.0, 10.0, 7.0, 4.0, 11.0, 9.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.90625, -61.87841796875, -59.8505859375, -57.82275390625, -55.794921875, -53.76708984375, -51.7392578125, -49.71142578125, -47.68359375, -45.65576171875, -43.6279296875, -41.60009765625, -39.572265625, -37.54443359375, -35.5166015625, -33.48876953125, -31.4609375, -29.43310546875, -27.4052734375, -25.37744140625, -23.349609375, -21.32177734375, -19.2939453125, -17.26611328125, -15.23828125, -13.21044921875, -11.1826171875, -9.15478515625, -7.126953125, -5.09912109375, -3.0712890625, -1.04345703125, 0.984375, 3.01220703125, 5.0400390625, 7.06787109375, 9.095703125, 11.12353515625, 13.1513671875, 15.17919921875, 17.20703125, 19.23486328125, 21.2626953125, 23.29052734375, 25.318359375, 27.34619140625, 29.3740234375, 31.40185546875, 33.4296875, 35.45751953125, 37.4853515625, 39.51318359375, 41.541015625, 43.56884765625, 45.5966796875, 47.62451171875, 49.65234375, 51.68017578125, 53.7080078125, 55.73583984375, 57.763671875, 59.79150390625, 61.8193359375, 63.84716796875, 65.875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 7.0, 17.0, 24.0, 27.0, 53.0, 78.0, 114.0, 220.0, 532.0, 1393.0, 4674.0, 22882.0, 278022.0, 3724162.0, 140391.0, 16005.0, 3623.0, 1148.0, 460.0, 181.0, 108.0, 47.0, 37.0, 18.0, 13.0, 7.0, 9.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-275.0, -267.23046875, -259.4609375, -251.69140625, -243.921875, -236.15234375, -228.3828125, -220.61328125, -212.84375, -205.07421875, -197.3046875, -189.53515625, -181.765625, -173.99609375, -166.2265625, -158.45703125, -150.6875, -142.91796875, -135.1484375, -127.37890625, -119.609375, -111.83984375, -104.0703125, -96.30078125, -88.53125, -80.76171875, -72.9921875, -65.22265625, -57.453125, -49.68359375, -41.9140625, -34.14453125, -26.375, -18.60546875, -10.8359375, -3.06640625, 4.703125, 12.47265625, 20.2421875, 28.01171875, 35.78125, 43.55078125, 51.3203125, 59.08984375, 66.859375, 74.62890625, 82.3984375, 90.16796875, 97.9375, 105.70703125, 113.4765625, 121.24609375, 129.015625, 136.78515625, 144.5546875, 152.32421875, 160.09375, 167.86328125, 175.6328125, 183.40234375, 191.171875, 198.94140625, 206.7109375, 214.48046875, 222.25]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 13.0, 16.0, 13.0, 17.0, 28.0, 36.0, 49.0, 82.0, 136.0, 217.0, 428.0, 651.0, 800.0, 598.0, 369.0, 189.0, 129.0, 70.0, 60.0, 35.0, 22.0, 22.0, 13.0, 12.0, 11.0, 11.0, 14.0, 3.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-208.625, -203.05078125, -197.4765625, -191.90234375, -186.328125, -180.75390625, -175.1796875, -169.60546875, -164.03125, -158.45703125, -152.8828125, -147.30859375, -141.734375, -136.16015625, -130.5859375, -125.01171875, -119.4375, -113.86328125, -108.2890625, -102.71484375, -97.140625, -91.56640625, -85.9921875, -80.41796875, -74.84375, -69.26953125, -63.6953125, -58.12109375, -52.546875, -46.97265625, -41.3984375, -35.82421875, -30.25, -24.67578125, -19.1015625, -13.52734375, -7.953125, -2.37890625, 3.1953125, 8.76953125, 14.34375, 19.91796875, 25.4921875, 31.06640625, 36.640625, 42.21484375, 47.7890625, 53.36328125, 58.9375, 64.51171875, 70.0859375, 75.66015625, 81.234375, 86.80859375, 92.3828125, 97.95703125, 103.53125, 109.10546875, 114.6796875, 120.25390625, 125.828125, 131.40234375, 136.9765625, 142.55078125, 148.125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 6.0, 4.0, 5.0, 14.0, 33.0, 62.0, 166.0, 259.0, 198.0, 133.0, 55.0, 26.0, 20.0, 8.0, 1.0, 1.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1606.7406005859375, -1539.2440185546875, -1471.74755859375, -1404.2509765625, -1336.75439453125, -1269.2578125, -1201.7613525390625, -1134.2647705078125, -1066.768310546875, -999.2717895507812, -931.7752075195312, -864.2786865234375, -796.7821044921875, -729.2855834960938, -661.7890625, -594.29248046875, -526.7958984375, -459.2993469238281, -391.80279541015625, -324.3062744140625, -256.8097229003906, -189.31317138671875, -121.816650390625, -54.320098876953125, 13.17645263671875, 80.6729965209961, 148.16954040527344, 215.66607666015625, 283.1626281738281, 350.6591796875, 418.15570068359375, 485.6522521972656, 553.148681640625, 620.6452026367188, 688.1417846679688, 755.6383056640625, 823.1348876953125, 890.6314086914062, 958.1279296875, 1025.62451171875, 1093.12109375, 1160.61767578125, 1228.1141357421875, 1295.6107177734375, 1363.1072998046875, 1430.603759765625, 1498.100341796875, 1565.596923828125, 1633.0933837890625, 1700.5899658203125, 1768.08642578125, 1835.5830078125, 1903.07958984375, 1970.576171875, 2038.0726318359375, 2105.569091796875, 2173.065673828125, 2240.562255859375, 2308.058837890625, 2375.55517578125, 2443.0517578125, 2510.54833984375, 2578.044921875, 2645.54150390625, 2713.0380859375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 14.0, 10.0, 16.0, 15.0, 18.0, 23.0, 23.0, 26.0, 35.0, 33.0, 29.0, 50.0, 36.0, 50.0, 46.0, 44.0, 55.0, 51.0, 52.0, 47.0, 49.0, 35.0, 39.0, 29.0, 33.0, 21.0, 23.0, 16.0, 18.0, 12.0, 13.0, 11.0, 5.0, 3.0, 8.0, 1.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-986.668701171875, -959.8295288085938, -932.9903564453125, -906.1511840820312, -879.31201171875, -852.472900390625, -825.6337280273438, -798.7945556640625, -771.9553833007812, -745.1162109375, -718.2770385742188, -691.4378662109375, -664.5987548828125, -637.759521484375, -610.92041015625, -584.0812377929688, -557.2420654296875, -530.4028930664062, -503.563720703125, -476.7245788574219, -449.8854064941406, -423.0462341308594, -396.20709228515625, -369.367919921875, -342.52874755859375, -315.6895751953125, -288.85040283203125, -262.0112609863281, -235.17208862304688, -208.33291625976562, -181.49375915527344, -154.65460205078125, -127.81549072265625, -100.97632598876953, -74.13716125488281, -47.297996520996094, -20.458831787109375, 6.380340576171875, 33.21949768066406, 60.05865478515625, 86.8978271484375, 113.73699188232422, 140.57615661621094, 167.41531372070312, 194.25448608398438, 221.09365844726562, 247.9328155517578, 274.77197265625, 301.61114501953125, 328.4503173828125, 355.28948974609375, 382.1286315917969, 408.9678039550781, 435.8069763183594, 462.6461181640625, 489.48529052734375, 516.324462890625, 543.1636352539062, 570.0028076171875, 596.8419799804688, 623.68115234375, 650.520263671875, 677.3594360351562, 704.1986083984375, 731.0377807617188]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 11.0, 15.0, 23.0, 39.0, 36.0, 92.0, 131.0, 232.0, 414.0, 704.0, 1363.0, 2469.0, 5103.0, 10753.0, 24717.0, 61592.0, 163224.0, 352961.0, 256356.0, 99008.0, 38369.0, 16187.0, 7175.0, 3538.0, 1733.0, 981.0, 539.0, 314.0, 170.0, 112.0, 83.0, 47.0, 23.0, 10.0, 14.0, 7.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.4375, -65.779296875, -63.12109375, -60.462890625, -57.8046875, -55.146484375, -52.48828125, -49.830078125, -47.171875, -44.513671875, -41.85546875, -39.197265625, -36.5390625, -33.880859375, -31.22265625, -28.564453125, -25.90625, -23.248046875, -20.58984375, -17.931640625, -15.2734375, -12.615234375, -9.95703125, -7.298828125, -4.640625, -1.982421875, 0.67578125, 3.333984375, 5.9921875, 8.650390625, 11.30859375, 13.966796875, 16.625, 19.283203125, 21.94140625, 24.599609375, 27.2578125, 29.916015625, 32.57421875, 35.232421875, 37.890625, 40.548828125, 43.20703125, 45.865234375, 48.5234375, 51.181640625, 53.83984375, 56.498046875, 59.15625, 61.814453125, 64.47265625, 67.130859375, 69.7890625, 72.447265625, 75.10546875, 77.763671875, 80.421875, 83.080078125, 85.73828125, 88.396484375, 91.0546875, 93.712890625, 96.37109375, 99.029296875, 101.6875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 7.0, 7.0, 10.0, 17.0, 19.0, 27.0, 17.0, 27.0, 31.0, 30.0, 35.0, 35.0, 43.0, 46.0, 53.0, 43.0, 62.0, 47.0, 47.0, 49.0, 44.0, 38.0, 30.0, 38.0, 23.0, 27.0, 19.0, 25.0, 16.0, 14.0, 18.0, 12.0, 11.0, 7.0, 5.0, 6.0, 2.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.125, -71.9541015625, -69.783203125, -67.6123046875, -65.44140625, -63.2705078125, -61.099609375, -58.9287109375, -56.7578125, -54.5869140625, -52.416015625, -50.2451171875, -48.07421875, -45.9033203125, -43.732421875, -41.5615234375, -39.390625, -37.2197265625, -35.048828125, -32.8779296875, -30.70703125, -28.5361328125, -26.365234375, -24.1943359375, -22.0234375, -19.8525390625, -17.681640625, -15.5107421875, -13.33984375, -11.1689453125, -8.998046875, -6.8271484375, -4.65625, -2.4853515625, -0.314453125, 1.8564453125, 4.02734375, 6.1982421875, 8.369140625, 10.5400390625, 12.7109375, 14.8818359375, 17.052734375, 19.2236328125, 21.39453125, 23.5654296875, 25.736328125, 27.9072265625, 30.078125, 32.2490234375, 34.419921875, 36.5908203125, 38.76171875, 40.9326171875, 43.103515625, 45.2744140625, 47.4453125, 49.6162109375, 51.787109375, 53.9580078125, 56.12890625, 58.2998046875, 60.470703125, 62.6416015625, 64.8125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 8.0, 12.0, 24.0, 38.0, 65.0, 155.0, 481.0, 1544.0, 9270.0, 166689.0, 834431.0, 31023.0, 3473.0, 835.0, 281.0, 94.0, 64.0, 27.0, 13.0, 14.0, 8.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.25, -256.2265625, -245.203125, -234.1796875, -223.15625, -212.1328125, -201.109375, -190.0859375, -179.0625, -168.0390625, -157.015625, -145.9921875, -134.96875, -123.9453125, -112.921875, -101.8984375, -90.875, -79.8515625, -68.828125, -57.8046875, -46.78125, -35.7578125, -24.734375, -13.7109375, -2.6875, 8.3359375, 19.359375, 30.3828125, 41.40625, 52.4296875, 63.453125, 74.4765625, 85.5, 96.5234375, 107.546875, 118.5703125, 129.59375, 140.6171875, 151.640625, 162.6640625, 173.6875, 184.7109375, 195.734375, 206.7578125, 217.78125, 228.8046875, 239.828125, 250.8515625, 261.875, 272.8984375, 283.921875, 294.9453125, 305.96875, 316.9921875, 328.015625, 339.0390625, 350.0625, 361.0859375, 372.109375, 383.1328125, 394.15625, 405.1796875, 416.203125, 427.2265625, 438.25]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 11.0, 9.0, 23.0, 21.0, 44.0, 59.0, 72.0, 73.0, 80.0, 88.0, 80.0, 87.0, 60.0, 60.0, 48.0, 42.0, 40.0, 41.0, 17.0, 14.0, 6.0, 11.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-467.0, -454.046875, -441.09375, -428.140625, -415.1875, -402.234375, -389.28125, -376.328125, -363.375, -350.421875, -337.46875, -324.515625, -311.5625, -298.609375, -285.65625, -272.703125, -259.75, -246.796875, -233.84375, -220.890625, -207.9375, -194.984375, -182.03125, -169.078125, -156.125, -143.171875, -130.21875, -117.265625, -104.3125, -91.359375, -78.40625, -65.453125, -52.5, -39.546875, -26.59375, -13.640625, -0.6875, 12.265625, 25.21875, 38.171875, 51.125, 64.078125, 77.03125, 89.984375, 102.9375, 115.890625, 128.84375, 141.796875, 154.75, 167.703125, 180.65625, 193.609375, 206.5625, 219.515625, 232.46875, 245.421875, 258.375, 271.328125, 284.28125, 297.234375, 310.1875, 323.140625, 336.09375, 349.046875, 362.0]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 8.0, 17.0, 18.0, 35.0, 70.0, 106.0, 229.0, 414.0, 907.0, 2309.0, 6156.0, 21591.0, 96446.0, 596482.0, 253661.0, 50463.0, 12662.0, 4040.0, 1513.0, 692.0, 326.0, 173.0, 77.0, 54.0, 25.0, 27.0, 18.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.125, -45.5947265625, -44.064453125, -42.5341796875, -41.00390625, -39.4736328125, -37.943359375, -36.4130859375, -34.8828125, -33.3525390625, -31.822265625, -30.2919921875, -28.76171875, -27.2314453125, -25.701171875, -24.1708984375, -22.640625, -21.1103515625, -19.580078125, -18.0498046875, -16.51953125, -14.9892578125, -13.458984375, -11.9287109375, -10.3984375, -8.8681640625, -7.337890625, -5.8076171875, -4.27734375, -2.7470703125, -1.216796875, 0.3134765625, 1.84375, 3.3740234375, 4.904296875, 6.4345703125, 7.96484375, 9.4951171875, 11.025390625, 12.5556640625, 14.0859375, 15.6162109375, 17.146484375, 18.6767578125, 20.20703125, 21.7373046875, 23.267578125, 24.7978515625, 26.328125, 27.8583984375, 29.388671875, 30.9189453125, 32.44921875, 33.9794921875, 35.509765625, 37.0400390625, 38.5703125, 40.1005859375, 41.630859375, 43.1611328125, 44.69140625, 46.2216796875, 47.751953125, 49.2822265625, 50.8125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 8.0, 11.0, 10.0, 17.0, 36.0, 29.0, 46.0, 67.0, 90.0, 115.0, 109.0, 92.0, 81.0, 75.0, 59.0, 36.0, 30.0, 23.0, 19.0, 12.0, 12.0, 7.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0142059326171875, -0.013648748397827148, -0.013091564178466797, -0.012534379959106445, -0.011977195739746094, -0.011420011520385742, -0.01086282730102539, -0.010305643081665039, -0.009748458862304688, -0.009191274642944336, -0.008634090423583984, -0.008076906204223633, -0.007519721984863281, -0.00696253776550293, -0.006405353546142578, -0.0058481693267822266, -0.005290985107421875, -0.0047338008880615234, -0.004176616668701172, -0.0036194324493408203, -0.0030622482299804688, -0.002505064010620117, -0.0019478797912597656, -0.001390695571899414, -0.0008335113525390625, -0.00027632713317871094, 0.0002808570861816406, 0.0008380413055419922, 0.0013952255249023438, 0.0019524097442626953, 0.002509593963623047, 0.0030667781829833984, 0.00362396240234375, 0.0041811466217041016, 0.004738330841064453, 0.005295515060424805, 0.005852699279785156, 0.006409883499145508, 0.006967067718505859, 0.007524251937866211, 0.008081436157226562, 0.008638620376586914, 0.009195804595947266, 0.009752988815307617, 0.010310173034667969, 0.01086735725402832, 0.011424541473388672, 0.011981725692749023, 0.012538909912109375, 0.013096094131469727, 0.013653278350830078, 0.01421046257019043, 0.014767646789550781, 0.015324831008911133, 0.015882015228271484, 0.016439199447631836, 0.016996383666992188, 0.01755356788635254, 0.01811075210571289, 0.018667936325073242, 0.019225120544433594, 0.019782304763793945, 0.020339488983154297, 0.02089667320251465, 0.021453857421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 6.0, 4.0, 3.0, 7.0, 19.0, 13.0, 25.0, 30.0, 50.0, 96.0, 172.0, 307.0, 710.0, 1808.0, 5350.0, 18402.0, 85722.0, 576002.0, 285429.0, 55109.0, 12882.0, 3807.0, 1420.0, 584.0, 253.0, 117.0, 64.0, 48.0, 39.0, 29.0, 10.0, 9.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-54.0, -52.4052734375, -50.810546875, -49.2158203125, -47.62109375, -46.0263671875, -44.431640625, -42.8369140625, -41.2421875, -39.6474609375, -38.052734375, -36.4580078125, -34.86328125, -33.2685546875, -31.673828125, -30.0791015625, -28.484375, -26.8896484375, -25.294921875, -23.7001953125, -22.10546875, -20.5107421875, -18.916015625, -17.3212890625, -15.7265625, -14.1318359375, -12.537109375, -10.9423828125, -9.34765625, -7.7529296875, -6.158203125, -4.5634765625, -2.96875, -1.3740234375, 0.220703125, 1.8154296875, 3.41015625, 5.0048828125, 6.599609375, 8.1943359375, 9.7890625, 11.3837890625, 12.978515625, 14.5732421875, 16.16796875, 17.7626953125, 19.357421875, 20.9521484375, 22.546875, 24.1416015625, 25.736328125, 27.3310546875, 28.92578125, 30.5205078125, 32.115234375, 33.7099609375, 35.3046875, 36.8994140625, 38.494140625, 40.0888671875, 41.68359375, 43.2783203125, 44.873046875, 46.4677734375, 48.0625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 9.0, 12.0, 11.0, 19.0, 13.0, 29.0, 33.0, 43.0, 44.0, 43.0, 51.0, 73.0, 89.0, 67.0, 58.0, 67.0, 61.0, 58.0, 42.0, 40.0, 28.0, 29.0, 11.0, 15.0, 11.0, 8.0, 7.0, 8.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.625, -46.1416015625, -44.658203125, -43.1748046875, -41.69140625, -40.2080078125, -38.724609375, -37.2412109375, -35.7578125, -34.2744140625, -32.791015625, -31.3076171875, -29.82421875, -28.3408203125, -26.857421875, -25.3740234375, -23.890625, -22.4072265625, -20.923828125, -19.4404296875, -17.95703125, -16.4736328125, -14.990234375, -13.5068359375, -12.0234375, -10.5400390625, -9.056640625, -7.5732421875, -6.08984375, -4.6064453125, -3.123046875, -1.6396484375, -0.15625, 1.3271484375, 2.810546875, 4.2939453125, 5.77734375, 7.2607421875, 8.744140625, 10.2275390625, 11.7109375, 13.1943359375, 14.677734375, 16.1611328125, 17.64453125, 19.1279296875, 20.611328125, 22.0947265625, 23.578125, 25.0615234375, 26.544921875, 28.0283203125, 29.51171875, 30.9951171875, 32.478515625, 33.9619140625, 35.4453125, 36.9287109375, 38.412109375, 39.8955078125, 41.37890625, 42.8623046875, 44.345703125, 45.8291015625, 47.3125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 9.0, 19.0, 43.0, 70.0, 113.0, 199.0, 238.0, 120.0, 82.0, 40.0, 20.0, 15.0, 11.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1245.5618896484375, -1204.123779296875, -1162.6856689453125, -1121.24755859375, -1079.8094482421875, -1038.371337890625, -996.9331665039062, -955.4950561523438, -914.0569458007812, -872.6188354492188, -831.1807250976562, -789.7426147460938, -748.304443359375, -706.8663330078125, -665.42822265625, -623.9901123046875, -582.552001953125, -541.1138916015625, -499.67578125, -458.2376403808594, -416.7995300292969, -375.3614196777344, -333.92327880859375, -292.48516845703125, -251.04705810546875, -209.60894775390625, -168.1708221435547, -126.73270416259766, -85.29458618164062, -43.856475830078125, -2.4183502197265625, 39.019775390625, 80.457763671875, 121.89588165283203, 163.33399963378906, 204.77212524414062, 246.21023559570312, 287.6483459472656, 329.08648681640625, 370.52459716796875, 411.96270751953125, 453.40081787109375, 494.83892822265625, 536.2770385742188, 577.7152099609375, 619.1533203125, 660.5914306640625, 702.029541015625, 743.4676513671875, 784.90576171875, 826.3438720703125, 867.781982421875, 909.2200927734375, 950.658203125, 992.0963745117188, 1033.534423828125, 1074.97265625, 1116.4107666015625, 1157.848876953125, 1199.2869873046875, 1240.72509765625, 1282.1632080078125, 1323.601318359375, 1365.03955078125, 1406.4775390625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 7.0, 15.0, 9.0, 8.0, 6.0, 16.0, 22.0, 15.0, 29.0, 27.0, 28.0, 33.0, 32.0, 32.0, 52.0, 66.0, 94.0, 76.0, 69.0, 56.0, 41.0, 35.0, 31.0, 16.0, 26.0, 26.0, 27.0, 23.0, 12.0, 9.0, 19.0, 7.0, 11.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1107.3682861328125, -1075.04150390625, -1042.7147216796875, -1010.3878784179688, -978.0610961914062, -945.7343139648438, -913.407470703125, -881.0806884765625, -848.75390625, -816.4271240234375, -784.100341796875, -751.7734985351562, -719.4467163085938, -687.1199340820312, -654.7930908203125, -622.46630859375, -590.1395263671875, -557.812744140625, -525.4859619140625, -493.15911865234375, -460.83233642578125, -428.50555419921875, -396.1787414550781, -363.8519287109375, -331.525146484375, -299.1983642578125, -266.8715515136719, -234.5447540283203, -202.21795654296875, -169.8911590576172, -137.56436157226562, -105.23756408691406, -72.9107666015625, -40.58396911621094, -8.257171630859375, 24.069625854492188, 56.39642333984375, 88.72322082519531, 121.05001831054688, 153.37681579589844, 185.70361328125, 218.03041076660156, 250.35720825195312, 282.68402099609375, 315.01080322265625, 347.33758544921875, 379.6643981933594, 411.9912109375, 444.3179931640625, 476.644775390625, 508.9715881347656, 541.2984008789062, 573.6251831054688, 605.9519653320312, 638.27880859375, 670.6055908203125, 702.932373046875, 735.2591552734375, 767.5859375, 799.9127807617188, 832.2395629882812, 864.5663452148438, 896.8931884765625, 929.219970703125, 961.5467529296875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 3.0, 8.0, 16.0, 13.0, 23.0, 24.0, 27.0, 34.0, 51.0, 83.0, 243.0, 818.0, 3523.0, 28514.0, 1314904.0, 2782705.0, 55767.0, 5619.0, 1155.0, 365.0, 123.0, 81.0, 35.0, 35.0, 28.0, 18.0, 16.0, 6.0, 14.0, 5.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-243.0, -236.625, -230.25, -223.875, -217.5, -211.125, -204.75, -198.375, -192.0, -185.625, -179.25, -172.875, -166.5, -160.125, -153.75, -147.375, -141.0, -134.625, -128.25, -121.875, -115.5, -109.125, -102.75, -96.375, -90.0, -83.625, -77.25, -70.875, -64.5, -58.125, -51.75, -45.375, -39.0, -32.625, -26.25, -19.875, -13.5, -7.125, -0.75, 5.625, 12.0, 18.375, 24.75, 31.125, 37.5, 43.875, 50.25, 56.625, 63.0, 69.375, 75.75, 82.125, 88.5, 94.875, 101.25, 107.625, 114.0, 120.375, 126.75, 133.125, 139.5, 145.875, 152.25, 158.625, 165.0]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 11.0, 4.0, 9.0, 12.0, 18.0, 13.0, 25.0, 29.0, 29.0, 29.0, 44.0, 39.0, 44.0, 55.0, 59.0, 61.0, 48.0, 44.0, 61.0, 45.0, 40.0, 47.0, 38.0, 43.0, 37.0, 24.0, 20.0, 19.0, 15.0, 8.0, 9.0, 7.0, 5.0, 5.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-90.875, -88.3798828125, -85.884765625, -83.3896484375, -80.89453125, -78.3994140625, -75.904296875, -73.4091796875, -70.9140625, -68.4189453125, -65.923828125, -63.4287109375, -60.93359375, -58.4384765625, -55.943359375, -53.4482421875, -50.953125, -48.4580078125, -45.962890625, -43.4677734375, -40.97265625, -38.4775390625, -35.982421875, -33.4873046875, -30.9921875, -28.4970703125, -26.001953125, -23.5068359375, -21.01171875, -18.5166015625, -16.021484375, -13.5263671875, -11.03125, -8.5361328125, -6.041015625, -3.5458984375, -1.05078125, 1.4443359375, 3.939453125, 6.4345703125, 8.9296875, 11.4248046875, 13.919921875, 16.4150390625, 18.91015625, 21.4052734375, 23.900390625, 26.3955078125, 28.890625, 31.3857421875, 33.880859375, 36.3759765625, 38.87109375, 41.3662109375, 43.861328125, 46.3564453125, 48.8515625, 51.3466796875, 53.841796875, 56.3369140625, 58.83203125, 61.3271484375, 63.822265625, 66.3173828125, 68.8125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 6.0, 4.0, 13.0, 16.0, 33.0, 58.0, 111.0, 298.0, 1074.0, 8215.0, 318352.0, 3833625.0, 29207.0, 2361.0, 525.0, 198.0, 84.0, 30.0, 20.0, 20.0, 7.0, 5.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.875, -196.470703125, -185.06640625, -173.662109375, -162.2578125, -150.853515625, -139.44921875, -128.044921875, -116.640625, -105.236328125, -93.83203125, -82.427734375, -71.0234375, -59.619140625, -48.21484375, -36.810546875, -25.40625, -14.001953125, -2.59765625, 8.806640625, 20.2109375, 31.615234375, 43.01953125, 54.423828125, 65.828125, 77.232421875, 88.63671875, 100.041015625, 111.4453125, 122.849609375, 134.25390625, 145.658203125, 157.0625, 168.466796875, 179.87109375, 191.275390625, 202.6796875, 214.083984375, 225.48828125, 236.892578125, 248.296875, 259.701171875, 271.10546875, 282.509765625, 293.9140625, 305.318359375, 316.72265625, 328.126953125, 339.53125, 350.935546875, 362.33984375, 373.744140625, 385.1484375, 396.552734375, 407.95703125, 419.361328125, 430.765625, 442.169921875, 453.57421875, 464.978515625, 476.3828125, 487.787109375, 499.19140625, 510.595703125, 522.0]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 3.0, 12.0, 5.0, 11.0, 18.0, 20.0, 32.0, 60.0, 75.0, 152.0, 258.0, 529.0, 867.0, 861.0, 524.0, 273.0, 147.0, 69.0, 56.0, 27.0, 21.0, 16.0, 16.0, 7.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.5, -155.294921875, -149.08984375, -142.884765625, -136.6796875, -130.474609375, -124.26953125, -118.064453125, -111.859375, -105.654296875, -99.44921875, -93.244140625, -87.0390625, -80.833984375, -74.62890625, -68.423828125, -62.21875, -56.013671875, -49.80859375, -43.603515625, -37.3984375, -31.193359375, -24.98828125, -18.783203125, -12.578125, -6.373046875, -0.16796875, 6.037109375, 12.2421875, 18.447265625, 24.65234375, 30.857421875, 37.0625, 43.267578125, 49.47265625, 55.677734375, 61.8828125, 68.087890625, 74.29296875, 80.498046875, 86.703125, 92.908203125, 99.11328125, 105.318359375, 111.5234375, 117.728515625, 123.93359375, 130.138671875, 136.34375, 142.548828125, 148.75390625, 154.958984375, 161.1640625, 167.369140625, 173.57421875, 179.779296875, 185.984375, 192.189453125, 198.39453125, 204.599609375, 210.8046875, 217.009765625, 223.21484375, 229.419921875, 235.625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 13.0, 62.0, 173.0, 349.0, 258.0, 95.0, 35.0, 12.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4054.216064453125, -3972.801513671875, -3891.38671875, -3809.97216796875, -3728.5576171875, -3647.14306640625, -3565.728271484375, -3484.313720703125, -3402.89892578125, -3321.484375, -3240.069580078125, -3158.655029296875, -3077.240478515625, -2995.82568359375, -2914.4111328125, -2832.99658203125, -2751.58203125, -2670.16748046875, -2588.752685546875, -2507.338134765625, -2425.923583984375, -2344.5087890625, -2263.09423828125, -2181.6796875, -2100.26513671875, -2018.8504638671875, -1937.4359130859375, -1856.021240234375, -1774.606689453125, -1693.1920166015625, -1611.77734375, -1530.36279296875, -1448.947998046875, -1367.5333251953125, -1286.1187744140625, -1204.7041015625, -1123.28955078125, -1041.8748779296875, -960.460205078125, -879.0455932617188, -797.6309814453125, -716.2163696289062, -634.8017578125, -553.3870849609375, -471.97247314453125, -390.557861328125, -309.1432189941406, -227.72857666015625, -146.31396484375, -64.89933776855469, 16.515289306640625, 97.92991638183594, 179.34454345703125, 260.7591552734375, 342.1737976074219, 423.58843994140625, 505.0030517578125, 586.4176635742188, 667.832275390625, 749.2469482421875, 830.6615600585938, 912.076171875, 993.4908447265625, 1074.905517578125, 1156.320068359375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 5.0, 8.0, 7.0, 9.0, 10.0, 16.0, 22.0, 20.0, 17.0, 30.0, 32.0, 37.0, 25.0, 41.0, 35.0, 38.0, 41.0, 34.0, 29.0, 37.0, 40.0, 40.0, 49.0, 32.0, 40.0, 38.0, 30.0, 35.0, 28.0, 22.0, 21.0, 23.0, 17.0, 10.0, 18.0, 13.0, 10.0, 9.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-566.1646118164062, -547.57373046875, -528.9827880859375, -510.39190673828125, -491.8009948730469, -473.2100830078125, -454.61920166015625, -436.0282897949219, -417.4373779296875, -398.8464660644531, -380.25555419921875, -361.6646728515625, -343.0737609863281, -324.48284912109375, -305.8919677734375, -287.3010559082031, -268.71014404296875, -250.11923217773438, -231.52833557128906, -212.93743896484375, -194.34652709960938, -175.755615234375, -157.1647186279297, -138.57382202148438, -119.98291015625, -101.39200592041016, -82.80110168457031, -64.21019744873047, -45.619293212890625, -27.02838897705078, -8.437484741210938, 10.153411865234375, 28.7442626953125, 47.335166931152344, 65.92607116699219, 84.51697540283203, 103.10787963867188, 121.69878387451172, 140.28968811035156, 158.88058471679688, 177.47149658203125, 196.06240844726562, 214.65330505371094, 233.24420166015625, 251.83511352539062, 270.426025390625, 289.01690673828125, 307.6078186035156, 326.19873046875, 344.7896423339844, 363.38055419921875, 381.971435546875, 400.5623474121094, 419.15325927734375, 437.744140625, 456.3350524902344, 474.92596435546875, 493.5168762207031, 512.1077880859375, 530.6986694335938, 549.28955078125, 567.8804931640625, 586.4713745117188, 605.062255859375, 623.6531982421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 12.0, 8.0, 23.0, 16.0, 28.0, 67.0, 90.0, 145.0, 194.0, 333.0, 544.0, 928.0, 1480.0, 2787.0, 5027.0, 9733.0, 18793.0, 39736.0, 87738.0, 204591.0, 331554.0, 188855.0, 81194.0, 36934.0, 17896.0, 8915.0, 4702.0, 2480.0, 1436.0, 877.0, 539.0, 341.0, 218.0, 135.0, 67.0, 44.0, 27.0, 26.0, 19.0, 10.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-79.4375, -77.19677734375, -74.9560546875, -72.71533203125, -70.474609375, -68.23388671875, -65.9931640625, -63.75244140625, -61.51171875, -59.27099609375, -57.0302734375, -54.78955078125, -52.548828125, -50.30810546875, -48.0673828125, -45.82666015625, -43.5859375, -41.34521484375, -39.1044921875, -36.86376953125, -34.623046875, -32.38232421875, -30.1416015625, -27.90087890625, -25.66015625, -23.41943359375, -21.1787109375, -18.93798828125, -16.697265625, -14.45654296875, -12.2158203125, -9.97509765625, -7.734375, -5.49365234375, -3.2529296875, -1.01220703125, 1.228515625, 3.46923828125, 5.7099609375, 7.95068359375, 10.19140625, 12.43212890625, 14.6728515625, 16.91357421875, 19.154296875, 21.39501953125, 23.6357421875, 25.87646484375, 28.1171875, 30.35791015625, 32.5986328125, 34.83935546875, 37.080078125, 39.32080078125, 41.5615234375, 43.80224609375, 46.04296875, 48.28369140625, 50.5244140625, 52.76513671875, 55.005859375, 57.24658203125, 59.4873046875, 61.72802734375, 63.96875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 7.0, 6.0, 10.0, 7.0, 7.0, 11.0, 19.0, 19.0, 24.0, 19.0, 31.0, 38.0, 30.0, 35.0, 42.0, 51.0, 47.0, 42.0, 49.0, 40.0, 50.0, 52.0, 47.0, 43.0, 36.0, 27.0, 35.0, 32.0, 21.0, 17.0, 22.0, 14.0, 13.0, 8.0, 10.0, 5.0, 7.0, 10.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-71.75, -69.5888671875, -67.427734375, -65.2666015625, -63.10546875, -60.9443359375, -58.783203125, -56.6220703125, -54.4609375, -52.2998046875, -50.138671875, -47.9775390625, -45.81640625, -43.6552734375, -41.494140625, -39.3330078125, -37.171875, -35.0107421875, -32.849609375, -30.6884765625, -28.52734375, -26.3662109375, -24.205078125, -22.0439453125, -19.8828125, -17.7216796875, -15.560546875, -13.3994140625, -11.23828125, -9.0771484375, -6.916015625, -4.7548828125, -2.59375, -0.4326171875, 1.728515625, 3.8896484375, 6.05078125, 8.2119140625, 10.373046875, 12.5341796875, 14.6953125, 16.8564453125, 19.017578125, 21.1787109375, 23.33984375, 25.5009765625, 27.662109375, 29.8232421875, 31.984375, 34.1455078125, 36.306640625, 38.4677734375, 40.62890625, 42.7900390625, 44.951171875, 47.1123046875, 49.2734375, 51.4345703125, 53.595703125, 55.7568359375, 57.91796875, 60.0791015625, 62.240234375, 64.4013671875, 66.5625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 7.0, 4.0, 4.0, 2.0, 5.0, 10.0, 13.0, 16.0, 23.0, 25.0, 49.0, 45.0, 90.0, 123.0, 213.0, 363.0, 679.0, 1400.0, 3719.0, 13234.0, 77974.0, 765463.0, 154751.0, 21104.0, 5387.0, 1947.0, 797.0, 423.0, 225.0, 135.0, 94.0, 66.0, 34.0, 22.0, 21.0, 20.0, 15.0, 13.0, 5.0, 9.0, 6.0, 7.0, 7.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.375, -202.962890625, -196.55078125, -190.138671875, -183.7265625, -177.314453125, -170.90234375, -164.490234375, -158.078125, -151.666015625, -145.25390625, -138.841796875, -132.4296875, -126.017578125, -119.60546875, -113.193359375, -106.78125, -100.369140625, -93.95703125, -87.544921875, -81.1328125, -74.720703125, -68.30859375, -61.896484375, -55.484375, -49.072265625, -42.66015625, -36.248046875, -29.8359375, -23.423828125, -17.01171875, -10.599609375, -4.1875, 2.224609375, 8.63671875, 15.048828125, 21.4609375, 27.873046875, 34.28515625, 40.697265625, 47.109375, 53.521484375, 59.93359375, 66.345703125, 72.7578125, 79.169921875, 85.58203125, 91.994140625, 98.40625, 104.818359375, 111.23046875, 117.642578125, 124.0546875, 130.466796875, 136.87890625, 143.291015625, 149.703125, 156.115234375, 162.52734375, 168.939453125, 175.3515625, 181.763671875, 188.17578125, 194.587890625, 201.0]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 1.0, 2.0, 10.0, 8.0, 11.0, 14.0, 32.0, 40.0, 33.0, 36.0, 47.0, 56.0, 70.0, 84.0, 86.0, 81.0, 71.0, 48.0, 69.0, 44.0, 50.0, 28.0, 18.0, 12.0, 14.0, 7.0, 6.0, 3.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-435.75, -423.56640625, -411.3828125, -399.19921875, -387.015625, -374.83203125, -362.6484375, -350.46484375, -338.28125, -326.09765625, -313.9140625, -301.73046875, -289.546875, -277.36328125, -265.1796875, -252.99609375, -240.8125, -228.62890625, -216.4453125, -204.26171875, -192.078125, -179.89453125, -167.7109375, -155.52734375, -143.34375, -131.16015625, -118.9765625, -106.79296875, -94.609375, -82.42578125, -70.2421875, -58.05859375, -45.875, -33.69140625, -21.5078125, -9.32421875, 2.859375, 15.04296875, 27.2265625, 39.41015625, 51.59375, 63.77734375, 75.9609375, 88.14453125, 100.328125, 112.51171875, 124.6953125, 136.87890625, 149.0625, 161.24609375, 173.4296875, 185.61328125, 197.796875, 209.98046875, 222.1640625, 234.34765625, 246.53125, 258.71484375, 270.8984375, 283.08203125, 295.265625, 307.44921875, 319.6328125, 331.81640625, 344.0]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 9.0, 7.0, 15.0, 20.0, 20.0, 43.0, 45.0, 78.0, 137.0, 224.0, 326.0, 603.0, 1142.0, 2304.0, 5096.0, 13131.0, 40058.0, 157232.0, 651623.0, 123544.0, 32657.0, 11319.0, 4386.0, 2092.0, 1009.0, 560.0, 350.0, 176.0, 98.0, 74.0, 55.0, 29.0, 25.0, 22.0, 18.0, 7.0, 4.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.65625, -33.29296875, -31.9296875, -30.56640625, -29.203125, -27.83984375, -26.4765625, -25.11328125, -23.75, -22.38671875, -21.0234375, -19.66015625, -18.296875, -16.93359375, -15.5703125, -14.20703125, -12.84375, -11.48046875, -10.1171875, -8.75390625, -7.390625, -6.02734375, -4.6640625, -3.30078125, -1.9375, -0.57421875, 0.7890625, 2.15234375, 3.515625, 4.87890625, 6.2421875, 7.60546875, 8.96875, 10.33203125, 11.6953125, 13.05859375, 14.421875, 15.78515625, 17.1484375, 18.51171875, 19.875, 21.23828125, 22.6015625, 23.96484375, 25.328125, 26.69140625, 28.0546875, 29.41796875, 30.78125, 32.14453125, 33.5078125, 34.87109375, 36.234375, 37.59765625, 38.9609375, 40.32421875, 41.6875, 43.05078125, 44.4140625, 45.77734375, 47.140625, 48.50390625, 49.8671875, 51.23046875, 52.59375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 7.0, 7.0, 11.0, 13.0, 18.0, 25.0, 23.0, 63.0, 72.0, 76.0, 107.0, 157.0, 113.0, 83.0, 55.0, 46.0, 32.0, 23.0, 23.0, 11.0, 7.0, 3.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0198516845703125, -0.019176006317138672, -0.018500328063964844, -0.017824649810791016, -0.017148971557617188, -0.01647329330444336, -0.01579761505126953, -0.015121936798095703, -0.014446258544921875, -0.013770580291748047, -0.013094902038574219, -0.01241922378540039, -0.011743545532226562, -0.011067867279052734, -0.010392189025878906, -0.009716510772705078, -0.00904083251953125, -0.008365154266357422, -0.007689476013183594, -0.007013797760009766, -0.0063381195068359375, -0.005662441253662109, -0.004986763000488281, -0.004311084747314453, -0.003635406494140625, -0.002959728240966797, -0.0022840499877929688, -0.0016083717346191406, -0.0009326934814453125, -0.0002570152282714844, 0.00041866302490234375, 0.0010943412780761719, 0.00177001953125, 0.002445697784423828, 0.0031213760375976562, 0.0037970542907714844, 0.0044727325439453125, 0.005148410797119141, 0.005824089050292969, 0.006499767303466797, 0.007175445556640625, 0.007851123809814453, 0.008526802062988281, 0.00920248031616211, 0.009878158569335938, 0.010553836822509766, 0.011229515075683594, 0.011905193328857422, 0.01258087158203125, 0.013256549835205078, 0.013932228088378906, 0.014607906341552734, 0.015283584594726562, 0.01595926284790039, 0.01663494110107422, 0.017310619354248047, 0.017986297607421875, 0.018661975860595703, 0.01933765411376953, 0.02001333236694336, 0.020689010620117188, 0.021364688873291016, 0.022040367126464844, 0.022716045379638672, 0.0233917236328125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 6.0, 4.0, 12.0, 10.0, 13.0, 21.0, 43.0, 53.0, 63.0, 136.0, 236.0, 371.0, 868.0, 1953.0, 5273.0, 18780.0, 97322.0, 742570.0, 144898.0, 24830.0, 6705.0, 2275.0, 947.0, 498.0, 273.0, 117.0, 81.0, 70.0, 39.0, 22.0, 16.0, 10.0, 6.0, 9.0, 11.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-60.4375, -58.58349609375, -56.7294921875, -54.87548828125, -53.021484375, -51.16748046875, -49.3134765625, -47.45947265625, -45.60546875, -43.75146484375, -41.8974609375, -40.04345703125, -38.189453125, -36.33544921875, -34.4814453125, -32.62744140625, -30.7734375, -28.91943359375, -27.0654296875, -25.21142578125, -23.357421875, -21.50341796875, -19.6494140625, -17.79541015625, -15.94140625, -14.08740234375, -12.2333984375, -10.37939453125, -8.525390625, -6.67138671875, -4.8173828125, -2.96337890625, -1.109375, 0.74462890625, 2.5986328125, 4.45263671875, 6.306640625, 8.16064453125, 10.0146484375, 11.86865234375, 13.72265625, 15.57666015625, 17.4306640625, 19.28466796875, 21.138671875, 22.99267578125, 24.8466796875, 26.70068359375, 28.5546875, 30.40869140625, 32.2626953125, 34.11669921875, 35.970703125, 37.82470703125, 39.6787109375, 41.53271484375, 43.38671875, 45.24072265625, 47.0947265625, 48.94873046875, 50.802734375, 52.65673828125, 54.5107421875, 56.36474609375, 58.21875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 8.0, 8.0, 4.0, 8.0, 14.0, 10.0, 14.0, 18.0, 24.0, 29.0, 25.0, 49.0, 58.0, 55.0, 56.0, 93.0, 71.0, 67.0, 66.0, 58.0, 45.0, 31.0, 33.0, 28.0, 21.0, 12.0, 16.0, 8.0, 8.0, 11.0, 10.0, 8.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0], "bins": [-42.25, -41.017578125, -39.78515625, -38.552734375, -37.3203125, -36.087890625, -34.85546875, -33.623046875, -32.390625, -31.158203125, -29.92578125, -28.693359375, -27.4609375, -26.228515625, -24.99609375, -23.763671875, -22.53125, -21.298828125, -20.06640625, -18.833984375, -17.6015625, -16.369140625, -15.13671875, -13.904296875, -12.671875, -11.439453125, -10.20703125, -8.974609375, -7.7421875, -6.509765625, -5.27734375, -4.044921875, -2.8125, -1.580078125, -0.34765625, 0.884765625, 2.1171875, 3.349609375, 4.58203125, 5.814453125, 7.046875, 8.279296875, 9.51171875, 10.744140625, 11.9765625, 13.208984375, 14.44140625, 15.673828125, 16.90625, 18.138671875, 19.37109375, 20.603515625, 21.8359375, 23.068359375, 24.30078125, 25.533203125, 26.765625, 27.998046875, 29.23046875, 30.462890625, 31.6953125, 32.927734375, 34.16015625, 35.392578125, 36.625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 12.0, 5.0, 11.0, 16.0, 27.0, 60.0, 82.0, 140.0, 268.0, 136.0, 101.0, 55.0, 38.0, 12.0, 7.0, 9.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1242.4111328125, -1208.351806640625, -1174.29248046875, -1140.233154296875, -1106.173828125, -1072.114501953125, -1038.05517578125, -1003.9957885742188, -969.9364624023438, -935.8771362304688, -901.8178100585938, -867.7584838867188, -833.6990966796875, -799.6397705078125, -765.5804443359375, -731.5211181640625, -697.4617919921875, -663.4024658203125, -629.3431396484375, -595.2838134765625, -561.2244873046875, -527.1651611328125, -493.10577392578125, -459.04644775390625, -424.98712158203125, -390.92779541015625, -356.86846923828125, -322.8091125488281, -288.7497863769531, -254.69046020507812, -220.63111877441406, -186.57177734375, -152.5123291015625, -118.45299530029297, -84.39366149902344, -50.334327697753906, -16.274993896484375, 17.784332275390625, 51.84367370605469, 85.90301513671875, 119.96234130859375, 154.02166748046875, 188.0810089111328, 222.14035034179688, 256.1996765136719, 290.2590026855469, 324.318359375, 358.377685546875, 392.43701171875, 426.496337890625, 460.5556640625, 494.6150207519531, 528.67431640625, 562.733642578125, 596.7930297851562, 630.8523559570312, 664.9116821289062, 698.9710083007812, 733.0303344726562, 767.0896606445312, 801.1490478515625, 835.2083740234375, 869.2677001953125, 903.3270263671875, 937.3863525390625]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 10.0, 5.0, 9.0, 12.0, 12.0, 14.0, 13.0, 18.0, 18.0, 25.0, 31.0, 26.0, 38.0, 34.0, 53.0, 69.0, 92.0, 98.0, 77.0, 48.0, 42.0, 30.0, 28.0, 28.0, 21.0, 21.0, 24.0, 15.0, 16.0, 9.0, 11.0, 12.0, 4.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-854.59912109375, -822.7855224609375, -790.971923828125, -759.1583251953125, -727.3446655273438, -695.5310668945312, -663.7174682617188, -631.9038696289062, -600.0902709960938, -568.2766723632812, -536.4630737304688, -504.6494445800781, -472.8358459472656, -441.022216796875, -409.2086181640625, -377.39501953125, -345.5813903808594, -313.7677917480469, -281.95416259765625, -250.14056396484375, -218.32696533203125, -186.5133514404297, -154.69973754882812, -122.88613891601562, -91.07252502441406, -59.25891876220703, -27.445308685302734, 4.3683013916015625, 36.181907653808594, 67.99551391601562, 99.80912780761719, 131.6227264404297, 163.43634033203125, 195.2499542236328, 227.0635528564453, 258.8771667480469, 290.6907653808594, 322.50439453125, 354.3179931640625, 386.131591796875, 417.9451904296875, 449.7587890625, 481.5724182128906, 513.385986328125, 545.1996459960938, 577.0132446289062, 608.8268432617188, 640.6404418945312, 672.4541015625, 704.2677001953125, 736.081298828125, 767.8948974609375, 799.7085571289062, 831.5221557617188, 863.3357543945312, 895.1493530273438, 926.9629516601562, 958.7765502929688, 990.5901489257812, 1022.40380859375, 1054.2174072265625, 1086.031005859375, 1117.8446044921875, 1149.658203125, 1181.4718017578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 6.0, 8.0, 12.0, 22.0, 46.0, 71.0, 115.0, 180.0, 318.0, 575.0, 1184.0, 2464.0, 5941.0, 17941.0, 76239.0, 454744.0, 2179492.0, 1188717.0, 207356.0, 40038.0, 10766.0, 4077.0, 1853.0, 942.0, 513.0, 250.0, 166.0, 89.0, 59.0, 32.0, 19.0, 20.0, 9.0, 3.0, 5.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.78125, -57.15673828125, -54.5322265625, -51.90771484375, -49.283203125, -46.65869140625, -44.0341796875, -41.40966796875, -38.78515625, -36.16064453125, -33.5361328125, -30.91162109375, -28.287109375, -25.66259765625, -23.0380859375, -20.41357421875, -17.7890625, -15.16455078125, -12.5400390625, -9.91552734375, -7.291015625, -4.66650390625, -2.0419921875, 0.58251953125, 3.20703125, 5.83154296875, 8.4560546875, 11.08056640625, 13.705078125, 16.32958984375, 18.9541015625, 21.57861328125, 24.203125, 26.82763671875, 29.4521484375, 32.07666015625, 34.701171875, 37.32568359375, 39.9501953125, 42.57470703125, 45.19921875, 47.82373046875, 50.4482421875, 53.07275390625, 55.697265625, 58.32177734375, 60.9462890625, 63.57080078125, 66.1953125, 68.81982421875, 71.4443359375, 74.06884765625, 76.693359375, 79.31787109375, 81.9423828125, 84.56689453125, 87.19140625, 89.81591796875, 92.4404296875, 95.06494140625, 97.689453125, 100.31396484375, 102.9384765625, 105.56298828125, 108.1875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 5.0, 4.0, 6.0, 3.0, 9.0, 6.0, 11.0, 12.0, 26.0, 23.0, 19.0, 22.0, 22.0, 30.0, 37.0, 41.0, 41.0, 35.0, 38.0, 49.0, 59.0, 60.0, 57.0, 36.0, 40.0, 38.0, 36.0, 26.0, 35.0, 33.0, 29.0, 27.0, 15.0, 14.0, 15.0, 6.0, 5.0, 5.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.0625, -65.84765625, -63.6328125, -61.41796875, -59.203125, -56.98828125, -54.7734375, -52.55859375, -50.34375, -48.12890625, -45.9140625, -43.69921875, -41.484375, -39.26953125, -37.0546875, -34.83984375, -32.625, -30.41015625, -28.1953125, -25.98046875, -23.765625, -21.55078125, -19.3359375, -17.12109375, -14.90625, -12.69140625, -10.4765625, -8.26171875, -6.046875, -3.83203125, -1.6171875, 0.59765625, 2.8125, 5.02734375, 7.2421875, 9.45703125, 11.671875, 13.88671875, 16.1015625, 18.31640625, 20.53125, 22.74609375, 24.9609375, 27.17578125, 29.390625, 31.60546875, 33.8203125, 36.03515625, 38.25, 40.46484375, 42.6796875, 44.89453125, 47.109375, 49.32421875, 51.5390625, 53.75390625, 55.96875, 58.18359375, 60.3984375, 62.61328125, 64.828125, 67.04296875, 69.2578125, 71.47265625, 73.6875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 4.0, 17.0, 21.0, 47.0, 102.0, 253.0, 622.0, 2577.0, 24627.0, 3639374.0, 514231.0, 9854.0, 1638.0, 503.0, 206.0, 82.0, 39.0, 24.0, 12.0, 16.0, 6.0, 1.0, 4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-331.0, -320.6015625, -310.203125, -299.8046875, -289.40625, -279.0078125, -268.609375, -258.2109375, -247.8125, -237.4140625, -227.015625, -216.6171875, -206.21875, -195.8203125, -185.421875, -175.0234375, -164.625, -154.2265625, -143.828125, -133.4296875, -123.03125, -112.6328125, -102.234375, -91.8359375, -81.4375, -71.0390625, -60.640625, -50.2421875, -39.84375, -29.4453125, -19.046875, -8.6484375, 1.75, 12.1484375, 22.546875, 32.9453125, 43.34375, 53.7421875, 64.140625, 74.5390625, 84.9375, 95.3359375, 105.734375, 116.1328125, 126.53125, 136.9296875, 147.328125, 157.7265625, 168.125, 178.5234375, 188.921875, 199.3203125, 209.71875, 220.1171875, 230.515625, 240.9140625, 251.3125, 261.7109375, 272.109375, 282.5078125, 292.90625, 303.3046875, 313.703125, 324.1015625, 334.5]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 14.0, 12.0, 31.0, 27.0, 71.0, 83.0, 197.0, 413.0, 741.0, 1001.0, 697.0, 327.0, 181.0, 96.0, 72.0, 35.0, 27.0, 16.0, 8.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.625, -136.951171875, -130.27734375, -123.603515625, -116.9296875, -110.255859375, -103.58203125, -96.908203125, -90.234375, -83.560546875, -76.88671875, -70.212890625, -63.5390625, -56.865234375, -50.19140625, -43.517578125, -36.84375, -30.169921875, -23.49609375, -16.822265625, -10.1484375, -3.474609375, 3.19921875, 9.873046875, 16.546875, 23.220703125, 29.89453125, 36.568359375, 43.2421875, 49.916015625, 56.58984375, 63.263671875, 69.9375, 76.611328125, 83.28515625, 89.958984375, 96.6328125, 103.306640625, 109.98046875, 116.654296875, 123.328125, 130.001953125, 136.67578125, 143.349609375, 150.0234375, 156.697265625, 163.37109375, 170.044921875, 176.71875, 183.392578125, 190.06640625, 196.740234375, 203.4140625, 210.087890625, 216.76171875, 223.435546875, 230.109375, 236.783203125, 243.45703125, 250.130859375, 256.8046875, 263.478515625, 270.15234375, 276.826171875, 283.5]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 12.0, 5.0, 13.0, 23.0, 53.0, 43.0, 90.0, 150.0, 162.0, 137.0, 100.0, 70.0, 40.0, 28.0, 21.0, 11.0, 15.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1168.4798583984375, -1135.7244873046875, -1102.9691162109375, -1070.2138671875, -1037.45849609375, -1004.703125, -971.94775390625, -939.1923828125, -906.4370727539062, -873.6817016601562, -840.9263916015625, -808.1710205078125, -775.4156494140625, -742.6603393554688, -709.9049682617188, -677.149658203125, -644.394287109375, -611.638916015625, -578.8836059570312, -546.1282348632812, -513.3729248046875, -480.6175537109375, -447.8621826171875, -415.1068420410156, -382.35150146484375, -349.5961608886719, -316.8408203125, -284.08544921875, -251.33010864257812, -218.57476806640625, -185.8194122314453, -153.06405639648438, -120.30865478515625, -87.55330657958984, -54.79795837402344, -22.04261016845703, 10.712738037109375, 43.46807861328125, 76.22343444824219, 108.97879028320312, 141.734130859375, 174.48947143554688, 207.2448272705078, 240.00018310546875, 272.7555236816406, 305.5108642578125, 338.2662353515625, 371.0215759277344, 403.77691650390625, 436.5322570800781, 469.28759765625, 502.04296875, 534.79833984375, 567.5536499023438, 600.3090209960938, 633.0643310546875, 665.8197021484375, 698.5750732421875, 731.3303833007812, 764.0857543945312, 796.841064453125, 829.596435546875, 862.351806640625, 895.107177734375, 927.8624877929688]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 8.0, 4.0, 6.0, 11.0, 7.0, 17.0, 20.0, 18.0, 25.0, 30.0, 39.0, 41.0, 50.0, 75.0, 83.0, 55.0, 64.0, 58.0, 56.0, 64.0, 55.0, 33.0, 37.0, 24.0, 16.0, 25.0, 17.0, 15.0, 15.0, 2.0, 9.0, 5.0, 11.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-965.2545166015625, -937.2748413085938, -909.2951049804688, -881.3154296875, -853.335693359375, -825.3560180664062, -797.3763427734375, -769.3966064453125, -741.4168701171875, -713.4371948242188, -685.4574584960938, -657.477783203125, -629.498046875, -601.5183715820312, -573.5386962890625, -545.5589599609375, -517.5792846679688, -489.5995788574219, -461.619873046875, -433.64019775390625, -405.66046142578125, -377.6807861328125, -349.7010803222656, -321.72137451171875, -293.7416687011719, -265.761962890625, -237.78225708007812, -209.8025665283203, -181.82286071777344, -153.84315490722656, -125.86346435546875, -97.88375854492188, -69.90399169921875, -41.92428970336914, -13.944587707519531, 14.035110473632812, 42.01481628417969, 69.99452209472656, 97.97421264648438, 125.95391845703125, 153.93362426757812, 181.913330078125, 209.89303588867188, 237.8727264404297, 265.8524169921875, 293.8321533203125, 321.81182861328125, 349.7915344238281, 377.771240234375, 405.7509460449219, 433.73065185546875, 461.7103271484375, 489.6900634765625, 517.6697387695312, 545.6494140625, 573.629150390625, 601.60888671875, 629.5885620117188, 657.5682983398438, 685.5479736328125, 713.5277099609375, 741.5073852539062, 769.487060546875, 797.466796875, 825.4464721679688]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 10.0, 22.0, 26.0, 50.0, 55.0, 114.0, 160.0, 302.0, 424.0, 775.0, 1321.0, 2372.0, 4587.0, 9057.0, 20227.0, 47293.0, 125805.0, 348342.0, 304453.0, 106614.0, 41377.0, 17624.0, 8302.0, 4219.0, 2123.0, 1161.0, 662.0, 409.0, 241.0, 157.0, 99.0, 56.0, 44.0, 22.0, 11.0, 11.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.6875, -89.8720703125, -87.056640625, -84.2412109375, -81.42578125, -78.6103515625, -75.794921875, -72.9794921875, -70.1640625, -67.3486328125, -64.533203125, -61.7177734375, -58.90234375, -56.0869140625, -53.271484375, -50.4560546875, -47.640625, -44.8251953125, -42.009765625, -39.1943359375, -36.37890625, -33.5634765625, -30.748046875, -27.9326171875, -25.1171875, -22.3017578125, -19.486328125, -16.6708984375, -13.85546875, -11.0400390625, -8.224609375, -5.4091796875, -2.59375, 0.2216796875, 3.037109375, 5.8525390625, 8.66796875, 11.4833984375, 14.298828125, 17.1142578125, 19.9296875, 22.7451171875, 25.560546875, 28.3759765625, 31.19140625, 34.0068359375, 36.822265625, 39.6376953125, 42.453125, 45.2685546875, 48.083984375, 50.8994140625, 53.71484375, 56.5302734375, 59.345703125, 62.1611328125, 64.9765625, 67.7919921875, 70.607421875, 73.4228515625, 76.23828125, 79.0537109375, 81.869140625, 84.6845703125, 87.5]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 7.0, 5.0, 8.0, 17.0, 15.0, 15.0, 18.0, 23.0, 15.0, 17.0, 27.0, 35.0, 33.0, 26.0, 38.0, 37.0, 38.0, 52.0, 45.0, 46.0, 53.0, 50.0, 45.0, 46.0, 29.0, 45.0, 32.0, 25.0, 28.0, 25.0, 22.0, 16.0, 9.0, 11.0, 9.0, 8.0, 7.0, 3.0, 3.0, 3.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.65625, -57.58056640625, -55.5048828125, -53.42919921875, -51.353515625, -49.27783203125, -47.2021484375, -45.12646484375, -43.05078125, -40.97509765625, -38.8994140625, -36.82373046875, -34.748046875, -32.67236328125, -30.5966796875, -28.52099609375, -26.4453125, -24.36962890625, -22.2939453125, -20.21826171875, -18.142578125, -16.06689453125, -13.9912109375, -11.91552734375, -9.83984375, -7.76416015625, -5.6884765625, -3.61279296875, -1.537109375, 0.53857421875, 2.6142578125, 4.68994140625, 6.765625, 8.84130859375, 10.9169921875, 12.99267578125, 15.068359375, 17.14404296875, 19.2197265625, 21.29541015625, 23.37109375, 25.44677734375, 27.5224609375, 29.59814453125, 31.673828125, 33.74951171875, 35.8251953125, 37.90087890625, 39.9765625, 42.05224609375, 44.1279296875, 46.20361328125, 48.279296875, 50.35498046875, 52.4306640625, 54.50634765625, 56.58203125, 58.65771484375, 60.7333984375, 62.80908203125, 64.884765625, 66.96044921875, 69.0361328125, 71.11181640625, 73.1875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 6.0, 8.0, 20.0, 27.0, 45.0, 75.0, 93.0, 136.0, 287.0, 512.0, 1048.0, 2917.0, 12828.0, 131012.0, 842090.0, 47045.0, 6710.0, 1904.0, 789.0, 398.0, 222.0, 122.0, 81.0, 53.0, 45.0, 25.0, 13.0, 13.0, 12.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-285.5, -277.4140625, -269.328125, -261.2421875, -253.15625, -245.0703125, -236.984375, -228.8984375, -220.8125, -212.7265625, -204.640625, -196.5546875, -188.46875, -180.3828125, -172.296875, -164.2109375, -156.125, -148.0390625, -139.953125, -131.8671875, -123.78125, -115.6953125, -107.609375, -99.5234375, -91.4375, -83.3515625, -75.265625, -67.1796875, -59.09375, -51.0078125, -42.921875, -34.8359375, -26.75, -18.6640625, -10.578125, -2.4921875, 5.59375, 13.6796875, 21.765625, 29.8515625, 37.9375, 46.0234375, 54.109375, 62.1953125, 70.28125, 78.3671875, 86.453125, 94.5390625, 102.625, 110.7109375, 118.796875, 126.8828125, 134.96875, 143.0546875, 151.140625, 159.2265625, 167.3125, 175.3984375, 183.484375, 191.5703125, 199.65625, 207.7421875, 215.828125, 223.9140625, 232.0]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 11.0, 16.0, 13.0, 14.0, 20.0, 21.0, 23.0, 34.0, 41.0, 51.0, 52.0, 55.0, 61.0, 66.0, 75.0, 68.0, 67.0, 49.0, 50.0, 30.0, 32.0, 28.0, 23.0, 12.0, 17.0, 15.0, 13.0, 5.0, 10.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-348.25, -338.515625, -328.78125, -319.046875, -309.3125, -299.578125, -289.84375, -280.109375, -270.375, -260.640625, -250.90625, -241.171875, -231.4375, -221.703125, -211.96875, -202.234375, -192.5, -182.765625, -173.03125, -163.296875, -153.5625, -143.828125, -134.09375, -124.359375, -114.625, -104.890625, -95.15625, -85.421875, -75.6875, -65.953125, -56.21875, -46.484375, -36.75, -27.015625, -17.28125, -7.546875, 2.1875, 11.921875, 21.65625, 31.390625, 41.125, 50.859375, 60.59375, 70.328125, 80.0625, 89.796875, 99.53125, 109.265625, 119.0, 128.734375, 138.46875, 148.203125, 157.9375, 167.671875, 177.40625, 187.140625, 196.875, 206.609375, 216.34375, 226.078125, 235.8125, 245.546875, 255.28125, 265.015625, 274.75]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 2.0, 14.0, 22.0, 29.0, 32.0, 36.0, 65.0, 90.0, 139.0, 204.0, 364.0, 677.0, 1200.0, 2155.0, 4635.0, 10729.0, 28651.0, 101497.0, 650064.0, 176914.0, 43486.0, 15080.0, 6183.0, 2884.0, 1403.0, 770.0, 428.0, 261.0, 174.0, 96.0, 79.0, 51.0, 37.0, 29.0, 20.0, 15.0, 9.0, 3.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.0, -29.95556640625, -28.9111328125, -27.86669921875, -26.822265625, -25.77783203125, -24.7333984375, -23.68896484375, -22.64453125, -21.60009765625, -20.5556640625, -19.51123046875, -18.466796875, -17.42236328125, -16.3779296875, -15.33349609375, -14.2890625, -13.24462890625, -12.2001953125, -11.15576171875, -10.111328125, -9.06689453125, -8.0224609375, -6.97802734375, -5.93359375, -4.88916015625, -3.8447265625, -2.80029296875, -1.755859375, -0.71142578125, 0.3330078125, 1.37744140625, 2.421875, 3.46630859375, 4.5107421875, 5.55517578125, 6.599609375, 7.64404296875, 8.6884765625, 9.73291015625, 10.77734375, 11.82177734375, 12.8662109375, 13.91064453125, 14.955078125, 15.99951171875, 17.0439453125, 18.08837890625, 19.1328125, 20.17724609375, 21.2216796875, 22.26611328125, 23.310546875, 24.35498046875, 25.3994140625, 26.44384765625, 27.48828125, 28.53271484375, 29.5771484375, 30.62158203125, 31.666015625, 32.71044921875, 33.7548828125, 34.79931640625, 35.84375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 14.0, 14.0, 18.0, 32.0, 40.0, 62.0, 76.0, 99.0, 121.0, 146.0, 101.0, 76.0, 65.0, 32.0, 26.0, 15.0, 12.0, 12.0, 10.0, 11.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169219970703125, -0.01629638671875, -0.0156707763671875, -0.015045166015625, -0.0144195556640625, -0.0137939453125, -0.0131683349609375, -0.012542724609375, -0.0119171142578125, -0.01129150390625, -0.0106658935546875, -0.010040283203125, -0.0094146728515625, -0.0087890625, -0.0081634521484375, -0.007537841796875, -0.0069122314453125, -0.00628662109375, -0.0056610107421875, -0.005035400390625, -0.0044097900390625, -0.0037841796875, -0.0031585693359375, -0.002532958984375, -0.0019073486328125, -0.00128173828125, -0.0006561279296875, -3.0517578125e-05, 0.0005950927734375, 0.001220703125, 0.0018463134765625, 0.002471923828125, 0.0030975341796875, 0.00372314453125, 0.0043487548828125, 0.004974365234375, 0.0055999755859375, 0.0062255859375, 0.0068511962890625, 0.007476806640625, 0.0081024169921875, 0.00872802734375, 0.0093536376953125, 0.009979248046875, 0.0106048583984375, 0.01123046875, 0.0118560791015625, 0.012481689453125, 0.0131072998046875, 0.01373291015625, 0.0143585205078125, 0.014984130859375, 0.0156097412109375, 0.0162353515625, 0.0168609619140625, 0.017486572265625, 0.0181121826171875, 0.01873779296875, 0.0193634033203125, 0.019989013671875, 0.0206146240234375, 0.021240234375, 0.0218658447265625, 0.022491455078125, 0.0231170654296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 9.0, 8.0, 11.0, 16.0, 41.0, 106.0, 201.0, 620.0, 2350.0, 20172.0, 854307.0, 161564.0, 7138.0, 1281.0, 390.0, 152.0, 84.0, 37.0, 27.0, 13.0, 11.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-107.6875, -104.5927734375, -101.498046875, -98.4033203125, -95.30859375, -92.2138671875, -89.119140625, -86.0244140625, -82.9296875, -79.8349609375, -76.740234375, -73.6455078125, -70.55078125, -67.4560546875, -64.361328125, -61.2666015625, -58.171875, -55.0771484375, -51.982421875, -48.8876953125, -45.79296875, -42.6982421875, -39.603515625, -36.5087890625, -33.4140625, -30.3193359375, -27.224609375, -24.1298828125, -21.03515625, -17.9404296875, -14.845703125, -11.7509765625, -8.65625, -5.5615234375, -2.466796875, 0.6279296875, 3.72265625, 6.8173828125, 9.912109375, 13.0068359375, 16.1015625, 19.1962890625, 22.291015625, 25.3857421875, 28.48046875, 31.5751953125, 34.669921875, 37.7646484375, 40.859375, 43.9541015625, 47.048828125, 50.1435546875, 53.23828125, 56.3330078125, 59.427734375, 62.5224609375, 65.6171875, 68.7119140625, 71.806640625, 74.9013671875, 77.99609375, 81.0908203125, 84.185546875, 87.2802734375, 90.375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 4.0, 4.0, 12.0, 15.0, 24.0, 48.0, 79.0, 116.0, 133.0, 141.0, 120.0, 90.0, 78.0, 38.0, 31.0, 24.0, 10.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-87.6875, -85.2197265625, -82.751953125, -80.2841796875, -77.81640625, -75.3486328125, -72.880859375, -70.4130859375, -67.9453125, -65.4775390625, -63.009765625, -60.5419921875, -58.07421875, -55.6064453125, -53.138671875, -50.6708984375, -48.203125, -45.7353515625, -43.267578125, -40.7998046875, -38.33203125, -35.8642578125, -33.396484375, -30.9287109375, -28.4609375, -25.9931640625, -23.525390625, -21.0576171875, -18.58984375, -16.1220703125, -13.654296875, -11.1865234375, -8.71875, -6.2509765625, -3.783203125, -1.3154296875, 1.15234375, 3.6201171875, 6.087890625, 8.5556640625, 11.0234375, 13.4912109375, 15.958984375, 18.4267578125, 20.89453125, 23.3623046875, 25.830078125, 28.2978515625, 30.765625, 33.2333984375, 35.701171875, 38.1689453125, 40.63671875, 43.1044921875, 45.572265625, 48.0400390625, 50.5078125, 52.9755859375, 55.443359375, 57.9111328125, 60.37890625, 62.8466796875, 65.314453125, 67.7822265625, 70.25]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 14.0, 36.0, 68.0, 191.0, 424.0, 135.0, 67.0, 32.0, 11.0, 11.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1262.30615234375, -1202.849365234375, -1143.3924560546875, -1083.9356689453125, -1024.4788818359375, -965.02197265625, -905.565185546875, -846.1083374023438, -786.6514892578125, -727.1946411132812, -667.7378540039062, -608.281005859375, -548.8241577148438, -489.3673400878906, -429.9105224609375, -370.45367431640625, -310.99688720703125, -251.54005432128906, -192.08322143554688, -132.62640380859375, -73.16957092285156, -13.712738037109375, 45.74407958984375, 105.200927734375, 164.65774536132812, 224.1145782470703, 283.5714111328125, 343.0282287597656, 402.48504638671875, 461.94189453125, 521.398681640625, 580.8555908203125, 640.3123779296875, 699.7692260742188, 759.2260131835938, 818.682861328125, 878.1397094726562, 937.5965576171875, 997.0533447265625, 1056.51025390625, 1115.967041015625, 1175.423828125, 1234.8807373046875, 1294.3375244140625, 1353.7943115234375, 1413.251220703125, 1472.7080078125, 1532.164794921875, 1591.62158203125, 1651.078369140625, 1710.5352783203125, 1769.9920654296875, 1829.4488525390625, 1888.90576171875, 1948.362548828125, 2007.8193359375, 2067.2763671875, 2126.733154296875, 2186.18994140625, 2245.64697265625, 2305.103759765625, 2364.560546875, 2424.017333984375, 2483.47412109375, 2542.930908203125]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 5.0, 5.0, 9.0, 14.0, 9.0, 20.0, 24.0, 23.0, 22.0, 27.0, 28.0, 39.0, 46.0, 82.0, 185.0, 126.0, 71.0, 54.0, 38.0, 36.0, 25.0, 21.0, 26.0, 23.0, 10.0, 17.0, 11.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1369.1583251953125, -1328.6373291015625, -1288.1162109375, -1247.59521484375, -1207.07421875, -1166.55322265625, -1126.0321044921875, -1085.5111083984375, -1044.989990234375, -1004.4689331054688, -963.9479370117188, -923.4268798828125, -882.9058837890625, -842.3848266601562, -801.86376953125, -761.3427734375, -720.82177734375, -680.3007202148438, -639.7797241210938, -599.2586669921875, -558.7376708984375, -518.2166137695312, -477.695556640625, -437.1745300292969, -396.65350341796875, -356.1324768066406, -315.6114501953125, -275.09039306640625, -234.56936645507812, -194.04833984375, -153.5272979736328, -113.00625610351562, -72.4853515625, -31.964317321777344, 8.556716918945312, 49.07775115966797, 89.59878540039062, 130.11981201171875, 170.64085388183594, 211.16189575195312, 251.68292236328125, 292.2039489746094, 332.7249755859375, 373.24603271484375, 413.7670593261719, 454.2880859375, 494.80914306640625, 535.3302001953125, 575.8511962890625, 616.3722534179688, 656.8932495117188, 697.414306640625, 737.935302734375, 778.4563598632812, 818.9774169921875, 859.4984130859375, 900.0194702148438, 940.54052734375, 981.0615234375, 1021.5825805664062, 1062.1036376953125, 1102.6246337890625, 1143.1456298828125, 1183.666748046875, 1224.187744140625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 8.0, 8.0, 21.0, 19.0, 33.0, 33.0, 41.0, 61.0, 107.0, 151.0, 243.0, 430.0, 834.0, 1858.0, 4716.0, 13847.0, 56659.0, 426810.0, 2466978.0, 1060649.0, 124662.0, 24012.0, 7044.0, 2487.0, 1149.0, 562.0, 278.0, 187.0, 144.0, 75.0, 41.0, 48.0, 21.0, 22.0, 16.0, 13.0, 4.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.625, -146.84375, -142.0625, -137.28125, -132.5, -127.71875, -122.9375, -118.15625, -113.375, -108.59375, -103.8125, -99.03125, -94.25, -89.46875, -84.6875, -79.90625, -75.125, -70.34375, -65.5625, -60.78125, -56.0, -51.21875, -46.4375, -41.65625, -36.875, -32.09375, -27.3125, -22.53125, -17.75, -12.96875, -8.1875, -3.40625, 1.375, 6.15625, 10.9375, 15.71875, 20.5, 25.28125, 30.0625, 34.84375, 39.625, 44.40625, 49.1875, 53.96875, 58.75, 63.53125, 68.3125, 73.09375, 77.875, 82.65625, 87.4375, 92.21875, 97.0, 101.78125, 106.5625, 111.34375, 116.125, 120.90625, 125.6875, 130.46875, 135.25, 140.03125, 144.8125, 149.59375, 154.375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 10.0, 5.0, 17.0, 18.0, 15.0, 30.0, 27.0, 27.0, 28.0, 34.0, 43.0, 44.0, 50.0, 45.0, 48.0, 48.0, 49.0, 43.0, 46.0, 45.0, 39.0, 35.0, 46.0, 38.0, 26.0, 22.0, 20.0, 15.0, 22.0, 17.0, 8.0, 10.0, 5.0, 6.0, 1.0, 3.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.5, -78.2666015625, -76.033203125, -73.7998046875, -71.56640625, -69.3330078125, -67.099609375, -64.8662109375, -62.6328125, -60.3994140625, -58.166015625, -55.9326171875, -53.69921875, -51.4658203125, -49.232421875, -46.9990234375, -44.765625, -42.5322265625, -40.298828125, -38.0654296875, -35.83203125, -33.5986328125, -31.365234375, -29.1318359375, -26.8984375, -24.6650390625, -22.431640625, -20.1982421875, -17.96484375, -15.7314453125, -13.498046875, -11.2646484375, -9.03125, -6.7978515625, -4.564453125, -2.3310546875, -0.09765625, 2.1357421875, 4.369140625, 6.6025390625, 8.8359375, 11.0693359375, 13.302734375, 15.5361328125, 17.76953125, 20.0029296875, 22.236328125, 24.4697265625, 26.703125, 28.9365234375, 31.169921875, 33.4033203125, 35.63671875, 37.8701171875, 40.103515625, 42.3369140625, 44.5703125, 46.8037109375, 49.037109375, 51.2705078125, 53.50390625, 55.7373046875, 57.970703125, 60.2041015625, 62.4375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 12.0, 17.0, 31.0, 75.0, 266.0, 1060.0, 16194.0, 4164208.0, 11096.0, 941.0, 239.0, 75.0, 39.0, 14.0, 9.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1395.0, -1358.7265625, -1322.453125, -1286.1796875, -1249.90625, -1213.6328125, -1177.359375, -1141.0859375, -1104.8125, -1068.5390625, -1032.265625, -995.9921875, -959.71875, -923.4453125, -887.171875, -850.8984375, -814.625, -778.3515625, -742.078125, -705.8046875, -669.53125, -633.2578125, -596.984375, -560.7109375, -524.4375, -488.1640625, -451.890625, -415.6171875, -379.34375, -343.0703125, -306.796875, -270.5234375, -234.25, -197.9765625, -161.703125, -125.4296875, -89.15625, -52.8828125, -16.609375, 19.6640625, 55.9375, 92.2109375, 128.484375, 164.7578125, 201.03125, 237.3046875, 273.578125, 309.8515625, 346.125, 382.3984375, 418.671875, 454.9453125, 491.21875, 527.4921875, 563.765625, 600.0390625, 636.3125, 672.5859375, 708.859375, 745.1328125, 781.40625, 817.6796875, 853.953125, 890.2265625, 926.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 12.0, 26.0, 31.0, 84.0, 179.0, 428.0, 1015.0, 1367.0, 504.0, 236.0, 87.0, 58.0, 25.0, 10.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-692.0, -675.953125, -659.90625, -643.859375, -627.8125, -611.765625, -595.71875, -579.671875, -563.625, -547.578125, -531.53125, -515.484375, -499.4375, -483.390625, -467.34375, -451.296875, -435.25, -419.203125, -403.15625, -387.109375, -371.0625, -355.015625, -338.96875, -322.921875, -306.875, -290.828125, -274.78125, -258.734375, -242.6875, -226.640625, -210.59375, -194.546875, -178.5, -162.453125, -146.40625, -130.359375, -114.3125, -98.265625, -82.21875, -66.171875, -50.125, -34.078125, -18.03125, -1.984375, 14.0625, 30.109375, 46.15625, 62.203125, 78.25, 94.296875, 110.34375, 126.390625, 142.4375, 158.484375, 174.53125, 190.578125, 206.625, 222.671875, 238.71875, 254.765625, 270.8125, 286.859375, 302.90625, 318.953125, 335.0]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 7.0, 4.0, 7.0, 16.0, 32.0, 40.0, 67.0, 99.0, 138.0, 169.0, 145.0, 99.0, 67.0, 33.0, 31.0, 8.0, 10.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2266.616943359375, -2194.469970703125, -2122.322998046875, -2050.176025390625, -1978.0291748046875, -1905.8822021484375, -1833.7353515625, -1761.58837890625, -1689.44140625, -1617.29443359375, -1545.1474609375, -1473.0006103515625, -1400.8536376953125, -1328.7066650390625, -1256.559814453125, -1184.412841796875, -1112.265869140625, -1040.118896484375, -967.9719848632812, -895.8250732421875, -823.6781005859375, -751.5311279296875, -679.3842163085938, -607.2373046875, -535.09033203125, -462.9433898925781, -390.79644775390625, -318.6495056152344, -246.5025634765625, -174.35562133789062, -102.20867919921875, -30.061737060546875, 42.085205078125, 114.23214721679688, 186.37908935546875, 258.5260314941406, 330.6729736328125, 402.8199157714844, 474.96685791015625, 547.11376953125, 619.2607421875, 691.40771484375, 763.5546264648438, 835.7015380859375, 907.8485107421875, 979.9954833984375, 1052.142333984375, 1124.289306640625, 1196.436279296875, 1268.583251953125, 1340.730224609375, 1412.8770751953125, 1485.0240478515625, 1557.1710205078125, 1629.31787109375, 1701.46484375, 1773.61181640625, 1845.7587890625, 1917.90576171875, 1990.0526123046875, 2062.19970703125, 2134.346435546875, 2206.493408203125, 2278.640380859375, 2350.787353515625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 5.0, 2.0, 4.0, 2.0, 8.0, 8.0, 7.0, 10.0, 8.0, 16.0, 12.0, 24.0, 16.0, 17.0, 25.0, 19.0, 22.0, 26.0, 31.0, 41.0, 50.0, 46.0, 42.0, 54.0, 37.0, 51.0, 43.0, 43.0, 37.0, 32.0, 36.0, 29.0, 28.0, 30.0, 21.0, 25.0, 20.0, 11.0, 12.0, 12.0, 10.0, 8.0, 9.0, 4.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-1103.2652587890625, -1070.904052734375, -1038.54296875, -1006.1817626953125, -973.820556640625, -941.4593505859375, -909.0982055664062, -876.737060546875, -844.3758544921875, -812.0146484375, -779.6535034179688, -747.2923583984375, -714.93115234375, -682.5699462890625, -650.2088012695312, -617.84765625, -585.4864501953125, -553.125244140625, -520.7640991210938, -488.4029235839844, -456.041748046875, -423.6805725097656, -391.31939697265625, -358.9582214355469, -326.5970458984375, -294.2358703613281, -261.87469482421875, -229.51351928710938, -197.15234375, -164.79116821289062, -132.42999267578125, -100.06881713867188, -67.7076416015625, -35.346466064453125, -2.98529052734375, 29.375885009765625, 61.737060546875, 94.09823608398438, 126.45941162109375, 158.82058715820312, 191.1817626953125, 223.54293823242188, 255.90411376953125, 288.2652893066406, 320.62646484375, 352.9876403808594, 385.34881591796875, 417.7099914550781, 450.0711669921875, 482.4323425292969, 514.7935180664062, 547.1546630859375, 579.515869140625, 611.8770751953125, 644.2382202148438, 676.599365234375, 708.9605712890625, 741.32177734375, 773.6829223632812, 806.0440673828125, 838.4052734375, 870.7664794921875, 903.1276245117188, 935.48876953125, 967.8499755859375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 16.0, 16.0, 27.0, 25.0, 31.0, 47.0, 70.0, 104.0, 154.0, 258.0, 457.0, 765.0, 1356.0, 2606.0, 5341.0, 11515.0, 28246.0, 79388.0, 319286.0, 438819.0, 99121.0, 34393.0, 13667.0, 6168.0, 2956.0, 1486.0, 840.0, 505.0, 306.0, 209.0, 105.0, 67.0, 44.0, 33.0, 29.0, 19.0, 15.0, 15.0, 8.0, 9.0, 8.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-134.625, -130.6767578125, -126.728515625, -122.7802734375, -118.83203125, -114.8837890625, -110.935546875, -106.9873046875, -103.0390625, -99.0908203125, -95.142578125, -91.1943359375, -87.24609375, -83.2978515625, -79.349609375, -75.4013671875, -71.453125, -67.5048828125, -63.556640625, -59.6083984375, -55.66015625, -51.7119140625, -47.763671875, -43.8154296875, -39.8671875, -35.9189453125, -31.970703125, -28.0224609375, -24.07421875, -20.1259765625, -16.177734375, -12.2294921875, -8.28125, -4.3330078125, -0.384765625, 3.5634765625, 7.51171875, 11.4599609375, 15.408203125, 19.3564453125, 23.3046875, 27.2529296875, 31.201171875, 35.1494140625, 39.09765625, 43.0458984375, 46.994140625, 50.9423828125, 54.890625, 58.8388671875, 62.787109375, 66.7353515625, 70.68359375, 74.6318359375, 78.580078125, 82.5283203125, 86.4765625, 90.4248046875, 94.373046875, 98.3212890625, 102.26953125, 106.2177734375, 110.166015625, 114.1142578125, 118.0625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 6.0, 12.0, 14.0, 9.0, 26.0, 35.0, 47.0, 50.0, 54.0, 76.0, 76.0, 81.0, 83.0, 85.0, 79.0, 67.0, 39.0, 40.0, 35.0, 22.0, 13.0, 14.0, 15.0, 3.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-212.75, -207.6630859375, -202.576171875, -197.4892578125, -192.40234375, -187.3154296875, -182.228515625, -177.1416015625, -172.0546875, -166.9677734375, -161.880859375, -156.7939453125, -151.70703125, -146.6201171875, -141.533203125, -136.4462890625, -131.359375, -126.2724609375, -121.185546875, -116.0986328125, -111.01171875, -105.9248046875, -100.837890625, -95.7509765625, -90.6640625, -85.5771484375, -80.490234375, -75.4033203125, -70.31640625, -65.2294921875, -60.142578125, -55.0556640625, -49.96875, -44.8818359375, -39.794921875, -34.7080078125, -29.62109375, -24.5341796875, -19.447265625, -14.3603515625, -9.2734375, -4.1865234375, 0.900390625, 5.9873046875, 11.07421875, 16.1611328125, 21.248046875, 26.3349609375, 31.421875, 36.5087890625, 41.595703125, 46.6826171875, 51.76953125, 56.8564453125, 61.943359375, 67.0302734375, 72.1171875, 77.2041015625, 82.291015625, 87.3779296875, 92.46484375, 97.5517578125, 102.638671875, 107.7255859375, 112.8125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 5.0, 10.0, 9.0, 17.0, 32.0, 35.0, 56.0, 112.0, 206.0, 388.0, 806.0, 2227.0, 8347.0, 75714.0, 919307.0, 33382.0, 5256.0, 1452.0, 560.0, 278.0, 147.0, 82.0, 37.0, 22.0, 23.0, 13.0, 11.0, 4.0, 4.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-377.5, -367.65625, -357.8125, -347.96875, -338.125, -328.28125, -318.4375, -308.59375, -298.75, -288.90625, -279.0625, -269.21875, -259.375, -249.53125, -239.6875, -229.84375, -220.0, -210.15625, -200.3125, -190.46875, -180.625, -170.78125, -160.9375, -151.09375, -141.25, -131.40625, -121.5625, -111.71875, -101.875, -92.03125, -82.1875, -72.34375, -62.5, -52.65625, -42.8125, -32.96875, -23.125, -13.28125, -3.4375, 6.40625, 16.25, 26.09375, 35.9375, 45.78125, 55.625, 65.46875, 75.3125, 85.15625, 95.0, 104.84375, 114.6875, 124.53125, 134.375, 144.21875, 154.0625, 163.90625, 173.75, 183.59375, 193.4375, 203.28125, 213.125, 222.96875, 232.8125, 242.65625, 252.5]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 3.0, 8.0, 13.0, 16.0, 10.0, 14.0, 24.0, 28.0, 45.0, 56.0, 60.0, 89.0, 110.0, 94.0, 95.0, 65.0, 46.0, 35.0, 28.0, 24.0, 19.0, 19.0, 16.0, 12.0, 13.0, 10.0, 8.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-627.0, -609.09375, -591.1875, -573.28125, -555.375, -537.46875, -519.5625, -501.65625, -483.75, -465.84375, -447.9375, -430.03125, -412.125, -394.21875, -376.3125, -358.40625, -340.5, -322.59375, -304.6875, -286.78125, -268.875, -250.96875, -233.0625, -215.15625, -197.25, -179.34375, -161.4375, -143.53125, -125.625, -107.71875, -89.8125, -71.90625, -54.0, -36.09375, -18.1875, -0.28125, 17.625, 35.53125, 53.4375, 71.34375, 89.25, 107.15625, 125.0625, 142.96875, 160.875, 178.78125, 196.6875, 214.59375, 232.5, 250.40625, 268.3125, 286.21875, 304.125, 322.03125, 339.9375, 357.84375, 375.75, 393.65625, 411.5625, 429.46875, 447.375, 465.28125, 483.1875, 501.09375, 519.0]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 8.0, 16.0, 26.0, 33.0, 30.0, 78.0, 118.0, 140.0, 238.0, 369.0, 525.0, 940.0, 1736.0, 3098.0, 6532.0, 14557.0, 36848.0, 125883.0, 731061.0, 78087.0, 26233.0, 11096.0, 4959.0, 2580.0, 1295.0, 757.0, 448.0, 314.0, 142.0, 105.0, 83.0, 57.0, 39.0, 36.0, 27.0, 16.0, 10.0, 10.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.65625, -31.73193359375, -30.8076171875, -29.88330078125, -28.958984375, -28.03466796875, -27.1103515625, -26.18603515625, -25.26171875, -24.33740234375, -23.4130859375, -22.48876953125, -21.564453125, -20.64013671875, -19.7158203125, -18.79150390625, -17.8671875, -16.94287109375, -16.0185546875, -15.09423828125, -14.169921875, -13.24560546875, -12.3212890625, -11.39697265625, -10.47265625, -9.54833984375, -8.6240234375, -7.69970703125, -6.775390625, -5.85107421875, -4.9267578125, -4.00244140625, -3.078125, -2.15380859375, -1.2294921875, -0.30517578125, 0.619140625, 1.54345703125, 2.4677734375, 3.39208984375, 4.31640625, 5.24072265625, 6.1650390625, 7.08935546875, 8.013671875, 8.93798828125, 9.8623046875, 10.78662109375, 11.7109375, 12.63525390625, 13.5595703125, 14.48388671875, 15.408203125, 16.33251953125, 17.2568359375, 18.18115234375, 19.10546875, 20.02978515625, 20.9541015625, 21.87841796875, 22.802734375, 23.72705078125, 24.6513671875, 25.57568359375, 26.5]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 10.0, 9.0, 16.0, 11.0, 17.0, 30.0, 32.0, 54.0, 60.0, 100.0, 102.0, 110.0, 114.0, 75.0, 45.0, 24.0, 18.0, 20.0, 23.0, 28.0, 10.0, 13.0, 6.0, 11.0, 6.0, 8.0, 2.0, 5.0, 9.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0151824951171875, -0.014662981033325195, -0.01414346694946289, -0.013623952865600586, -0.013104438781738281, -0.012584924697875977, -0.012065410614013672, -0.011545896530151367, -0.011026382446289062, -0.010506868362426758, -0.009987354278564453, -0.009467840194702148, -0.008948326110839844, -0.008428812026977539, -0.007909297943115234, -0.00738978385925293, -0.006870269775390625, -0.00635075569152832, -0.005831241607666016, -0.005311727523803711, -0.004792213439941406, -0.0042726993560791016, -0.003753185272216797, -0.003233671188354492, -0.0027141571044921875, -0.002194643020629883, -0.0016751289367675781, -0.0011556148529052734, -0.0006361007690429688, -0.00011658668518066406, 0.0004029273986816406, 0.0009224414825439453, 0.00144195556640625, 0.0019614696502685547, 0.0024809837341308594, 0.003000497817993164, 0.0035200119018554688, 0.0040395259857177734, 0.004559040069580078, 0.005078554153442383, 0.0055980682373046875, 0.006117582321166992, 0.006637096405029297, 0.0071566104888916016, 0.007676124572753906, 0.008195638656616211, 0.008715152740478516, 0.00923466682434082, 0.009754180908203125, 0.01027369499206543, 0.010793209075927734, 0.011312723159790039, 0.011832237243652344, 0.012351751327514648, 0.012871265411376953, 0.013390779495239258, 0.013910293579101562, 0.014429807662963867, 0.014949321746826172, 0.015468835830688477, 0.01598834991455078, 0.016507863998413086, 0.01702737808227539, 0.017546892166137695, 0.01806640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 0.0, 8.0, 4.0, 6.0, 7.0, 10.0, 23.0, 32.0, 33.0, 45.0, 72.0, 105.0, 126.0, 184.0, 328.0, 541.0, 866.0, 1414.0, 2353.0, 4595.0, 9504.0, 21076.0, 58059.0, 628716.0, 239931.0, 45726.0, 17461.0, 8073.0, 4024.0, 2032.0, 1185.0, 673.0, 481.0, 277.0, 181.0, 122.0, 63.0, 49.0, 36.0, 44.0, 20.0, 21.0, 10.0, 10.0, 6.0, 7.0, 7.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-25.796875, -24.9619140625, -24.126953125, -23.2919921875, -22.45703125, -21.6220703125, -20.787109375, -19.9521484375, -19.1171875, -18.2822265625, -17.447265625, -16.6123046875, -15.77734375, -14.9423828125, -14.107421875, -13.2724609375, -12.4375, -11.6025390625, -10.767578125, -9.9326171875, -9.09765625, -8.2626953125, -7.427734375, -6.5927734375, -5.7578125, -4.9228515625, -4.087890625, -3.2529296875, -2.41796875, -1.5830078125, -0.748046875, 0.0869140625, 0.921875, 1.7568359375, 2.591796875, 3.4267578125, 4.26171875, 5.0966796875, 5.931640625, 6.7666015625, 7.6015625, 8.4365234375, 9.271484375, 10.1064453125, 10.94140625, 11.7763671875, 12.611328125, 13.4462890625, 14.28125, 15.1162109375, 15.951171875, 16.7861328125, 17.62109375, 18.4560546875, 19.291015625, 20.1259765625, 20.9609375, 21.7958984375, 22.630859375, 23.4658203125, 24.30078125, 25.1357421875, 25.970703125, 26.8056640625, 27.640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 5.0, 1.0, 3.0, 6.0, 6.0, 4.0, 13.0, 9.0, 5.0, 13.0, 8.0, 20.0, 25.0, 8.0, 36.0, 32.0, 29.0, 65.0, 60.0, 76.0, 75.0, 83.0, 72.0, 55.0, 59.0, 43.0, 27.0, 19.0, 21.0, 22.0, 13.0, 21.0, 4.0, 5.0, 11.0, 4.0, 7.0, 8.0, 2.0, 4.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-53.28125, -51.8720703125, -50.462890625, -49.0537109375, -47.64453125, -46.2353515625, -44.826171875, -43.4169921875, -42.0078125, -40.5986328125, -39.189453125, -37.7802734375, -36.37109375, -34.9619140625, -33.552734375, -32.1435546875, -30.734375, -29.3251953125, -27.916015625, -26.5068359375, -25.09765625, -23.6884765625, -22.279296875, -20.8701171875, -19.4609375, -18.0517578125, -16.642578125, -15.2333984375, -13.82421875, -12.4150390625, -11.005859375, -9.5966796875, -8.1875, -6.7783203125, -5.369140625, -3.9599609375, -2.55078125, -1.1416015625, 0.267578125, 1.6767578125, 3.0859375, 4.4951171875, 5.904296875, 7.3134765625, 8.72265625, 10.1318359375, 11.541015625, 12.9501953125, 14.359375, 15.7685546875, 17.177734375, 18.5869140625, 19.99609375, 21.4052734375, 22.814453125, 24.2236328125, 25.6328125, 27.0419921875, 28.451171875, 29.8603515625, 31.26953125, 32.6787109375, 34.087890625, 35.4970703125, 36.90625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 14.0, 21.0, 64.0, 132.0, 566.0, 121.0, 43.0, 18.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3842.87158203125, -3745.427734375, -3647.983642578125, -3550.53955078125, -3453.095703125, -3355.65185546875, -3258.207763671875, -3160.763671875, -3063.31982421875, -2965.8759765625, -2868.431884765625, -2770.98779296875, -2673.5439453125, -2576.10009765625, -2478.656005859375, -2381.2119140625, -2283.76806640625, -2186.32421875, -2088.880126953125, -1991.4361572265625, -1893.9921875, -1796.5482177734375, -1699.104248046875, -1601.6602783203125, -1504.21630859375, -1406.7723388671875, -1309.328369140625, -1211.8843994140625, -1114.4404296875, -1016.9964599609375, -919.552490234375, -822.1085205078125, -724.664794921875, -627.2208251953125, -529.77685546875, -432.3328857421875, -334.888916015625, -237.4449462890625, -140.0009765625, -42.5570068359375, 54.886962890625, 152.3309326171875, 249.77490234375, 347.2188720703125, 444.662841796875, 542.1068115234375, 639.55078125, 736.9947509765625, 834.438720703125, 931.8826904296875, 1029.32666015625, 1126.7706298828125, 1224.214599609375, 1321.6585693359375, 1419.1025390625, 1516.5465087890625, 1613.990478515625, 1711.4344482421875, 1808.87841796875, 1906.3223876953125, 2003.766357421875, 2101.21044921875, 2198.654296875, 2296.09814453125, 2393.542236328125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 6.0, 3.0, 11.0, 6.0, 10.0, 8.0, 14.0, 11.0, 18.0, 25.0, 22.0, 22.0, 22.0, 24.0, 33.0, 42.0, 101.0, 224.0, 131.0, 39.0, 28.0, 28.0, 24.0, 17.0, 16.0, 16.0, 15.0, 8.0, 22.0, 9.0, 4.0, 6.0, 5.0, 13.0, 3.0, 8.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1208.075927734375, -1169.9229736328125, -1131.77001953125, -1093.6170654296875, -1055.464111328125, -1017.3110961914062, -979.1581420898438, -941.005126953125, -902.8521728515625, -864.69921875, -826.5462646484375, -788.393310546875, -750.2402954101562, -712.0873413085938, -673.9343872070312, -635.7813720703125, -597.6284790039062, -559.4755249023438, -521.3225708007812, -483.1695861816406, -445.0166015625, -406.8636474609375, -368.710693359375, -330.5577087402344, -292.4047546386719, -254.2517852783203, -216.09881591796875, -177.94586181640625, -139.7928924560547, -101.63992309570312, -63.486968994140625, -25.333984375, 12.8189697265625, 50.9719352722168, 89.1249008178711, 127.27786254882812, 165.4308319091797, 203.58380126953125, 241.73675537109375, 279.8897399902344, 318.0426940917969, 356.1956481933594, 394.3486328125, 432.5015869140625, 470.654541015625, 508.8075256347656, 546.96044921875, 585.1134643554688, 623.2664184570312, 661.4193725585938, 699.5723266601562, 737.725341796875, 775.8782958984375, 814.03125, 852.1842041015625, 890.337158203125, 928.4901123046875, 966.64306640625, 1004.7960205078125, 1042.948974609375, 1081.1019287109375, 1119.2548828125, 1157.407958984375, 1195.5609130859375, 1233.7138671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 11.0, 12.0, 14.0, 11.0, 22.0, 14.0, 20.0, 21.0, 24.0, 28.0, 34.0, 45.0, 62.0, 141.0, 155.0, 65.0, 45.0, 41.0, 25.0, 34.0, 22.0, 21.0, 29.0, 17.0, 22.0, 10.0, 7.0, 9.0, 7.0, 4.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.0, -124.71875, -121.4375, -118.15625, -114.875, -111.59375, -108.3125, -105.03125, -101.75, -98.46875, -95.1875, -91.90625, -88.625, -85.34375, -82.0625, -78.78125, -75.5, -72.21875, -68.9375, -65.65625, -62.375, -59.09375, -55.8125, -52.53125, -49.25, -45.96875, -42.6875, -39.40625, -36.125, -32.84375, -29.5625, -26.28125, -23.0, -19.71875, -16.4375, -13.15625, -9.875, -6.59375, -3.3125, -0.03125, 3.25, 6.53125, 9.8125, 13.09375, 16.375, 19.65625, 22.9375, 26.21875, 29.5, 32.78125, 36.0625, 39.34375, 42.625, 45.90625, 49.1875, 52.46875, 55.75, 59.03125, 62.3125, 65.59375, 68.875, 72.15625, 75.4375, 78.71875, 82.0]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 2.0, 4.0, 16.0, 18.0, 24.0, 34.0, 46.0, 44.0, 61.0, 163.0, 252.0, 621.0, 1768.0, 7060.0, 399539.0, 7967438.0, 8207.0, 1950.0, 641.0, 266.0, 141.0, 94.0, 40.0, 46.0, 26.0, 17.0, 7.0, 7.0, 15.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-734.0562744140625, -713.1082763671875, -692.1602172851562, -671.212158203125, -650.26416015625, -629.316162109375, -608.3681030273438, -587.4200439453125, -566.4720458984375, -545.5240478515625, -524.5759887695312, -503.6279602050781, -482.679931640625, -461.7319030761719, -440.78387451171875, -419.8358459472656, -398.8878173828125, -377.9397888183594, -356.99176025390625, -336.0437316894531, -315.095703125, -294.1476745605469, -273.19964599609375, -252.25161743164062, -231.3035888671875, -210.35556030273438, -189.40753173828125, -168.45950317382812, -147.511474609375, -126.56344604492188, -105.61541748046875, -84.66738891601562, -63.7193603515625, -42.771331787109375, -21.82330322265625, -0.875274658203125, 20.07275390625, 41.020782470703125, 61.96881103515625, 82.91683959960938, 103.8648681640625, 124.81289672851562, 145.76092529296875, 166.70895385742188, 187.656982421875, 208.60501098632812, 229.55303955078125, 250.50106811523438, 271.4490966796875, 292.3971252441406, 313.34515380859375, 334.2931823730469, 355.2412109375, 376.1892395019531, 397.13726806640625, 418.0852966308594, 439.0333251953125, 459.9813537597656, 480.92938232421875, 501.8774108886719, 522.825439453125, 543.7734375, 564.7214965820312, 585.6695556640625, 606.6175537109375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 5.0, 4.0, 2.0, 5.0, 3.0, 7.0, 2.0, 6.0, 3.0, 4.0, 4.0, 1.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-653.5410766601562, -628.9877319335938, -604.434326171875, -579.8809814453125, -555.3275756835938, -530.7742309570312, -506.2208557128906, -481.66748046875, -457.1141052246094, -432.56072998046875, -408.0073547363281, -383.4539794921875, -358.900634765625, -334.34722900390625, -309.79388427734375, -285.2405090332031, -260.6871337890625, -236.13375854492188, -211.58038330078125, -187.0270233154297, -162.47364807128906, -137.92027282714844, -113.36691284179688, -88.81353759765625, -64.26016235351562, -39.706790924072266, -15.153419494628906, 9.399948120117188, 33.95332336425781, 58.50669860839844, 83.06005859375, 107.61343383789062, 132.166748046875, 156.72012329101562, 181.27349853515625, 205.8268585205078, 230.38023376464844, 254.93360900878906, 279.4869689941406, 304.04034423828125, 328.5937194824219, 353.1470947265625, 377.7004699707031, 402.25384521484375, 426.80718994140625, 451.360595703125, 475.9139404296875, 500.4673156738281, 525.0206909179688, 549.5740356445312, 574.12744140625, 598.6807861328125, 623.2341918945312, 647.7875366210938, 672.3409423828125, 696.894287109375, 721.4476318359375, 746.0009765625, 770.5543823242188, 795.1077270507812, 819.6611328125, 844.2144775390625, 868.767822265625, 893.3212280273438, 917.8746337890625]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 8.0, 6.0, 10.0, 11.0, 32.0, 25.0, 33.0, 46.0, 56.0, 57.0, 58.0, 60.0, 53.0, 69.0, 61.0, 69.0, 51.0, 65.0, 50.0, 32.0, 36.0, 23.0, 24.0, 17.0, 9.0, 6.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-103.1875, -100.443359375, -97.69921875, -94.955078125, -92.2109375, -89.466796875, -86.72265625, -83.978515625, -81.234375, -78.490234375, -75.74609375, -73.001953125, -70.2578125, -67.513671875, -64.76953125, -62.025390625, -59.28125, -56.537109375, -53.79296875, -51.048828125, -48.3046875, -45.560546875, -42.81640625, -40.072265625, -37.328125, -34.583984375, -31.83984375, -29.095703125, -26.3515625, -23.607421875, -20.86328125, -18.119140625, -15.375, -12.630859375, -9.88671875, -7.142578125, -4.3984375, -1.654296875, 1.08984375, 3.833984375, 6.578125, 9.322265625, 12.06640625, 14.810546875, 17.5546875, 20.298828125, 23.04296875, 25.787109375, 28.53125, 31.275390625, 34.01953125, 36.763671875, 39.5078125, 42.251953125, 44.99609375, 47.740234375, 50.484375, 53.228515625, 55.97265625, 58.716796875, 61.4609375, 64.205078125, 66.94921875, 69.693359375, 72.4375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 13.0, 13.0, 29.0, 36.0, 58.0, 111.0, 197.0, 379.0, 885.0, 1997.0, 5121.0, 14731.0, 46749.0, 157176.0, 199396.0, 65588.0, 19744.0, 7078.0, 2651.0, 1068.0, 579.0, 279.0, 162.0, 82.0, 54.0, 21.0, 17.0, 14.0, 7.0, 9.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-595.0, -574.578125, -554.15625, -533.734375, -513.3125, -492.890625, -472.46875, -452.046875, -431.625, -411.203125, -390.78125, -370.359375, -349.9375, -329.515625, -309.09375, -288.671875, -268.25, -247.828125, -227.40625, -206.984375, -186.5625, -166.140625, -145.71875, -125.296875, -104.875, -84.453125, -64.03125, -43.609375, -23.1875, -2.765625, 17.65625, 38.078125, 58.5, 78.921875, 99.34375, 119.765625, 140.1875, 160.609375, 181.03125, 201.453125, 221.875, 242.296875, 262.71875, 283.140625, 303.5625, 323.984375, 344.40625, 364.828125, 385.25, 405.671875, 426.09375, 446.515625, 466.9375, 487.359375, 507.78125, 528.203125, 548.625, 569.046875, 589.46875, 609.890625, 630.3125, 650.734375, 671.15625, 691.578125, 712.0]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 6.0, 6.0, 4.0, 10.0, 11.0, 14.0, 11.0, 18.0, 16.0, 23.0, 26.0, 51.0, 46.0, 40.0, 48.0, 49.0, 37.0, 49.0, 53.0, 57.0, 54.0, 47.0, 36.0, 42.0, 42.0, 34.0, 26.0, 25.0, 17.0, 14.0, 17.0, 17.0, 10.0, 6.0, 4.0, 12.0, 6.0, 4.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.1875, -80.6728515625, -78.158203125, -75.6435546875, -73.12890625, -70.6142578125, -68.099609375, -65.5849609375, -63.0703125, -60.5556640625, -58.041015625, -55.5263671875, -53.01171875, -50.4970703125, -47.982421875, -45.4677734375, -42.953125, -40.4384765625, -37.923828125, -35.4091796875, -32.89453125, -30.3798828125, -27.865234375, -25.3505859375, -22.8359375, -20.3212890625, -17.806640625, -15.2919921875, -12.77734375, -10.2626953125, -7.748046875, -5.2333984375, -2.71875, -0.2041015625, 2.310546875, 4.8251953125, 7.33984375, 9.8544921875, 12.369140625, 14.8837890625, 17.3984375, 19.9130859375, 22.427734375, 24.9423828125, 27.45703125, 29.9716796875, 32.486328125, 35.0009765625, 37.515625, 40.0302734375, 42.544921875, 45.0595703125, 47.57421875, 50.0888671875, 52.603515625, 55.1181640625, 57.6328125, 60.1474609375, 62.662109375, 65.1767578125, 67.69140625, 70.2060546875, 72.720703125, 75.2353515625, 77.75]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 2.0, 3.0, 6.0, 1.0, 5.0, 9.0, 20.0, 45.0, 53.0, 75.0, 69.0, 70.0, 32.0, 31.0, 13.0, 8.0, 6.0, 4.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-642.891845703125, -625.7798461914062, -608.6679077148438, -591.555908203125, -574.4439086914062, -557.3319091796875, -540.219970703125, -523.1079711914062, -505.9959716796875, -488.8840026855469, -471.7720031738281, -454.6600341796875, -437.54803466796875, -420.4360656738281, -403.3240966796875, -386.21209716796875, -369.1001281738281, -351.9881591796875, -334.87615966796875, -317.7641906738281, -300.6521911621094, -283.54022216796875, -266.42822265625, -249.31625366210938, -232.2042694091797, -215.09228515625, -197.9803009033203, -180.86831665039062, -163.75634765625, -146.64434814453125, -129.53237915039062, -112.42039489746094, -95.30838012695312, -78.19639587402344, -61.084415435791016, -43.972434997558594, -26.860450744628906, -9.748466491699219, 7.3635101318359375, 24.475494384765625, 41.58747863769531, 58.699462890625, 75.81144714355469, 92.92342376708984, 110.03540802001953, 127.14739227294922, 144.25936889648438, 161.37135314941406, 178.48333740234375, 195.59532165527344, 212.70730590820312, 229.81927490234375, 246.9312744140625, 264.0432434082031, 281.15521240234375, 298.2672119140625, 315.37921142578125, 332.4911804199219, 349.6031799316406, 366.71514892578125, 383.8271484375, 400.9391174316406, 418.05108642578125, 435.1630859375, 452.2750549316406]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 5.0, 1.0, 8.0, 2.0, 0.0, 5.0, 5.0, 4.0, 4.0, 4.0, 8.0, 10.0, 20.0, 52.0, 59.0, 80.0, 79.0, 37.0, 23.0, 16.0, 16.0, 11.0, 2.0, 3.0, 5.0, 1.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-445.65655517578125, -431.13250732421875, -416.6084289550781, -402.0843811035156, -387.5603332519531, -373.0362548828125, -358.51220703125, -343.9881591796875, -329.464111328125, -314.9400634765625, -300.4159851074219, -285.8919372558594, -271.3678894042969, -256.84381103515625, -242.31976318359375, -227.79571533203125, -213.27163696289062, -198.74757385253906, -184.22352600097656, -169.699462890625, -155.1754150390625, -140.65135192871094, -126.12728881835938, -111.60323333740234, -97.07917785644531, -82.55512237548828, -68.03106689453125, -53.50700378417969, -38.982948303222656, -24.458892822265625, -9.934829711914062, 4.589225769042969, 19.11328125, 33.63733673095703, 48.16139602661133, 62.685455322265625, 77.20951080322266, 91.73356628417969, 106.25762939453125, 120.78168487548828, 135.3057403564453, 149.82980346679688, 164.35385131835938, 178.87791442871094, 193.4019775390625, 207.926025390625, 222.45008850097656, 236.97415161132812, 251.49819946289062, 266.0222473144531, 280.54632568359375, 295.07037353515625, 309.59442138671875, 324.11846923828125, 338.6425476074219, 353.1665954589844, 367.690673828125, 382.2147216796875, 396.7388000488281, 411.2628479003906, 425.7868957519531, 440.31097412109375, 454.83502197265625, 469.35906982421875, 483.88311767578125]}, "eval/loss": 0.7146373391151428, "eval/wer": 0.09962316541055137, "eval/runtime": 901.9992, "eval/samples_per_second": 2.929, "eval/steps_per_second": 0.367, "train/train_runtime": 35320.0928, "train/train_samples_per_second": 20.2, "train/train_steps_per_second": 0.631, "train/total_flos": 0.0, "train/train_loss": 0.08645637407097047} \ No newline at end of file